From 7bbd7e84c136e67fb854ff3b0fe951222a718ff7 Mon Sep 17 00:00:00 2001
From: "Documenter.jl" <documenter@juliadocs.github.io>
Date: Wed, 3 Jul 2024 16:16:43 +0000
Subject: [PATCH] build based on 5ca73e4

---
 dev/index.html                           |  4 +-
 dev/man/all_manual/index.html            |  2 +-
 dev/man/cholesky/index.html              |  8 ++--
 dev/man/deep_learning/index.html         | 10 ++---
 dev/man/display/index.html               |  4 +-
 dev/man/eval/index.html                  | 26 ++++++------
 dev/man/find_path/index.html             | 12 +++---
 dev/man/input/index.html                 |  6 +--
 dev/man/make_adjacency_matrix/index.html |  6 +--
 dev/man/make_cue_matrix/index.html       | 14 +++----
 dev/man/make_semantic_matrix/index.html  | 50 ++++++++++++------------
 dev/man/make_yt_matrix/index.html        |  4 +-
 dev/man/measures_func/index.html         |  2 +-
 dev/man/output/index.html                | 14 +++----
 dev/man/pickle/index.html                |  2 +-
 dev/man/preprocess/index.html            |  2 +-
 dev/man/pyndl/index.html                 | 10 ++---
 dev/man/test_combo/index.html            |  2 +-
 dev/man/utils/index.html                 |  6 +--
 dev/man/wh/index.html                    |  2 +-
 dev/search/index.html                    |  2 +-
 dev/search_index.js                      |  2 +-
 22 files changed, 95 insertions(+), 95 deletions(-)
diff --git a/dev/index.html b/dev/index.html
index 864a826..e2d1402 100644
--- a/dev/index.html
+++ b/dev/index.html
@@ -1,5 +1,5 @@
 <!DOCTYPE html>
-<html lang="en"><head><meta charset="UTF-8"/><meta name="viewport" content="width=device-width, initial-scale=1.0"/><title>Home · JudiLing.jl</title><link rel="canonical" href="https://quantling.github.io/JudiLing.jl/"/><link href="https://fonts.googleapis.com/css?family=Lato|Roboto+Mono" rel="stylesheet" type="text/css"/><link href="https://cdnjs.cloudflare.com/ajax/libs/font-awesome/5.15.0/css/fontawesome.min.css" rel="stylesheet" type="text/css"/><link href="https://cdnjs.cloudflare.com/ajax/libs/font-awesome/5.15.0/css/solid.min.css" rel="stylesheet" type="text/css"/><link href="https://cdnjs.cloudflare.com/ajax/libs/font-awesome/5.15.0/css/brands.min.css" rel="stylesheet" type="text/css"/><link href="https://cdnjs.cloudflare.com/ajax/libs/KaTeX/0.11.1/katex.min.css" rel="stylesheet" type="text/css"/><script>documenterBaseURL="."</script><script src="https://cdnjs.cloudflare.com/ajax/libs/require.js/2.3.6/require.min.js" data-main="assets/documenter.js"></script><script src="siteinfo.js"></script><script src="../versions.js"></script><link class="docs-theme-link" rel="stylesheet" type="text/css" href="assets/themes/documenter-dark.css" data-theme-name="documenter-dark"/><link class="docs-theme-link" rel="stylesheet" type="text/css" href="assets/themes/documenter-light.css" data-theme-name="documenter-light" data-theme-primary/><script src="assets/themeswap.js"></script></head><body><div id="documenter"><nav class="docs-sidebar"><div class="docs-package-name"><span class="docs-autofit">JudiLing.jl</span></div><form class="docs-search" action="search/"><input class="docs-search-query" id="documenter-search-query" name="q" type="text" placeholder="Search docs"/></form><ul class="docs-menu"><li class="is-active"><a class="tocitem" href>Home</a><ul class="internal"><li><a class="tocitem" href="#Installation"><span>Installation</span></a></li><li><a class="tocitem" href="#Running-Julia-with-multiple-threads"><span>Running Julia with multiple threads</span></a></li><li><a class="tocitem" href="#Include-packages"><span>Include packages</span></a></li><li><a class="tocitem" href="#Running-Julia-with-multiple-threads-2"><span>Running Julia with multiple threads</span></a></li><li><a class="tocitem" href="#Quick-start-example"><span>Quick start example</span></a></li><li><a class="tocitem" href="#Cross-validation"><span>Cross-validation</span></a></li><li><a class="tocitem" href="#Supports"><span>Supports</span></a></li><li><a class="tocitem" href="#Acknowledgments"><span>Acknowledgments</span></a></li><li><a class="tocitem" href="#Acknowledgments-2"><span>Acknowledgments</span></a></li><li><a class="tocitem" href="#Citation"><span>Citation</span></a></li></ul></li><li><span class="tocitem">Manual</span><ul><li><a class="tocitem" href="man/input/">Loading data</a></li><li><a class="tocitem" href="man/make_cue_matrix/">Make Cue Matrix</a></li><li><a class="tocitem" href="man/make_semantic_matrix/">Make Semantic Matrix</a></li><li><a class="tocitem" href="man/cholesky/">Cholesky</a></li><li><a class="tocitem" href="man/make_adjacency_matrix/">Make Adjacency Matrix</a></li><li><a class="tocitem" href="man/make_yt_matrix/">Make Yt Matrix</a></li><li><a class="tocitem" href="man/find_path/">Find Paths</a></li><li><a class="tocitem" href="man/eval/">Evaluation</a></li><li><a class="tocitem" href="man/output/">Output</a></li><li><a class="tocitem" href="man/test_combo/">Test Combo</a></li><li><a class="tocitem" href="man/display/">Display</a></li><li><a class="tocitem" href="man/utils/">Utils</a></li><li><a class="tocitem" href="man/pickle/">Pickle</a></li><li><a class="tocitem" href="man/pyndl/">Pyndl</a></li><li><a class="tocitem" href="man/wh/">Widrow-Hoff Learning</a></li><li><a class="tocitem" href="man/deep_learning/">Deep learning</a></li><li><a class="tocitem" href="man/measures_func/">Measures function</a></li></ul></li><li><a class="tocitem" href="man/all_manual/">All Manual index</a></li></ul><div class="docs-version-selector field has-addons"><div class="control"><span class="docs-label button is-static is-size-7">Version</span></div><div class="docs-selector control is-expanded"><div class="select is-fullwidth is-size-7"><select id="documenter-version-selector"></select></div></div></div></nav><div class="docs-main"><header class="docs-navbar"><nav class="breadcrumb"><ul class="is-hidden-mobile"><li class="is-active"><a href>Home</a></li></ul><ul class="is-hidden-tablet"><li class="is-active"><a href>Home</a></li></ul></nav><div class="docs-right"><a class="docs-edit-link" href="https://github.com/quantling/JudiLing.jl/blob/master/docs/src/index.md#L" title="Edit on GitHub"><span class="docs-icon fab"></span><span class="docs-label is-hidden-touch">Edit on GitHub</span></a><a class="docs-settings-button fas fa-cog" id="documenter-settings-button" href="#" title="Settings"></a><a class="docs-sidebar-button fa fa-bars is-hidden-desktop" id="documenter-sidebar-button" href="#"></a></div></header><article class="content" id="documenter-page"><h1 id="JudiLing"><a class="docs-heading-anchor" href="#JudiLing">JudiLing</a><a id="JudiLing-1"></a><a class="docs-heading-anchor-permalink" href="#JudiLing" title="Permalink"></a></h1><p>JudiLing: An implementation for Linear Discriminative Learning in Julia</p><p>Maintainer: Maria Heitmeier <a href="https://github.com/MariaHei">@MariaHei</a><br/>Original codebase: Xuefeng Luo <a href="https://github.com/MegamindHenry">@MegamindHenry</a></p><h2 id="Installation"><a class="docs-heading-anchor" href="#Installation">Installation</a><a id="Installation-1"></a><a class="docs-heading-anchor-permalink" href="#Installation" title="Permalink"></a></h2><p>You can install JudiLing by the follow commands:</p><pre><code class="language-none">using Pkg
+<html lang="en"><head><meta charset="UTF-8"/><meta name="viewport" content="width=device-width, initial-scale=1.0"/><title>Home · JudiLing.jl</title><link rel="canonical" href="https://quantling.github.io/JudiLing.jl/"/><link href="https://fonts.googleapis.com/css?family=Lato|Roboto+Mono" rel="stylesheet" type="text/css"/><link href="https://cdnjs.cloudflare.com/ajax/libs/font-awesome/5.15.0/css/fontawesome.min.css" rel="stylesheet" type="text/css"/><link href="https://cdnjs.cloudflare.com/ajax/libs/font-awesome/5.15.0/css/solid.min.css" rel="stylesheet" type="text/css"/><link href="https://cdnjs.cloudflare.com/ajax/libs/font-awesome/5.15.0/css/brands.min.css" rel="stylesheet" type="text/css"/><link href="https://cdnjs.cloudflare.com/ajax/libs/KaTeX/0.11.1/katex.min.css" rel="stylesheet" type="text/css"/><script>documenterBaseURL="."</script><script src="https://cdnjs.cloudflare.com/ajax/libs/require.js/2.3.6/require.min.js" data-main="assets/documenter.js"></script><script src="siteinfo.js"></script><script src="../versions.js"></script><link class="docs-theme-link" rel="stylesheet" type="text/css" href="assets/themes/documenter-dark.css" data-theme-name="documenter-dark"/><link class="docs-theme-link" rel="stylesheet" type="text/css" href="assets/themes/documenter-light.css" data-theme-name="documenter-light" data-theme-primary/><script src="assets/themeswap.js"></script></head><body><div id="documenter"><nav class="docs-sidebar"><div class="docs-package-name"><span class="docs-autofit">JudiLing.jl</span></div><form class="docs-search" action="search/"><input class="docs-search-query" id="documenter-search-query" name="q" type="text" placeholder="Search docs"/></form><ul class="docs-menu"><li class="is-active"><a class="tocitem" href>Home</a><ul class="internal"><li><a class="tocitem" href="#Installation"><span>Installation</span></a></li><li><a class="tocitem" href="#Running-Julia-with-multiple-threads"><span>Running Julia with multiple threads</span></a></li><li><a class="tocitem" href="#Include-packages"><span>Include packages</span></a></li><li><a class="tocitem" href="#Running-Julia-with-multiple-threads-2"><span>Running Julia with multiple threads</span></a></li><li><a class="tocitem" href="#Quick-start-example"><span>Quick start example</span></a></li><li><a class="tocitem" href="#Cross-validation"><span>Cross-validation</span></a></li><li><a class="tocitem" href="#Supports"><span>Supports</span></a></li><li><a class="tocitem" href="#Acknowledgments"><span>Acknowledgments</span></a></li><li><a class="tocitem" href="#Citation"><span>Citation</span></a></li></ul></li><li><span class="tocitem">Manual</span><ul><li><a class="tocitem" href="man/input/">Loading data</a></li><li><a class="tocitem" href="man/make_cue_matrix/">Make Cue Matrix</a></li><li><a class="tocitem" href="man/make_semantic_matrix/">Make Semantic Matrix</a></li><li><a class="tocitem" href="man/cholesky/">Cholesky</a></li><li><a class="tocitem" href="man/make_adjacency_matrix/">Make Adjacency Matrix</a></li><li><a class="tocitem" href="man/make_yt_matrix/">Make Yt Matrix</a></li><li><a class="tocitem" href="man/find_path/">Find Paths</a></li><li><a class="tocitem" href="man/eval/">Evaluation</a></li><li><a class="tocitem" href="man/output/">Output</a></li><li><a class="tocitem" href="man/test_combo/">Test Combo</a></li><li><a class="tocitem" href="man/display/">Display</a></li><li><a class="tocitem" href="man/utils/">Utils</a></li><li><a class="tocitem" href="man/pickle/">Pickle</a></li><li><a class="tocitem" href="man/pyndl/">Pyndl</a></li><li><a class="tocitem" href="man/wh/">Widrow-Hoff Learning</a></li><li><a class="tocitem" href="man/deep_learning/">Deep learning</a></li><li><a class="tocitem" href="man/measures_func/">Measures function</a></li></ul></li><li><a class="tocitem" href="man/all_manual/">All Manual index</a></li></ul><div class="docs-version-selector field has-addons"><div class="control"><span class="docs-label button is-static is-size-7">Version</span></div><div class="docs-selector control is-expanded"><div class="select is-fullwidth is-size-7"><select id="documenter-version-selector"></select></div></div></div></nav><div class="docs-main"><header class="docs-navbar"><nav class="breadcrumb"><ul class="is-hidden-mobile"><li class="is-active"><a href>Home</a></li></ul><ul class="is-hidden-tablet"><li class="is-active"><a href>Home</a></li></ul></nav><div class="docs-right"><a class="docs-edit-link" href="https://github.com/quantling/JudiLing.jl/blob/master/docs/src/index.md#L" title="Edit on GitHub"><span class="docs-icon fab"></span><span class="docs-label is-hidden-touch">Edit on GitHub</span></a><a class="docs-settings-button fas fa-cog" id="documenter-settings-button" href="#" title="Settings"></a><a class="docs-sidebar-button fa fa-bars is-hidden-desktop" id="documenter-sidebar-button" href="#"></a></div></header><article class="content" id="documenter-page"><h1 id="JudiLing"><a class="docs-heading-anchor" href="#JudiLing">JudiLing</a><a id="JudiLing-1"></a><a class="docs-heading-anchor-permalink" href="#JudiLing" title="Permalink"></a></h1><p>JudiLing: An implementation for Linear Discriminative Learning in Julia</p><p>Maintainer: Maria Heitmeier <a href="https://github.com/MariaHei">@MariaHei</a><br/>Original codebase: Xuefeng Luo <a href="https://github.com/MegamindHenry">@MegamindHenry</a></p><h2 id="Installation"><a class="docs-heading-anchor" href="#Installation">Installation</a><a id="Installation-1"></a><a class="docs-heading-anchor-permalink" href="#Installation" title="Permalink"></a></h2><p>You can install JudiLing by the follow commands:</p><pre><code class="language-none">using Pkg
 Pkg.add(&quot;JudiLing&quot;)</code></pre><p>For brave adventurers, install test version of JudiLing by:</p><pre><code class="language-none">julia&gt; Pkg.add(url=&quot;https://github.com/quantling/JudiLing.jl.git&quot;)</code></pre><p>Or from the Julia REPL, type <code>]</code> to enter the Pkg REPL mode and run</p><pre><code class="language-none">pkg&gt; add https://github.com/quantling/JudiLing.jl.git</code></pre><h2 id="Running-Julia-with-multiple-threads"><a class="docs-heading-anchor" href="#Running-Julia-with-multiple-threads">Running Julia with multiple threads</a><a id="Running-Julia-with-multiple-threads-1"></a><a class="docs-heading-anchor-permalink" href="#Running-Julia-with-multiple-threads" title="Permalink"></a></h2><p>JudiLing supports the use of multiple threads. Simply start up Julia in your terminal as follows:</p><pre><code class="language-none">$ julia -t your_num_of_threads</code></pre><p>For detailed information on using Julia with threads, see this <a href="https://docs.julialang.org/en/v1/manual/multi-threading/">link</a>.</p><h2 id="Include-packages"><a class="docs-heading-anchor" href="#Include-packages">Include packages</a><a id="Include-packages-1"></a><a class="docs-heading-anchor-permalink" href="#Include-packages" title="Permalink"></a></h2><p>Before we start, we first need to load the JudiLing package:</p><pre><code class="language-julia">using JudiLing</code></pre><p><strong>Note:</strong> As of JudiLing 0.8.0, <a href="https://github.com/JuliaPy/PyCall.jl">PyCall</a> and <a href="https://fluxml.ai/Flux.jl/stable/">Flux</a> have become optional dependencies. This means that all code in JudiLing which requires calls to python is only available if PyCall is loaded first, like this:</p><pre><code class="language-julia">using PyCall
 using JudiLing</code></pre><p>Likewise, the code involving deep learning is only available if Julia&#39;s deep learning library Flux is loaded first, like this:</p><pre><code class="language-julia">using Flux
 using JudiLing</code></pre><p>Note that Flux and PyCall have to be installed separately, and the newest version of Flux requires at least Julia 1.9. If you want to run deep learning in a GPU, make sure to also install and import <a href="https://cuda.juliagpu.org/stable/">CUDA</a>.</p><h2 id="Running-Julia-with-multiple-threads-2"><a class="docs-heading-anchor" href="#Running-Julia-with-multiple-threads-2">Running Julia with multiple threads</a><a class="docs-heading-anchor-permalink" href="#Running-Julia-with-multiple-threads-2" title="Permalink"></a></h2><p>JudiLing supports the use of multiple threads. Simply start up Julia in your terminal as follows:</p><pre><code class="language-none">$ julia -t your_num_of_threads</code></pre><p>For detailed information on using Julia with threads, see this <a href="https://docs.julialang.org/en/v1/manual/multi-threading/">link</a>.</p><h2 id="Quick-start-example"><a class="docs-heading-anchor" href="#Quick-start-example">Quick start example</a><a id="Quick-start-example-1"></a><a class="docs-heading-anchor-permalink" href="#Quick-start-example" title="Permalink"></a></h2><p>The Latin dataset <a href="https://osf.io/2ejfu/download">latin.csv</a> contains lexemes and inflectional features for 672 inflected Latin verb forms for 8 lexemes from 4 conjugation classes. Word forms are inflected for person, number, tense, voice and mood.</p><pre><code class="language-none">&quot;&quot;,&quot;Word&quot;,&quot;Lexeme&quot;,&quot;Person&quot;,&quot;Number&quot;,&quot;Tense&quot;,&quot;Voice&quot;,&quot;Mood&quot;
@@ -324,4 +324,4 @@
 @show acc_build_val</code></pre><p>Output:</p><pre><code class="language-output">acc_learn_train = 0.9983
 acc_learn_val = 0.6866
 acc_build_train = 1.0
-acc_build_val = 0.3284</code></pre><p>Alternatively, we  have a wrapper function incorporating all above functionalities. With this function, you can quickly explore datasets with different parameter settings. Please find more in the <a href="@ref">Test Combo Introduction</a>.</p><h2 id="Supports"><a class="docs-heading-anchor" href="#Supports">Supports</a><a id="Supports-1"></a><a class="docs-heading-anchor-permalink" href="#Supports" title="Permalink"></a></h2><p>There are two types of supports in outputs. An utterance level and a set of supports for each cue. The former support is also called &quot;synthesis-by-analysis&quot; support. This support is calculated by predicted S vector and original S vector and it is used to select the best paths. Cue level supports are slices of Yt matrices from each timestep. Those supports are used to determine whether a cue is eligible for constructing paths.</p><h2 id="Acknowledgments"><a class="docs-heading-anchor" href="#Acknowledgments">Acknowledgments</a><a id="Acknowledgments-1"></a><a class="docs-heading-anchor-permalink" href="#Acknowledgments" title="Permalink"></a></h2><p>This project was supported by the ERC advanced grant WIDE-742545 and by the Deutsche Forschungsgemeinschaft (DFG, German Research Foundation) under Germany’s Excellence Strategy - EXC number 2064/1 - Project number 390727645.</p><h2 id="Acknowledgments-2"><a class="docs-heading-anchor" href="#Acknowledgments-2">Acknowledgments</a><a class="docs-heading-anchor-permalink" href="#Acknowledgments-2" title="Permalink"></a></h2><p>This project was supported by the ERC advanced grant WIDE-742545 and by the Deutsche Forschungsgemeinschaft (DFG, German Research Foundation) under Germany’s Excellence Strategy - EXC number 2064/1 - Project number 390727645.</p><h2 id="Citation"><a class="docs-heading-anchor" href="#Citation">Citation</a><a id="Citation-1"></a><a class="docs-heading-anchor-permalink" href="#Citation" title="Permalink"></a></h2><p>If you find this package helpful, please cite it as follows:</p><p>Luo, X., Heitmeier, M., Chuang, Y. Y., Baayen, R. H. JudiLing: an implementation of the Discriminative Lexicon Model in Julia. Eberhard Karls Universität Tübingen, Seminar für Sprachwissenschaft.</p><p>The following studies have made use of several algorithms now implemented in JudiLing instead of WpmWithLdl:</p><ul><li><p>Baayen, R. H., Chuang, Y. Y., Shafaei-Bajestan, E., and Blevins, J. P. (2019). The discriminative lexicon: A unified computational model for the lexicon and lexical processing in comprehension and production grounded not in (de)composition but in linear discriminative learning. Complexity, 2019, 1-39.</p></li><li><p>Baayen, R. H., Chuang, Y. Y., and Blevins, J. P. (2018). Inflectional morphology with linear mappings. The Mental Lexicon, 13 (2), 232-270.</p></li><li><p>Chuang, Y.-Y., Lõo, K., Blevins, J. P., and Baayen, R. H. (2020). Estonian case inflection made simple. A case study in Word and Paradigm morphology with Linear Discriminative Learning. In Körtvélyessy, L., and Štekauer, P. (Eds.) Complex Words: Advances in Morphology, 1-19.</p></li><li><p>Chuang, Y-Y., Bell, M. J., Banke, I., and Baayen, R. H. (2020). Bilingual and multilingual mental lexicon: a modeling study with Linear Discriminative Learning. Language Learning, 1-55.</p></li><li><p>Heitmeier, M., Chuang, Y-Y., Baayen, R. H. (2021). Modeling morphology with Linear Discriminative Learning: considerations and design choices. Frontiers in Psychology, 12, 4929.</p></li><li><p>Denistia, K., and Baayen, R. H. (2022). The morphology of Indonesian: Data and quantitative modeling. In Shei, C., and Li, S. (Eds.) The Routledge Handbook of Asian Linguistics, (pp. 605-634). Routledge, London.</p></li><li><p>Heitmeier, M., Chuang, Y.-Y., and Baayen, R. H. (2023). How trial-to-trial learning shapes mappings in the mental lexicon: Modelling lexical decision with linear discriminative learning. Cognitive Psychology, 1-30.</p></li><li><p>Chuang, Y. Y., Kang, M., Luo, X. F. and Baayen, R. H. (2023). Vector Space Morphology with Linear Discriminative Learning. In Crepaldi, D. (Ed.) Linguistic morphology in the mind and brain.</p></li><li><p>Heitmeier, M., Chuang, Y. Y., Axen, S. D., &amp; Baayen, R. H. (2024). Frequency effects in linear discriminative learning. Frontiers in Human Neuroscience, 17, 1242720.</p></li><li><p>Plag, I., Heitmeier, M. &amp; Domahs, F. (to appear). German nominal number interpretation in an impaired mental lexicon: A naive discriminative learning perspective. The Mental Lexicon.</p></li></ul></article><nav class="docs-footer"><a class="docs-footer-nextpage" href="man/input/">Loading data »</a><div class="flexbox-break"></div><p class="footer-message">Powered by <a href="https://github.com/JuliaDocs/Documenter.jl">Documenter.jl</a> and the <a href="https://julialang.org/">Julia Programming Language</a>.</p></nav></div><div class="modal" id="documenter-settings"><div class="modal-background"></div><div class="modal-card"><header class="modal-card-head"><p class="modal-card-title">Settings</p><button class="delete"></button></header><section class="modal-card-body"><p><label class="label">Theme</label><div class="select"><select id="documenter-themepicker"><option value="documenter-light">documenter-light</option><option value="documenter-dark">documenter-dark</option></select></div></p><hr/><p>This document was generated with <a href="https://github.com/JuliaDocs/Documenter.jl">Documenter.jl</a> on <span class="colophon-date" title="Wednesday 3 July 2024 16:02">Wednesday 3 July 2024</span>. Using Julia version 1.10.4.</p></section><footer class="modal-card-foot"></footer></div></div></div></body></html>
+acc_build_val = 0.3284</code></pre><p>Alternatively, we  have a wrapper function incorporating all above functionalities. With this function, you can quickly explore datasets with different parameter settings. Please find more in the <a href="@ref">Test Combo Introduction</a>.</p><h2 id="Supports"><a class="docs-heading-anchor" href="#Supports">Supports</a><a id="Supports-1"></a><a class="docs-heading-anchor-permalink" href="#Supports" title="Permalink"></a></h2><p>There are two types of supports in outputs. An utterance level and a set of supports for each cue. The former support is also called &quot;synthesis-by-analysis&quot; support. This support is calculated by predicted S vector and original S vector and it is used to select the best paths. Cue level supports are slices of Yt matrices from each timestep. Those supports are used to determine whether a cue is eligible for constructing paths.</p><h2 id="Acknowledgments"><a class="docs-heading-anchor" href="#Acknowledgments">Acknowledgments</a><a id="Acknowledgments-1"></a><a class="docs-heading-anchor-permalink" href="#Acknowledgments" title="Permalink"></a></h2><p>This project was supported by the ERC advanced grant WIDE-742545 and by the Deutsche Forschungsgemeinschaft (DFG, German Research Foundation) under Germany’s Excellence Strategy - EXC number 2064/1 - Project number 390727645.</p><h2 id="Citation"><a class="docs-heading-anchor" href="#Citation">Citation</a><a id="Citation-1"></a><a class="docs-heading-anchor-permalink" href="#Citation" title="Permalink"></a></h2><p>If you find this package helpful, please cite it as follows:</p><p>Luo, X., Heitmeier, M., Chuang, Y. Y., Baayen, R. H. JudiLing: an implementation of the Discriminative Lexicon Model in Julia. Eberhard Karls Universität Tübingen, Seminar für Sprachwissenschaft.</p><p>The following studies have made use of several algorithms now implemented in JudiLing instead of WpmWithLdl:</p><ul><li><p>Baayen, R. H., Chuang, Y. Y., Shafaei-Bajestan, E., and Blevins, J. P. (2019). The discriminative lexicon: A unified computational model for the lexicon and lexical processing in comprehension and production grounded not in (de)composition but in linear discriminative learning. Complexity, 2019, 1-39.</p></li><li><p>Baayen, R. H., Chuang, Y. Y., and Blevins, J. P. (2018). Inflectional morphology with linear mappings. The Mental Lexicon, 13 (2), 232-270.</p></li><li><p>Chuang, Y.-Y., Lõo, K., Blevins, J. P., and Baayen, R. H. (2020). Estonian case inflection made simple. A case study in Word and Paradigm morphology with Linear Discriminative Learning. In Körtvélyessy, L., and Štekauer, P. (Eds.) Complex Words: Advances in Morphology, 1-19.</p></li><li><p>Chuang, Y-Y., Bell, M. J., Banke, I., and Baayen, R. H. (2020). Bilingual and multilingual mental lexicon: a modeling study with Linear Discriminative Learning. Language Learning, 1-55.</p></li><li><p>Heitmeier, M., Chuang, Y-Y., Baayen, R. H. (2021). Modeling morphology with Linear Discriminative Learning: considerations and design choices. Frontiers in Psychology, 12, 4929.</p></li><li><p>Denistia, K., and Baayen, R. H. (2022). The morphology of Indonesian: Data and quantitative modeling. In Shei, C., and Li, S. (Eds.) The Routledge Handbook of Asian Linguistics, (pp. 605-634). Routledge, London.</p></li><li><p>Heitmeier, M., Chuang, Y.-Y., and Baayen, R. H. (2023). How trial-to-trial learning shapes mappings in the mental lexicon: Modelling lexical decision with linear discriminative learning. Cognitive Psychology, 1-30.</p></li><li><p>Chuang, Y. Y., Kang, M., Luo, X. F. and Baayen, R. H. (2023). Vector Space Morphology with Linear Discriminative Learning. In Crepaldi, D. (Ed.) Linguistic morphology in the mind and brain.</p></li><li><p>Heitmeier, M., Chuang, Y. Y., Axen, S. D., &amp; Baayen, R. H. (2024). Frequency effects in linear discriminative learning. Frontiers in Human Neuroscience, 17, 1242720.</p></li><li><p>Plag, I., Heitmeier, M. &amp; Domahs, F. (to appear). German nominal number interpretation in an impaired mental lexicon: A naive discriminative learning perspective. The Mental Lexicon.</p></li></ul></article><nav class="docs-footer"><a class="docs-footer-nextpage" href="man/input/">Loading data »</a><div class="flexbox-break"></div><p class="footer-message">Powered by <a href="https://github.com/JuliaDocs/Documenter.jl">Documenter.jl</a> and the <a href="https://julialang.org/">Julia Programming Language</a>.</p></nav></div><div class="modal" id="documenter-settings"><div class="modal-background"></div><div class="modal-card"><header class="modal-card-head"><p class="modal-card-title">Settings</p><button class="delete"></button></header><section class="modal-card-body"><p><label class="label">Theme</label><div class="select"><select id="documenter-themepicker"><option value="documenter-light">documenter-light</option><option value="documenter-dark">documenter-dark</option></select></div></p><hr/><p>This document was generated with <a href="https://github.com/JuliaDocs/Documenter.jl">Documenter.jl</a> on <span class="colophon-date" title="Wednesday 3 July 2024 16:16">Wednesday 3 July 2024</span>. Using Julia version 1.10.4.</p></section><footer class="modal-card-foot"></footer></div></div></div></body></html>
diff --git a/dev/man/all_manual/index.html b/dev/man/all_manual/index.html
index 240c2da..1d2634c 100644
--- a/dev/man/all_manual/index.html
+++ b/dev/man/all_manual/index.html
@@ -1,2 +1,2 @@
 <!DOCTYPE html>
-<html lang="en"><head><meta charset="UTF-8"/><meta name="viewport" content="width=device-width, initial-scale=1.0"/><title>All Manual index · JudiLing.jl</title><link rel="canonical" href="https://quantling.github.io/JudiLing.jl/man/all_manual/"/><link href="https://fonts.googleapis.com/css?family=Lato|Roboto+Mono" rel="stylesheet" type="text/css"/><link href="https://cdnjs.cloudflare.com/ajax/libs/font-awesome/5.15.0/css/fontawesome.min.css" rel="stylesheet" type="text/css"/><link href="https://cdnjs.cloudflare.com/ajax/libs/font-awesome/5.15.0/css/solid.min.css" rel="stylesheet" type="text/css"/><link href="https://cdnjs.cloudflare.com/ajax/libs/font-awesome/5.15.0/css/brands.min.css" rel="stylesheet" type="text/css"/><link href="https://cdnjs.cloudflare.com/ajax/libs/KaTeX/0.11.1/katex.min.css" rel="stylesheet" type="text/css"/><script>documenterBaseURL="../.."</script><script src="https://cdnjs.cloudflare.com/ajax/libs/require.js/2.3.6/require.min.js" data-main="../../assets/documenter.js"></script><script src="../../siteinfo.js"></script><script src="../../../versions.js"></script><link class="docs-theme-link" rel="stylesheet" type="text/css" href="../../assets/themes/documenter-dark.css" data-theme-name="documenter-dark"/><link class="docs-theme-link" rel="stylesheet" type="text/css" href="../../assets/themes/documenter-light.css" data-theme-name="documenter-light" data-theme-primary/><script src="../../assets/themeswap.js"></script></head><body><div id="documenter"><nav class="docs-sidebar"><div class="docs-package-name"><span class="docs-autofit">JudiLing.jl</span></div><form class="docs-search" action="../../search/"><input class="docs-search-query" id="documenter-search-query" name="q" type="text" placeholder="Search docs"/></form><ul class="docs-menu"><li><a class="tocitem" href="../../">Home</a></li><li><span class="tocitem">Manual</span><ul><li><a class="tocitem" href="../input/">Loading data</a></li><li><a class="tocitem" href="../make_cue_matrix/">Make Cue Matrix</a></li><li><a class="tocitem" href="../make_semantic_matrix/">Make Semantic Matrix</a></li><li><a class="tocitem" href="../cholesky/">Cholesky</a></li><li><a class="tocitem" href="../make_adjacency_matrix/">Make Adjacency Matrix</a></li><li><a class="tocitem" href="../make_yt_matrix/">Make Yt Matrix</a></li><li><a class="tocitem" href="../find_path/">Find Paths</a></li><li><a class="tocitem" href="../eval/">Evaluation</a></li><li><a class="tocitem" href="../output/">Output</a></li><li><a class="tocitem" href="../test_combo/">Test Combo</a></li><li><a class="tocitem" href="../display/">Display</a></li><li><a class="tocitem" href="../utils/">Utils</a></li><li><a class="tocitem" href="../pickle/">Pickle</a></li><li><a class="tocitem" href="../pyndl/">Pyndl</a></li><li><a class="tocitem" href="../wh/">Widrow-Hoff Learning</a></li><li><a class="tocitem" href="../deep_learning/">Deep learning</a></li><li><a class="tocitem" href="../measures_func/">Measures function</a></li></ul></li><li class="is-active"><a class="tocitem" href>All Manual index</a></li></ul><div class="docs-version-selector field has-addons"><div class="control"><span class="docs-label button is-static is-size-7">Version</span></div><div class="docs-selector control is-expanded"><div class="select is-fullwidth is-size-7"><select id="documenter-version-selector"></select></div></div></div></nav><div class="docs-main"><header class="docs-navbar"><nav class="breadcrumb"><ul class="is-hidden-mobile"><li class="is-active"><a href>All Manual index</a></li></ul><ul class="is-hidden-tablet"><li class="is-active"><a href>All Manual index</a></li></ul></nav><div class="docs-right"><a class="docs-edit-link" href="https://github.com/quantling/JudiLing.jl/blob/master/docs/src/man/all_manual.md#L" title="Edit on GitHub"><span class="docs-icon fab"></span><span class="docs-label is-hidden-touch">Edit on GitHub</span></a><a class="docs-settings-button fas fa-cog" id="documenter-settings-button" href="#" title="Settings"></a><a class="docs-sidebar-button fa fa-bars is-hidden-desktop" id="documenter-sidebar-button" href="#"></a></div></header><article class="content" id="documenter-page"><ul><li><a href="../eval/#JudiLing.Comp_Acc_Struct"><code>JudiLing.Comp_Acc_Struct</code></a></li><li><a href="../make_cue_matrix/#JudiLing.Cue_Matrix_Struct"><code>JudiLing.Cue_Matrix_Struct</code></a></li><li><a href="../find_path/#JudiLing.Gold_Path_Info_Struct"><code>JudiLing.Gold_Path_Info_Struct</code></a></li><li><a href="../make_semantic_matrix/#JudiLing.L_Matrix_Struct"><code>JudiLing.L_Matrix_Struct</code></a></li><li><a href="../make_semantic_matrix/#JudiLing.L_Matrix_Struct-NTuple{12, Any}"><code>JudiLing.L_Matrix_Struct</code></a></li><li><a href="../make_semantic_matrix/#JudiLing.L_Matrix_Struct-NTuple{10, Any}"><code>JudiLing.L_Matrix_Struct</code></a></li><li><a href="../make_semantic_matrix/#JudiLing.PS_Matrix_Struct"><code>JudiLing.PS_Matrix_Struct</code></a></li><li><a href="../pyndl/#JudiLing.Pyndl_Weight_Struct"><code>JudiLing.Pyndl_Weight_Struct</code></a></li><li><a href="../find_path/#JudiLing.Result_Path_Info_Struct"><code>JudiLing.Result_Path_Info_Struct</code></a></li><li><a href="../preprocess/#JudiLing.SplitDataException"><code>JudiLing.SplitDataException</code></a></li><li><a href="../find_path/#JudiLing.Threshold_Stat_Struct"><code>JudiLing.Threshold_Stat_Struct</code></a></li><li><a href="../eval/#JudiLing.accuracy_comprehension-Tuple{Any, Any, Any}"><code>JudiLing.accuracy_comprehension</code></a></li><li><a href="../eval/#JudiLing.accuracy_comprehension-NTuple{5, Any}"><code>JudiLing.accuracy_comprehension</code></a></li><li><a href="../make_semantic_matrix/#JudiLing.add_St_noise!-Tuple{Any, Any}"><code>JudiLing.add_St_noise!</code></a></li><li><a href="../find_path/#JudiLing.build_paths-NTuple{8, Any}"><code>JudiLing.build_paths</code></a></li><li><a href="../find_path/#JudiLing.build_paths"><code>JudiLing.build_paths</code></a></li><li><a href="../utils/#JudiLing.cal_max_timestep"><code>JudiLing.cal_max_timestep</code></a></li><li><a href="../utils/#JudiLing.check_used_token"><code>JudiLing.check_used_token</code></a></li><li><a href="../make_semantic_matrix/#JudiLing.comp_f_M!-NTuple{6, Any}"><code>JudiLing.comp_f_M!</code></a></li><li><a href="../make_semantic_matrix/#JudiLing.comp_f_M!-NTuple{5, Any}"><code>JudiLing.comp_f_M!</code></a></li><li><a href="../display/#JudiLing.display_matrix-Tuple{Any, Any, Any}"><code>JudiLing.display_matrix</code></a></li><li><a href="../display/#JudiLing.display_matrix-NTuple{5, Any}"><code>JudiLing.display_matrix</code></a></li><li><a href="../utils/#JudiLing.display_pred"><code>JudiLing.display_pred</code></a></li><li><a href="../eval/#JudiLing.eval_SC-Tuple{AbstractArray, AbstractArray, DataFrames.DataFrame, Union{String, Symbol}}"><code>JudiLing.eval_SC</code></a></li><li><a href="../eval/#JudiLing.eval_SC-Tuple{AbstractArray, AbstractArray}"><code>JudiLing.eval_SC</code></a></li><li><a href="../eval/#JudiLing.eval_SC-Tuple{AbstractArray, AbstractArray, AbstractArray, DataFrames.DataFrame, DataFrames.DataFrame, Union{String, Symbol}}"><code>JudiLing.eval_SC</code></a></li><li><a href="../eval/#JudiLing.eval_SC-Tuple{AbstractArray, AbstractArray, DataFrames.DataFrame, Union{String, Symbol}, Int64}"><code>JudiLing.eval_SC</code></a></li><li><a href="../eval/#JudiLing.eval_SC-Tuple{AbstractArray, AbstractArray, AbstractArray}"><code>JudiLing.eval_SC</code></a></li><li><a href="../eval/#JudiLing.eval_SC-Tuple{AbstractArray, AbstractArray, Int64}"><code>JudiLing.eval_SC</code></a></li><li><a href="../eval/#JudiLing.eval_SC"><code>JudiLing.eval_SC</code></a></li><li><a href="../eval/#JudiLing.eval_SC_loose-NTuple{5, Any}"><code>JudiLing.eval_SC_loose</code></a></li><li><a href="../eval/#JudiLing.eval_SC_loose-Tuple{Any, Any, Any}"><code>JudiLing.eval_SC_loose</code></a></li><li><a href="../eval/#JudiLing.eval_SC_loose"><code>JudiLing.eval_SC_loose</code></a></li><li><a href="../eval/#JudiLing.eval_acc-Tuple{Any, JudiLing.Cue_Matrix_Struct}"><code>JudiLing.eval_acc</code></a></li><li><a href="../eval/#JudiLing.eval_acc-Tuple{Any, Array}"><code>JudiLing.eval_acc</code></a></li><li><a href="../eval/#JudiLing.eval_acc_loose-Tuple{Any, Any}"><code>JudiLing.eval_acc_loose</code></a></li><li><a href="../find_path/#JudiLing.eval_can-NTuple{7, Any}"><code>JudiLing.eval_can</code></a></li><li><a href="../eval/#JudiLing.eval_manual-Tuple{Any, Any, Any}"><code>JudiLing.eval_manual</code></a></li><li><a href="../eval/#JudiLing.extract_gpi"><code>JudiLing.extract_gpi</code></a></li><li><a href="../deep_learning/#JudiLing.fiddl-Tuple{Union{SparseArrays.SparseMatrixCSC, Matrix}, Union{SparseArrays.SparseMatrixCSC, Matrix}, Vector, DataFrames.DataFrame, Union{String, Symbol}, String}"><code>JudiLing.fiddl</code></a></li><li><a href="../find_path/#JudiLing.find_top_feature_indices-Tuple{Any, Any}"><code>JudiLing.find_top_feature_indices</code></a></li><li><a href="../cholesky/#JudiLing.format_matrix"><code>JudiLing.format_matrix</code></a></li><li><a href="../deep_learning/#JudiLing.get_and_train_model-Tuple{Union{SparseArrays.SparseMatrixCSC, Matrix}, Union{SparseArrays.SparseMatrixCSC, Matrix}, String}"><code>JudiLing.get_and_train_model</code></a></li><li><a href="../deep_learning/#JudiLing.get_and_train_model-Tuple{Union{SparseArrays.SparseMatrixCSC, Matrix}, Union{SparseArrays.SparseMatrixCSC, Matrix}, Union{Missing, SparseArrays.SparseMatrixCSC, Matrix}, Union{Missing, SparseArrays.SparseMatrixCSC, Matrix}, Union{Missing, DataFrames.DataFrame}, Union{Missing, DataFrames.DataFrame}, Union{Missing, String, Symbol}, String}"><code>JudiLing.get_and_train_model</code></a></li><li><a href="../utils/#JudiLing.is_truly_sparse"><code>JudiLing.is_truly_sparse</code></a></li><li><a href="../utils/#JudiLing.isattachable"><code>JudiLing.isattachable</code></a></li><li><a href="../utils/#JudiLing.iscomplete"><code>JudiLing.iscomplete</code></a></li><li><a href="../utils/#JudiLing.iscorrect"><code>JudiLing.iscorrect</code></a></li><li><a href="../utils/#JudiLing.isnovel"><code>JudiLing.isnovel</code></a></li><li><a href="../utils/#JudiLing.isstart"><code>JudiLing.isstart</code></a></li><li><a href="../find_path/#JudiLing.learn_paths-Tuple{DataFrames.DataFrame, JudiLing.Cue_Matrix_Struct, Union{SparseArrays.SparseMatrixCSC, Matrix}, Any, Union{SparseArrays.SparseMatrixCSC, Matrix}}"><code>JudiLing.learn_paths</code></a></li><li><a href="../find_path/#JudiLing.learn_paths-Tuple{DataFrames.DataFrame, DataFrames.DataFrame, Union{SparseArrays.SparseMatrixCSC, Matrix}, Union{SparseArrays.SparseMatrixCSC, Matrix}, Any, Union{SparseArrays.SparseMatrixCSC, Matrix}, SparseArrays.SparseMatrixCSC, Dict, Dict}"><code>JudiLing.learn_paths</code></a></li><li><a href="../find_path/#JudiLing.learn_paths"><code>JudiLing.learn_paths</code></a></li><li><a href="../find_path/#JudiLing.learn_paths_rpi-Tuple{DataFrames.DataFrame, DataFrames.DataFrame, Union{SparseArrays.SparseMatrixCSC, Matrix}, Union{SparseArrays.SparseMatrixCSC, Matrix}, Any, Union{SparseArrays.SparseMatrixCSC, Matrix}, SparseArrays.SparseMatrixCSC, Dict, Dict}"><code>JudiLing.learn_paths_rpi</code></a></li><li><a href="../make_semantic_matrix/#JudiLing.lexome_sum-Tuple{Any, Any}"><code>JudiLing.lexome_sum</code></a></li><li><a href="../output/#JudiLing.load_L_matrix-Tuple{Any}"><code>JudiLing.load_L_matrix</code></a></li><li><a href="../output/#JudiLing.load_S_matrix-Tuple{Any}"><code>JudiLing.load_S_matrix</code></a></li><li><a href="../make_semantic_matrix/#JudiLing.load_S_matrix_from_fasttext-Tuple{DataFrames.DataFrame, DataFrames.DataFrame, Symbol}"><code>JudiLing.load_S_matrix_from_fasttext</code></a></li><li><a href="../make_semantic_matrix/#JudiLing.load_S_matrix_from_fasttext-Tuple{DataFrames.DataFrame, Symbol}"><code>JudiLing.load_S_matrix_from_fasttext</code></a></li><li><a href="../make_semantic_matrix/#JudiLing.load_S_matrix_from_fasttext_file-Tuple{DataFrames.DataFrame, String}"><code>JudiLing.load_S_matrix_from_fasttext_file</code></a></li><li><a href="../make_semantic_matrix/#JudiLing.load_S_matrix_from_fasttext_file-Tuple{DataFrames.DataFrame, DataFrames.DataFrame, String}"><code>JudiLing.load_S_matrix_from_fasttext_file</code></a></li><li><a href="../make_semantic_matrix/#JudiLing.load_S_matrix_from_word2vec_file-Tuple{DataFrames.DataFrame, DataFrames.DataFrame, String}"><code>JudiLing.load_S_matrix_from_word2vec_file</code></a></li><li><a href="../make_semantic_matrix/#JudiLing.load_S_matrix_from_word2vec_file-Tuple{DataFrames.DataFrame, String}"><code>JudiLing.load_S_matrix_from_word2vec_file</code></a></li><li><a href="../input/#JudiLing.load_dataset-Tuple{String}"><code>JudiLing.load_dataset</code></a></li><li><a href="../pickle/#JudiLing.load_pickle"><code>JudiLing.load_pickle</code></a></li><li><a href="../input/#JudiLing.loading_data_careful_split-Tuple{String, String, String, Union{Vector{String}, Vector{Symbol}}}"><code>JudiLing.loading_data_careful_split</code></a></li><li><a href="../input/#JudiLing.loading_data_randomly_split-Tuple{String, String, String}"><code>JudiLing.loading_data_randomly_split</code></a></li><li><a href="../preprocess/#JudiLing.loo_cv_split-Tuple{Any}"><code>JudiLing.loo_cv_split</code></a></li><li><a href="../preprocess/#JudiLing.lpo_cv_split-Tuple{Any, Any}"><code>JudiLing.lpo_cv_split</code></a></li><li><a href="../make_semantic_matrix/#JudiLing.make_L_matrix-Tuple{DataFrames.DataFrame, Vector}"><code>JudiLing.make_L_matrix</code></a></li><li><a href="../make_semantic_matrix/#JudiLing.make_L_matrix"><code>JudiLing.make_L_matrix</code></a></li><li><a href="../make_semantic_matrix/#JudiLing.make_S_matrix-Tuple{DataFrames.DataFrame, DataFrames.DataFrame, Vector}"><code>JudiLing.make_S_matrix</code></a></li><li><a href="../make_semantic_matrix/#JudiLing.make_S_matrix-Tuple{DataFrames.DataFrame, Vector, JudiLing.L_Matrix_Struct}"><code>JudiLing.make_S_matrix</code></a></li><li><a href="../make_semantic_matrix/#JudiLing.make_S_matrix-Tuple{DataFrames.DataFrame, Vector, Vector}"><code>JudiLing.make_S_matrix</code></a></li><li><a href="../make_semantic_matrix/#JudiLing.make_S_matrix"><code>JudiLing.make_S_matrix</code></a></li><li><a href="../make_semantic_matrix/#JudiLing.make_S_matrix-Tuple{DataFrames.DataFrame, Vector}"><code>JudiLing.make_S_matrix</code></a></li><li><a href="../make_semantic_matrix/#JudiLing.make_S_matrix-Tuple{DataFrames.DataFrame, DataFrames.DataFrame, Vector, Vector}"><code>JudiLing.make_S_matrix</code></a></li><li><a href="../make_semantic_matrix/#JudiLing.make_S_matrix-Tuple{DataFrames.DataFrame, Vector, Vector, JudiLing.L_Matrix_Struct}"><code>JudiLing.make_S_matrix</code></a></li><li><a href="../pyndl/#JudiLing.make_S_matrix-Tuple{DataFrames.DataFrame, JudiLing.Pyndl_Weight_Struct, Vector}"><code>JudiLing.make_S_matrix</code></a></li><li><a href="../make_semantic_matrix/#JudiLing.make_S_matrix-Tuple{DataFrames.DataFrame, DataFrames.DataFrame, Vector, Vector, JudiLing.L_Matrix_Struct}"><code>JudiLing.make_S_matrix</code></a></li><li><a href="../make_semantic_matrix/#JudiLing.make_S_matrix-Tuple{DataFrames.DataFrame, Union{Nothing, DataFrames.DataFrame}, Vector, JudiLing.L_Matrix_Struct}"><code>JudiLing.make_S_matrix</code></a></li><li><a href="../pyndl/#JudiLing.make_S_matrix-Tuple{DataFrames.DataFrame, DataFrames.DataFrame, JudiLing.Pyndl_Weight_Struct, Vector}"><code>JudiLing.make_S_matrix</code></a></li><li><a href="../make_semantic_matrix/#JudiLing.make_St-NTuple{5, Any}"><code>JudiLing.make_St</code></a></li><li><a href="../make_semantic_matrix/#JudiLing.make_St-NTuple{4, Any}"><code>JudiLing.make_St</code></a></li><li><a href="../make_yt_matrix/#JudiLing.make_Yt_matrix"><code>JudiLing.make_Yt_matrix</code></a></li><li><a href="../make_yt_matrix/#JudiLing.make_Yt_matrix-Tuple{Any, Any, Any}"><code>JudiLing.make_Yt_matrix</code></a></li><li><a href="../make_semantic_matrix/#JudiLing.make_combined_L_matrix-Tuple{DataFrames.DataFrame, DataFrames.DataFrame, Vector}"><code>JudiLing.make_combined_L_matrix</code></a></li><li><a href="../make_semantic_matrix/#JudiLing.make_combined_L_matrix-Tuple{DataFrames.DataFrame, DataFrames.DataFrame, Vector, Vector}"><code>JudiLing.make_combined_L_matrix</code></a></li><li><a href="../make_semantic_matrix/#JudiLing.make_combined_L_matrix"><code>JudiLing.make_combined_L_matrix</code></a></li><li><a href="../make_semantic_matrix/#JudiLing.make_combined_S_matrix-Tuple{DataFrames.DataFrame, Union{Nothing, DataFrames.DataFrame}, Vector, JudiLing.L_Matrix_Struct}"><code>JudiLing.make_combined_S_matrix</code></a></li><li><a href="../make_semantic_matrix/#JudiLing.make_combined_S_matrix-Tuple{DataFrames.DataFrame, DataFrames.DataFrame, Vector, Vector}"><code>JudiLing.make_combined_S_matrix</code></a></li><li><a href="../make_semantic_matrix/#JudiLing.make_combined_S_matrix-Tuple{DataFrames.DataFrame, DataFrames.DataFrame, Vector, Vector, JudiLing.L_Matrix_Struct}"><code>JudiLing.make_combined_S_matrix</code></a></li><li><a href="../make_semantic_matrix/#JudiLing.make_combined_S_matrix-Tuple{DataFrames.DataFrame, DataFrames.DataFrame, Vector}"><code>JudiLing.make_combined_S_matrix</code></a></li><li><a href="../make_semantic_matrix/#JudiLing.make_combined_S_matrix"><code>JudiLing.make_combined_S_matrix</code></a></li><li><a href="../make_adjacency_matrix/#JudiLing.make_combined_adjacency_matrix-Tuple{Any, Any}"><code>JudiLing.make_combined_adjacency_matrix</code></a></li><li><a href="../make_cue_matrix/#JudiLing.make_combined_cue_matrix-Tuple{Any, Any}"><code>JudiLing.make_combined_cue_matrix</code></a></li><li><a href="../make_cue_matrix/#JudiLing.make_combined_cue_matrix"><code>JudiLing.make_combined_cue_matrix</code></a></li><li><a href="../make_cue_matrix/#JudiLing.make_combined_cue_matrix_from_CFBS-Union{Tuple{T}, Tuple{Array{Vector{T}, 1}, Array{Vector{T}, 1}}} where T"><code>JudiLing.make_combined_cue_matrix_from_CFBS</code></a></li><li><a href="../make_semantic_matrix/#JudiLing.make_combined_pS_matrix-Tuple{Any, Any}"><code>JudiLing.make_combined_pS_matrix</code></a></li><li><a href="../make_cue_matrix/#JudiLing.make_cue_matrix-Tuple{DataFrames.DataFrame}"><code>JudiLing.make_cue_matrix</code></a></li><li><a href="../make_cue_matrix/#JudiLing.make_cue_matrix-Tuple{DataFrames.DataFrame, JudiLing.Cue_Matrix_Struct}"><code>JudiLing.make_cue_matrix</code></a></li><li><a href="../make_cue_matrix/#JudiLing.make_cue_matrix-Tuple{DataFrames.DataFrame, DataFrames.DataFrame}"><code>JudiLing.make_cue_matrix</code></a></li><li><a href="../pyndl/#JudiLing.make_cue_matrix-Tuple{DataFrames.DataFrame, JudiLing.Pyndl_Weight_Struct}"><code>JudiLing.make_cue_matrix</code></a></li><li><a href="../make_cue_matrix/#JudiLing.make_cue_matrix"><code>JudiLing.make_cue_matrix</code></a></li><li><a href="../make_cue_matrix/#JudiLing.make_cue_matrix_from_CFBS-Union{Tuple{Array{Vector{T}, 1}}, Tuple{T}} where T"><code>JudiLing.make_cue_matrix_from_CFBS</code></a></li><li><a href="../make_adjacency_matrix/#JudiLing.make_full_adjacency_matrix-Tuple{Any}"><code>JudiLing.make_full_adjacency_matrix</code></a></li><li><a href="../make_adjacency_matrix/#JudiLing.make_full_adjacency_matrix"><code>JudiLing.make_full_adjacency_matrix</code></a></li><li><a href="../wh/#JudiLing.make_learn_seq-Tuple{Any}"><code>JudiLing.make_learn_seq</code></a></li><li><a href="../make_cue_matrix/#JudiLing.make_ngrams-NTuple{5, Any}"><code>JudiLing.make_ngrams</code></a></li><li><a href="../make_cue_matrix/#JudiLing.make_ngrams"><code>JudiLing.make_ngrams</code></a></li><li><a href="../find_path/#JudiLing.make_ngrams_ind-Tuple{Any, Any}"><code>JudiLing.make_ngrams_ind</code></a></li><li><a href="../make_semantic_matrix/#JudiLing.make_pS_matrix-Tuple{Any}"><code>JudiLing.make_pS_matrix</code></a></li><li><a href="../make_semantic_matrix/#JudiLing.make_pS_matrix"><code>JudiLing.make_pS_matrix</code></a></li><li><a href="../make_semantic_matrix/#JudiLing.make_pS_matrix-Tuple{Any, Any}"><code>JudiLing.make_pS_matrix</code></a></li><li><a href="../cholesky/#JudiLing.make_transform_fac-Tuple{Matrix}"><code>JudiLing.make_transform_fac</code></a></li><li><a href="../cholesky/#JudiLing.make_transform_fac-Tuple{SparseArrays.SparseMatrixCSC}"><code>JudiLing.make_transform_fac</code></a></li><li><a href="../cholesky/#JudiLing.make_transform_fac"><code>JudiLing.make_transform_fac</code></a></li><li><a href="../cholesky/#JudiLing.make_transform_matrix"><code>JudiLing.make_transform_matrix</code></a></li><li><a href="../cholesky/#JudiLing.make_transform_matrix-Tuple{Union{SparseArrays.CHOLMOD.Factor, LinearAlgebra.Cholesky}, Union{SparseArrays.SparseMatrixCSC, Matrix}, Union{SparseArrays.SparseMatrixCSC, Matrix}}"><code>JudiLing.make_transform_matrix</code></a></li><li><a href="../cholesky/#JudiLing.make_transform_matrix-Tuple{Matrix, Union{SparseArrays.SparseMatrixCSC, Matrix}}"><code>JudiLing.make_transform_matrix</code></a></li><li><a href="../cholesky/#JudiLing.make_transform_matrix-Tuple{SparseArrays.SparseMatrixCSC, Matrix}"><code>JudiLing.make_transform_matrix</code></a></li><li><a href="../cholesky/#JudiLing.make_transform_matrix-Tuple{SparseArrays.SparseMatrixCSC, SparseArrays.SparseMatrixCSC}"><code>JudiLing.make_transform_matrix</code></a></li><li><a href="../make_semantic_matrix/#JudiLing.merge_f2i-NTuple{4, Any}"><code>JudiLing.merge_f2i</code></a></li><li><a href="../make_semantic_matrix/#JudiLing.normalize_St!-Tuple{Any, Any}"><code>JudiLing.normalize_St!</code></a></li><li><a href="../make_semantic_matrix/#JudiLing.normalize_St!-Tuple{Any, Any, Any}"><code>JudiLing.normalize_St!</code></a></li><li><a href="../deep_learning/#JudiLing.predict_from_deep_model-Tuple{Chain, Union{SparseArrays.SparseMatrixCSC, Matrix}}"><code>JudiLing.predict_from_deep_model</code></a></li><li><a href="../deep_learning/#JudiLing.predict_shat-Tuple{Chain, Vector{Int64}}"><code>JudiLing.predict_shat</code></a></li><li><a href="../find_path/#JudiLing.predict_shat-Tuple{Union{SparseArrays.SparseMatrixCSC, Matrix}, Vector{Int64}}"><code>JudiLing.predict_shat</code></a></li><li><a href="../make_semantic_matrix/#JudiLing.process_features-Tuple{Any, Any}"><code>JudiLing.process_features</code></a></li><li><a href="../pyndl/#JudiLing.pyndl-Tuple{String}"><code>JudiLing.pyndl</code></a></li><li><a href="../output/#JudiLing.save_L_matrix-Tuple{Any, Any}"><code>JudiLing.save_L_matrix</code></a></li><li><a href="../output/#JudiLing.save_S_matrix-NTuple{4, Any}"><code>JudiLing.save_S_matrix</code></a></li><li><a href="../pickle/#JudiLing.save_pickle"><code>JudiLing.save_pickle</code></a></li><li><a href="../test_combo/#JudiLing.test_combo-Tuple{Any}"><code>JudiLing.test_combo</code></a></li><li><a href="../preprocess/#JudiLing.train_val_careful_split-NTuple{4, Any}"><code>JudiLing.train_val_careful_split</code></a></li><li><a href="../preprocess/#JudiLing.train_val_random_split-Tuple{Any, Any, Any}"><code>JudiLing.train_val_random_split</code></a></li><li><a href="../utils/#JudiLing.translate"><code>JudiLing.translate</code></a></li><li><a href="../utils/#JudiLing.translate_path"><code>JudiLing.translate_path</code></a></li><li><a href="../wh/#JudiLing.wh_learn-Tuple{Any, Any}"><code>JudiLing.wh_learn</code></a></li><li><a href="../output/#JudiLing.write2csv-NTuple{5, Any}"><code>JudiLing.write2csv</code></a></li><li><a href="../output/#JudiLing.write2csv"><code>JudiLing.write2csv</code></a></li><li><a href="../output/#JudiLing.write2csv-Tuple{Vector{JudiLing.Gold_Path_Info_Struct}, Any}"><code>JudiLing.write2csv</code></a></li><li><a href="../output/#JudiLing.write2csv-Tuple{JudiLing.Threshold_Stat_Struct, Any}"><code>JudiLing.write2csv</code></a></li><li><a href="../output/#JudiLing.write2df-NTuple{4, Any}"><code>JudiLing.write2df</code></a></li><li><a href="../output/#JudiLing.write2df-Tuple{JudiLing.Threshold_Stat_Struct}"><code>JudiLing.write2df</code></a></li><li><a href="../output/#JudiLing.write2df-Tuple{Vector{JudiLing.Gold_Path_Info_Struct}}"><code>JudiLing.write2df</code></a></li><li><a href="../output/#JudiLing.write2df"><code>JudiLing.write2df</code></a></li><li><a href="../output/#JudiLing.write_comprehension_eval"><code>JudiLing.write_comprehension_eval</code></a></li><li><a href="../output/#JudiLing.write_comprehension_eval-NTuple{7, Any}"><code>JudiLing.write_comprehension_eval</code></a></li><li><a href="../output/#JudiLing.write_comprehension_eval-NTuple{5, Any}"><code>JudiLing.write_comprehension_eval</code></a></li></ul></article><nav class="docs-footer"><a class="docs-footer-prevpage" href="../measures_func/">« Measures function</a><div class="flexbox-break"></div><p class="footer-message">Powered by <a href="https://github.com/JuliaDocs/Documenter.jl">Documenter.jl</a> and the <a href="https://julialang.org/">Julia Programming Language</a>.</p></nav></div><div class="modal" id="documenter-settings"><div class="modal-background"></div><div class="modal-card"><header class="modal-card-head"><p class="modal-card-title">Settings</p><button class="delete"></button></header><section class="modal-card-body"><p><label class="label">Theme</label><div class="select"><select id="documenter-themepicker"><option value="documenter-light">documenter-light</option><option value="documenter-dark">documenter-dark</option></select></div></p><hr/><p>This document was generated with <a href="https://github.com/JuliaDocs/Documenter.jl">Documenter.jl</a> on <span class="colophon-date" title="Wednesday 3 July 2024 16:02">Wednesday 3 July 2024</span>. Using Julia version 1.10.4.</p></section><footer class="modal-card-foot"></footer></div></div></div></body></html>
+<html lang="en"><head><meta charset="UTF-8"/><meta name="viewport" content="width=device-width, initial-scale=1.0"/><title>All Manual index · JudiLing.jl</title><link rel="canonical" href="https://quantling.github.io/JudiLing.jl/man/all_manual/"/><link href="https://fonts.googleapis.com/css?family=Lato|Roboto+Mono" rel="stylesheet" type="text/css"/><link href="https://cdnjs.cloudflare.com/ajax/libs/font-awesome/5.15.0/css/fontawesome.min.css" rel="stylesheet" type="text/css"/><link href="https://cdnjs.cloudflare.com/ajax/libs/font-awesome/5.15.0/css/solid.min.css" rel="stylesheet" type="text/css"/><link href="https://cdnjs.cloudflare.com/ajax/libs/font-awesome/5.15.0/css/brands.min.css" rel="stylesheet" type="text/css"/><link href="https://cdnjs.cloudflare.com/ajax/libs/KaTeX/0.11.1/katex.min.css" rel="stylesheet" type="text/css"/><script>documenterBaseURL="../.."</script><script src="https://cdnjs.cloudflare.com/ajax/libs/require.js/2.3.6/require.min.js" data-main="../../assets/documenter.js"></script><script src="../../siteinfo.js"></script><script src="../../../versions.js"></script><link class="docs-theme-link" rel="stylesheet" type="text/css" href="../../assets/themes/documenter-dark.css" data-theme-name="documenter-dark"/><link class="docs-theme-link" rel="stylesheet" type="text/css" href="../../assets/themes/documenter-light.css" data-theme-name="documenter-light" data-theme-primary/><script src="../../assets/themeswap.js"></script></head><body><div id="documenter"><nav class="docs-sidebar"><div class="docs-package-name"><span class="docs-autofit">JudiLing.jl</span></div><form class="docs-search" action="../../search/"><input class="docs-search-query" id="documenter-search-query" name="q" type="text" placeholder="Search docs"/></form><ul class="docs-menu"><li><a class="tocitem" href="../../">Home</a></li><li><span class="tocitem">Manual</span><ul><li><a class="tocitem" href="../input/">Loading data</a></li><li><a class="tocitem" href="../make_cue_matrix/">Make Cue Matrix</a></li><li><a class="tocitem" href="../make_semantic_matrix/">Make Semantic Matrix</a></li><li><a class="tocitem" href="../cholesky/">Cholesky</a></li><li><a class="tocitem" href="../make_adjacency_matrix/">Make Adjacency Matrix</a></li><li><a class="tocitem" href="../make_yt_matrix/">Make Yt Matrix</a></li><li><a class="tocitem" href="../find_path/">Find Paths</a></li><li><a class="tocitem" href="../eval/">Evaluation</a></li><li><a class="tocitem" href="../output/">Output</a></li><li><a class="tocitem" href="../test_combo/">Test Combo</a></li><li><a class="tocitem" href="../display/">Display</a></li><li><a class="tocitem" href="../utils/">Utils</a></li><li><a class="tocitem" href="../pickle/">Pickle</a></li><li><a class="tocitem" href="../pyndl/">Pyndl</a></li><li><a class="tocitem" href="../wh/">Widrow-Hoff Learning</a></li><li><a class="tocitem" href="../deep_learning/">Deep learning</a></li><li><a class="tocitem" href="../measures_func/">Measures function</a></li></ul></li><li class="is-active"><a class="tocitem" href>All Manual index</a></li></ul><div class="docs-version-selector field has-addons"><div class="control"><span class="docs-label button is-static is-size-7">Version</span></div><div class="docs-selector control is-expanded"><div class="select is-fullwidth is-size-7"><select id="documenter-version-selector"></select></div></div></div></nav><div class="docs-main"><header class="docs-navbar"><nav class="breadcrumb"><ul class="is-hidden-mobile"><li class="is-active"><a href>All Manual index</a></li></ul><ul class="is-hidden-tablet"><li class="is-active"><a href>All Manual index</a></li></ul></nav><div class="docs-right"><a class="docs-edit-link" href="https://github.com/quantling/JudiLing.jl/blob/master/docs/src/man/all_manual.md#L" title="Edit on GitHub"><span class="docs-icon fab"></span><span class="docs-label is-hidden-touch">Edit on GitHub</span></a><a class="docs-settings-button fas fa-cog" id="documenter-settings-button" href="#" title="Settings"></a><a class="docs-sidebar-button fa fa-bars is-hidden-desktop" id="documenter-sidebar-button" href="#"></a></div></header><article class="content" id="documenter-page"><ul><li><a href="../eval/#JudiLing.Comp_Acc_Struct"><code>JudiLing.Comp_Acc_Struct</code></a></li><li><a href="../make_cue_matrix/#JudiLing.Cue_Matrix_Struct"><code>JudiLing.Cue_Matrix_Struct</code></a></li><li><a href="../find_path/#JudiLing.Gold_Path_Info_Struct"><code>JudiLing.Gold_Path_Info_Struct</code></a></li><li><a href="../make_semantic_matrix/#JudiLing.L_Matrix_Struct"><code>JudiLing.L_Matrix_Struct</code></a></li><li><a href="../make_semantic_matrix/#JudiLing.L_Matrix_Struct-NTuple{12, Any}"><code>JudiLing.L_Matrix_Struct</code></a></li><li><a href="../make_semantic_matrix/#JudiLing.L_Matrix_Struct-NTuple{10, Any}"><code>JudiLing.L_Matrix_Struct</code></a></li><li><a href="../make_semantic_matrix/#JudiLing.PS_Matrix_Struct"><code>JudiLing.PS_Matrix_Struct</code></a></li><li><a href="../pyndl/#JudiLing.Pyndl_Weight_Struct"><code>JudiLing.Pyndl_Weight_Struct</code></a></li><li><a href="../find_path/#JudiLing.Result_Path_Info_Struct"><code>JudiLing.Result_Path_Info_Struct</code></a></li><li><a href="../preprocess/#JudiLing.SplitDataException"><code>JudiLing.SplitDataException</code></a></li><li><a href="../find_path/#JudiLing.Threshold_Stat_Struct"><code>JudiLing.Threshold_Stat_Struct</code></a></li><li><a href="../eval/#JudiLing.accuracy_comprehension-Tuple{Any, Any, Any}"><code>JudiLing.accuracy_comprehension</code></a></li><li><a href="../eval/#JudiLing.accuracy_comprehension-NTuple{5, Any}"><code>JudiLing.accuracy_comprehension</code></a></li><li><a href="../make_semantic_matrix/#JudiLing.add_St_noise!-Tuple{Any, Any}"><code>JudiLing.add_St_noise!</code></a></li><li><a href="../find_path/#JudiLing.build_paths-NTuple{8, Any}"><code>JudiLing.build_paths</code></a></li><li><a href="../find_path/#JudiLing.build_paths"><code>JudiLing.build_paths</code></a></li><li><a href="../utils/#JudiLing.cal_max_timestep"><code>JudiLing.cal_max_timestep</code></a></li><li><a href="../utils/#JudiLing.check_used_token"><code>JudiLing.check_used_token</code></a></li><li><a href="../make_semantic_matrix/#JudiLing.comp_f_M!-NTuple{6, Any}"><code>JudiLing.comp_f_M!</code></a></li><li><a href="../make_semantic_matrix/#JudiLing.comp_f_M!-NTuple{5, Any}"><code>JudiLing.comp_f_M!</code></a></li><li><a href="../display/#JudiLing.display_matrix-NTuple{5, Any}"><code>JudiLing.display_matrix</code></a></li><li><a href="../display/#JudiLing.display_matrix-Tuple{Any, Any, Any}"><code>JudiLing.display_matrix</code></a></li><li><a href="../utils/#JudiLing.display_pred"><code>JudiLing.display_pred</code></a></li><li><a href="../eval/#JudiLing.eval_SC-Tuple{AbstractArray, AbstractArray, AbstractArray}"><code>JudiLing.eval_SC</code></a></li><li><a href="../eval/#JudiLing.eval_SC-Tuple{AbstractArray, AbstractArray, AbstractArray, DataFrames.DataFrame, DataFrames.DataFrame, Union{String, Symbol}}"><code>JudiLing.eval_SC</code></a></li><li><a href="../eval/#JudiLing.eval_SC-Tuple{AbstractArray, AbstractArray, DataFrames.DataFrame, Union{String, Symbol}}"><code>JudiLing.eval_SC</code></a></li><li><a href="../eval/#JudiLing.eval_SC-Tuple{AbstractArray, AbstractArray}"><code>JudiLing.eval_SC</code></a></li><li><a href="../eval/#JudiLing.eval_SC-Tuple{AbstractArray, AbstractArray, Int64}"><code>JudiLing.eval_SC</code></a></li><li><a href="../eval/#JudiLing.eval_SC"><code>JudiLing.eval_SC</code></a></li><li><a href="../eval/#JudiLing.eval_SC-Tuple{AbstractArray, AbstractArray, DataFrames.DataFrame, Union{String, Symbol}, Int64}"><code>JudiLing.eval_SC</code></a></li><li><a href="../eval/#JudiLing.eval_SC_loose-NTuple{5, Any}"><code>JudiLing.eval_SC_loose</code></a></li><li><a href="../eval/#JudiLing.eval_SC_loose-Tuple{Any, Any, Any}"><code>JudiLing.eval_SC_loose</code></a></li><li><a href="../eval/#JudiLing.eval_SC_loose"><code>JudiLing.eval_SC_loose</code></a></li><li><a href="../eval/#JudiLing.eval_acc-Tuple{Any, JudiLing.Cue_Matrix_Struct}"><code>JudiLing.eval_acc</code></a></li><li><a href="../eval/#JudiLing.eval_acc-Tuple{Any, Array}"><code>JudiLing.eval_acc</code></a></li><li><a href="../eval/#JudiLing.eval_acc_loose-Tuple{Any, Any}"><code>JudiLing.eval_acc_loose</code></a></li><li><a href="../find_path/#JudiLing.eval_can-NTuple{7, Any}"><code>JudiLing.eval_can</code></a></li><li><a href="../eval/#JudiLing.eval_manual-Tuple{Any, Any, Any}"><code>JudiLing.eval_manual</code></a></li><li><a href="../eval/#JudiLing.extract_gpi"><code>JudiLing.extract_gpi</code></a></li><li><a href="../deep_learning/#JudiLing.fiddl-Tuple{Union{SparseArrays.SparseMatrixCSC, Matrix}, Union{SparseArrays.SparseMatrixCSC, Matrix}, Vector, DataFrames.DataFrame, Union{String, Symbol}, String}"><code>JudiLing.fiddl</code></a></li><li><a href="../find_path/#JudiLing.find_top_feature_indices-Tuple{Any, Any}"><code>JudiLing.find_top_feature_indices</code></a></li><li><a href="../cholesky/#JudiLing.format_matrix"><code>JudiLing.format_matrix</code></a></li><li><a href="../deep_learning/#JudiLing.get_and_train_model-Tuple{Union{SparseArrays.SparseMatrixCSC, Matrix}, Union{SparseArrays.SparseMatrixCSC, Matrix}, Union{Missing, SparseArrays.SparseMatrixCSC, Matrix}, Union{Missing, SparseArrays.SparseMatrixCSC, Matrix}, Union{Missing, DataFrames.DataFrame}, Union{Missing, DataFrames.DataFrame}, Union{Missing, String, Symbol}, String}"><code>JudiLing.get_and_train_model</code></a></li><li><a href="../deep_learning/#JudiLing.get_and_train_model-Tuple{Union{SparseArrays.SparseMatrixCSC, Matrix}, Union{SparseArrays.SparseMatrixCSC, Matrix}, String}"><code>JudiLing.get_and_train_model</code></a></li><li><a href="../utils/#JudiLing.is_truly_sparse"><code>JudiLing.is_truly_sparse</code></a></li><li><a href="../utils/#JudiLing.isattachable"><code>JudiLing.isattachable</code></a></li><li><a href="../utils/#JudiLing.iscomplete"><code>JudiLing.iscomplete</code></a></li><li><a href="../utils/#JudiLing.iscorrect"><code>JudiLing.iscorrect</code></a></li><li><a href="../utils/#JudiLing.isnovel"><code>JudiLing.isnovel</code></a></li><li><a href="../utils/#JudiLing.isstart"><code>JudiLing.isstart</code></a></li><li><a href="../find_path/#JudiLing.learn_paths"><code>JudiLing.learn_paths</code></a></li><li><a href="../find_path/#JudiLing.learn_paths-Tuple{DataFrames.DataFrame, JudiLing.Cue_Matrix_Struct, Union{SparseArrays.SparseMatrixCSC, Matrix}, Any, Union{SparseArrays.SparseMatrixCSC, Matrix}}"><code>JudiLing.learn_paths</code></a></li><li><a href="../find_path/#JudiLing.learn_paths-Tuple{DataFrames.DataFrame, DataFrames.DataFrame, Union{SparseArrays.SparseMatrixCSC, Matrix}, Union{SparseArrays.SparseMatrixCSC, Matrix}, Any, Union{SparseArrays.SparseMatrixCSC, Matrix}, SparseArrays.SparseMatrixCSC, Dict, Dict}"><code>JudiLing.learn_paths</code></a></li><li><a href="../find_path/#JudiLing.learn_paths_rpi-Tuple{DataFrames.DataFrame, DataFrames.DataFrame, Union{SparseArrays.SparseMatrixCSC, Matrix}, Union{SparseArrays.SparseMatrixCSC, Matrix}, Any, Union{SparseArrays.SparseMatrixCSC, Matrix}, SparseArrays.SparseMatrixCSC, Dict, Dict}"><code>JudiLing.learn_paths_rpi</code></a></li><li><a href="../make_semantic_matrix/#JudiLing.lexome_sum-Tuple{Any, Any}"><code>JudiLing.lexome_sum</code></a></li><li><a href="../output/#JudiLing.load_L_matrix-Tuple{Any}"><code>JudiLing.load_L_matrix</code></a></li><li><a href="../output/#JudiLing.load_S_matrix-Tuple{Any}"><code>JudiLing.load_S_matrix</code></a></li><li><a href="../make_semantic_matrix/#JudiLing.load_S_matrix_from_fasttext-Tuple{DataFrames.DataFrame, Symbol}"><code>JudiLing.load_S_matrix_from_fasttext</code></a></li><li><a href="../make_semantic_matrix/#JudiLing.load_S_matrix_from_fasttext-Tuple{DataFrames.DataFrame, DataFrames.DataFrame, Symbol}"><code>JudiLing.load_S_matrix_from_fasttext</code></a></li><li><a href="../make_semantic_matrix/#JudiLing.load_S_matrix_from_fasttext_file-Tuple{DataFrames.DataFrame, String}"><code>JudiLing.load_S_matrix_from_fasttext_file</code></a></li><li><a href="../make_semantic_matrix/#JudiLing.load_S_matrix_from_fasttext_file-Tuple{DataFrames.DataFrame, DataFrames.DataFrame, String}"><code>JudiLing.load_S_matrix_from_fasttext_file</code></a></li><li><a href="../make_semantic_matrix/#JudiLing.load_S_matrix_from_word2vec_file-Tuple{DataFrames.DataFrame, DataFrames.DataFrame, String}"><code>JudiLing.load_S_matrix_from_word2vec_file</code></a></li><li><a href="../make_semantic_matrix/#JudiLing.load_S_matrix_from_word2vec_file-Tuple{DataFrames.DataFrame, String}"><code>JudiLing.load_S_matrix_from_word2vec_file</code></a></li><li><a href="../input/#JudiLing.load_dataset-Tuple{String}"><code>JudiLing.load_dataset</code></a></li><li><a href="../pickle/#JudiLing.load_pickle"><code>JudiLing.load_pickle</code></a></li><li><a href="../input/#JudiLing.loading_data_careful_split-Tuple{String, String, String, Union{Vector{String}, Vector{Symbol}}}"><code>JudiLing.loading_data_careful_split</code></a></li><li><a href="../input/#JudiLing.loading_data_randomly_split-Tuple{String, String, String}"><code>JudiLing.loading_data_randomly_split</code></a></li><li><a href="../preprocess/#JudiLing.loo_cv_split-Tuple{Any}"><code>JudiLing.loo_cv_split</code></a></li><li><a href="../preprocess/#JudiLing.lpo_cv_split-Tuple{Any, Any}"><code>JudiLing.lpo_cv_split</code></a></li><li><a href="../make_semantic_matrix/#JudiLing.make_L_matrix"><code>JudiLing.make_L_matrix</code></a></li><li><a href="../make_semantic_matrix/#JudiLing.make_L_matrix-Tuple{DataFrames.DataFrame, Vector}"><code>JudiLing.make_L_matrix</code></a></li><li><a href="../make_semantic_matrix/#JudiLing.make_S_matrix-Tuple{DataFrames.DataFrame, Vector, JudiLing.L_Matrix_Struct}"><code>JudiLing.make_S_matrix</code></a></li><li><a href="../pyndl/#JudiLing.make_S_matrix-Tuple{DataFrames.DataFrame, DataFrames.DataFrame, JudiLing.Pyndl_Weight_Struct, Vector}"><code>JudiLing.make_S_matrix</code></a></li><li><a href="../make_semantic_matrix/#JudiLing.make_S_matrix-Tuple{DataFrames.DataFrame, Vector, Vector}"><code>JudiLing.make_S_matrix</code></a></li><li><a href="../make_semantic_matrix/#JudiLing.make_S_matrix-Tuple{DataFrames.DataFrame, Vector, Vector, JudiLing.L_Matrix_Struct}"><code>JudiLing.make_S_matrix</code></a></li><li><a href="../make_semantic_matrix/#JudiLing.make_S_matrix-Tuple{DataFrames.DataFrame, Union{Nothing, DataFrames.DataFrame}, Vector, JudiLing.L_Matrix_Struct}"><code>JudiLing.make_S_matrix</code></a></li><li><a href="../make_semantic_matrix/#JudiLing.make_S_matrix-Tuple{DataFrames.DataFrame, Vector}"><code>JudiLing.make_S_matrix</code></a></li><li><a href="../make_semantic_matrix/#JudiLing.make_S_matrix-Tuple{DataFrames.DataFrame, DataFrames.DataFrame, Vector, Vector}"><code>JudiLing.make_S_matrix</code></a></li><li><a href="../pyndl/#JudiLing.make_S_matrix-Tuple{DataFrames.DataFrame, JudiLing.Pyndl_Weight_Struct, Vector}"><code>JudiLing.make_S_matrix</code></a></li><li><a href="../make_semantic_matrix/#JudiLing.make_S_matrix-Tuple{DataFrames.DataFrame, DataFrames.DataFrame, Vector, Vector, JudiLing.L_Matrix_Struct}"><code>JudiLing.make_S_matrix</code></a></li><li><a href="../make_semantic_matrix/#JudiLing.make_S_matrix"><code>JudiLing.make_S_matrix</code></a></li><li><a href="../make_semantic_matrix/#JudiLing.make_S_matrix-Tuple{DataFrames.DataFrame, DataFrames.DataFrame, Vector}"><code>JudiLing.make_S_matrix</code></a></li><li><a href="../make_semantic_matrix/#JudiLing.make_St-NTuple{5, Any}"><code>JudiLing.make_St</code></a></li><li><a href="../make_semantic_matrix/#JudiLing.make_St-NTuple{4, Any}"><code>JudiLing.make_St</code></a></li><li><a href="../make_yt_matrix/#JudiLing.make_Yt_matrix"><code>JudiLing.make_Yt_matrix</code></a></li><li><a href="../make_yt_matrix/#JudiLing.make_Yt_matrix-Tuple{Any, Any, Any}"><code>JudiLing.make_Yt_matrix</code></a></li><li><a href="../make_semantic_matrix/#JudiLing.make_combined_L_matrix-Tuple{DataFrames.DataFrame, DataFrames.DataFrame, Vector}"><code>JudiLing.make_combined_L_matrix</code></a></li><li><a href="../make_semantic_matrix/#JudiLing.make_combined_L_matrix-Tuple{DataFrames.DataFrame, DataFrames.DataFrame, Vector, Vector}"><code>JudiLing.make_combined_L_matrix</code></a></li><li><a href="../make_semantic_matrix/#JudiLing.make_combined_L_matrix"><code>JudiLing.make_combined_L_matrix</code></a></li><li><a href="../make_semantic_matrix/#JudiLing.make_combined_S_matrix-Tuple{DataFrames.DataFrame, DataFrames.DataFrame, Vector, Vector}"><code>JudiLing.make_combined_S_matrix</code></a></li><li><a href="../make_semantic_matrix/#JudiLing.make_combined_S_matrix"><code>JudiLing.make_combined_S_matrix</code></a></li><li><a href="../make_semantic_matrix/#JudiLing.make_combined_S_matrix-Tuple{DataFrames.DataFrame, DataFrames.DataFrame, Vector, Vector, JudiLing.L_Matrix_Struct}"><code>JudiLing.make_combined_S_matrix</code></a></li><li><a href="../make_semantic_matrix/#JudiLing.make_combined_S_matrix-Tuple{DataFrames.DataFrame, DataFrames.DataFrame, Vector}"><code>JudiLing.make_combined_S_matrix</code></a></li><li><a href="../make_semantic_matrix/#JudiLing.make_combined_S_matrix-Tuple{DataFrames.DataFrame, Union{Nothing, DataFrames.DataFrame}, Vector, JudiLing.L_Matrix_Struct}"><code>JudiLing.make_combined_S_matrix</code></a></li><li><a href="../make_adjacency_matrix/#JudiLing.make_combined_adjacency_matrix-Tuple{Any, Any}"><code>JudiLing.make_combined_adjacency_matrix</code></a></li><li><a href="../make_cue_matrix/#JudiLing.make_combined_cue_matrix"><code>JudiLing.make_combined_cue_matrix</code></a></li><li><a href="../make_cue_matrix/#JudiLing.make_combined_cue_matrix-Tuple{Any, Any}"><code>JudiLing.make_combined_cue_matrix</code></a></li><li><a href="../make_cue_matrix/#JudiLing.make_combined_cue_matrix_from_CFBS-Union{Tuple{T}, Tuple{Array{Vector{T}, 1}, Array{Vector{T}, 1}}} where T"><code>JudiLing.make_combined_cue_matrix_from_CFBS</code></a></li><li><a href="../make_semantic_matrix/#JudiLing.make_combined_pS_matrix-Tuple{Any, Any}"><code>JudiLing.make_combined_pS_matrix</code></a></li><li><a href="../make_cue_matrix/#JudiLing.make_cue_matrix-Tuple{DataFrames.DataFrame, DataFrames.DataFrame}"><code>JudiLing.make_cue_matrix</code></a></li><li><a href="../pyndl/#JudiLing.make_cue_matrix-Tuple{DataFrames.DataFrame, JudiLing.Pyndl_Weight_Struct}"><code>JudiLing.make_cue_matrix</code></a></li><li><a href="../make_cue_matrix/#JudiLing.make_cue_matrix"><code>JudiLing.make_cue_matrix</code></a></li><li><a href="../make_cue_matrix/#JudiLing.make_cue_matrix-Tuple{DataFrames.DataFrame}"><code>JudiLing.make_cue_matrix</code></a></li><li><a href="../make_cue_matrix/#JudiLing.make_cue_matrix-Tuple{DataFrames.DataFrame, JudiLing.Cue_Matrix_Struct}"><code>JudiLing.make_cue_matrix</code></a></li><li><a href="../make_cue_matrix/#JudiLing.make_cue_matrix_from_CFBS-Union{Tuple{Array{Vector{T}, 1}}, Tuple{T}} where T"><code>JudiLing.make_cue_matrix_from_CFBS</code></a></li><li><a href="../make_adjacency_matrix/#JudiLing.make_full_adjacency_matrix"><code>JudiLing.make_full_adjacency_matrix</code></a></li><li><a href="../make_adjacency_matrix/#JudiLing.make_full_adjacency_matrix-Tuple{Any}"><code>JudiLing.make_full_adjacency_matrix</code></a></li><li><a href="../wh/#JudiLing.make_learn_seq-Tuple{Any}"><code>JudiLing.make_learn_seq</code></a></li><li><a href="../make_cue_matrix/#JudiLing.make_ngrams"><code>JudiLing.make_ngrams</code></a></li><li><a href="../make_cue_matrix/#JudiLing.make_ngrams-NTuple{5, Any}"><code>JudiLing.make_ngrams</code></a></li><li><a href="../find_path/#JudiLing.make_ngrams_ind-Tuple{Any, Any}"><code>JudiLing.make_ngrams_ind</code></a></li><li><a href="../make_semantic_matrix/#JudiLing.make_pS_matrix-Tuple{Any}"><code>JudiLing.make_pS_matrix</code></a></li><li><a href="../make_semantic_matrix/#JudiLing.make_pS_matrix"><code>JudiLing.make_pS_matrix</code></a></li><li><a href="../make_semantic_matrix/#JudiLing.make_pS_matrix-Tuple{Any, Any}"><code>JudiLing.make_pS_matrix</code></a></li><li><a href="../cholesky/#JudiLing.make_transform_fac"><code>JudiLing.make_transform_fac</code></a></li><li><a href="../cholesky/#JudiLing.make_transform_fac-Tuple{Matrix}"><code>JudiLing.make_transform_fac</code></a></li><li><a href="../cholesky/#JudiLing.make_transform_fac-Tuple{SparseArrays.SparseMatrixCSC}"><code>JudiLing.make_transform_fac</code></a></li><li><a href="../cholesky/#JudiLing.make_transform_matrix-Tuple{SparseArrays.SparseMatrixCSC, SparseArrays.SparseMatrixCSC}"><code>JudiLing.make_transform_matrix</code></a></li><li><a href="../cholesky/#JudiLing.make_transform_matrix"><code>JudiLing.make_transform_matrix</code></a></li><li><a href="../cholesky/#JudiLing.make_transform_matrix-Tuple{Matrix, Union{SparseArrays.SparseMatrixCSC, Matrix}}"><code>JudiLing.make_transform_matrix</code></a></li><li><a href="../cholesky/#JudiLing.make_transform_matrix-Tuple{SparseArrays.SparseMatrixCSC, Matrix}"><code>JudiLing.make_transform_matrix</code></a></li><li><a href="../cholesky/#JudiLing.make_transform_matrix-Tuple{Union{SparseArrays.CHOLMOD.Factor, LinearAlgebra.Cholesky}, Union{SparseArrays.SparseMatrixCSC, Matrix}, Union{SparseArrays.SparseMatrixCSC, Matrix}}"><code>JudiLing.make_transform_matrix</code></a></li><li><a href="../make_semantic_matrix/#JudiLing.merge_f2i-NTuple{4, Any}"><code>JudiLing.merge_f2i</code></a></li><li><a href="../make_semantic_matrix/#JudiLing.normalize_St!-Tuple{Any, Any}"><code>JudiLing.normalize_St!</code></a></li><li><a href="../make_semantic_matrix/#JudiLing.normalize_St!-Tuple{Any, Any, Any}"><code>JudiLing.normalize_St!</code></a></li><li><a href="../deep_learning/#JudiLing.predict_from_deep_model-Tuple{Chain, Union{SparseArrays.SparseMatrixCSC, Matrix}}"><code>JudiLing.predict_from_deep_model</code></a></li><li><a href="../find_path/#JudiLing.predict_shat-Tuple{Union{SparseArrays.SparseMatrixCSC, Matrix}, Vector{Int64}}"><code>JudiLing.predict_shat</code></a></li><li><a href="../deep_learning/#JudiLing.predict_shat-Tuple{Chain, Vector{Int64}}"><code>JudiLing.predict_shat</code></a></li><li><a href="../make_semantic_matrix/#JudiLing.process_features-Tuple{Any, Any}"><code>JudiLing.process_features</code></a></li><li><a href="../pyndl/#JudiLing.pyndl-Tuple{String}"><code>JudiLing.pyndl</code></a></li><li><a href="../output/#JudiLing.save_L_matrix-Tuple{Any, Any}"><code>JudiLing.save_L_matrix</code></a></li><li><a href="../output/#JudiLing.save_S_matrix-NTuple{4, Any}"><code>JudiLing.save_S_matrix</code></a></li><li><a href="../pickle/#JudiLing.save_pickle"><code>JudiLing.save_pickle</code></a></li><li><a href="../test_combo/#JudiLing.test_combo-Tuple{Any}"><code>JudiLing.test_combo</code></a></li><li><a href="../preprocess/#JudiLing.train_val_careful_split-NTuple{4, Any}"><code>JudiLing.train_val_careful_split</code></a></li><li><a href="../preprocess/#JudiLing.train_val_random_split-Tuple{Any, Any, Any}"><code>JudiLing.train_val_random_split</code></a></li><li><a href="../utils/#JudiLing.translate"><code>JudiLing.translate</code></a></li><li><a href="../utils/#JudiLing.translate_path"><code>JudiLing.translate_path</code></a></li><li><a href="../wh/#JudiLing.wh_learn-Tuple{Any, Any}"><code>JudiLing.wh_learn</code></a></li><li><a href="../output/#JudiLing.write2csv-Tuple{JudiLing.Threshold_Stat_Struct, Any}"><code>JudiLing.write2csv</code></a></li><li><a href="../output/#JudiLing.write2csv-Tuple{Vector{JudiLing.Gold_Path_Info_Struct}, Any}"><code>JudiLing.write2csv</code></a></li><li><a href="../output/#JudiLing.write2csv"><code>JudiLing.write2csv</code></a></li><li><a href="../output/#JudiLing.write2csv-NTuple{5, Any}"><code>JudiLing.write2csv</code></a></li><li><a href="../output/#JudiLing.write2df-Tuple{JudiLing.Threshold_Stat_Struct}"><code>JudiLing.write2df</code></a></li><li><a href="../output/#JudiLing.write2df-Tuple{Vector{JudiLing.Gold_Path_Info_Struct}}"><code>JudiLing.write2df</code></a></li><li><a href="../output/#JudiLing.write2df-NTuple{4, Any}"><code>JudiLing.write2df</code></a></li><li><a href="../output/#JudiLing.write2df"><code>JudiLing.write2df</code></a></li><li><a href="../output/#JudiLing.write_comprehension_eval-NTuple{5, Any}"><code>JudiLing.write_comprehension_eval</code></a></li><li><a href="../output/#JudiLing.write_comprehension_eval-NTuple{7, Any}"><code>JudiLing.write_comprehension_eval</code></a></li><li><a href="../output/#JudiLing.write_comprehension_eval"><code>JudiLing.write_comprehension_eval</code></a></li></ul></article><nav class="docs-footer"><a class="docs-footer-prevpage" href="../measures_func/">« Measures function</a><div class="flexbox-break"></div><p class="footer-message">Powered by <a href="https://github.com/JuliaDocs/Documenter.jl">Documenter.jl</a> and the <a href="https://julialang.org/">Julia Programming Language</a>.</p></nav></div><div class="modal" id="documenter-settings"><div class="modal-background"></div><div class="modal-card"><header class="modal-card-head"><p class="modal-card-title">Settings</p><button class="delete"></button></header><section class="modal-card-body"><p><label class="label">Theme</label><div class="select"><select id="documenter-themepicker"><option value="documenter-light">documenter-light</option><option value="documenter-dark">documenter-dark</option></select></div></p><hr/><p>This document was generated with <a href="https://github.com/JuliaDocs/Documenter.jl">Documenter.jl</a> on <span class="colophon-date" title="Wednesday 3 July 2024 16:16">Wednesday 3 July 2024</span>. Using Julia version 1.10.4.</p></section><footer class="modal-card-foot"></footer></div></div></div></body></html>
diff --git a/dev/man/cholesky/index.html b/dev/man/cholesky/index.html
index 0929e1f..e9dedc3 100644
--- a/dev/man/cholesky/index.html
+++ b/dev/man/cholesky/index.html
@@ -1,5 +1,5 @@
 <!DOCTYPE html>
-<html lang="en"><head><meta charset="UTF-8"/><meta name="viewport" content="width=device-width, initial-scale=1.0"/><title>Cholesky · JudiLing.jl</title><link rel="canonical" href="https://quantling.github.io/JudiLing.jl/man/cholesky/"/><link href="https://fonts.googleapis.com/css?family=Lato|Roboto+Mono" rel="stylesheet" type="text/css"/><link href="https://cdnjs.cloudflare.com/ajax/libs/font-awesome/5.15.0/css/fontawesome.min.css" rel="stylesheet" type="text/css"/><link href="https://cdnjs.cloudflare.com/ajax/libs/font-awesome/5.15.0/css/solid.min.css" rel="stylesheet" type="text/css"/><link href="https://cdnjs.cloudflare.com/ajax/libs/font-awesome/5.15.0/css/brands.min.css" rel="stylesheet" type="text/css"/><link href="https://cdnjs.cloudflare.com/ajax/libs/KaTeX/0.11.1/katex.min.css" rel="stylesheet" type="text/css"/><script>documenterBaseURL="../.."</script><script src="https://cdnjs.cloudflare.com/ajax/libs/require.js/2.3.6/require.min.js" data-main="../../assets/documenter.js"></script><script src="../../siteinfo.js"></script><script src="../../../versions.js"></script><link class="docs-theme-link" rel="stylesheet" type="text/css" href="../../assets/themes/documenter-dark.css" data-theme-name="documenter-dark"/><link class="docs-theme-link" rel="stylesheet" type="text/css" href="../../assets/themes/documenter-light.css" data-theme-name="documenter-light" data-theme-primary/><script src="../../assets/themeswap.js"></script></head><body><div id="documenter"><nav class="docs-sidebar"><div class="docs-package-name"><span class="docs-autofit">JudiLing.jl</span></div><form class="docs-search" action="../../search/"><input class="docs-search-query" id="documenter-search-query" name="q" type="text" placeholder="Search docs"/></form><ul class="docs-menu"><li><a class="tocitem" href="../../">Home</a></li><li><span class="tocitem">Manual</span><ul><li><a class="tocitem" href="../input/">Loading data</a></li><li><a class="tocitem" href="../make_cue_matrix/">Make Cue Matrix</a></li><li><a class="tocitem" href="../make_semantic_matrix/">Make Semantic Matrix</a></li><li class="is-active"><a class="tocitem" href>Cholesky</a></li><li><a class="tocitem" href="../make_adjacency_matrix/">Make Adjacency Matrix</a></li><li><a class="tocitem" href="../make_yt_matrix/">Make Yt Matrix</a></li><li><a class="tocitem" href="../find_path/">Find Paths</a></li><li><a class="tocitem" href="../eval/">Evaluation</a></li><li><a class="tocitem" href="../output/">Output</a></li><li><a class="tocitem" href="../test_combo/">Test Combo</a></li><li><a class="tocitem" href="../display/">Display</a></li><li><a class="tocitem" href="../utils/">Utils</a></li><li><a class="tocitem" href="../pickle/">Pickle</a></li><li><a class="tocitem" href="../pyndl/">Pyndl</a></li><li><a class="tocitem" href="../wh/">Widrow-Hoff Learning</a></li><li><a class="tocitem" href="../deep_learning/">Deep learning</a></li><li><a class="tocitem" href="../measures_func/">Measures function</a></li></ul></li><li><a class="tocitem" href="../all_manual/">All Manual index</a></li></ul><div class="docs-version-selector field has-addons"><div class="control"><span class="docs-label button is-static is-size-7">Version</span></div><div class="docs-selector control is-expanded"><div class="select is-fullwidth is-size-7"><select id="documenter-version-selector"></select></div></div></div></nav><div class="docs-main"><header class="docs-navbar"><nav class="breadcrumb"><ul class="is-hidden-mobile"><li><a class="is-disabled">Manual</a></li><li class="is-active"><a href>Cholesky</a></li></ul><ul class="is-hidden-tablet"><li class="is-active"><a href>Cholesky</a></li></ul></nav><div class="docs-right"><a class="docs-edit-link" href="https://github.com/quantling/JudiLing.jl/blob/master/docs/src/man/cholesky.md#L" title="Edit on GitHub"><span class="docs-icon fab"></span><span class="docs-label is-hidden-touch">Edit on GitHub</span></a><a class="docs-settings-button fas fa-cog" id="documenter-settings-button" href="#" title="Settings"></a><a class="docs-sidebar-button fa fa-bars is-hidden-desktop" id="documenter-sidebar-button" href="#"></a></div></header><article class="content" id="documenter-page"><h1 id="Cholesky"><a class="docs-heading-anchor" href="#Cholesky">Cholesky</a><a id="Cholesky-1"></a><a class="docs-heading-anchor-permalink" href="#Cholesky" title="Permalink"></a></h1><article class="docstring"><header><a class="docstring-binding" id="JudiLing.make_transform_fac" href="#JudiLing.make_transform_fac"><code>JudiLing.make_transform_fac</code></a> — <span class="docstring-category">Function</span></header><section><div><p>The first part of make transform matrix, usually used by the <code>learn_paths</code> function to save time and computing resources.</p></div><a class="docs-sourcelink" target="_blank" href="https://github.com/quantling/JudiLing.jl/blob/244bb0c648484065ffd5a41781ccc1caf2e5db60/src/cholesky.jl#LL1-L4">source</a></section></article><article class="docstring"><header><a class="docstring-binding" id="JudiLing.make_transform_matrix" href="#JudiLing.make_transform_matrix"><code>JudiLing.make_transform_matrix</code></a> — <span class="docstring-category">Function</span></header><section><div><p>Using Cholesky decomposition to calculate the transformation matrix from S to C or from C to S.</p></div><a class="docs-sourcelink" target="_blank" href="https://github.com/quantling/JudiLing.jl/blob/244bb0c648484065ffd5a41781ccc1caf2e5db60/src/cholesky.jl#LL7-L10">source</a></section></article><article class="docstring"><header><a class="docstring-binding" id="JudiLing.make_transform_fac-Tuple{SparseArrays.SparseMatrixCSC}" href="#JudiLing.make_transform_fac-Tuple{SparseArrays.SparseMatrixCSC}"><code>JudiLing.make_transform_fac</code></a> — <span class="docstring-category">Method</span></header><section><div><pre><code class="language-julia">make_transform_fac(X::SparseMatrixCSC)</code></pre><p>Calculate the first step of Cholesky decomposition for sparse matrices.</p></div><a class="docs-sourcelink" target="_blank" href="https://github.com/quantling/JudiLing.jl/blob/244bb0c648484065ffd5a41781ccc1caf2e5db60/src/cholesky.jl#LL13-L17">source</a></section></article><article class="docstring"><header><a class="docstring-binding" id="JudiLing.make_transform_fac-Tuple{Matrix}" href="#JudiLing.make_transform_fac-Tuple{Matrix}"><code>JudiLing.make_transform_fac</code></a> — <span class="docstring-category">Method</span></header><section><div><pre><code class="language-julia">make_transform_fac(X::Matrix)</code></pre><p>Calculate the first step of Cholesky decomposition for dense matrices.</p></div><a class="docs-sourcelink" target="_blank" href="https://github.com/quantling/JudiLing.jl/blob/244bb0c648484065ffd5a41781ccc1caf2e5db60/src/cholesky.jl#LL42-L46">source</a></section></article><article class="docstring"><header><a class="docstring-binding" id="JudiLing.make_transform_matrix-Tuple{Union{SparseArrays.CHOLMOD.Factor, LinearAlgebra.Cholesky}, Union{SparseArrays.SparseMatrixCSC, Matrix}, Union{SparseArrays.SparseMatrixCSC, Matrix}}" href="#JudiLing.make_transform_matrix-Tuple{Union{SparseArrays.CHOLMOD.Factor, LinearAlgebra.Cholesky}, Union{SparseArrays.SparseMatrixCSC, Matrix}, Union{SparseArrays.SparseMatrixCSC, Matrix}}"><code>JudiLing.make_transform_matrix</code></a> — <span class="docstring-category">Method</span></header><section><div><pre><code class="language-julia">make_transform_matrix(fac::Union{LinearAlgebra.Cholesky, SuiteSparse.CHOLMOD.Factor}, X::Union{SparseMatrixCSC, Matrix}, Y::Union{SparseMatrixCSC, Matrix})</code></pre><p>Second step in calculating the Cholesky decomposition for the transformation matrix.</p></div><a class="docs-sourcelink" target="_blank" href="https://github.com/quantling/JudiLing.jl/blob/244bb0c648484065ffd5a41781ccc1caf2e5db60/src/cholesky.jl#LL68-L72">source</a></section></article><article class="docstring"><header><a class="docstring-binding" id="JudiLing.make_transform_matrix-Tuple{SparseArrays.SparseMatrixCSC, Matrix}" href="#JudiLing.make_transform_matrix-Tuple{SparseArrays.SparseMatrixCSC, Matrix}"><code>JudiLing.make_transform_matrix</code></a> — <span class="docstring-category">Method</span></header><section><div><pre><code class="language-julia">make_transform_matrix(X::SparseMatrixCSC, Y::Matrix)</code></pre><p>Use Cholesky decomposition to calculate the transformation matrix from X to Y, where X is a sparse matrix and Y is a dense matrix.</p><p><strong>Obligatory Arguments</strong></p><ul><li><code>X::SparseMatrixCSC</code>: the X matrix, where X is a sparse matrix</li><li><code>Y::Matrix</code>: the Y matrix, where Y is a dense matrix</li></ul><p><strong>Optional Arguments</strong></p><ul><li><code>method::Symbol = :additive</code>: whether :additive or :multiplicative decomposition is required</li><li><code>shift::Float64 = 0.02</code>: shift value for :additive decomposition</li><li><code>multiplier::Float64 = 1.01</code>: multiplier value for :multiplicative decomposition</li><li><code>output_format::Symbol = :auto</code>: to force output format to dense(:dense) or sparse(:sparse), make it auto(:auto) to determined by the program</li><li><code>sparse_ratio::Float64 = 0.05</code>: the ratio to decide whether a matrix is sparse</li><li><code>verbose::Bool = false</code>: if true, more information will be printed out</li></ul><p><strong>Examples</strong></p><pre><code class="language-julia"># additive mode
+<html lang="en"><head><meta charset="UTF-8"/><meta name="viewport" content="width=device-width, initial-scale=1.0"/><title>Cholesky · JudiLing.jl</title><link rel="canonical" href="https://quantling.github.io/JudiLing.jl/man/cholesky/"/><link href="https://fonts.googleapis.com/css?family=Lato|Roboto+Mono" rel="stylesheet" type="text/css"/><link href="https://cdnjs.cloudflare.com/ajax/libs/font-awesome/5.15.0/css/fontawesome.min.css" rel="stylesheet" type="text/css"/><link href="https://cdnjs.cloudflare.com/ajax/libs/font-awesome/5.15.0/css/solid.min.css" rel="stylesheet" type="text/css"/><link href="https://cdnjs.cloudflare.com/ajax/libs/font-awesome/5.15.0/css/brands.min.css" rel="stylesheet" type="text/css"/><link href="https://cdnjs.cloudflare.com/ajax/libs/KaTeX/0.11.1/katex.min.css" rel="stylesheet" type="text/css"/><script>documenterBaseURL="../.."</script><script src="https://cdnjs.cloudflare.com/ajax/libs/require.js/2.3.6/require.min.js" data-main="../../assets/documenter.js"></script><script src="../../siteinfo.js"></script><script src="../../../versions.js"></script><link class="docs-theme-link" rel="stylesheet" type="text/css" href="../../assets/themes/documenter-dark.css" data-theme-name="documenter-dark"/><link class="docs-theme-link" rel="stylesheet" type="text/css" href="../../assets/themes/documenter-light.css" data-theme-name="documenter-light" data-theme-primary/><script src="../../assets/themeswap.js"></script></head><body><div id="documenter"><nav class="docs-sidebar"><div class="docs-package-name"><span class="docs-autofit">JudiLing.jl</span></div><form class="docs-search" action="../../search/"><input class="docs-search-query" id="documenter-search-query" name="q" type="text" placeholder="Search docs"/></form><ul class="docs-menu"><li><a class="tocitem" href="../../">Home</a></li><li><span class="tocitem">Manual</span><ul><li><a class="tocitem" href="../input/">Loading data</a></li><li><a class="tocitem" href="../make_cue_matrix/">Make Cue Matrix</a></li><li><a class="tocitem" href="../make_semantic_matrix/">Make Semantic Matrix</a></li><li class="is-active"><a class="tocitem" href>Cholesky</a></li><li><a class="tocitem" href="../make_adjacency_matrix/">Make Adjacency Matrix</a></li><li><a class="tocitem" href="../make_yt_matrix/">Make Yt Matrix</a></li><li><a class="tocitem" href="../find_path/">Find Paths</a></li><li><a class="tocitem" href="../eval/">Evaluation</a></li><li><a class="tocitem" href="../output/">Output</a></li><li><a class="tocitem" href="../test_combo/">Test Combo</a></li><li><a class="tocitem" href="../display/">Display</a></li><li><a class="tocitem" href="../utils/">Utils</a></li><li><a class="tocitem" href="../pickle/">Pickle</a></li><li><a class="tocitem" href="../pyndl/">Pyndl</a></li><li><a class="tocitem" href="../wh/">Widrow-Hoff Learning</a></li><li><a class="tocitem" href="../deep_learning/">Deep learning</a></li><li><a class="tocitem" href="../measures_func/">Measures function</a></li></ul></li><li><a class="tocitem" href="../all_manual/">All Manual index</a></li></ul><div class="docs-version-selector field has-addons"><div class="control"><span class="docs-label button is-static is-size-7">Version</span></div><div class="docs-selector control is-expanded"><div class="select is-fullwidth is-size-7"><select id="documenter-version-selector"></select></div></div></div></nav><div class="docs-main"><header class="docs-navbar"><nav class="breadcrumb"><ul class="is-hidden-mobile"><li><a class="is-disabled">Manual</a></li><li class="is-active"><a href>Cholesky</a></li></ul><ul class="is-hidden-tablet"><li class="is-active"><a href>Cholesky</a></li></ul></nav><div class="docs-right"><a class="docs-edit-link" href="https://github.com/quantling/JudiLing.jl/blob/master/docs/src/man/cholesky.md#L" title="Edit on GitHub"><span class="docs-icon fab"></span><span class="docs-label is-hidden-touch">Edit on GitHub</span></a><a class="docs-settings-button fas fa-cog" id="documenter-settings-button" href="#" title="Settings"></a><a class="docs-sidebar-button fa fa-bars is-hidden-desktop" id="documenter-sidebar-button" href="#"></a></div></header><article class="content" id="documenter-page"><h1 id="Cholesky"><a class="docs-heading-anchor" href="#Cholesky">Cholesky</a><a id="Cholesky-1"></a><a class="docs-heading-anchor-permalink" href="#Cholesky" title="Permalink"></a></h1><article class="docstring"><header><a class="docstring-binding" id="JudiLing.make_transform_fac" href="#JudiLing.make_transform_fac"><code>JudiLing.make_transform_fac</code></a> — <span class="docstring-category">Function</span></header><section><div><p>The first part of make transform matrix, usually used by the <code>learn_paths</code> function to save time and computing resources.</p></div><a class="docs-sourcelink" target="_blank" href="https://github.com/quantling/JudiLing.jl/blob/5ca73e4b27ef788e0b36d45e6360491a5a413be8/src/cholesky.jl#LL1-L4">source</a></section></article><article class="docstring"><header><a class="docstring-binding" id="JudiLing.make_transform_matrix" href="#JudiLing.make_transform_matrix"><code>JudiLing.make_transform_matrix</code></a> — <span class="docstring-category">Function</span></header><section><div><p>Using Cholesky decomposition to calculate the transformation matrix from S to C or from C to S.</p></div><a class="docs-sourcelink" target="_blank" href="https://github.com/quantling/JudiLing.jl/blob/5ca73e4b27ef788e0b36d45e6360491a5a413be8/src/cholesky.jl#LL7-L10">source</a></section></article><article class="docstring"><header><a class="docstring-binding" id="JudiLing.make_transform_fac-Tuple{SparseArrays.SparseMatrixCSC}" href="#JudiLing.make_transform_fac-Tuple{SparseArrays.SparseMatrixCSC}"><code>JudiLing.make_transform_fac</code></a> — <span class="docstring-category">Method</span></header><section><div><pre><code class="language-julia">make_transform_fac(X::SparseMatrixCSC)</code></pre><p>Calculate the first step of Cholesky decomposition for sparse matrices.</p></div><a class="docs-sourcelink" target="_blank" href="https://github.com/quantling/JudiLing.jl/blob/5ca73e4b27ef788e0b36d45e6360491a5a413be8/src/cholesky.jl#LL13-L17">source</a></section></article><article class="docstring"><header><a class="docstring-binding" id="JudiLing.make_transform_fac-Tuple{Matrix}" href="#JudiLing.make_transform_fac-Tuple{Matrix}"><code>JudiLing.make_transform_fac</code></a> — <span class="docstring-category">Method</span></header><section><div><pre><code class="language-julia">make_transform_fac(X::Matrix)</code></pre><p>Calculate the first step of Cholesky decomposition for dense matrices.</p></div><a class="docs-sourcelink" target="_blank" href="https://github.com/quantling/JudiLing.jl/blob/5ca73e4b27ef788e0b36d45e6360491a5a413be8/src/cholesky.jl#LL42-L46">source</a></section></article><article class="docstring"><header><a class="docstring-binding" id="JudiLing.make_transform_matrix-Tuple{Union{SparseArrays.CHOLMOD.Factor, LinearAlgebra.Cholesky}, Union{SparseArrays.SparseMatrixCSC, Matrix}, Union{SparseArrays.SparseMatrixCSC, Matrix}}" href="#JudiLing.make_transform_matrix-Tuple{Union{SparseArrays.CHOLMOD.Factor, LinearAlgebra.Cholesky}, Union{SparseArrays.SparseMatrixCSC, Matrix}, Union{SparseArrays.SparseMatrixCSC, Matrix}}"><code>JudiLing.make_transform_matrix</code></a> — <span class="docstring-category">Method</span></header><section><div><pre><code class="language-julia">make_transform_matrix(fac::Union{LinearAlgebra.Cholesky, SuiteSparse.CHOLMOD.Factor}, X::Union{SparseMatrixCSC, Matrix}, Y::Union{SparseMatrixCSC, Matrix})</code></pre><p>Second step in calculating the Cholesky decomposition for the transformation matrix.</p></div><a class="docs-sourcelink" target="_blank" href="https://github.com/quantling/JudiLing.jl/blob/5ca73e4b27ef788e0b36d45e6360491a5a413be8/src/cholesky.jl#LL68-L72">source</a></section></article><article class="docstring"><header><a class="docstring-binding" id="JudiLing.make_transform_matrix-Tuple{SparseArrays.SparseMatrixCSC, Matrix}" href="#JudiLing.make_transform_matrix-Tuple{SparseArrays.SparseMatrixCSC, Matrix}"><code>JudiLing.make_transform_matrix</code></a> — <span class="docstring-category">Method</span></header><section><div><pre><code class="language-julia">make_transform_matrix(X::SparseMatrixCSC, Y::Matrix)</code></pre><p>Use Cholesky decomposition to calculate the transformation matrix from X to Y, where X is a sparse matrix and Y is a dense matrix.</p><p><strong>Obligatory Arguments</strong></p><ul><li><code>X::SparseMatrixCSC</code>: the X matrix, where X is a sparse matrix</li><li><code>Y::Matrix</code>: the Y matrix, where Y is a dense matrix</li></ul><p><strong>Optional Arguments</strong></p><ul><li><code>method::Symbol = :additive</code>: whether :additive or :multiplicative decomposition is required</li><li><code>shift::Float64 = 0.02</code>: shift value for :additive decomposition</li><li><code>multiplier::Float64 = 1.01</code>: multiplier value for :multiplicative decomposition</li><li><code>output_format::Symbol = :auto</code>: to force output format to dense(:dense) or sparse(:sparse), make it auto(:auto) to determined by the program</li><li><code>sparse_ratio::Float64 = 0.05</code>: the ratio to decide whether a matrix is sparse</li><li><code>verbose::Bool = false</code>: if true, more information will be printed out</li></ul><p><strong>Examples</strong></p><pre><code class="language-julia"># additive mode
 JudiLing.make_transform_matrix(
     C,
     S,
@@ -20,7 +20,7 @@
   ...
     output_format = :auto,
     sparse_ratio = 0.05,
-  ...)</code></pre></div><a class="docs-sourcelink" target="_blank" href="https://github.com/quantling/JudiLing.jl/blob/244bb0c648484065ffd5a41781ccc1caf2e5db60/src/cholesky.jl#LL91-L134">source</a></section></article><article class="docstring"><header><a class="docstring-binding" id="JudiLing.make_transform_matrix-Tuple{Matrix, Union{SparseArrays.SparseMatrixCSC, Matrix}}" href="#JudiLing.make_transform_matrix-Tuple{Matrix, Union{SparseArrays.SparseMatrixCSC, Matrix}}"><code>JudiLing.make_transform_matrix</code></a> — <span class="docstring-category">Method</span></header><section><div><pre><code class="language-julia">make_transform_matrix(X::Matrix, Y::Union{SparseMatrixCSC, Matrix})</code></pre><p>Use the Cholesky decomposition to calculate the transformation matrix from X to Y, where X is a dense matrix and Y is either a dense matrix or a sparse matrix.</p><p><strong>Obligatory Arguments</strong></p><ul><li><code>X::Matrix</code>: the X matrix, where X is a dense matrix</li><li><code>Y::Union{SparseMatrixCSC, Matrix}</code>: the Y matrix, where Y is either a sparse or a dense matrix</li></ul><p><strong>Optional Arguments</strong></p><ul><li><code>method::Symbol = :additive</code>: whether :additive or :multiplicative decomposition is required</li><li><code>shift::Float64 = 0.02</code>: shift value for :additive decomposition</li><li><code>multiplier::Float64 = 1.01</code>: multiplier value for :multiplicative decomposition</li><li><code>output_format::Symbol = :auto</code>: to force output format to dense(:dense) or sparse(:sparse), make it auto(:auto) to determined by the program</li><li><code>sparse_ratio::Float64 = 0.05</code>: the ratio to decide whether a matrix is sparse</li><li><code>verbose::Bool = false</code>: if true, more information will be printed out</li></ul><p><strong>Examples</strong></p><pre><code class="language-julia"># additive mode
+  ...)</code></pre></div><a class="docs-sourcelink" target="_blank" href="https://github.com/quantling/JudiLing.jl/blob/5ca73e4b27ef788e0b36d45e6360491a5a413be8/src/cholesky.jl#LL91-L134">source</a></section></article><article class="docstring"><header><a class="docstring-binding" id="JudiLing.make_transform_matrix-Tuple{Matrix, Union{SparseArrays.SparseMatrixCSC, Matrix}}" href="#JudiLing.make_transform_matrix-Tuple{Matrix, Union{SparseArrays.SparseMatrixCSC, Matrix}}"><code>JudiLing.make_transform_matrix</code></a> — <span class="docstring-category">Method</span></header><section><div><pre><code class="language-julia">make_transform_matrix(X::Matrix, Y::Union{SparseMatrixCSC, Matrix})</code></pre><p>Use the Cholesky decomposition to calculate the transformation matrix from X to Y, where X is a dense matrix and Y is either a dense matrix or a sparse matrix.</p><p><strong>Obligatory Arguments</strong></p><ul><li><code>X::Matrix</code>: the X matrix, where X is a dense matrix</li><li><code>Y::Union{SparseMatrixCSC, Matrix}</code>: the Y matrix, where Y is either a sparse or a dense matrix</li></ul><p><strong>Optional Arguments</strong></p><ul><li><code>method::Symbol = :additive</code>: whether :additive or :multiplicative decomposition is required</li><li><code>shift::Float64 = 0.02</code>: shift value for :additive decomposition</li><li><code>multiplier::Float64 = 1.01</code>: multiplier value for :multiplicative decomposition</li><li><code>output_format::Symbol = :auto</code>: to force output format to dense(:dense) or sparse(:sparse), make it auto(:auto) to determined by the program</li><li><code>sparse_ratio::Float64 = 0.05</code>: the ratio to decide whether a matrix is sparse</li><li><code>verbose::Bool = false</code>: if true, more information will be printed out</li></ul><p><strong>Examples</strong></p><pre><code class="language-julia"># additive mode
 JudiLing.make_transform_matrix(
     C,
     S,
@@ -41,7 +41,7 @@
     ...
     output_format = :auto,
     sparse_ratio = 0.05,
-    ...)</code></pre></div><a class="docs-sourcelink" target="_blank" href="https://github.com/quantling/JudiLing.jl/blob/244bb0c648484065ffd5a41781ccc1caf2e5db60/src/cholesky.jl#LL169-L212">source</a></section></article><article class="docstring"><header><a class="docstring-binding" id="JudiLing.make_transform_matrix-Tuple{SparseArrays.SparseMatrixCSC, SparseArrays.SparseMatrixCSC}" href="#JudiLing.make_transform_matrix-Tuple{SparseArrays.SparseMatrixCSC, SparseArrays.SparseMatrixCSC}"><code>JudiLing.make_transform_matrix</code></a> — <span class="docstring-category">Method</span></header><section><div><pre><code class="language-julia">make_transform_matrix(X::SparseMatrixCSC, Y::SparseMatrixCSC)</code></pre><p>Use the Cholesky decomposition to calculate the transformation matrix from X to Y, where X is a sparse matrix and Y is a sparse matrix.</p><p><strong>Obligatory Arguments</strong></p><ul><li><code>X::SparseMatrixCSC</code>: the X matrix, where X is a sparse matrix</li><li><code>Y::SparseMatrixCSC</code>: the Y matrix, where Y is a sparse matrix</li></ul><p><strong>Optional Arguments</strong></p><ul><li><code>method::Symbol = :additive</code>: whether :additive or :multiplicative decomposition is required</li><li><code>shift::Float64 = 0.02</code>: shift value for :additive decomposition</li><li><code>multiplier::Float64 = 1.01</code>: multiplier value for :multiplicative decomposition</li><li><code>output_format::Symbol = :auto</code>: to force output format to dense(:dense) or sparse(:sparse), make it auto(:auto) to determined by the program</li><li><code>sparse_ratio::Float64 = 0.05</code>: the ratio to decide whether a matrix is sparse</li><li><code>verbose::Bool = false</code>: if true, more information will be printed out</li></ul><p><strong>Examples</strong></p><pre><code class="language-julia"># additive mode
+    ...)</code></pre></div><a class="docs-sourcelink" target="_blank" href="https://github.com/quantling/JudiLing.jl/blob/5ca73e4b27ef788e0b36d45e6360491a5a413be8/src/cholesky.jl#LL169-L212">source</a></section></article><article class="docstring"><header><a class="docstring-binding" id="JudiLing.make_transform_matrix-Tuple{SparseArrays.SparseMatrixCSC, SparseArrays.SparseMatrixCSC}" href="#JudiLing.make_transform_matrix-Tuple{SparseArrays.SparseMatrixCSC, SparseArrays.SparseMatrixCSC}"><code>JudiLing.make_transform_matrix</code></a> — <span class="docstring-category">Method</span></header><section><div><pre><code class="language-julia">make_transform_matrix(X::SparseMatrixCSC, Y::SparseMatrixCSC)</code></pre><p>Use the Cholesky decomposition to calculate the transformation matrix from X to Y, where X is a sparse matrix and Y is a sparse matrix.</p><p><strong>Obligatory Arguments</strong></p><ul><li><code>X::SparseMatrixCSC</code>: the X matrix, where X is a sparse matrix</li><li><code>Y::SparseMatrixCSC</code>: the Y matrix, where Y is a sparse matrix</li></ul><p><strong>Optional Arguments</strong></p><ul><li><code>method::Symbol = :additive</code>: whether :additive or :multiplicative decomposition is required</li><li><code>shift::Float64 = 0.02</code>: shift value for :additive decomposition</li><li><code>multiplier::Float64 = 1.01</code>: multiplier value for :multiplicative decomposition</li><li><code>output_format::Symbol = :auto</code>: to force output format to dense(:dense) or sparse(:sparse), make it auto(:auto) to determined by the program</li><li><code>sparse_ratio::Float64 = 0.05</code>: the ratio to decide whether a matrix is sparse</li><li><code>verbose::Bool = false</code>: if true, more information will be printed out</li></ul><p><strong>Examples</strong></p><pre><code class="language-julia"># additive mode
 JudiLing.make_transform_matrix(
     C,
     S,
@@ -62,4 +62,4 @@
     ...
     output_format = :auto,
     sparse_ratio = 0.05,
-    ...)</code></pre></div><a class="docs-sourcelink" target="_blank" href="https://github.com/quantling/JudiLing.jl/blob/244bb0c648484065ffd5a41781ccc1caf2e5db60/src/cholesky.jl#LL247-L290">source</a></section></article><article class="docstring"><header><a class="docstring-binding" id="JudiLing.format_matrix" href="#JudiLing.format_matrix"><code>JudiLing.format_matrix</code></a> — <span class="docstring-category">Function</span></header><section><div><pre><code class="language-julia">format_matrix(M::Union{SparseMatrixCSC, Matrix}, output_format=:auto)</code></pre><p>Convert output matrix format to either a dense matrix or a sparse matrix.</p></div><a class="docs-sourcelink" target="_blank" href="https://github.com/quantling/JudiLing.jl/blob/244bb0c648484065ffd5a41781ccc1caf2e5db60/src/cholesky.jl#LL381-L385">source</a></section></article></article><nav class="docs-footer"><a class="docs-footer-prevpage" href="../make_semantic_matrix/">« Make Semantic Matrix</a><a class="docs-footer-nextpage" href="../make_adjacency_matrix/">Make Adjacency Matrix »</a><div class="flexbox-break"></div><p class="footer-message">Powered by <a href="https://github.com/JuliaDocs/Documenter.jl">Documenter.jl</a> and the <a href="https://julialang.org/">Julia Programming Language</a>.</p></nav></div><div class="modal" id="documenter-settings"><div class="modal-background"></div><div class="modal-card"><header class="modal-card-head"><p class="modal-card-title">Settings</p><button class="delete"></button></header><section class="modal-card-body"><p><label class="label">Theme</label><div class="select"><select id="documenter-themepicker"><option value="documenter-light">documenter-light</option><option value="documenter-dark">documenter-dark</option></select></div></p><hr/><p>This document was generated with <a href="https://github.com/JuliaDocs/Documenter.jl">Documenter.jl</a> on <span class="colophon-date" title="Wednesday 3 July 2024 16:02">Wednesday 3 July 2024</span>. Using Julia version 1.10.4.</p></section><footer class="modal-card-foot"></footer></div></div></div></body></html>
+    ...)</code></pre></div><a class="docs-sourcelink" target="_blank" href="https://github.com/quantling/JudiLing.jl/blob/5ca73e4b27ef788e0b36d45e6360491a5a413be8/src/cholesky.jl#LL247-L290">source</a></section></article><article class="docstring"><header><a class="docstring-binding" id="JudiLing.format_matrix" href="#JudiLing.format_matrix"><code>JudiLing.format_matrix</code></a> — <span class="docstring-category">Function</span></header><section><div><pre><code class="language-julia">format_matrix(M::Union{SparseMatrixCSC, Matrix}, output_format=:auto)</code></pre><p>Convert output matrix format to either a dense matrix or a sparse matrix.</p></div><a class="docs-sourcelink" target="_blank" href="https://github.com/quantling/JudiLing.jl/blob/5ca73e4b27ef788e0b36d45e6360491a5a413be8/src/cholesky.jl#LL381-L385">source</a></section></article></article><nav class="docs-footer"><a class="docs-footer-prevpage" href="../make_semantic_matrix/">« Make Semantic Matrix</a><a class="docs-footer-nextpage" href="../make_adjacency_matrix/">Make Adjacency Matrix »</a><div class="flexbox-break"></div><p class="footer-message">Powered by <a href="https://github.com/JuliaDocs/Documenter.jl">Documenter.jl</a> and the <a href="https://julialang.org/">Julia Programming Language</a>.</p></nav></div><div class="modal" id="documenter-settings"><div class="modal-background"></div><div class="modal-card"><header class="modal-card-head"><p class="modal-card-title">Settings</p><button class="delete"></button></header><section class="modal-card-body"><p><label class="label">Theme</label><div class="select"><select id="documenter-themepicker"><option value="documenter-light">documenter-light</option><option value="documenter-dark">documenter-dark</option></select></div></p><hr/><p>This document was generated with <a href="https://github.com/JuliaDocs/Documenter.jl">Documenter.jl</a> on <span class="colophon-date" title="Wednesday 3 July 2024 16:16">Wednesday 3 July 2024</span>. Using Julia version 1.10.4.</p></section><footer class="modal-card-foot"></footer></div></div></div></body></html>
diff --git a/dev/man/deep_learning/index.html b/dev/man/deep_learning/index.html
index ff22999..4e7c2f3 100644
--- a/dev/man/deep_learning/index.html
+++ b/dev/man/deep_learning/index.html
@@ -1,7 +1,7 @@
 <!DOCTYPE html>
 <html lang="en"><head><meta charset="UTF-8"/><meta name="viewport" content="width=device-width, initial-scale=1.0"/><title>Deep learning · JudiLing.jl</title><link rel="canonical" href="https://quantling.github.io/JudiLing.jl/man/deep_learning/"/><link href="https://fonts.googleapis.com/css?family=Lato|Roboto+Mono" rel="stylesheet" type="text/css"/><link href="https://cdnjs.cloudflare.com/ajax/libs/font-awesome/5.15.0/css/fontawesome.min.css" rel="stylesheet" type="text/css"/><link href="https://cdnjs.cloudflare.com/ajax/libs/font-awesome/5.15.0/css/solid.min.css" rel="stylesheet" type="text/css"/><link href="https://cdnjs.cloudflare.com/ajax/libs/font-awesome/5.15.0/css/brands.min.css" rel="stylesheet" type="text/css"/><link href="https://cdnjs.cloudflare.com/ajax/libs/KaTeX/0.11.1/katex.min.css" rel="stylesheet" type="text/css"/><script>documenterBaseURL="../.."</script><script src="https://cdnjs.cloudflare.com/ajax/libs/require.js/2.3.6/require.min.js" data-main="../../assets/documenter.js"></script><script src="../../siteinfo.js"></script><script src="../../../versions.js"></script><link class="docs-theme-link" rel="stylesheet" type="text/css" href="../../assets/themes/documenter-dark.css" data-theme-name="documenter-dark"/><link class="docs-theme-link" rel="stylesheet" type="text/css" href="../../assets/themes/documenter-light.css" data-theme-name="documenter-light" data-theme-primary/><script src="../../assets/themeswap.js"></script></head><body><div id="documenter"><nav class="docs-sidebar"><div class="docs-package-name"><span class="docs-autofit">JudiLing.jl</span></div><form class="docs-search" action="../../search/"><input class="docs-search-query" id="documenter-search-query" name="q" type="text" placeholder="Search docs"/></form><ul class="docs-menu"><li><a class="tocitem" href="../../">Home</a></li><li><span class="tocitem">Manual</span><ul><li><a class="tocitem" href="../input/">Loading data</a></li><li><a class="tocitem" href="../make_cue_matrix/">Make Cue Matrix</a></li><li><a class="tocitem" href="../make_semantic_matrix/">Make Semantic Matrix</a></li><li><a class="tocitem" href="../cholesky/">Cholesky</a></li><li><a class="tocitem" href="../make_adjacency_matrix/">Make Adjacency Matrix</a></li><li><a class="tocitem" href="../make_yt_matrix/">Make Yt Matrix</a></li><li><a class="tocitem" href="../find_path/">Find Paths</a></li><li><a class="tocitem" href="../eval/">Evaluation</a></li><li><a class="tocitem" href="../output/">Output</a></li><li><a class="tocitem" href="../test_combo/">Test Combo</a></li><li><a class="tocitem" href="../display/">Display</a></li><li><a class="tocitem" href="../utils/">Utils</a></li><li><a class="tocitem" href="../pickle/">Pickle</a></li><li><a class="tocitem" href="../pyndl/">Pyndl</a></li><li><a class="tocitem" href="../wh/">Widrow-Hoff Learning</a></li><li class="is-active"><a class="tocitem" href>Deep learning</a></li><li><a class="tocitem" href="../measures_func/">Measures function</a></li></ul></li><li><a class="tocitem" href="../all_manual/">All Manual index</a></li></ul><div class="docs-version-selector field has-addons"><div class="control"><span class="docs-label button is-static is-size-7">Version</span></div><div class="docs-selector control is-expanded"><div class="select is-fullwidth is-size-7"><select id="documenter-version-selector"></select></div></div></div></nav><div class="docs-main"><header class="docs-navbar"><nav class="breadcrumb"><ul class="is-hidden-mobile"><li><a class="is-disabled">Manual</a></li><li class="is-active"><a href>Deep learning</a></li></ul><ul class="is-hidden-tablet"><li class="is-active"><a href>Deep learning</a></li></ul></nav><div class="docs-right"><a class="docs-edit-link" href="https://github.com/quantling/JudiLing.jl/blob/master/docs/src/man/deep_learning.md#L" title="Edit on GitHub"><span class="docs-icon fab"></span><span class="docs-label is-hidden-touch">Edit on GitHub</span></a><a class="docs-settings-button fas fa-cog" id="documenter-settings-button" href="#" title="Settings"></a><a class="docs-sidebar-button fa fa-bars is-hidden-desktop" id="documenter-sidebar-button" href="#"></a></div></header><article class="content" id="documenter-page"><h1 id="Deep-learning-in-JudiLing"><a class="docs-heading-anchor" href="#Deep-learning-in-JudiLing">Deep learning in JudiLing</a><a id="Deep-learning-in-JudiLing-1"></a><a class="docs-heading-anchor-permalink" href="#Deep-learning-in-JudiLing" title="Permalink"></a></h1><article class="docstring"><header><a class="docstring-binding" id="JudiLing.predict_from_deep_model-Tuple{Chain, Union{SparseArrays.SparseMatrixCSC, Matrix}}" href="#JudiLing.predict_from_deep_model-Tuple{Chain, Union{SparseArrays.SparseMatrixCSC, Matrix}}"><code>JudiLing.predict_from_deep_model</code></a> — <span class="docstring-category">Method</span></header><section><div><pre><code class="language-julia">predict_from_deep_model(model::Chain,
-                        X::Union{SparseMatrixCSC,Matrix})</code></pre><p>Generates output of a model given input <code>X</code>.</p><p><strong>Obligatory arguments</strong></p><ul><li><code>model::Chain</code>: Model of type Flux.Chain, as generated by <code>get_and_train_model</code></li><li><code>X::Union{SparseMatrixCSC,Matrix}</code>: Input matrix of size (number<em>of</em>samples, inp<em>dim) where inp</em>dim is the input dimension of <code>model</code></li></ul></div><a class="docs-sourcelink" target="_blank" href="https://github.com/quantling/JudiLing.jl/blob/244bb0c648484065ffd5a41781ccc1caf2e5db60/src/deep_learning.jl#LL635-L645">source</a></section></article><article class="docstring"><header><a class="docstring-binding" id="JudiLing.predict_shat-Tuple{Chain, Vector{Int64}}" href="#JudiLing.predict_shat-Tuple{Chain, Vector{Int64}}"><code>JudiLing.predict_shat</code></a> — <span class="docstring-category">Method</span></header><section><div><pre><code class="language-julia">predict_shat(model::Chain,
-             ci::Vector{Int})</code></pre><p>Predicts semantic vector shat given a deep learning comprehension model <code>model</code> and a list of indices of ngrams <code>ci</code>.</p><p><strong>Obligatory arguments</strong></p><ul><li><code>model::Chain</code>: Deep learning comprehension model as generated by <code>get_and_train_model</code></li><li><code>ci::Vector{Int}</code>: Vector of indices of ngrams in c vector. Essentially, this is a vector indicating which ngrams in a c vector are absent and which are present.</li></ul></div><a class="docs-sourcelink" target="_blank" href="https://github.com/quantling/JudiLing.jl/blob/244bb0c648484065ffd5a41781ccc1caf2e5db60/src/deep_learning.jl#LL654-L664">source</a></section></article><article class="docstring"><header><a class="docstring-binding" id="JudiLing.get_and_train_model-Tuple{Union{SparseArrays.SparseMatrixCSC, Matrix}, Union{SparseArrays.SparseMatrixCSC, Matrix}, Union{Missing, SparseArrays.SparseMatrixCSC, Matrix}, Union{Missing, SparseArrays.SparseMatrixCSC, Matrix}, Union{Missing, DataFrames.DataFrame}, Union{Missing, DataFrames.DataFrame}, Union{Missing, String, Symbol}, String}" href="#JudiLing.get_and_train_model-Tuple{Union{SparseArrays.SparseMatrixCSC, Matrix}, Union{SparseArrays.SparseMatrixCSC, Matrix}, Union{Missing, SparseArrays.SparseMatrixCSC, Matrix}, Union{Missing, SparseArrays.SparseMatrixCSC, Matrix}, Union{Missing, DataFrames.DataFrame}, Union{Missing, DataFrames.DataFrame}, Union{Missing, String, Symbol}, String}"><code>JudiLing.get_and_train_model</code></a> — <span class="docstring-category">Method</span></header><section><div><pre><code class="language-julia">get_and_train_model(X_train::Union{SparseMatrixCSC,Matrix},
+                        X::Union{SparseMatrixCSC,Matrix})</code></pre><p>Generates output of a model given input <code>X</code>.</p><p><strong>Obligatory arguments</strong></p><ul><li><code>model::Chain</code>: Model of type Flux.Chain, as generated by <code>get_and_train_model</code></li><li><code>X::Union{SparseMatrixCSC,Matrix}</code>: Input matrix of size (number<em>of</em>samples, inp<em>dim) where inp</em>dim is the input dimension of <code>model</code></li></ul></div><a class="docs-sourcelink" target="_blank" href="https://github.com/quantling/JudiLing.jl/blob/5ca73e4b27ef788e0b36d45e6360491a5a413be8/src/deep_learning.jl#LL635-L645">source</a></section></article><article class="docstring"><header><a class="docstring-binding" id="JudiLing.predict_shat-Tuple{Chain, Vector{Int64}}" href="#JudiLing.predict_shat-Tuple{Chain, Vector{Int64}}"><code>JudiLing.predict_shat</code></a> — <span class="docstring-category">Method</span></header><section><div><pre><code class="language-julia">predict_shat(model::Chain,
+             ci::Vector{Int})</code></pre><p>Predicts semantic vector shat given a deep learning comprehension model <code>model</code> and a list of indices of ngrams <code>ci</code>.</p><p><strong>Obligatory arguments</strong></p><ul><li><code>model::Chain</code>: Deep learning comprehension model as generated by <code>get_and_train_model</code></li><li><code>ci::Vector{Int}</code>: Vector of indices of ngrams in c vector. Essentially, this is a vector indicating which ngrams in a c vector are absent and which are present.</li></ul></div><a class="docs-sourcelink" target="_blank" href="https://github.com/quantling/JudiLing.jl/blob/5ca73e4b27ef788e0b36d45e6360491a5a413be8/src/deep_learning.jl#LL654-L664">source</a></section></article><article class="docstring"><header><a class="docstring-binding" id="JudiLing.get_and_train_model-Tuple{Union{SparseArrays.SparseMatrixCSC, Matrix}, Union{SparseArrays.SparseMatrixCSC, Matrix}, Union{Missing, SparseArrays.SparseMatrixCSC, Matrix}, Union{Missing, SparseArrays.SparseMatrixCSC, Matrix}, Union{Missing, DataFrames.DataFrame}, Union{Missing, DataFrames.DataFrame}, Union{Missing, String, Symbol}, String}" href="#JudiLing.get_and_train_model-Tuple{Union{SparseArrays.SparseMatrixCSC, Matrix}, Union{SparseArrays.SparseMatrixCSC, Matrix}, Union{Missing, SparseArrays.SparseMatrixCSC, Matrix}, Union{Missing, SparseArrays.SparseMatrixCSC, Matrix}, Union{Missing, DataFrames.DataFrame}, Union{Missing, DataFrames.DataFrame}, Union{Missing, String, Symbol}, String}"><code>JudiLing.get_and_train_model</code></a> — <span class="docstring-category">Method</span></header><section><div><pre><code class="language-julia">get_and_train_model(X_train::Union{SparseMatrixCSC,Matrix},
                     Y_train::Union{SparseMatrixCSC,Matrix},
                     X_val::Union{SparseMatrixCSC,Matrix,Missing},
                     Y_val::Union{SparseMatrixCSC,Matrix,Missing},
@@ -24,7 +24,7 @@
                     ...kargs
                     )</code></pre><p>Trains a deep learning model from <code>X_train</code> to <code>Y_train</code>, saving the model with either the highest validation accuracy or lowest validation loss (depending on <code>optimise_for_acc</code>) to <code>outpath</code>.</p><p>The default model looks like this:</p><pre><code class="language-none">inp_dim = size(X_train, 2)
 out_dim = size(Y_train, 2)
-Chain(Dense(inp_dim =&gt; hidden_dim, relu), Dense(hidden_dim =&gt; out_dim))</code></pre><p>Any other model with the same input and output dimensions can be provided to the function with the <code>model</code> argument. The default loss function is mean squared error, but any other loss function can be provded, as long as it fits with the model architecture.</p><p>By default the adam optimizer (Kingma and Ba, 2015) with learning rate 0.001 is used. You can provide any other optimizer. If you want to use a different learning rate, e.g. 0.01, provide <code>optimizer=Flux.Adam(0.01)</code>. If you do not want to use an optimizer at all, and simply use normal gradient descent, provide <code>optimizer=Descent(0.001)</code>, again replacing the learning rate with the learning rate of your preference.</p><p>Returns a named tuple with the following values:</p><ul><li><code>model</code>: the trained model</li><li><code>data_train</code>: the training data, including any measures if computed by <code>measures_func</code></li><li><code>data_val</code>: the validation data, including any measures if computed by <code>measures_func</code></li><li><code>losses_train</code>: The losses of the training data for each epoch.</li><li><code>losses_val</code>: The losses of the validation data after each epoch.</li><li><code>accs_train</code>: The accuracies of the training data after each epoch, if <code>return_train_acc=true</code>.</li><li><code>accs_val</code>: The accuracies of the validation data after each epoch.</li></ul><p><strong>Obligatory arguments</strong></p><ul><li><code>X_train::Union{SparseMatrixCSC,Matrix}</code>: training input matrix of dimension m x n</li><li><code>Y_train::Union{SparseMatrixCSC,Matrix}</code>: training output/target matrix of dimension m x k</li><li><code>X_train::Union{SparseMatrixCSC,Matrix}</code>: validation input matrix of dimension l x n</li><li><code>Y_train::Union{SparseMatrixCSC,Matrix}</code>: validation output/target matrix of dimension l x k</li><li><code>data_train::DataFrame</code>: training data</li><li><code>data_val::DataFrame</code>: validation data</li><li><code>target_col::Union{Symbol, String}</code>: column with target wordforms in data<em>train and data</em>val</li><li><code>model_outpath::String</code>: filepath to where final model should be stored (in .bson format)</li></ul><p><strong>Optional arguments</strong></p><ul><li><code>hidden_dim::Int=1000</code>: hidden dimension of the model</li><li><code>n_epochs::Int=100</code>: number of epochs for which the model should be trained</li><li><code>batchsize::Int=64</code>: batchsize during training</li><li><code>loss_func::Function=Flux.mse</code>: Loss function. Per default this is the mse loss, but other options might be a crossentropy loss (<code>Flux.crossentropy</code>). Make sure the model makes sense with the loss function!</li><li><code>optimizer=Flux.Adam(0.001)</code>: optimizer to use for training</li><li><code>model::Union{Missing, Chain} = missing</code>: A custom model can be provided for training. Its requirements are that it has to correspond to the input and output size of the training and validation data</li><li><code>early_stopping::Union{Missing, Int}=missing</code>: If <code>missing</code>, no early stopping is used. Otherwise <code>early_stopping</code> indicates how many epochs have to pass without improvement in validation accuracy before the training is stopped.</li><li><code>optimise_for_acc::Bool=false</code>: if true, keep model with highest validation <em>accuracy</em>. If false, keep model with lowest validation <em>loss</em>.</li><li><code>return_losses::Bool=false</code>: whether additional to the model per-epoch losses for the training and test data as well as per-epoch accuracy on the validation data should be returned</li><li><code>verbose::Bool=true</code>: Turn on verbose mode</li><li><code>measures_func::Union{Missing, Function}=missing</code>: A measures function which is run at the end of every epoch. For more information see <a href="../measures_func/#The-measures_func-argument">The <code>measures_func</code> argument</a>. If a measure is tagged for each epoch, the one tagged with &quot;final&quot; will be the one for the finally returned model.</li><li><code>return_train_acc::Bool=false</code>: If true, a vector with training accuracies is returned at the end of the training.</li><li><code>...kargs</code>: any additional keyword arguments are passed to the measures_func</li></ul></div><a class="docs-sourcelink" target="_blank" href="https://github.com/quantling/JudiLing.jl/blob/244bb0c648484065ffd5a41781ccc1caf2e5db60/src/deep_learning.jl#LL18-L89">source</a></section></article><article class="docstring"><header><a class="docstring-binding" id="JudiLing.get_and_train_model-Tuple{Union{SparseArrays.SparseMatrixCSC, Matrix}, Union{SparseArrays.SparseMatrixCSC, Matrix}, String}" href="#JudiLing.get_and_train_model-Tuple{Union{SparseArrays.SparseMatrixCSC, Matrix}, Union{SparseArrays.SparseMatrixCSC, Matrix}, String}"><code>JudiLing.get_and_train_model</code></a> — <span class="docstring-category">Method</span></header><section><div><pre><code class="language-julia">get_and_train_model(X_train::Union{SparseMatrixCSC,Matrix},
+Chain(Dense(inp_dim =&gt; hidden_dim, relu), Dense(hidden_dim =&gt; out_dim))</code></pre><p>Any other model with the same input and output dimensions can be provided to the function with the <code>model</code> argument. The default loss function is mean squared error, but any other loss function can be provded, as long as it fits with the model architecture.</p><p>By default the adam optimizer (Kingma and Ba, 2015) with learning rate 0.001 is used. You can provide any other optimizer. If you want to use a different learning rate, e.g. 0.01, provide <code>optimizer=Flux.Adam(0.01)</code>. If you do not want to use an optimizer at all, and simply use normal gradient descent, provide <code>optimizer=Descent(0.001)</code>, again replacing the learning rate with the learning rate of your preference.</p><p>Returns a named tuple with the following values:</p><ul><li><code>model</code>: the trained model</li><li><code>data_train</code>: the training data, including any measures if computed by <code>measures_func</code></li><li><code>data_val</code>: the validation data, including any measures if computed by <code>measures_func</code></li><li><code>losses_train</code>: The losses of the training data for each epoch.</li><li><code>losses_val</code>: The losses of the validation data after each epoch.</li><li><code>accs_train</code>: The accuracies of the training data after each epoch, if <code>return_train_acc=true</code>.</li><li><code>accs_val</code>: The accuracies of the validation data after each epoch.</li></ul><p><strong>Obligatory arguments</strong></p><ul><li><code>X_train::Union{SparseMatrixCSC,Matrix}</code>: training input matrix of dimension m x n</li><li><code>Y_train::Union{SparseMatrixCSC,Matrix}</code>: training output/target matrix of dimension m x k</li><li><code>X_train::Union{SparseMatrixCSC,Matrix}</code>: validation input matrix of dimension l x n</li><li><code>Y_train::Union{SparseMatrixCSC,Matrix}</code>: validation output/target matrix of dimension l x k</li><li><code>data_train::DataFrame</code>: training data</li><li><code>data_val::DataFrame</code>: validation data</li><li><code>target_col::Union{Symbol, String}</code>: column with target wordforms in data<em>train and data</em>val</li><li><code>model_outpath::String</code>: filepath to where final model should be stored (in .bson format)</li></ul><p><strong>Optional arguments</strong></p><ul><li><code>hidden_dim::Int=1000</code>: hidden dimension of the model</li><li><code>n_epochs::Int=100</code>: number of epochs for which the model should be trained</li><li><code>batchsize::Int=64</code>: batchsize during training</li><li><code>loss_func::Function=Flux.mse</code>: Loss function. Per default this is the mse loss, but other options might be a crossentropy loss (<code>Flux.crossentropy</code>). Make sure the model makes sense with the loss function!</li><li><code>optimizer=Flux.Adam(0.001)</code>: optimizer to use for training</li><li><code>model::Union{Missing, Chain} = missing</code>: A custom model can be provided for training. Its requirements are that it has to correspond to the input and output size of the training and validation data</li><li><code>early_stopping::Union{Missing, Int}=missing</code>: If <code>missing</code>, no early stopping is used. Otherwise <code>early_stopping</code> indicates how many epochs have to pass without improvement in validation accuracy before the training is stopped.</li><li><code>optimise_for_acc::Bool=false</code>: if true, keep model with highest validation <em>accuracy</em>. If false, keep model with lowest validation <em>loss</em>.</li><li><code>return_losses::Bool=false</code>: whether additional to the model per-epoch losses for the training and test data as well as per-epoch accuracy on the validation data should be returned</li><li><code>verbose::Bool=true</code>: Turn on verbose mode</li><li><code>measures_func::Union{Missing, Function}=missing</code>: A measures function which is run at the end of every epoch. For more information see <a href="../measures_func/#The-measures_func-argument">The <code>measures_func</code> argument</a>. If a measure is tagged for each epoch, the one tagged with &quot;final&quot; will be the one for the finally returned model.</li><li><code>return_train_acc::Bool=false</code>: If true, a vector with training accuracies is returned at the end of the training.</li><li><code>...kargs</code>: any additional keyword arguments are passed to the measures_func</li></ul></div><a class="docs-sourcelink" target="_blank" href="https://github.com/quantling/JudiLing.jl/blob/5ca73e4b27ef788e0b36d45e6360491a5a413be8/src/deep_learning.jl#LL18-L89">source</a></section></article><article class="docstring"><header><a class="docstring-binding" id="JudiLing.get_and_train_model-Tuple{Union{SparseArrays.SparseMatrixCSC, Matrix}, Union{SparseArrays.SparseMatrixCSC, Matrix}, String}" href="#JudiLing.get_and_train_model-Tuple{Union{SparseArrays.SparseMatrixCSC, Matrix}, Union{SparseArrays.SparseMatrixCSC, Matrix}, String}"><code>JudiLing.get_and_train_model</code></a> — <span class="docstring-category">Method</span></header><section><div><pre><code class="language-julia">get_and_train_model(X_train::Union{SparseMatrixCSC,Matrix},
                     Y_train::Union{SparseMatrixCSC,Matrix},
                     model_outpath::String;
                     data_train::Union{Missing, DataFrame}=missing,
@@ -41,7 +41,7 @@
                     return_train_acc::Bool=false,
                     ...kargs)</code></pre><p>Trains a deep learning model from <code>X_train</code> to <code>Y_train</code>, saving the model after n_epochs epochs. The default model looks like this:</p><pre><code class="language-none">inp_dim = size(X_train, 2)
 out_dim = size(Y_train, 2)
-Chain(Dense(inp_dim =&gt; hidden_dim, relu), Dense(hidden_dim =&gt; out_dim))</code></pre><p>Any other model with the same input and output dimensions can be provided to the function with the <code>model</code> argument. The default loss function is mean squared error, but any other loss function can be provded, as long as it fits with the model architecture.</p><p>By default the adam optimizer (Kingma and Ba, 2015) with learning rate 0.001 is used. You can provide any other optimizer. If you want to use a different learning rate, e.g. 0.01, provide <code>optimizer=Flux.Adam(0.01)</code>. If you do not want to use an optimizer at all, and simply use normal gradient descent, provide <code>optimizer=Descent(0.001)</code>, again replacing the learning rate with the learning rate of your preference.</p><p>Returns a named tuple with the following values:</p><ul><li><code>model</code>: the trained model</li><li><code>data_train</code>: the data, including any measures if computed by <code>measures_func</code></li><li><code>data_val</code>: missing for this function</li><li><code>losses_train</code>: The losses of the training data for each epoch.</li><li><code>losses_val</code>: missing for this function</li><li><code>accs_train</code>: The accuracies of the training data after each epoch, if <code>return_train_acc=true</code>.</li><li><code>accs_val</code>: missing for this function</li></ul><p><strong>Obligatory arguments</strong></p><ul><li><code>X_train::Union{SparseMatrixCSC,Matrix}</code>: training input matrix of dimension m x n</li><li><code>Y_train::Union{SparseMatrixCSC,Matrix}</code>: training output/target matrix of dimension m x k</li><li><code>model_outpath::String</code>: filepath to where final model should be stored (in .bson format)</li></ul><p><strong>Optional arguments</strong></p><ul><li><code>data_train::Union{Missing, DataFrame}=missing</code>: The training data. Only necessary if a measures<em>func is included or return</em>train_acc=true.</li><li><code>target_col::Union{Missing, Symbol, String}=missing</code>: The column with target word forms in the training data. Only necessary if a measures<em>func is included or return</em>train_acc=true.</li><li><code>hidden_dim::Int=1000</code>: hidden dimension of the model</li><li><code>n_epochs::Int=100</code>: number of epochs for which the model should be trained</li><li><code>batchsize::Int=64</code>: batchsize during training</li><li><code>loss_func::Function=Flux.mse</code>: Loss function. Per default this is the mse loss, but other options might be a crossentropy loss (<code>Flux.crossentropy</code>). Make sure the model makes sense with the loss function!</li><li><code>optimizer=Flux.Adam(0.001)</code>: optimizer to use for training</li><li><code>model::Union{Missing, Chain} = missing</code>: A custom model can be provided for training. Its requirements are that it has to correspond to the input and output size of the training and validation data</li><li><code>return_losses::Bool=false</code>: whether additional to the model per-epoch losses for the training and test data as well as per-epoch accuracy on the validation data should be returned</li><li><code>verbose::Bool=true</code>: Turn on verbose mode</li><li><code>measures_func::Union{Missing, Function}=missing</code>: A measures function which is run at the end of every epoch. For more information see <a href="../measures_func/#The-measures_func-argument">The <code>measures_func</code> argument</a>.</li><li><code>return_train_acc::Bool=false</code>: If true, a vector with training accuracies is returned at the end of the training.</li><li><code>...kargs</code>: any additional keyword arguments are passed to the measures_func</li></ul></div><a class="docs-sourcelink" target="_blank" href="https://github.com/quantling/JudiLing.jl/blob/244bb0c648484065ffd5a41781ccc1caf2e5db60/src/deep_learning.jl#LL318-L378">source</a></section></article><article class="docstring"><header><a class="docstring-binding" id="JudiLing.fiddl-Tuple{Union{SparseArrays.SparseMatrixCSC, Matrix}, Union{SparseArrays.SparseMatrixCSC, Matrix}, Vector, DataFrames.DataFrame, Union{String, Symbol}, String}" href="#JudiLing.fiddl-Tuple{Union{SparseArrays.SparseMatrixCSC, Matrix}, Union{SparseArrays.SparseMatrixCSC, Matrix}, Vector, DataFrames.DataFrame, Union{String, Symbol}, String}"><code>JudiLing.fiddl</code></a> — <span class="docstring-category">Method</span></header><section><div><pre><code class="language-julia">fiddl(X_train::Union{SparseMatrixCSC,Matrix},
+Chain(Dense(inp_dim =&gt; hidden_dim, relu), Dense(hidden_dim =&gt; out_dim))</code></pre><p>Any other model with the same input and output dimensions can be provided to the function with the <code>model</code> argument. The default loss function is mean squared error, but any other loss function can be provded, as long as it fits with the model architecture.</p><p>By default the adam optimizer (Kingma and Ba, 2015) with learning rate 0.001 is used. You can provide any other optimizer. If you want to use a different learning rate, e.g. 0.01, provide <code>optimizer=Flux.Adam(0.01)</code>. If you do not want to use an optimizer at all, and simply use normal gradient descent, provide <code>optimizer=Descent(0.001)</code>, again replacing the learning rate with the learning rate of your preference.</p><p>Returns a named tuple with the following values:</p><ul><li><code>model</code>: the trained model</li><li><code>data_train</code>: the data, including any measures if computed by <code>measures_func</code></li><li><code>data_val</code>: missing for this function</li><li><code>losses_train</code>: The losses of the training data for each epoch.</li><li><code>losses_val</code>: missing for this function</li><li><code>accs_train</code>: The accuracies of the training data after each epoch, if <code>return_train_acc=true</code>.</li><li><code>accs_val</code>: missing for this function</li></ul><p><strong>Obligatory arguments</strong></p><ul><li><code>X_train::Union{SparseMatrixCSC,Matrix}</code>: training input matrix of dimension m x n</li><li><code>Y_train::Union{SparseMatrixCSC,Matrix}</code>: training output/target matrix of dimension m x k</li><li><code>model_outpath::String</code>: filepath to where final model should be stored (in .bson format)</li></ul><p><strong>Optional arguments</strong></p><ul><li><code>data_train::Union{Missing, DataFrame}=missing</code>: The training data. Only necessary if a measures<em>func is included or return</em>train_acc=true.</li><li><code>target_col::Union{Missing, Symbol, String}=missing</code>: The column with target word forms in the training data. Only necessary if a measures<em>func is included or return</em>train_acc=true.</li><li><code>hidden_dim::Int=1000</code>: hidden dimension of the model</li><li><code>n_epochs::Int=100</code>: number of epochs for which the model should be trained</li><li><code>batchsize::Int=64</code>: batchsize during training</li><li><code>loss_func::Function=Flux.mse</code>: Loss function. Per default this is the mse loss, but other options might be a crossentropy loss (<code>Flux.crossentropy</code>). Make sure the model makes sense with the loss function!</li><li><code>optimizer=Flux.Adam(0.001)</code>: optimizer to use for training</li><li><code>model::Union{Missing, Chain} = missing</code>: A custom model can be provided for training. Its requirements are that it has to correspond to the input and output size of the training and validation data</li><li><code>return_losses::Bool=false</code>: whether additional to the model per-epoch losses for the training and test data as well as per-epoch accuracy on the validation data should be returned</li><li><code>verbose::Bool=true</code>: Turn on verbose mode</li><li><code>measures_func::Union{Missing, Function}=missing</code>: A measures function which is run at the end of every epoch. For more information see <a href="../measures_func/#The-measures_func-argument">The <code>measures_func</code> argument</a>.</li><li><code>return_train_acc::Bool=false</code>: If true, a vector with training accuracies is returned at the end of the training.</li><li><code>...kargs</code>: any additional keyword arguments are passed to the measures_func</li></ul></div><a class="docs-sourcelink" target="_blank" href="https://github.com/quantling/JudiLing.jl/blob/5ca73e4b27ef788e0b36d45e6360491a5a413be8/src/deep_learning.jl#LL318-L378">source</a></section></article><article class="docstring"><header><a class="docstring-binding" id="JudiLing.fiddl-Tuple{Union{SparseArrays.SparseMatrixCSC, Matrix}, Union{SparseArrays.SparseMatrixCSC, Matrix}, Vector, DataFrames.DataFrame, Union{String, Symbol}, String}" href="#JudiLing.fiddl-Tuple{Union{SparseArrays.SparseMatrixCSC, Matrix}, Union{SparseArrays.SparseMatrixCSC, Matrix}, Vector, DataFrames.DataFrame, Union{String, Symbol}, String}"><code>JudiLing.fiddl</code></a> — <span class="docstring-category">Method</span></header><section><div><pre><code class="language-julia">fiddl(X_train::Union{SparseMatrixCSC,Matrix},
         Y_train::Union{SparseMatrixCSC,Matrix},
         learn_seq::Vector,
         data::DataFrame,
@@ -57,4 +57,4 @@
         n_batch_eval::Int=100,
         compute_accuracy::Bool=true,
         measures_func::Union{Function, Missing}=missing,
-        kargs...)</code></pre><p>Trains a deep learning model using the FIDDL method (frequency-informed deep discriminative learning). Optionally, after each <code>n_batch_eval</code> batches <code>measures_func</code> can be run to compute any measures which are then added to the data.</p><div class="admonition is-info"><header class="admonition-header">Note</header><div class="admonition-body"><p>If you get an OutOfMemory error, chances are that this is due to the <code>eval_SC</code> function being evaluated after each <code>n_batch_eval</code> batches. Setting <code>compute_accuracy=false</code> disables computing the mapping accuracy.</p></div></div><p>Returns a named tuple with the following values:</p><ul><li><code>model</code>: the trained model</li><li><code>data</code>: the data, including any measures if computed by <code>measures_func</code></li><li><code>losses_train</code>: The losses of the data the model is trained on within each <code>n_batch_eval</code> batches.</li><li><code>losses</code>: The losses of the full dataset after each <code>n_batch_eval</code> batches.</li><li><code>accs</code>: The accuracies of the full dataset after each <code>n_batch_eval</code> batches.</li></ul><p><strong>Obligatory arguments</strong></p><ul><li><code>X_train::Union{SparseMatrixCSC,Matrix}</code>: training input matrix of dimension m x n</li><li><code>Y_train::Union{SparseMatrixCSC,Matrix}</code>: training output/target matrix of dimension m x k</li><li><code>learn_seq::Vector</code>: List of indices in the order that the vectors in X<em>train and Y</em>train should be presented to the model for training.</li><li><code>data::DataFrame</code>: The full data.</li><li><code>target_col::Union{Symbol, String}</code>: The column with target word forms in the data.</li><li><code>model_outpath::String</code>: filepath to where final model should be stored (in .bson format)</li></ul><p><strong>Optional arguments</strong></p><ul><li><code>hidden_dim::Int=1000</code>: hidden dimension of the model</li><li><code>n_epochs::Int=100</code>: number of epochs for which the model should be trained</li><li><code>batchsize::Int=64</code>: batchsize during training</li><li><code>loss_func::Function=Flux.mse</code>: Loss function. Per default this is the mse loss, but other options might be a crossentropy loss (<code>Flux.crossentropy</code>). Make sure the model makes sense with the loss function!</li><li><code>optimizer=Flux.Adam(0.001)</code>: optimizer to use for training</li><li><code>model::Union{Missing, Chain} = missing</code>: A custom model can be provided for training. Its requirements are that it has to correspond to the input and output size of the training and validation data</li><li><code>return_losses::Bool=false</code>: whether additional to the model per-epoch losses for the training and test data as well as per-epoch accuracy on the validation data should be returned</li><li><code>verbose::Bool=true</code>: Turn on verbose mode</li><li><code>n_batch_eval::Int=100</code>: Loss, accuracy and <code>measures_func</code> are evaluated every <code>n_batch_eval</code> batches.</li><li><code>compute_accuracy::Bool=true</code>: Whether accuracy should be computed every <code>n_batch_eval</code> batches.</li><li><code>measures_func::Union{Missing, Function}=missing</code>: A measures function which is run each <code>n_batch_eval</code> batches. For more information see <a href="../measures_func/#The-measures_func-argument">The <code>measures_func</code> argument</a>.</li></ul></div><a class="docs-sourcelink" target="_blank" href="https://github.com/quantling/JudiLing.jl/blob/244bb0c648484065ffd5a41781ccc1caf2e5db60/src/deep_learning.jl#LL419-L471">source</a></section></article></article><nav class="docs-footer"><a class="docs-footer-prevpage" href="../wh/">« Widrow-Hoff Learning</a><a class="docs-footer-nextpage" href="../measures_func/">Measures function »</a><div class="flexbox-break"></div><p class="footer-message">Powered by <a href="https://github.com/JuliaDocs/Documenter.jl">Documenter.jl</a> and the <a href="https://julialang.org/">Julia Programming Language</a>.</p></nav></div><div class="modal" id="documenter-settings"><div class="modal-background"></div><div class="modal-card"><header class="modal-card-head"><p class="modal-card-title">Settings</p><button class="delete"></button></header><section class="modal-card-body"><p><label class="label">Theme</label><div class="select"><select id="documenter-themepicker"><option value="documenter-light">documenter-light</option><option value="documenter-dark">documenter-dark</option></select></div></p><hr/><p>This document was generated with <a href="https://github.com/JuliaDocs/Documenter.jl">Documenter.jl</a> on <span class="colophon-date" title="Wednesday 3 July 2024 16:02">Wednesday 3 July 2024</span>. Using Julia version 1.10.4.</p></section><footer class="modal-card-foot"></footer></div></div></div></body></html>
+        kargs...)</code></pre><p>Trains a deep learning model using the FIDDL method (frequency-informed deep discriminative learning). Optionally, after each <code>n_batch_eval</code> batches <code>measures_func</code> can be run to compute any measures which are then added to the data.</p><div class="admonition is-info"><header class="admonition-header">Note</header><div class="admonition-body"><p>If you get an OutOfMemory error, chances are that this is due to the <code>eval_SC</code> function being evaluated after each <code>n_batch_eval</code> batches. Setting <code>compute_accuracy=false</code> disables computing the mapping accuracy.</p></div></div><p>Returns a named tuple with the following values:</p><ul><li><code>model</code>: the trained model</li><li><code>data</code>: the data, including any measures if computed by <code>measures_func</code></li><li><code>losses_train</code>: The losses of the data the model is trained on within each <code>n_batch_eval</code> batches.</li><li><code>losses</code>: The losses of the full dataset after each <code>n_batch_eval</code> batches.</li><li><code>accs</code>: The accuracies of the full dataset after each <code>n_batch_eval</code> batches.</li></ul><p><strong>Obligatory arguments</strong></p><ul><li><code>X_train::Union{SparseMatrixCSC,Matrix}</code>: training input matrix of dimension m x n</li><li><code>Y_train::Union{SparseMatrixCSC,Matrix}</code>: training output/target matrix of dimension m x k</li><li><code>learn_seq::Vector</code>: List of indices in the order that the vectors in X<em>train and Y</em>train should be presented to the model for training.</li><li><code>data::DataFrame</code>: The full data.</li><li><code>target_col::Union{Symbol, String}</code>: The column with target word forms in the data.</li><li><code>model_outpath::String</code>: filepath to where final model should be stored (in .bson format)</li></ul><p><strong>Optional arguments</strong></p><ul><li><code>hidden_dim::Int=1000</code>: hidden dimension of the model</li><li><code>n_epochs::Int=100</code>: number of epochs for which the model should be trained</li><li><code>batchsize::Int=64</code>: batchsize during training</li><li><code>loss_func::Function=Flux.mse</code>: Loss function. Per default this is the mse loss, but other options might be a crossentropy loss (<code>Flux.crossentropy</code>). Make sure the model makes sense with the loss function!</li><li><code>optimizer=Flux.Adam(0.001)</code>: optimizer to use for training</li><li><code>model::Union{Missing, Chain} = missing</code>: A custom model can be provided for training. Its requirements are that it has to correspond to the input and output size of the training and validation data</li><li><code>return_losses::Bool=false</code>: whether additional to the model per-epoch losses for the training and test data as well as per-epoch accuracy on the validation data should be returned</li><li><code>verbose::Bool=true</code>: Turn on verbose mode</li><li><code>n_batch_eval::Int=100</code>: Loss, accuracy and <code>measures_func</code> are evaluated every <code>n_batch_eval</code> batches.</li><li><code>compute_accuracy::Bool=true</code>: Whether accuracy should be computed every <code>n_batch_eval</code> batches.</li><li><code>measures_func::Union{Missing, Function}=missing</code>: A measures function which is run each <code>n_batch_eval</code> batches. For more information see <a href="../measures_func/#The-measures_func-argument">The <code>measures_func</code> argument</a>.</li></ul></div><a class="docs-sourcelink" target="_blank" href="https://github.com/quantling/JudiLing.jl/blob/5ca73e4b27ef788e0b36d45e6360491a5a413be8/src/deep_learning.jl#LL419-L471">source</a></section></article></article><nav class="docs-footer"><a class="docs-footer-prevpage" href="../wh/">« Widrow-Hoff Learning</a><a class="docs-footer-nextpage" href="../measures_func/">Measures function »</a><div class="flexbox-break"></div><p class="footer-message">Powered by <a href="https://github.com/JuliaDocs/Documenter.jl">Documenter.jl</a> and the <a href="https://julialang.org/">Julia Programming Language</a>.</p></nav></div><div class="modal" id="documenter-settings"><div class="modal-background"></div><div class="modal-card"><header class="modal-card-head"><p class="modal-card-title">Settings</p><button class="delete"></button></header><section class="modal-card-body"><p><label class="label">Theme</label><div class="select"><select id="documenter-themepicker"><option value="documenter-light">documenter-light</option><option value="documenter-dark">documenter-dark</option></select></div></p><hr/><p>This document was generated with <a href="https://github.com/JuliaDocs/Documenter.jl">Documenter.jl</a> on <span class="colophon-date" title="Wednesday 3 July 2024 16:16">Wednesday 3 July 2024</span>. Using Julia version 1.10.4.</p></section><footer class="modal-card-foot"></footer></div></div></div></body></html>
diff --git a/dev/man/display/index.html b/dev/man/display/index.html
index ad2af79..ef48501 100644
--- a/dev/man/display/index.html
+++ b/dev/man/display/index.html
@@ -1,5 +1,5 @@
 <!DOCTYPE html>
-<html lang="en"><head><meta charset="UTF-8"/><meta name="viewport" content="width=device-width, initial-scale=1.0"/><title>Display · JudiLing.jl</title><link rel="canonical" href="https://quantling.github.io/JudiLing.jl/man/display/"/><link href="https://fonts.googleapis.com/css?family=Lato|Roboto+Mono" rel="stylesheet" type="text/css"/><link href="https://cdnjs.cloudflare.com/ajax/libs/font-awesome/5.15.0/css/fontawesome.min.css" rel="stylesheet" type="text/css"/><link href="https://cdnjs.cloudflare.com/ajax/libs/font-awesome/5.15.0/css/solid.min.css" rel="stylesheet" type="text/css"/><link href="https://cdnjs.cloudflare.com/ajax/libs/font-awesome/5.15.0/css/brands.min.css" rel="stylesheet" type="text/css"/><link href="https://cdnjs.cloudflare.com/ajax/libs/KaTeX/0.11.1/katex.min.css" rel="stylesheet" type="text/css"/><script>documenterBaseURL="../.."</script><script src="https://cdnjs.cloudflare.com/ajax/libs/require.js/2.3.6/require.min.js" data-main="../../assets/documenter.js"></script><script src="../../siteinfo.js"></script><script src="../../../versions.js"></script><link class="docs-theme-link" rel="stylesheet" type="text/css" href="../../assets/themes/documenter-dark.css" data-theme-name="documenter-dark"/><link class="docs-theme-link" rel="stylesheet" type="text/css" href="../../assets/themes/documenter-light.css" data-theme-name="documenter-light" data-theme-primary/><script src="../../assets/themeswap.js"></script></head><body><div id="documenter"><nav class="docs-sidebar"><div class="docs-package-name"><span class="docs-autofit">JudiLing.jl</span></div><form class="docs-search" action="../../search/"><input class="docs-search-query" id="documenter-search-query" name="q" type="text" placeholder="Search docs"/></form><ul class="docs-menu"><li><a class="tocitem" href="../../">Home</a></li><li><span class="tocitem">Manual</span><ul><li><a class="tocitem" href="../input/">Loading data</a></li><li><a class="tocitem" href="../make_cue_matrix/">Make Cue Matrix</a></li><li><a class="tocitem" href="../make_semantic_matrix/">Make Semantic Matrix</a></li><li><a class="tocitem" href="../cholesky/">Cholesky</a></li><li><a class="tocitem" href="../make_adjacency_matrix/">Make Adjacency Matrix</a></li><li><a class="tocitem" href="../make_yt_matrix/">Make Yt Matrix</a></li><li><a class="tocitem" href="../find_path/">Find Paths</a></li><li><a class="tocitem" href="../eval/">Evaluation</a></li><li><a class="tocitem" href="../output/">Output</a></li><li><a class="tocitem" href="../test_combo/">Test Combo</a></li><li class="is-active"><a class="tocitem" href>Display</a></li><li><a class="tocitem" href="../utils/">Utils</a></li><li><a class="tocitem" href="../pickle/">Pickle</a></li><li><a class="tocitem" href="../pyndl/">Pyndl</a></li><li><a class="tocitem" href="../wh/">Widrow-Hoff Learning</a></li><li><a class="tocitem" href="../deep_learning/">Deep learning</a></li><li><a class="tocitem" href="../measures_func/">Measures function</a></li></ul></li><li><a class="tocitem" href="../all_manual/">All Manual index</a></li></ul><div class="docs-version-selector field has-addons"><div class="control"><span class="docs-label button is-static is-size-7">Version</span></div><div class="docs-selector control is-expanded"><div class="select is-fullwidth is-size-7"><select id="documenter-version-selector"></select></div></div></div></nav><div class="docs-main"><header class="docs-navbar"><nav class="breadcrumb"><ul class="is-hidden-mobile"><li><a class="is-disabled">Manual</a></li><li class="is-active"><a href>Display</a></li></ul><ul class="is-hidden-tablet"><li class="is-active"><a href>Display</a></li></ul></nav><div class="docs-right"><a class="docs-edit-link" href="https://github.com/quantling/JudiLing.jl/blob/master/docs/src/man/display.md#L" title="Edit on GitHub"><span class="docs-icon fab"></span><span class="docs-label is-hidden-touch">Edit on GitHub</span></a><a class="docs-settings-button fas fa-cog" id="documenter-settings-button" href="#" title="Settings"></a><a class="docs-sidebar-button fa fa-bars is-hidden-desktop" id="documenter-sidebar-button" href="#"></a></div></header><article class="content" id="documenter-page"><h1 id="Cholesky"><a class="docs-heading-anchor" href="#Cholesky">Cholesky</a><a id="Cholesky-1"></a><a class="docs-heading-anchor-permalink" href="#Cholesky" title="Permalink"></a></h1><article class="docstring"><header><a class="docstring-binding" id="JudiLing.display_matrix-Tuple{Any, Any, Any}" href="#JudiLing.display_matrix-Tuple{Any, Any, Any}"><code>JudiLing.display_matrix</code></a> — <span class="docstring-category">Method</span></header><section><div><pre><code class="language-julia">display_matrix(M, rownames, colnames)</code></pre><p>Display matrix with rownames and colnames.</p></div><a class="docs-sourcelink" target="_blank" href="https://github.com/quantling/JudiLing.jl/blob/244bb0c648484065ffd5a41781ccc1caf2e5db60/src/display.jl#LL1-L5">source</a></section></article><article class="docstring"><header><a class="docstring-binding" id="JudiLing.display_matrix-NTuple{5, Any}" href="#JudiLing.display_matrix-NTuple{5, Any}"><code>JudiLing.display_matrix</code></a> — <span class="docstring-category">Method</span></header><section><div><pre><code class="language-julia">display_matrix(data, target_col, cue_pS_obj, M, M_type)</code></pre><p>Display matrix with rownames and colnames.</p><p><strong>Obligatory Arguments</strong></p><ul><li><code>data::DataFrame</code>: the dataset</li><li><code>target_col::Union{String, Symbol}</code>: the target column name</li><li><code>cue_pS_obj::Union{Cue_Matrix_Struct,PS_Matrix_Struct}</code>: the cue matrix or pS matrix structure</li><li><code>M::Union{SparseMatrixCSC, Matrix}</code>: the matrix</li><li><code>M_type::Union{String, Symbol}</code>: the type of the matrix, currently support :C, :S, :F, :G, :Chat, :Shat, :A, :R and :pS</li></ul><p><strong>Optional Arguments</strong></p><ul><li><code>nrow::Int64 = 6</code>: the number of rows to display</li><li><code>ncol::Int64 = 6</code>: the number of columns to display</li><li><code>return_matrix::Bool = false</code>: whether the created dataframe should be returned (and not only displayed)</li></ul><p><strong>Examples</strong></p><pre><code class="language-julia">JudiLing.display_matrix(latin, :Word, cue_obj, cue_obj.C, :C)
+<html lang="en"><head><meta charset="UTF-8"/><meta name="viewport" content="width=device-width, initial-scale=1.0"/><title>Display · JudiLing.jl</title><link rel="canonical" href="https://quantling.github.io/JudiLing.jl/man/display/"/><link href="https://fonts.googleapis.com/css?family=Lato|Roboto+Mono" rel="stylesheet" type="text/css"/><link href="https://cdnjs.cloudflare.com/ajax/libs/font-awesome/5.15.0/css/fontawesome.min.css" rel="stylesheet" type="text/css"/><link href="https://cdnjs.cloudflare.com/ajax/libs/font-awesome/5.15.0/css/solid.min.css" rel="stylesheet" type="text/css"/><link href="https://cdnjs.cloudflare.com/ajax/libs/font-awesome/5.15.0/css/brands.min.css" rel="stylesheet" type="text/css"/><link href="https://cdnjs.cloudflare.com/ajax/libs/KaTeX/0.11.1/katex.min.css" rel="stylesheet" type="text/css"/><script>documenterBaseURL="../.."</script><script src="https://cdnjs.cloudflare.com/ajax/libs/require.js/2.3.6/require.min.js" data-main="../../assets/documenter.js"></script><script src="../../siteinfo.js"></script><script src="../../../versions.js"></script><link class="docs-theme-link" rel="stylesheet" type="text/css" href="../../assets/themes/documenter-dark.css" data-theme-name="documenter-dark"/><link class="docs-theme-link" rel="stylesheet" type="text/css" href="../../assets/themes/documenter-light.css" data-theme-name="documenter-light" data-theme-primary/><script src="../../assets/themeswap.js"></script></head><body><div id="documenter"><nav class="docs-sidebar"><div class="docs-package-name"><span class="docs-autofit">JudiLing.jl</span></div><form class="docs-search" action="../../search/"><input class="docs-search-query" id="documenter-search-query" name="q" type="text" placeholder="Search docs"/></form><ul class="docs-menu"><li><a class="tocitem" href="../../">Home</a></li><li><span class="tocitem">Manual</span><ul><li><a class="tocitem" href="../input/">Loading data</a></li><li><a class="tocitem" href="../make_cue_matrix/">Make Cue Matrix</a></li><li><a class="tocitem" href="../make_semantic_matrix/">Make Semantic Matrix</a></li><li><a class="tocitem" href="../cholesky/">Cholesky</a></li><li><a class="tocitem" href="../make_adjacency_matrix/">Make Adjacency Matrix</a></li><li><a class="tocitem" href="../make_yt_matrix/">Make Yt Matrix</a></li><li><a class="tocitem" href="../find_path/">Find Paths</a></li><li><a class="tocitem" href="../eval/">Evaluation</a></li><li><a class="tocitem" href="../output/">Output</a></li><li><a class="tocitem" href="../test_combo/">Test Combo</a></li><li class="is-active"><a class="tocitem" href>Display</a></li><li><a class="tocitem" href="../utils/">Utils</a></li><li><a class="tocitem" href="../pickle/">Pickle</a></li><li><a class="tocitem" href="../pyndl/">Pyndl</a></li><li><a class="tocitem" href="../wh/">Widrow-Hoff Learning</a></li><li><a class="tocitem" href="../deep_learning/">Deep learning</a></li><li><a class="tocitem" href="../measures_func/">Measures function</a></li></ul></li><li><a class="tocitem" href="../all_manual/">All Manual index</a></li></ul><div class="docs-version-selector field has-addons"><div class="control"><span class="docs-label button is-static is-size-7">Version</span></div><div class="docs-selector control is-expanded"><div class="select is-fullwidth is-size-7"><select id="documenter-version-selector"></select></div></div></div></nav><div class="docs-main"><header class="docs-navbar"><nav class="breadcrumb"><ul class="is-hidden-mobile"><li><a class="is-disabled">Manual</a></li><li class="is-active"><a href>Display</a></li></ul><ul class="is-hidden-tablet"><li class="is-active"><a href>Display</a></li></ul></nav><div class="docs-right"><a class="docs-edit-link" href="https://github.com/quantling/JudiLing.jl/blob/master/docs/src/man/display.md#L" title="Edit on GitHub"><span class="docs-icon fab"></span><span class="docs-label is-hidden-touch">Edit on GitHub</span></a><a class="docs-settings-button fas fa-cog" id="documenter-settings-button" href="#" title="Settings"></a><a class="docs-sidebar-button fa fa-bars is-hidden-desktop" id="documenter-sidebar-button" href="#"></a></div></header><article class="content" id="documenter-page"><h1 id="Cholesky"><a class="docs-heading-anchor" href="#Cholesky">Cholesky</a><a id="Cholesky-1"></a><a class="docs-heading-anchor-permalink" href="#Cholesky" title="Permalink"></a></h1><article class="docstring"><header><a class="docstring-binding" id="JudiLing.display_matrix-Tuple{Any, Any, Any}" href="#JudiLing.display_matrix-Tuple{Any, Any, Any}"><code>JudiLing.display_matrix</code></a> — <span class="docstring-category">Method</span></header><section><div><pre><code class="language-julia">display_matrix(M, rownames, colnames)</code></pre><p>Display matrix with rownames and colnames.</p></div><a class="docs-sourcelink" target="_blank" href="https://github.com/quantling/JudiLing.jl/blob/5ca73e4b27ef788e0b36d45e6360491a5a413be8/src/display.jl#LL1-L5">source</a></section></article><article class="docstring"><header><a class="docstring-binding" id="JudiLing.display_matrix-NTuple{5, Any}" href="#JudiLing.display_matrix-NTuple{5, Any}"><code>JudiLing.display_matrix</code></a> — <span class="docstring-category">Method</span></header><section><div><pre><code class="language-julia">display_matrix(data, target_col, cue_pS_obj, M, M_type)</code></pre><p>Display matrix with rownames and colnames.</p><p><strong>Obligatory Arguments</strong></p><ul><li><code>data::DataFrame</code>: the dataset</li><li><code>target_col::Union{String, Symbol}</code>: the target column name</li><li><code>cue_pS_obj::Union{Cue_Matrix_Struct,PS_Matrix_Struct}</code>: the cue matrix or pS matrix structure</li><li><code>M::Union{SparseMatrixCSC, Matrix}</code>: the matrix</li><li><code>M_type::Union{String, Symbol}</code>: the type of the matrix, currently support :C, :S, :F, :G, :Chat, :Shat, :A, :R and :pS</li></ul><p><strong>Optional Arguments</strong></p><ul><li><code>nrow::Int64 = 6</code>: the number of rows to display</li><li><code>ncol::Int64 = 6</code>: the number of columns to display</li><li><code>return_matrix::Bool = false</code>: whether the created dataframe should be returned (and not only displayed)</li></ul><p><strong>Examples</strong></p><pre><code class="language-julia">JudiLing.display_matrix(latin, :Word, cue_obj, cue_obj.C, :C)
 JudiLing.display_matrix(latin, :Word, cue_obj, S, :S)
 JudiLing.display_matrix(latin, :Word, cue_obj, G, :G)
 JudiLing.display_matrix(latin, :Word, cue_obj, Chat, :Chat)
@@ -7,4 +7,4 @@
 JudiLing.display_matrix(latin, :Word, cue_obj, Shat, :Shat)
 JudiLing.display_matrix(latin, :Word, cue_obj, A, :A)
 JudiLing.display_matrix(latin, :Word, cue_obj, R, :R)
-JudiLing.display_matrix(latin, :Word, pS_obj, pS_obj.pS, :pS)</code></pre></div><a class="docs-sourcelink" target="_blank" href="https://github.com/quantling/JudiLing.jl/blob/244bb0c648484065ffd5a41781ccc1caf2e5db60/src/display.jl#LL23-L52">source</a></section></article></article><nav class="docs-footer"><a class="docs-footer-prevpage" href="../test_combo/">« Test Combo</a><a class="docs-footer-nextpage" href="../utils/">Utils »</a><div class="flexbox-break"></div><p class="footer-message">Powered by <a href="https://github.com/JuliaDocs/Documenter.jl">Documenter.jl</a> and the <a href="https://julialang.org/">Julia Programming Language</a>.</p></nav></div><div class="modal" id="documenter-settings"><div class="modal-background"></div><div class="modal-card"><header class="modal-card-head"><p class="modal-card-title">Settings</p><button class="delete"></button></header><section class="modal-card-body"><p><label class="label">Theme</label><div class="select"><select id="documenter-themepicker"><option value="documenter-light">documenter-light</option><option value="documenter-dark">documenter-dark</option></select></div></p><hr/><p>This document was generated with <a href="https://github.com/JuliaDocs/Documenter.jl">Documenter.jl</a> on <span class="colophon-date" title="Wednesday 3 July 2024 16:02">Wednesday 3 July 2024</span>. Using Julia version 1.10.4.</p></section><footer class="modal-card-foot"></footer></div></div></div></body></html>
+JudiLing.display_matrix(latin, :Word, pS_obj, pS_obj.pS, :pS)</code></pre></div><a class="docs-sourcelink" target="_blank" href="https://github.com/quantling/JudiLing.jl/blob/5ca73e4b27ef788e0b36d45e6360491a5a413be8/src/display.jl#LL23-L52">source</a></section></article></article><nav class="docs-footer"><a class="docs-footer-prevpage" href="../test_combo/">« Test Combo</a><a class="docs-footer-nextpage" href="../utils/">Utils »</a><div class="flexbox-break"></div><p class="footer-message">Powered by <a href="https://github.com/JuliaDocs/Documenter.jl">Documenter.jl</a> and the <a href="https://julialang.org/">Julia Programming Language</a>.</p></nav></div><div class="modal" id="documenter-settings"><div class="modal-background"></div><div class="modal-card"><header class="modal-card-head"><p class="modal-card-title">Settings</p><button class="delete"></button></header><section class="modal-card-body"><p><label class="label">Theme</label><div class="select"><select id="documenter-themepicker"><option value="documenter-light">documenter-light</option><option value="documenter-dark">documenter-dark</option></select></div></p><hr/><p>This document was generated with <a href="https://github.com/JuliaDocs/Documenter.jl">Documenter.jl</a> on <span class="colophon-date" title="Wednesday 3 July 2024 16:16">Wednesday 3 July 2024</span>. Using Julia version 1.10.4.</p></section><footer class="modal-card-foot"></footer></div></div></div></body></html>
diff --git a/dev/man/eval/index.html b/dev/man/eval/index.html
index 7aa8daf..05ce3af 100644
--- a/dev/man/eval/index.html
+++ b/dev/man/eval/index.html
@@ -1,12 +1,12 @@
 <!DOCTYPE html>
-<html lang="en"><head><meta charset="UTF-8"/><meta name="viewport" content="width=device-width, initial-scale=1.0"/><title>Evaluation · JudiLing.jl</title><link rel="canonical" href="https://quantling.github.io/JudiLing.jl/man/eval/"/><link href="https://fonts.googleapis.com/css?family=Lato|Roboto+Mono" rel="stylesheet" type="text/css"/><link href="https://cdnjs.cloudflare.com/ajax/libs/font-awesome/5.15.0/css/fontawesome.min.css" rel="stylesheet" type="text/css"/><link href="https://cdnjs.cloudflare.com/ajax/libs/font-awesome/5.15.0/css/solid.min.css" rel="stylesheet" type="text/css"/><link href="https://cdnjs.cloudflare.com/ajax/libs/font-awesome/5.15.0/css/brands.min.css" rel="stylesheet" type="text/css"/><link href="https://cdnjs.cloudflare.com/ajax/libs/KaTeX/0.11.1/katex.min.css" rel="stylesheet" type="text/css"/><script>documenterBaseURL="../.."</script><script src="https://cdnjs.cloudflare.com/ajax/libs/require.js/2.3.6/require.min.js" data-main="../../assets/documenter.js"></script><script src="../../siteinfo.js"></script><script src="../../../versions.js"></script><link class="docs-theme-link" rel="stylesheet" type="text/css" href="../../assets/themes/documenter-dark.css" data-theme-name="documenter-dark"/><link class="docs-theme-link" rel="stylesheet" type="text/css" href="../../assets/themes/documenter-light.css" data-theme-name="documenter-light" data-theme-primary/><script src="../../assets/themeswap.js"></script></head><body><div id="documenter"><nav class="docs-sidebar"><div class="docs-package-name"><span class="docs-autofit">JudiLing.jl</span></div><form class="docs-search" action="../../search/"><input class="docs-search-query" id="documenter-search-query" name="q" type="text" placeholder="Search docs"/></form><ul class="docs-menu"><li><a class="tocitem" href="../../">Home</a></li><li><span class="tocitem">Manual</span><ul><li><a class="tocitem" href="../input/">Loading data</a></li><li><a class="tocitem" href="../make_cue_matrix/">Make Cue Matrix</a></li><li><a class="tocitem" href="../make_semantic_matrix/">Make Semantic Matrix</a></li><li><a class="tocitem" href="../cholesky/">Cholesky</a></li><li><a class="tocitem" href="../make_adjacency_matrix/">Make Adjacency Matrix</a></li><li><a class="tocitem" href="../make_yt_matrix/">Make Yt Matrix</a></li><li><a class="tocitem" href="../find_path/">Find Paths</a></li><li class="is-active"><a class="tocitem" href>Evaluation</a></li><li><a class="tocitem" href="../output/">Output</a></li><li><a class="tocitem" href="../test_combo/">Test Combo</a></li><li><a class="tocitem" href="../display/">Display</a></li><li><a class="tocitem" href="../utils/">Utils</a></li><li><a class="tocitem" href="../pickle/">Pickle</a></li><li><a class="tocitem" href="../pyndl/">Pyndl</a></li><li><a class="tocitem" href="../wh/">Widrow-Hoff Learning</a></li><li><a class="tocitem" href="../deep_learning/">Deep learning</a></li><li><a class="tocitem" href="../measures_func/">Measures function</a></li></ul></li><li><a class="tocitem" href="../all_manual/">All Manual index</a></li></ul><div class="docs-version-selector field has-addons"><div class="control"><span class="docs-label button is-static is-size-7">Version</span></div><div class="docs-selector control is-expanded"><div class="select is-fullwidth is-size-7"><select id="documenter-version-selector"></select></div></div></div></nav><div class="docs-main"><header class="docs-navbar"><nav class="breadcrumb"><ul class="is-hidden-mobile"><li><a class="is-disabled">Manual</a></li><li class="is-active"><a href>Evaluation</a></li></ul><ul class="is-hidden-tablet"><li class="is-active"><a href>Evaluation</a></li></ul></nav><div class="docs-right"><a class="docs-edit-link" href="https://github.com/quantling/JudiLing.jl/blob/master/docs/src/man/eval.md#L" title="Edit on GitHub"><span class="docs-icon fab"></span><span class="docs-label is-hidden-touch">Edit on GitHub</span></a><a class="docs-settings-button fas fa-cog" id="documenter-settings-button" href="#" title="Settings"></a><a class="docs-sidebar-button fa fa-bars is-hidden-desktop" id="documenter-sidebar-button" href="#"></a></div></header><article class="content" id="documenter-page"><h1 id="Evaluation"><a class="docs-heading-anchor" href="#Evaluation">Evaluation</a><a id="Evaluation-1"></a><a class="docs-heading-anchor-permalink" href="#Evaluation" title="Permalink"></a></h1><article class="docstring"><header><a class="docstring-binding" id="JudiLing.Comp_Acc_Struct" href="#JudiLing.Comp_Acc_Struct"><code>JudiLing.Comp_Acc_Struct</code></a> — <span class="docstring-category">Type</span></header><section><div><p>A structure that stores information about comprehension accuracy.</p></div><a class="docs-sourcelink" target="_blank" href="https://github.com/quantling/JudiLing.jl/blob/244bb0c648484065ffd5a41781ccc1caf2e5db60/src/eval.jl#LL1-L3">source</a></section></article><article class="docstring"><header><a class="docstring-binding" id="JudiLing.eval_SC" href="#JudiLing.eval_SC"><code>JudiLing.eval_SC</code></a> — <span class="docstring-category">Function</span></header><section><div><p>Assess model accuracy on the basis of the correlations of row vectors of Chat and C or Shat and S. Ideally the target words have highest correlations on the diagonal of the pertinent correlation matrices. Homophones support option is implemented.</p></div><a class="docs-sourcelink" target="_blank" href="https://github.com/quantling/JudiLing.jl/blob/244bb0c648484065ffd5a41781ccc1caf2e5db60/src/eval.jl#LL10-L14">source</a></section></article><article class="docstring"><header><a class="docstring-binding" id="JudiLing.eval_SC_loose" href="#JudiLing.eval_SC_loose"><code>JudiLing.eval_SC_loose</code></a> — <span class="docstring-category">Function</span></header><section><div><p>Assess model accuracy on the basis of the correlations of row vectors of Chat and C or Shat and S. Count it as correct if one of the top k candidates is correct. Homophones support option is implemented.</p></div><a class="docs-sourcelink" target="_blank" href="https://github.com/quantling/JudiLing.jl/blob/244bb0c648484065ffd5a41781ccc1caf2e5db60/src/eval.jl#LL18-L22">source</a></section></article><article class="docstring"><header><a class="docstring-binding" id="JudiLing.accuracy_comprehension-Tuple{Any, Any, Any}" href="#JudiLing.accuracy_comprehension-Tuple{Any, Any, Any}"><code>JudiLing.accuracy_comprehension</code></a> — <span class="docstring-category">Method</span></header><section><div><pre><code class="language-julia">accuracy_comprehension(S, Shat, data)</code></pre><p>Evaluate comprehension accuracy for training data.</p><div class="admonition is-info"><header class="admonition-header">Note</header><div class="admonition-body"><p>In case of homophones/homographs in the dataset, the correct/incorrect values for base and inflections may be misleading! See below for more information.</p></div></div><p><strong>Obligatory Arguments</strong></p><ul><li><code>S::Matrix</code>: the (gold standard) S matrix</li><li><code>Shat::Matrix</code>: the (predicted) Shat matrix</li><li><code>data::DataFrame</code>: the dataset</li></ul><p><strong>Optional Arguments</strong></p><ul><li><code>target_col::Union{String, Symbol}=:Words</code>: the column name for target strings</li><li><code>base::Vector=nothing</code>: base features (typically a lexeme)</li><li><code>inflections::Union{Nothing, Vector}=nothing</code>: other features (typically in inflectional features)</li></ul><p><strong>Examples</strong></p><pre><code class="language-julia">accuracy_comprehension(
+<html lang="en"><head><meta charset="UTF-8"/><meta name="viewport" content="width=device-width, initial-scale=1.0"/><title>Evaluation · JudiLing.jl</title><link rel="canonical" href="https://quantling.github.io/JudiLing.jl/man/eval/"/><link href="https://fonts.googleapis.com/css?family=Lato|Roboto+Mono" rel="stylesheet" type="text/css"/><link href="https://cdnjs.cloudflare.com/ajax/libs/font-awesome/5.15.0/css/fontawesome.min.css" rel="stylesheet" type="text/css"/><link href="https://cdnjs.cloudflare.com/ajax/libs/font-awesome/5.15.0/css/solid.min.css" rel="stylesheet" type="text/css"/><link href="https://cdnjs.cloudflare.com/ajax/libs/font-awesome/5.15.0/css/brands.min.css" rel="stylesheet" type="text/css"/><link href="https://cdnjs.cloudflare.com/ajax/libs/KaTeX/0.11.1/katex.min.css" rel="stylesheet" type="text/css"/><script>documenterBaseURL="../.."</script><script src="https://cdnjs.cloudflare.com/ajax/libs/require.js/2.3.6/require.min.js" data-main="../../assets/documenter.js"></script><script src="../../siteinfo.js"></script><script src="../../../versions.js"></script><link class="docs-theme-link" rel="stylesheet" type="text/css" href="../../assets/themes/documenter-dark.css" data-theme-name="documenter-dark"/><link class="docs-theme-link" rel="stylesheet" type="text/css" href="../../assets/themes/documenter-light.css" data-theme-name="documenter-light" data-theme-primary/><script src="../../assets/themeswap.js"></script></head><body><div id="documenter"><nav class="docs-sidebar"><div class="docs-package-name"><span class="docs-autofit">JudiLing.jl</span></div><form class="docs-search" action="../../search/"><input class="docs-search-query" id="documenter-search-query" name="q" type="text" placeholder="Search docs"/></form><ul class="docs-menu"><li><a class="tocitem" href="../../">Home</a></li><li><span class="tocitem">Manual</span><ul><li><a class="tocitem" href="../input/">Loading data</a></li><li><a class="tocitem" href="../make_cue_matrix/">Make Cue Matrix</a></li><li><a class="tocitem" href="../make_semantic_matrix/">Make Semantic Matrix</a></li><li><a class="tocitem" href="../cholesky/">Cholesky</a></li><li><a class="tocitem" href="../make_adjacency_matrix/">Make Adjacency Matrix</a></li><li><a class="tocitem" href="../make_yt_matrix/">Make Yt Matrix</a></li><li><a class="tocitem" href="../find_path/">Find Paths</a></li><li class="is-active"><a class="tocitem" href>Evaluation</a></li><li><a class="tocitem" href="../output/">Output</a></li><li><a class="tocitem" href="../test_combo/">Test Combo</a></li><li><a class="tocitem" href="../display/">Display</a></li><li><a class="tocitem" href="../utils/">Utils</a></li><li><a class="tocitem" href="../pickle/">Pickle</a></li><li><a class="tocitem" href="../pyndl/">Pyndl</a></li><li><a class="tocitem" href="../wh/">Widrow-Hoff Learning</a></li><li><a class="tocitem" href="../deep_learning/">Deep learning</a></li><li><a class="tocitem" href="../measures_func/">Measures function</a></li></ul></li><li><a class="tocitem" href="../all_manual/">All Manual index</a></li></ul><div class="docs-version-selector field has-addons"><div class="control"><span class="docs-label button is-static is-size-7">Version</span></div><div class="docs-selector control is-expanded"><div class="select is-fullwidth is-size-7"><select id="documenter-version-selector"></select></div></div></div></nav><div class="docs-main"><header class="docs-navbar"><nav class="breadcrumb"><ul class="is-hidden-mobile"><li><a class="is-disabled">Manual</a></li><li class="is-active"><a href>Evaluation</a></li></ul><ul class="is-hidden-tablet"><li class="is-active"><a href>Evaluation</a></li></ul></nav><div class="docs-right"><a class="docs-edit-link" href="https://github.com/quantling/JudiLing.jl/blob/master/docs/src/man/eval.md#L" title="Edit on GitHub"><span class="docs-icon fab"></span><span class="docs-label is-hidden-touch">Edit on GitHub</span></a><a class="docs-settings-button fas fa-cog" id="documenter-settings-button" href="#" title="Settings"></a><a class="docs-sidebar-button fa fa-bars is-hidden-desktop" id="documenter-sidebar-button" href="#"></a></div></header><article class="content" id="documenter-page"><h1 id="Evaluation"><a class="docs-heading-anchor" href="#Evaluation">Evaluation</a><a id="Evaluation-1"></a><a class="docs-heading-anchor-permalink" href="#Evaluation" title="Permalink"></a></h1><article class="docstring"><header><a class="docstring-binding" id="JudiLing.Comp_Acc_Struct" href="#JudiLing.Comp_Acc_Struct"><code>JudiLing.Comp_Acc_Struct</code></a> — <span class="docstring-category">Type</span></header><section><div><p>A structure that stores information about comprehension accuracy.</p></div><a class="docs-sourcelink" target="_blank" href="https://github.com/quantling/JudiLing.jl/blob/5ca73e4b27ef788e0b36d45e6360491a5a413be8/src/eval.jl#LL1-L3">source</a></section></article><article class="docstring"><header><a class="docstring-binding" id="JudiLing.eval_SC" href="#JudiLing.eval_SC"><code>JudiLing.eval_SC</code></a> — <span class="docstring-category">Function</span></header><section><div><p>Assess model accuracy on the basis of the correlations of row vectors of Chat and C or Shat and S. Ideally the target words have highest correlations on the diagonal of the pertinent correlation matrices. Homophones support option is implemented.</p></div><a class="docs-sourcelink" target="_blank" href="https://github.com/quantling/JudiLing.jl/blob/5ca73e4b27ef788e0b36d45e6360491a5a413be8/src/eval.jl#LL10-L14">source</a></section></article><article class="docstring"><header><a class="docstring-binding" id="JudiLing.eval_SC_loose" href="#JudiLing.eval_SC_loose"><code>JudiLing.eval_SC_loose</code></a> — <span class="docstring-category">Function</span></header><section><div><p>Assess model accuracy on the basis of the correlations of row vectors of Chat and C or Shat and S. Count it as correct if one of the top k candidates is correct. Homophones support option is implemented.</p></div><a class="docs-sourcelink" target="_blank" href="https://github.com/quantling/JudiLing.jl/blob/5ca73e4b27ef788e0b36d45e6360491a5a413be8/src/eval.jl#LL18-L22">source</a></section></article><article class="docstring"><header><a class="docstring-binding" id="JudiLing.accuracy_comprehension-Tuple{Any, Any, Any}" href="#JudiLing.accuracy_comprehension-Tuple{Any, Any, Any}"><code>JudiLing.accuracy_comprehension</code></a> — <span class="docstring-category">Method</span></header><section><div><pre><code class="language-julia">accuracy_comprehension(S, Shat, data)</code></pre><p>Evaluate comprehension accuracy for training data.</p><div class="admonition is-info"><header class="admonition-header">Note</header><div class="admonition-body"><p>In case of homophones/homographs in the dataset, the correct/incorrect values for base and inflections may be misleading! See below for more information.</p></div></div><p><strong>Obligatory Arguments</strong></p><ul><li><code>S::Matrix</code>: the (gold standard) S matrix</li><li><code>Shat::Matrix</code>: the (predicted) Shat matrix</li><li><code>data::DataFrame</code>: the dataset</li></ul><p><strong>Optional Arguments</strong></p><ul><li><code>target_col::Union{String, Symbol}=:Words</code>: the column name for target strings</li><li><code>base::Vector=nothing</code>: base features (typically a lexeme)</li><li><code>inflections::Union{Nothing, Vector}=nothing</code>: other features (typically in inflectional features)</li></ul><p><strong>Examples</strong></p><pre><code class="language-julia">accuracy_comprehension(
     S_train,
     Shat_train,
     latin_val,
     target_col=:Words,
     base=[:Lexeme],
     inflections=[:Person, :Number, :Tense, :Voice, :Mood]
-    )</code></pre><p><strong>Note</strong></p><p>In case of homophones/homographs in the dataset, the correct/incorrect values for base and inflections may be misleading! Consider the following example: The wordform &quot;Äpfel&quot; in German can be nominative plural, genitive plural and accusative plural. Let&#39;s assume we have a dataset in which &quot;Äpfel&quot; occurs in all three case/number combinations (i.e. there are homographs). If all these wordforms have the same semantic vectors (e.g. because they are derived from word2vec or fasttext which typically have a single vector per unique wordform), the predicted semantic vector of the wordform &quot;Äpfel&quot; will be equally correlated with all three case/number combinations in the dataset. In such cases, while the algorithm in this function can unambiguously conclude that the correct surface form &quot;Äpfel&quot; was comprehended, which of the three possible rows is the correct one will be picked somewhat non-deterministically (see https://docs.julialang.org/en/v1/base/collections/#Base.argmax). It is thus possible that the algorithm will then use the genitive plural instead of the intended nominative plural as the ground plural, and will report that &quot;case&quot; was comprehended incorrectly.</p></div><a class="docs-sourcelink" target="_blank" href="https://github.com/quantling/JudiLing.jl/blob/244bb0c648484065ffd5a41781ccc1caf2e5db60/src/eval.jl#LL25-L66">source</a></section></article><article class="docstring"><header><a class="docstring-binding" id="JudiLing.accuracy_comprehension-NTuple{5, Any}" href="#JudiLing.accuracy_comprehension-NTuple{5, Any}"><code>JudiLing.accuracy_comprehension</code></a> — <span class="docstring-category">Method</span></header><section><div><pre><code class="language-julia">accuracy_comprehension(
+    )</code></pre><p><strong>Note</strong></p><p>In case of homophones/homographs in the dataset, the correct/incorrect values for base and inflections may be misleading! Consider the following example: The wordform &quot;Äpfel&quot; in German can be nominative plural, genitive plural and accusative plural. Let&#39;s assume we have a dataset in which &quot;Äpfel&quot; occurs in all three case/number combinations (i.e. there are homographs). If all these wordforms have the same semantic vectors (e.g. because they are derived from word2vec or fasttext which typically have a single vector per unique wordform), the predicted semantic vector of the wordform &quot;Äpfel&quot; will be equally correlated with all three case/number combinations in the dataset. In such cases, while the algorithm in this function can unambiguously conclude that the correct surface form &quot;Äpfel&quot; was comprehended, which of the three possible rows is the correct one will be picked somewhat non-deterministically (see https://docs.julialang.org/en/v1/base/collections/#Base.argmax). It is thus possible that the algorithm will then use the genitive plural instead of the intended nominative plural as the ground plural, and will report that &quot;case&quot; was comprehended incorrectly.</p></div><a class="docs-sourcelink" target="_blank" href="https://github.com/quantling/JudiLing.jl/blob/5ca73e4b27ef788e0b36d45e6360491a5a413be8/src/eval.jl#LL25-L66">source</a></section></article><article class="docstring"><header><a class="docstring-binding" id="JudiLing.accuracy_comprehension-NTuple{5, Any}" href="#JudiLing.accuracy_comprehension-NTuple{5, Any}"><code>JudiLing.accuracy_comprehension</code></a> — <span class="docstring-category">Method</span></header><section><div><pre><code class="language-julia">accuracy_comprehension(
     S_val,
     S_train,
     Shat_val,
@@ -24,27 +24,27 @@
     target_col=:Words,
     base=[:Lexeme],
     inflections=[:Person, :Number, :Tense, :Voice, :Mood]
-    )</code></pre><p><strong>Note</strong></p><p>In case of homophones/homographs in the dataset, the correct/incorrect values for base and inflections may be misleading! Consider the following example: The wordform &quot;Äpfel&quot; in German can be nominative plural, genitive plural and accusative plural. Let&#39;s assume we have a dataset in which &quot;Äpfel&quot; occurs in all three case/number combinations (i.e. there are homographs). If all these wordforms have the same semantic vectors (e.g. because they are derived from word2vec or fasttext which typically have a single vector per unique wordform), the predicted semantic vector of the wordform &quot;Äpfel&quot; will be equally correlated with all three case/number combinations in the dataset. In such cases, while the algorithm in this function can unambiguously conclude that the correct surface form &quot;Äpfel&quot; was comprehended, which of the three possible rows is the correct one will be picked somewhat non-deterministically (see https://docs.julialang.org/en/v1/base/collections/#Base.argmax). It is thus possible that the algorithm will then use the genitive plural instead of the intended nominative plural as the ground plural, and will report that &quot;case&quot; was comprehended incorrectly.</p></div><a class="docs-sourcelink" target="_blank" href="https://github.com/quantling/JudiLing.jl/blob/244bb0c648484065ffd5a41781ccc1caf2e5db60/src/eval.jl#LL113-L168">source</a></section></article><article class="docstring"><header><a class="docstring-binding" id="JudiLing.eval_SC-Tuple{AbstractArray, AbstractArray}" href="#JudiLing.eval_SC-Tuple{AbstractArray, AbstractArray}"><code>JudiLing.eval_SC</code></a> — <span class="docstring-category">Method</span></header><section><div><pre><code class="language-julia">eval_SC(SChat::AbstractArray, SC::AbstractArray)</code></pre><p>Assess model accuracy on the basis of the correlations (or Euclidean distances or Cosine Similarities) of row vectors of Chat and C or Shat and S. Ideally the target words have highest correlations (lowest distance/highest similarity) on the diagonal of the pertinent correlation (distance/similarity) matrices.</p><p>If <code>freq</code> is added, token-based accuracy is computed. Token-based accuracy weighs accuracy values according to words&#39; frequency, i.e. if a word has a frequency of 30 and overall there are 3000 tokens (the frequencies of all types sum to 3000), this token&#39;s accuracy will contribute 30/3000.</p><div class="admonition is-info"><header class="admonition-header">Note</header><div class="admonition-body"><p>If there are homophones/homographs in the dataset, this evaluation method may be misleading: the predicted vector will be equally correlated with the target vector of both words and the one on the diagonal will not necessarily be selected as the most correlated. In such cases, supplying the dataset and <code>target_col</code> is recommended which enables taking into account homophones/homographs.</p></div></div><p><strong>Obligatory Arguments</strong></p><ul><li><code>SChat::Union{SparseMatrixCSC, Matrix}</code>: the Chat or Shat matrix</li><li><code>SC::Union{SparseMatrixCSC, Matrix}</code>: the C or S matrix</li></ul><p><strong>Optional Arguments</strong></p><ul><li><code>digits</code>: the specified number of digits after the decimal place (or before if negative)</li><li><code>R::Bool=false</code>: if true, pairwise correlation/distance/similarity matrix R is return</li><li><code>freq::Union{Missing, Array{Int64, 1}, Array{Float64,1}}=missing</code>: list of frequencies of the wordforms in X and Y</li><li><code>method::Union{Symbol, String}=:correlation</code>: Method for computing similarities, one of {:correlation, :euclidean, :cosine}.</li></ul><pre><code class="language-julia">eval_SC(Chat_train, cue_obj_train.C)
+    )</code></pre><p><strong>Note</strong></p><p>In case of homophones/homographs in the dataset, the correct/incorrect values for base and inflections may be misleading! Consider the following example: The wordform &quot;Äpfel&quot; in German can be nominative plural, genitive plural and accusative plural. Let&#39;s assume we have a dataset in which &quot;Äpfel&quot; occurs in all three case/number combinations (i.e. there are homographs). If all these wordforms have the same semantic vectors (e.g. because they are derived from word2vec or fasttext which typically have a single vector per unique wordform), the predicted semantic vector of the wordform &quot;Äpfel&quot; will be equally correlated with all three case/number combinations in the dataset. In such cases, while the algorithm in this function can unambiguously conclude that the correct surface form &quot;Äpfel&quot; was comprehended, which of the three possible rows is the correct one will be picked somewhat non-deterministically (see https://docs.julialang.org/en/v1/base/collections/#Base.argmax). It is thus possible that the algorithm will then use the genitive plural instead of the intended nominative plural as the ground plural, and will report that &quot;case&quot; was comprehended incorrectly.</p></div><a class="docs-sourcelink" target="_blank" href="https://github.com/quantling/JudiLing.jl/blob/5ca73e4b27ef788e0b36d45e6360491a5a413be8/src/eval.jl#LL113-L168">source</a></section></article><article class="docstring"><header><a class="docstring-binding" id="JudiLing.eval_SC-Tuple{AbstractArray, AbstractArray}" href="#JudiLing.eval_SC-Tuple{AbstractArray, AbstractArray}"><code>JudiLing.eval_SC</code></a> — <span class="docstring-category">Method</span></header><section><div><pre><code class="language-julia">eval_SC(SChat::AbstractArray, SC::AbstractArray)</code></pre><p>Assess model accuracy on the basis of the correlations (or Euclidean distances or Cosine Similarities) of row vectors of Chat and C or Shat and S. Ideally the target words have highest correlations (lowest distance/highest similarity) on the diagonal of the pertinent correlation (distance/similarity) matrices.</p><p>If <code>freq</code> is added, token-based accuracy is computed. Token-based accuracy weighs accuracy values according to words&#39; frequency, i.e. if a word has a frequency of 30 and overall there are 3000 tokens (the frequencies of all types sum to 3000), this token&#39;s accuracy will contribute 30/3000.</p><div class="admonition is-info"><header class="admonition-header">Note</header><div class="admonition-body"><p>If there are homophones/homographs in the dataset, this evaluation method may be misleading: the predicted vector will be equally correlated with the target vector of both words and the one on the diagonal will not necessarily be selected as the most correlated. In such cases, supplying the dataset and <code>target_col</code> is recommended which enables taking into account homophones/homographs.</p></div></div><p><strong>Obligatory Arguments</strong></p><ul><li><code>SChat::Union{SparseMatrixCSC, Matrix}</code>: the Chat or Shat matrix</li><li><code>SC::Union{SparseMatrixCSC, Matrix}</code>: the C or S matrix</li></ul><p><strong>Optional Arguments</strong></p><ul><li><code>digits</code>: the specified number of digits after the decimal place (or before if negative)</li><li><code>R::Bool=false</code>: if true, pairwise correlation/distance/similarity matrix R is return</li><li><code>freq::Union{Missing, Array{Int64, 1}, Array{Float64,1}}=missing</code>: list of frequencies of the wordforms in X and Y</li><li><code>method::Union{Symbol, String}=:correlation</code>: Method for computing similarities, one of {:correlation, :euclidean, :cosine}.</li></ul><pre><code class="language-julia">eval_SC(Chat_train, cue_obj_train.C)
 eval_SC(Chat_val, cue_obj_val.C)
 eval_SC(Shat_train, S_train)
-eval_SC(Shat_val, S_val)</code></pre></div><a class="docs-sourcelink" target="_blank" href="https://github.com/quantling/JudiLing.jl/blob/244bb0c648484065ffd5a41781ccc1caf2e5db60/src/eval.jl#LL229-L257">source</a></section></article><article class="docstring"><header><a class="docstring-binding" id="JudiLing.eval_SC-Tuple{AbstractArray, AbstractArray, AbstractArray}" href="#JudiLing.eval_SC-Tuple{AbstractArray, AbstractArray, AbstractArray}"><code>JudiLing.eval_SC</code></a> — <span class="docstring-category">Method</span></header><section><div><pre><code class="language-julia">eval_SC(SChat::AbstractArray, SC::AbstractArray, SC_rest::AbstractArray)</code></pre><p>Assess model accuracy on the basis of the correlations (or Euclidean distances or Cosine Similarities) of row vectors of Chat and C or Shat and S. Ideally the target words have highest correlations (lowest distance/highest similarity) on the diagonal of the pertinent correlation (distance/similarity) matrices.</p><p>If <code>freq</code> is added, token-based accuracy is computed. Token-based accuracy weighs accuracy values according to words&#39; frequency, i.e. if a word has a frequency of 30 and overall there are 3000 tokens (the frequencies of all types sum to 3000), this token&#39;s accuracy will contribute 30/3000.</p><div class="admonition is-info"><header class="admonition-header">Note</header><div class="admonition-body"><p>The order is important. The fist gold standard matrix has to be corresponing to the SChat matrix, such as <code>eval_SC(Shat_train, S_train, S_val)</code> or <code>eval_SC(Shat_val, S_val, S_train)</code></p></div></div><div class="admonition is-info"><header class="admonition-header">Note</header><div class="admonition-body"><p>If there are homophones/homographs in the dataset, this evaluation method may be misleading: the predicted vector will be equally correlated with the target vector of both words and the one on the diagonal will not necessarily be selected as the most correlated. In such cases, supplying the dataset and target_col is recommended which enables taking into account homophones/homographs.</p></div></div><p><strong>Obligatory Arguments</strong></p><ul><li><code>SChat::Union{SparseMatrixCSC, Matrix}</code>: the Chat or Shat matrix</li><li><code>SC::Union{SparseMatrixCSC, Matrix}</code>: the training/validation C or S matrix</li><li><code>SC_rest::Union{SparseMatrixCSC, Matrix}</code>: the validation/training C or S matrix</li></ul><p><strong>Optional Arguments</strong></p><ul><li><code>digits</code>: the specified number of digits after the decimal place (or before if negative)</li><li><code>R::Bool=false</code>: if true, pairwise correlation/distance/similarity matrix R is return</li><li><code>freq::Union{Missing, Array{Int64, 1}, Array{Float64,1}}=missing</code>: list of frequencies of the wordforms in X and Y</li><li><code>method::Union{Symbol, String}=:correlation</code>: Method for computing similarities, one of {:correlation, :euclidean, :cosine}.</li></ul><pre><code class="language-julia">eval_SC(Chat_train, cue_obj_train.C, cue_obj_val.C)
+eval_SC(Shat_val, S_val)</code></pre></div><a class="docs-sourcelink" target="_blank" href="https://github.com/quantling/JudiLing.jl/blob/5ca73e4b27ef788e0b36d45e6360491a5a413be8/src/eval.jl#LL229-L257">source</a></section></article><article class="docstring"><header><a class="docstring-binding" id="JudiLing.eval_SC-Tuple{AbstractArray, AbstractArray, AbstractArray}" href="#JudiLing.eval_SC-Tuple{AbstractArray, AbstractArray, AbstractArray}"><code>JudiLing.eval_SC</code></a> — <span class="docstring-category">Method</span></header><section><div><pre><code class="language-julia">eval_SC(SChat::AbstractArray, SC::AbstractArray, SC_rest::AbstractArray)</code></pre><p>Assess model accuracy on the basis of the correlations (or Euclidean distances or Cosine Similarities) of row vectors of Chat and C or Shat and S. Ideally the target words have highest correlations (lowest distance/highest similarity) on the diagonal of the pertinent correlation (distance/similarity) matrices.</p><p>If <code>freq</code> is added, token-based accuracy is computed. Token-based accuracy weighs accuracy values according to words&#39; frequency, i.e. if a word has a frequency of 30 and overall there are 3000 tokens (the frequencies of all types sum to 3000), this token&#39;s accuracy will contribute 30/3000.</p><div class="admonition is-info"><header class="admonition-header">Note</header><div class="admonition-body"><p>The order is important. The fist gold standard matrix has to be corresponing to the SChat matrix, such as <code>eval_SC(Shat_train, S_train, S_val)</code> or <code>eval_SC(Shat_val, S_val, S_train)</code></p></div></div><div class="admonition is-info"><header class="admonition-header">Note</header><div class="admonition-body"><p>If there are homophones/homographs in the dataset, this evaluation method may be misleading: the predicted vector will be equally correlated with the target vector of both words and the one on the diagonal will not necessarily be selected as the most correlated. In such cases, supplying the dataset and target_col is recommended which enables taking into account homophones/homographs.</p></div></div><p><strong>Obligatory Arguments</strong></p><ul><li><code>SChat::Union{SparseMatrixCSC, Matrix}</code>: the Chat or Shat matrix</li><li><code>SC::Union{SparseMatrixCSC, Matrix}</code>: the training/validation C or S matrix</li><li><code>SC_rest::Union{SparseMatrixCSC, Matrix}</code>: the validation/training C or S matrix</li></ul><p><strong>Optional Arguments</strong></p><ul><li><code>digits</code>: the specified number of digits after the decimal place (or before if negative)</li><li><code>R::Bool=false</code>: if true, pairwise correlation/distance/similarity matrix R is return</li><li><code>freq::Union{Missing, Array{Int64, 1}, Array{Float64,1}}=missing</code>: list of frequencies of the wordforms in X and Y</li><li><code>method::Union{Symbol, String}=:correlation</code>: Method for computing similarities, one of {:correlation, :euclidean, :cosine}.</li></ul><pre><code class="language-julia">eval_SC(Chat_train, cue_obj_train.C, cue_obj_val.C)
 eval_SC(Chat_val, cue_obj_val.C, cue_obj_train.C)
 eval_SC(Shat_train, S_train, S_val)
-eval_SC(Shat_val, S_val, S_train)</code></pre></div><a class="docs-sourcelink" target="_blank" href="https://github.com/quantling/JudiLing.jl/blob/244bb0c648484065ffd5a41781ccc1caf2e5db60/src/eval.jl#LL303-L336">source</a></section></article><article class="docstring"><header><a class="docstring-binding" id="JudiLing.eval_SC-Tuple{AbstractArray, AbstractArray, DataFrames.DataFrame, Union{String, Symbol}}" href="#JudiLing.eval_SC-Tuple{AbstractArray, AbstractArray, DataFrames.DataFrame, Union{String, Symbol}}"><code>JudiLing.eval_SC</code></a> — <span class="docstring-category">Method</span></header><section><div><pre><code class="language-julia">eval_SC(SChat::AbstractArray, SC::AbstractArray, data::DataFrame, target_col::Union{String, Symbol})</code></pre><p>Assess model accuracy on the basis of the correlations (or Euclidean distances or Cosine Similarities) of row vectors of Chat and C or Shat and S. Ideally the target words have highest correlations (lowest distance/highest similarity) on the diagonal of the pertinent correlation (distance/similarity) matrices. Support for homophones.</p><p>If <code>freq</code> is added, token-based accuracy is computed. Token-based accuracy weighs accuracy values according to words&#39; frequency, i.e. if a word has a frequency of 30 and overall there are 3000 tokens (the frequencies of all types sum to 3000), this token&#39;s accuracy will contribute 30/3000.</p><p><strong>Obligatory Arguments</strong></p><ul><li><code>SChat::Union{SparseMatrixCSC, Matrix}</code>: the Chat or Shat matrix</li><li><code>SC::Union{SparseMatrixCSC, Matrix}</code>: the C or S matrix</li><li><code>data::DataFrame</code>: datasets</li><li><code>target_col::Union{String, Symbol}</code>: target column name</li></ul><p><strong>Optional Arguments</strong></p><ul><li><code>digits</code>: the specified number of digits after the decimal place (or before if negative)</li><li><code>R::Bool=false</code>: if true, pairwise correlation/distance/similarity matrix R is return</li><li><code>freq::Union{Missing, Array{Int64, 1}, Array{Float64,1}}=missing</code>: list of frequencies of the wordforms in X and Y</li><li><code>method::Union{Symbol, String}=:correlation</code>: Method for computing similarities, one of {:correlation, :euclidean, :cosine}.</li></ul><pre><code class="language-julia">eval_SC(Chat_train, cue_obj_train.C, latin, :Word)
+eval_SC(Shat_val, S_val, S_train)</code></pre></div><a class="docs-sourcelink" target="_blank" href="https://github.com/quantling/JudiLing.jl/blob/5ca73e4b27ef788e0b36d45e6360491a5a413be8/src/eval.jl#LL303-L336">source</a></section></article><article class="docstring"><header><a class="docstring-binding" id="JudiLing.eval_SC-Tuple{AbstractArray, AbstractArray, DataFrames.DataFrame, Union{String, Symbol}}" href="#JudiLing.eval_SC-Tuple{AbstractArray, AbstractArray, DataFrames.DataFrame, Union{String, Symbol}}"><code>JudiLing.eval_SC</code></a> — <span class="docstring-category">Method</span></header><section><div><pre><code class="language-julia">eval_SC(SChat::AbstractArray, SC::AbstractArray, data::DataFrame, target_col::Union{String, Symbol})</code></pre><p>Assess model accuracy on the basis of the correlations (or Euclidean distances or Cosine Similarities) of row vectors of Chat and C or Shat and S. Ideally the target words have highest correlations (lowest distance/highest similarity) on the diagonal of the pertinent correlation (distance/similarity) matrices. Support for homophones.</p><p>If <code>freq</code> is added, token-based accuracy is computed. Token-based accuracy weighs accuracy values according to words&#39; frequency, i.e. if a word has a frequency of 30 and overall there are 3000 tokens (the frequencies of all types sum to 3000), this token&#39;s accuracy will contribute 30/3000.</p><p><strong>Obligatory Arguments</strong></p><ul><li><code>SChat::Union{SparseMatrixCSC, Matrix}</code>: the Chat or Shat matrix</li><li><code>SC::Union{SparseMatrixCSC, Matrix}</code>: the C or S matrix</li><li><code>data::DataFrame</code>: datasets</li><li><code>target_col::Union{String, Symbol}</code>: target column name</li></ul><p><strong>Optional Arguments</strong></p><ul><li><code>digits</code>: the specified number of digits after the decimal place (or before if negative)</li><li><code>R::Bool=false</code>: if true, pairwise correlation/distance/similarity matrix R is return</li><li><code>freq::Union{Missing, Array{Int64, 1}, Array{Float64,1}}=missing</code>: list of frequencies of the wordforms in X and Y</li><li><code>method::Union{Symbol, String}=:correlation</code>: Method for computing similarities, one of {:correlation, :euclidean, :cosine}.</li></ul><pre><code class="language-julia">eval_SC(Chat_train, cue_obj_train.C, latin, :Word)
 eval_SC(Chat_val, cue_obj_val.C, latin, :Word)
 eval_SC(Shat_train, S_train, latin, :Word)
-eval_SC(Shat_val, S_val, latin, :Word)</code></pre></div><a class="docs-sourcelink" target="_blank" href="https://github.com/quantling/JudiLing.jl/blob/244bb0c648484065ffd5a41781ccc1caf2e5db60/src/eval.jl#LL351-L378">source</a></section></article><article class="docstring"><header><a class="docstring-binding" id="JudiLing.eval_SC-Tuple{AbstractArray, AbstractArray, AbstractArray, DataFrames.DataFrame, DataFrames.DataFrame, Union{String, Symbol}}" href="#JudiLing.eval_SC-Tuple{AbstractArray, AbstractArray, AbstractArray, DataFrames.DataFrame, DataFrames.DataFrame, Union{String, Symbol}}"><code>JudiLing.eval_SC</code></a> — <span class="docstring-category">Method</span></header><section><div><pre><code class="language-julia">eval_SC(SChat::AbstractArray, SC::AbstractArray, SC_rest::AbstractArray, data::DataFrame, data_rest::DataFrame, target_col::Union{String, Symbol})</code></pre><p>Assess model accuracy on the basis of the correlations (or Euclidean distances or Cosine Similarities) of row vectors of Chat and C or Shat and S. Ideally the target words have highest correlations (lowest distance/highest similarity) on the diagonal of the pertinent correlation (distance/similarity) matrices.</p><p>If <code>freq</code> is added, token-based accuracy is computed. Token-based accuracy weighs accuracy values according to words&#39; frequency, i.e. if a word has a frequency of 30 and overall there are 3000 tokens (the frequencies of all types sum to 3000), this token&#39;s accuracy will contribute 30/3000.</p><div class="admonition is-info"><header class="admonition-header">Note</header><div class="admonition-body"><p>The order is important. The first gold standard matrix has to be corresponing to the SChat matrix, such as <code>eval_SC(Shat_train, S_train, S_val, latin, :Word)</code> or <code>eval_SC(Shat_val, S_val, S_train, latin, :Word)</code></p></div></div><p><strong>Obligatory Arguments</strong></p><ul><li><code>SChat::Union{SparseMatrixCSC, Matrix}</code>: the Chat or Shat matrix</li><li><code>SC::Union{SparseMatrixCSC, Matrix}</code>: the training/validation C or S matrix</li><li><code>SC_rest::Union{SparseMatrixCSC, Matrix}</code>: the validation/training C or S matrix</li><li><code>data::DataFrame</code>: the training/validation datasets</li><li><code>data_rest::DataFrame</code>: the validation/training datasets</li><li><code>target_col::Union{String, Symbol}</code>: target column name</li></ul><p><strong>Optional Arguments</strong></p><ul><li><code>digits</code>: the specified number of digits after the decimal place (or before if negative)</li><li><code>R::Bool=false</code>: if true, pairwise correlation/distance/similarity matrix R is return</li><li><code>freq::Union{Missing, Array{Int64, 1}, Array{Float64,1}}=missing</code>: list of frequencies of the wordforms in X and Y</li><li><code>method::Union{Symbol, String}=:correlation</code>: Method for computing similarities, one of {:correlation, :euclidean, :cosine}.</li></ul><pre><code class="language-julia">eval_SC(Chat_train, cue_obj_train.C, cue_obj_val.C, latin, :Word)
+eval_SC(Shat_val, S_val, latin, :Word)</code></pre></div><a class="docs-sourcelink" target="_blank" href="https://github.com/quantling/JudiLing.jl/blob/5ca73e4b27ef788e0b36d45e6360491a5a413be8/src/eval.jl#LL351-L378">source</a></section></article><article class="docstring"><header><a class="docstring-binding" id="JudiLing.eval_SC-Tuple{AbstractArray, AbstractArray, AbstractArray, DataFrames.DataFrame, DataFrames.DataFrame, Union{String, Symbol}}" href="#JudiLing.eval_SC-Tuple{AbstractArray, AbstractArray, AbstractArray, DataFrames.DataFrame, DataFrames.DataFrame, Union{String, Symbol}}"><code>JudiLing.eval_SC</code></a> — <span class="docstring-category">Method</span></header><section><div><pre><code class="language-julia">eval_SC(SChat::AbstractArray, SC::AbstractArray, SC_rest::AbstractArray, data::DataFrame, data_rest::DataFrame, target_col::Union{String, Symbol})</code></pre><p>Assess model accuracy on the basis of the correlations (or Euclidean distances or Cosine Similarities) of row vectors of Chat and C or Shat and S. Ideally the target words have highest correlations (lowest distance/highest similarity) on the diagonal of the pertinent correlation (distance/similarity) matrices.</p><p>If <code>freq</code> is added, token-based accuracy is computed. Token-based accuracy weighs accuracy values according to words&#39; frequency, i.e. if a word has a frequency of 30 and overall there are 3000 tokens (the frequencies of all types sum to 3000), this token&#39;s accuracy will contribute 30/3000.</p><div class="admonition is-info"><header class="admonition-header">Note</header><div class="admonition-body"><p>The order is important. The first gold standard matrix has to be corresponing to the SChat matrix, such as <code>eval_SC(Shat_train, S_train, S_val, latin, :Word)</code> or <code>eval_SC(Shat_val, S_val, S_train, latin, :Word)</code></p></div></div><p><strong>Obligatory Arguments</strong></p><ul><li><code>SChat::Union{SparseMatrixCSC, Matrix}</code>: the Chat or Shat matrix</li><li><code>SC::Union{SparseMatrixCSC, Matrix}</code>: the training/validation C or S matrix</li><li><code>SC_rest::Union{SparseMatrixCSC, Matrix}</code>: the validation/training C or S matrix</li><li><code>data::DataFrame</code>: the training/validation datasets</li><li><code>data_rest::DataFrame</code>: the validation/training datasets</li><li><code>target_col::Union{String, Symbol}</code>: target column name</li></ul><p><strong>Optional Arguments</strong></p><ul><li><code>digits</code>: the specified number of digits after the decimal place (or before if negative)</li><li><code>R::Bool=false</code>: if true, pairwise correlation/distance/similarity matrix R is return</li><li><code>freq::Union{Missing, Array{Int64, 1}, Array{Float64,1}}=missing</code>: list of frequencies of the wordforms in X and Y</li><li><code>method::Union{Symbol, String}=:correlation</code>: Method for computing similarities, one of {:correlation, :euclidean, :cosine}.</li></ul><pre><code class="language-julia">eval_SC(Chat_train, cue_obj_train.C, cue_obj_val.C, latin, :Word)
 eval_SC(Chat_val, cue_obj_val.C, cue_obj_train.C, latin, :Word)
 eval_SC(Shat_train, S_train, S_val, latin, :Word)
-eval_SC(Shat_val, S_val, S_train, latin, :Word)</code></pre></div><a class="docs-sourcelink" target="_blank" href="https://github.com/quantling/JudiLing.jl/blob/244bb0c648484065ffd5a41781ccc1caf2e5db60/src/eval.jl#LL436-L470">source</a></section></article><article class="docstring"><header><a class="docstring-binding" id="JudiLing.eval_SC-Tuple{AbstractArray, AbstractArray, Int64}" href="#JudiLing.eval_SC-Tuple{AbstractArray, AbstractArray, Int64}"><code>JudiLing.eval_SC</code></a> — <span class="docstring-category">Method</span></header><section><div><pre><code class="language-julia">eval_SC(SChat::AbstractArray, SC::AbstractArray, batch_size::Int64)</code></pre><p>Assess model accuracy on the basis of the correlations of row vectors of Chat and C or Shat and S. Ideally the target words have highest correlations on the diagonal of the pertinent correlation matrices. For large datasets, pass batch_size to process evaluation in chunks.</p><div class="admonition is-info"><header class="admonition-header">Note</header><div class="admonition-body"><p>If there are homophones/homographs in the dataset, this evaluation method may be misleading: the predicted vector will be equally correlated with the target vector of both words and the one on the diagonal will not necessarily be selected as the most correlated. In such cases, supplying the dataset and target_col is recommended which enables taking into account homophones/homographs.</p></div></div><div class="admonition is-info"><header class="admonition-header">Note</header><div class="admonition-body"><p>Currently only available for correlation.</p></div></div><p><strong>Obligatory Arguments</strong></p><ul><li><code>SChat</code>: the Chat or Shat matrix</li><li><code>SC</code>: the C or S matrix</li><li><code>data</code>: datasets</li><li><code>target_col</code>: target column name</li><li><code>batch_size</code>: batch size</li></ul><p><strong>Optional Arguments</strong></p><ul><li><code>digits</code>: the specified number of digits after the decimal place (or before if negative)</li><li><code>verbose::Bool=false</code>: if true, more information is printed</li></ul><pre><code class="language-julia">eval_SC(Chat_train, cue_obj_train.C, latin, :Word)
+eval_SC(Shat_val, S_val, S_train, latin, :Word)</code></pre></div><a class="docs-sourcelink" target="_blank" href="https://github.com/quantling/JudiLing.jl/blob/5ca73e4b27ef788e0b36d45e6360491a5a413be8/src/eval.jl#LL436-L470">source</a></section></article><article class="docstring"><header><a class="docstring-binding" id="JudiLing.eval_SC-Tuple{AbstractArray, AbstractArray, Int64}" href="#JudiLing.eval_SC-Tuple{AbstractArray, AbstractArray, Int64}"><code>JudiLing.eval_SC</code></a> — <span class="docstring-category">Method</span></header><section><div><pre><code class="language-julia">eval_SC(SChat::AbstractArray, SC::AbstractArray, batch_size::Int64)</code></pre><p>Assess model accuracy on the basis of the correlations of row vectors of Chat and C or Shat and S. Ideally the target words have highest correlations on the diagonal of the pertinent correlation matrices. For large datasets, pass batch_size to process evaluation in chunks.</p><div class="admonition is-info"><header class="admonition-header">Note</header><div class="admonition-body"><p>If there are homophones/homographs in the dataset, this evaluation method may be misleading: the predicted vector will be equally correlated with the target vector of both words and the one on the diagonal will not necessarily be selected as the most correlated. In such cases, supplying the dataset and target_col is recommended which enables taking into account homophones/homographs.</p></div></div><div class="admonition is-info"><header class="admonition-header">Note</header><div class="admonition-body"><p>Currently only available for correlation.</p></div></div><p><strong>Obligatory Arguments</strong></p><ul><li><code>SChat</code>: the Chat or Shat matrix</li><li><code>SC</code>: the C or S matrix</li><li><code>data</code>: datasets</li><li><code>target_col</code>: target column name</li><li><code>batch_size</code>: batch size</li></ul><p><strong>Optional Arguments</strong></p><ul><li><code>digits</code>: the specified number of digits after the decimal place (or before if negative)</li><li><code>verbose::Bool=false</code>: if true, more information is printed</li></ul><pre><code class="language-julia">eval_SC(Chat_train, cue_obj_train.C, latin, :Word)
 eval_SC(Chat_val, cue_obj_val.C, latin, :Word)
 eval_SC(Shat_train, S_train, latin, :Word)
-eval_SC(Shat_val, S_val, latin, :Word)</code></pre></div><a class="docs-sourcelink" target="_blank" href="https://github.com/quantling/JudiLing.jl/blob/244bb0c648484065ffd5a41781ccc1caf2e5db60/src/eval.jl#LL515-L546">source</a></section></article><article class="docstring"><header><a class="docstring-binding" id="JudiLing.eval_SC-Tuple{AbstractArray, AbstractArray, DataFrames.DataFrame, Union{String, Symbol}, Int64}" href="#JudiLing.eval_SC-Tuple{AbstractArray, AbstractArray, DataFrames.DataFrame, Union{String, Symbol}, Int64}"><code>JudiLing.eval_SC</code></a> — <span class="docstring-category">Method</span></header><section><div><pre><code class="language-julia">eval_SC(SChat::AbstractArray, SC::AbstractArray, data::DataFrame, target_col::Union{String, Symbol}, batch_size::Int64)</code></pre><p>Assess model accuracy on the basis of the correlations of row vectors of Chat and C or Shat and S. Ideally the target words have highest correlations on the diagonal of the pertinent correlation matrices. For large datasets, pass batch_size to process evaluation in chunks. Support homophones.</p><div class="admonition is-info"><header class="admonition-header">Note</header><div class="admonition-body"><p>Currently only available for correlation.</p></div></div><p><strong>Obligatory Arguments</strong></p><ul><li><code>SChat::AbstractArray</code>: the Chat or Shat matrix</li><li><code>SC::AbstractArray</code>: the C or S matrix</li><li><code>data::DataFrame</code>: datasets</li><li><code>target_col::Union{String, Symbol}</code>: target column name</li><li><code>batch_size::Int64</code>: batch size</li></ul><p><strong>Optional Arguments</strong></p><ul><li><code>digits</code>: the specified number of digits after the decimal place (or before if negative)</li><li><code>verbose::Bool=false</code>: if true, more information is printed</li></ul><pre><code class="language-julia">eval_SC(Chat_train, cue_obj_train.C, latin, :Word, 5000)
+eval_SC(Shat_val, S_val, latin, :Word)</code></pre></div><a class="docs-sourcelink" target="_blank" href="https://github.com/quantling/JudiLing.jl/blob/5ca73e4b27ef788e0b36d45e6360491a5a413be8/src/eval.jl#LL515-L546">source</a></section></article><article class="docstring"><header><a class="docstring-binding" id="JudiLing.eval_SC-Tuple{AbstractArray, AbstractArray, DataFrames.DataFrame, Union{String, Symbol}, Int64}" href="#JudiLing.eval_SC-Tuple{AbstractArray, AbstractArray, DataFrames.DataFrame, Union{String, Symbol}, Int64}"><code>JudiLing.eval_SC</code></a> — <span class="docstring-category">Method</span></header><section><div><pre><code class="language-julia">eval_SC(SChat::AbstractArray, SC::AbstractArray, data::DataFrame, target_col::Union{String, Symbol}, batch_size::Int64)</code></pre><p>Assess model accuracy on the basis of the correlations of row vectors of Chat and C or Shat and S. Ideally the target words have highest correlations on the diagonal of the pertinent correlation matrices. For large datasets, pass batch_size to process evaluation in chunks. Support homophones.</p><div class="admonition is-info"><header class="admonition-header">Note</header><div class="admonition-body"><p>Currently only available for correlation.</p></div></div><p><strong>Obligatory Arguments</strong></p><ul><li><code>SChat::AbstractArray</code>: the Chat or Shat matrix</li><li><code>SC::AbstractArray</code>: the C or S matrix</li><li><code>data::DataFrame</code>: datasets</li><li><code>target_col::Union{String, Symbol}</code>: target column name</li><li><code>batch_size::Int64</code>: batch size</li></ul><p><strong>Optional Arguments</strong></p><ul><li><code>digits</code>: the specified number of digits after the decimal place (or before if negative)</li><li><code>verbose::Bool=false</code>: if true, more information is printed</li></ul><pre><code class="language-julia">eval_SC(Chat_train, cue_obj_train.C, latin, :Word, 5000)
 eval_SC(Chat_val, cue_obj_val.C, latin, :Word, 5000)
 eval_SC(Shat_train, S_train, latin, :Word, 5000)
-eval_SC(Shat_val, S_val, latin, :Word, 5000)</code></pre></div><a class="docs-sourcelink" target="_blank" href="https://github.com/quantling/JudiLing.jl/blob/244bb0c648484065ffd5a41781ccc1caf2e5db60/src/eval.jl#LL592-L620">source</a></section></article><article class="docstring"><header><a class="docstring-binding" id="JudiLing.eval_SC_loose-Tuple{Any, Any, Any}" href="#JudiLing.eval_SC_loose-Tuple{Any, Any, Any}"><code>JudiLing.eval_SC_loose</code></a> — <span class="docstring-category">Method</span></header><section><div><pre><code class="language-julia">eval_SC_loose(SChat, SC, k)</code></pre><p>Assess model accuracy on the basis of the correlations (or Euclidean distances or Cosine Similarities) of row vectors of Chat and C or Shat and S. Ideally the target words have highest correlations (lowest distance/highest similarity) on the diagonal of the pertinent correlation (distance/similarity) matrices. Count it as correct if one of the top k candidates is correct.</p><div class="admonition is-info"><header class="admonition-header">Note</header><div class="admonition-body"><p>If there are homophones/homographs in the dataset, this evaluation method may be misleading: the predicted vector will be equally correlated with the target vector of both words and it is not guaranteed that the target on the diagonal will be among the k neighbours. In particular, <code>eval_SC</code> and <code>eval_SC_loose</code> with k=1 are not guaranteed to give the same result. In such cases, supplying the dataset and <code>target_col</code> is recommended which enables taking into account homophones/homographs.</p></div></div><p><strong>Obligatory Arguments</strong></p><ul><li><code>SChat::Union{SparseMatrixCSC, Matrix}</code>: the Chat or Shat matrix</li><li><code>SC::Union{SparseMatrixCSC, Matrix}</code>: the C or S matrix</li><li><code>k</code>: top k candidates</li></ul><p><strong>Optional Arguments</strong></p><ul><li><code>digits</code>: the specified number of digits after the decimal place (or before if negative)</li><li><code>method::Union{Symbol, String}=:correlation</code>: Method for computing similarities, one of {:correlation, :euclidean, :cosine}.</li></ul><pre><code class="language-julia">eval_SC_loose(Chat, cue_obj.C, k)
-eval_SC_loose(Shat, S, k)</code></pre></div><a class="docs-sourcelink" target="_blank" href="https://github.com/quantling/JudiLing.jl/blob/244bb0c648484065ffd5a41781ccc1caf2e5db60/src/eval.jl#LL698-L721">source</a></section></article><article class="docstring"><header><a class="docstring-binding" id="JudiLing.eval_SC_loose-NTuple{5, Any}" href="#JudiLing.eval_SC_loose-NTuple{5, Any}"><code>JudiLing.eval_SC_loose</code></a> — <span class="docstring-category">Method</span></header><section><div><pre><code class="language-julia">eval_SC_loose(SChat, SC, k, data, target_col)</code></pre><p>Assess model accuracy on the basis of the correlations (or Euclidean distances or Cosine Similarities) of row vectors of Chat and C or Shat and S. Ideally the target words have highest correlations (lowest distance/highest similarity) on the diagonal of the pertinent correlation (distance/similarity) matrices. Count it as correct if one of the top k candidates is correct. Support for homophones.</p><p><strong>Obligatory Arguments</strong></p><ul><li><code>SChat::Union{SparseMatrixCSC, Matrix}</code>: the Chat or Shat matrix</li><li><code>SC::Union{SparseMatrixCSC, Matrix}</code>: the C or S matrix</li><li><code>k</code>: top k candidates</li><li><code>data</code>: datasets</li><li><code>target_col</code>: target column name</li></ul><p><strong>Optional Arguments</strong></p><ul><li><code>digits</code>: the specified number of digits after the decimal place (or before if negative)</li><li><code>method::Union{Symbol, String}=:correlation</code>: Method for computing similarities, one of {:correlation, :euclidean, :cosine}.</li></ul><pre><code class="language-julia">eval_SC_loose(Chat, cue_obj.C, k, latin, :Word)
-eval_SC_loose(Shat, S, k, latin, :Word)</code></pre></div><a class="docs-sourcelink" target="_blank" href="https://github.com/quantling/JudiLing.jl/blob/244bb0c648484065ffd5a41781ccc1caf2e5db60/src/eval.jl#LL768-L791">source</a></section></article><article class="docstring"><header><a class="docstring-binding" id="JudiLing.eval_manual-Tuple{Any, Any, Any}" href="#JudiLing.eval_manual-Tuple{Any, Any, Any}"><code>JudiLing.eval_manual</code></a> — <span class="docstring-category">Method</span></header><section><div><pre><code class="language-julia">eval_manual(res, data, i2f)</code></pre><p>Create extensive reports for the outputs from <code>build_paths</code> and <code>learn_paths</code>.</p></div><a class="docs-sourcelink" target="_blank" href="https://github.com/quantling/JudiLing.jl/blob/244bb0c648484065ffd5a41781ccc1caf2e5db60/src/eval.jl#LL921-L925">source</a></section></article><article class="docstring"><header><a class="docstring-binding" id="JudiLing.eval_acc-Tuple{Any, Array}" href="#JudiLing.eval_acc-Tuple{Any, Array}"><code>JudiLing.eval_acc</code></a> — <span class="docstring-category">Method</span></header><section><div><pre><code class="language-julia">eval_acc(res, gold_inds::Array)</code></pre><p>Evaluate the accuracy of the results from <code>learn_paths</code> or <code>build_paths</code>.</p><p><strong>Obligatory Arguments</strong></p><ul><li><code>res::Array</code>: the results from <code>learn_paths</code> or <code>build_paths</code></li><li><code>gold_inds::Array</code>: the gold paths&#39; indices</li></ul><p><strong>Optional Arguments</strong></p><ul><li><code>digits</code>: the specified number of digits after the decimal place (or before if negative)</li><li><code>verbose::Bool=false</code>: if true, more information is printed</li></ul><p><strong>Examples</strong></p><pre><code class="language-julia"># evaluation on training data
+eval_SC(Shat_val, S_val, latin, :Word, 5000)</code></pre></div><a class="docs-sourcelink" target="_blank" href="https://github.com/quantling/JudiLing.jl/blob/5ca73e4b27ef788e0b36d45e6360491a5a413be8/src/eval.jl#LL592-L620">source</a></section></article><article class="docstring"><header><a class="docstring-binding" id="JudiLing.eval_SC_loose-Tuple{Any, Any, Any}" href="#JudiLing.eval_SC_loose-Tuple{Any, Any, Any}"><code>JudiLing.eval_SC_loose</code></a> — <span class="docstring-category">Method</span></header><section><div><pre><code class="language-julia">eval_SC_loose(SChat, SC, k)</code></pre><p>Assess model accuracy on the basis of the correlations (or Euclidean distances or Cosine Similarities) of row vectors of Chat and C or Shat and S. Ideally the target words have highest correlations (lowest distance/highest similarity) on the diagonal of the pertinent correlation (distance/similarity) matrices. Count it as correct if one of the top k candidates is correct.</p><div class="admonition is-info"><header class="admonition-header">Note</header><div class="admonition-body"><p>If there are homophones/homographs in the dataset, this evaluation method may be misleading: the predicted vector will be equally correlated with the target vector of both words and it is not guaranteed that the target on the diagonal will be among the k neighbours. In particular, <code>eval_SC</code> and <code>eval_SC_loose</code> with k=1 are not guaranteed to give the same result. In such cases, supplying the dataset and <code>target_col</code> is recommended which enables taking into account homophones/homographs.</p></div></div><p><strong>Obligatory Arguments</strong></p><ul><li><code>SChat::Union{SparseMatrixCSC, Matrix}</code>: the Chat or Shat matrix</li><li><code>SC::Union{SparseMatrixCSC, Matrix}</code>: the C or S matrix</li><li><code>k</code>: top k candidates</li></ul><p><strong>Optional Arguments</strong></p><ul><li><code>digits</code>: the specified number of digits after the decimal place (or before if negative)</li><li><code>method::Union{Symbol, String}=:correlation</code>: Method for computing similarities, one of {:correlation, :euclidean, :cosine}.</li></ul><pre><code class="language-julia">eval_SC_loose(Chat, cue_obj.C, k)
+eval_SC_loose(Shat, S, k)</code></pre></div><a class="docs-sourcelink" target="_blank" href="https://github.com/quantling/JudiLing.jl/blob/5ca73e4b27ef788e0b36d45e6360491a5a413be8/src/eval.jl#LL698-L721">source</a></section></article><article class="docstring"><header><a class="docstring-binding" id="JudiLing.eval_SC_loose-NTuple{5, Any}" href="#JudiLing.eval_SC_loose-NTuple{5, Any}"><code>JudiLing.eval_SC_loose</code></a> — <span class="docstring-category">Method</span></header><section><div><pre><code class="language-julia">eval_SC_loose(SChat, SC, k, data, target_col)</code></pre><p>Assess model accuracy on the basis of the correlations (or Euclidean distances or Cosine Similarities) of row vectors of Chat and C or Shat and S. Ideally the target words have highest correlations (lowest distance/highest similarity) on the diagonal of the pertinent correlation (distance/similarity) matrices. Count it as correct if one of the top k candidates is correct. Support for homophones.</p><p><strong>Obligatory Arguments</strong></p><ul><li><code>SChat::Union{SparseMatrixCSC, Matrix}</code>: the Chat or Shat matrix</li><li><code>SC::Union{SparseMatrixCSC, Matrix}</code>: the C or S matrix</li><li><code>k</code>: top k candidates</li><li><code>data</code>: datasets</li><li><code>target_col</code>: target column name</li></ul><p><strong>Optional Arguments</strong></p><ul><li><code>digits</code>: the specified number of digits after the decimal place (or before if negative)</li><li><code>method::Union{Symbol, String}=:correlation</code>: Method for computing similarities, one of {:correlation, :euclidean, :cosine}.</li></ul><pre><code class="language-julia">eval_SC_loose(Chat, cue_obj.C, k, latin, :Word)
+eval_SC_loose(Shat, S, k, latin, :Word)</code></pre></div><a class="docs-sourcelink" target="_blank" href="https://github.com/quantling/JudiLing.jl/blob/5ca73e4b27ef788e0b36d45e6360491a5a413be8/src/eval.jl#LL768-L791">source</a></section></article><article class="docstring"><header><a class="docstring-binding" id="JudiLing.eval_manual-Tuple{Any, Any, Any}" href="#JudiLing.eval_manual-Tuple{Any, Any, Any}"><code>JudiLing.eval_manual</code></a> — <span class="docstring-category">Method</span></header><section><div><pre><code class="language-julia">eval_manual(res, data, i2f)</code></pre><p>Create extensive reports for the outputs from <code>build_paths</code> and <code>learn_paths</code>.</p></div><a class="docs-sourcelink" target="_blank" href="https://github.com/quantling/JudiLing.jl/blob/5ca73e4b27ef788e0b36d45e6360491a5a413be8/src/eval.jl#LL921-L925">source</a></section></article><article class="docstring"><header><a class="docstring-binding" id="JudiLing.eval_acc-Tuple{Any, Array}" href="#JudiLing.eval_acc-Tuple{Any, Array}"><code>JudiLing.eval_acc</code></a> — <span class="docstring-category">Method</span></header><section><div><pre><code class="language-julia">eval_acc(res, gold_inds::Array)</code></pre><p>Evaluate the accuracy of the results from <code>learn_paths</code> or <code>build_paths</code>.</p><p><strong>Obligatory Arguments</strong></p><ul><li><code>res::Array</code>: the results from <code>learn_paths</code> or <code>build_paths</code></li><li><code>gold_inds::Array</code>: the gold paths&#39; indices</li></ul><p><strong>Optional Arguments</strong></p><ul><li><code>digits</code>: the specified number of digits after the decimal place (or before if negative)</li><li><code>verbose::Bool=false</code>: if true, more information is printed</li></ul><p><strong>Examples</strong></p><pre><code class="language-julia"># evaluation on training data
 acc_train = JudiLing.eval_acc(
     res_train,
     cue_obj_train.gold_ind,
@@ -56,7 +56,7 @@
     res_val,
     cue_obj_val.gold_ind,
     verbose=false
-)</code></pre></div><a class="docs-sourcelink" target="_blank" href="https://github.com/quantling/JudiLing.jl/blob/244bb0c648484065ffd5a41781ccc1caf2e5db60/src/eval.jl#LL967-L996">source</a></section></article><article class="docstring"><header><a class="docstring-binding" id="JudiLing.eval_acc-Tuple{Any, JudiLing.Cue_Matrix_Struct}" href="#JudiLing.eval_acc-Tuple{Any, JudiLing.Cue_Matrix_Struct}"><code>JudiLing.eval_acc</code></a> — <span class="docstring-category">Method</span></header><section><div><pre><code class="language-julia">eval_acc(res, cue_obj::Cue_Matrix_Struct)</code></pre><p>Evaluate the accuracy of the results from <code>learn_paths</code> or <code>build_paths</code>.</p><p><strong>Obligatory Arguments</strong></p><ul><li><code>res::Array</code>: the results from <code>learn_paths</code> or <code>build_paths</code></li><li><code>cue_obj::Cue_Matrix_Struct</code>: the C matrix object</li></ul><p><strong>Optional Arguments</strong></p><ul><li><code>digits</code>: the specified number of digits after the decimal place (or before if negative)</li><li><code>verbose::Bool=false</code>: if true, more information is printed</li></ul><p><strong>Examples</strong></p><pre><code class="language-julia">acc = JudiLing.eval_acc(res, cue_obj)</code></pre></div><a class="docs-sourcelink" target="_blank" href="https://github.com/quantling/JudiLing.jl/blob/244bb0c648484065ffd5a41781ccc1caf2e5db60/src/eval.jl#LL1020-L1037">source</a></section></article><article class="docstring"><header><a class="docstring-binding" id="JudiLing.eval_acc_loose-Tuple{Any, Any}" href="#JudiLing.eval_acc_loose-Tuple{Any, Any}"><code>JudiLing.eval_acc_loose</code></a> — <span class="docstring-category">Method</span></header><section><div><pre><code class="language-julia">eval_acc_loose(res, gold_inds)</code></pre><p>Lenient evaluation of the accuracy of the results from <code>learn_paths</code> or <code>build_paths</code>, counting a prediction as correct when the correlation of the predicted and gold standard semantic vectors is among the n top correlations, where n is equal to <code>max_can</code> in the &#39;learn<em>paths&#39; or `build</em>paths` function.</p><p><strong>Obligatory Arguments</strong></p><ul><li><code>res::Array</code>: the results from <code>learn_paths</code> or <code>build_paths</code></li><li><code>gold_inds::Array</code>: the gold paths&#39; indices</li></ul><p><strong>Optional Arguments</strong></p><ul><li><code>digits</code>: the specified number of digits after the decimal place (or before if negative)</li><li><code>verbose::Bool=false</code>: if true, more information is printed</li></ul><p><strong>Examples</strong></p><pre><code class="language-julia"># evaluation on training data
+)</code></pre></div><a class="docs-sourcelink" target="_blank" href="https://github.com/quantling/JudiLing.jl/blob/5ca73e4b27ef788e0b36d45e6360491a5a413be8/src/eval.jl#LL967-L996">source</a></section></article><article class="docstring"><header><a class="docstring-binding" id="JudiLing.eval_acc-Tuple{Any, JudiLing.Cue_Matrix_Struct}" href="#JudiLing.eval_acc-Tuple{Any, JudiLing.Cue_Matrix_Struct}"><code>JudiLing.eval_acc</code></a> — <span class="docstring-category">Method</span></header><section><div><pre><code class="language-julia">eval_acc(res, cue_obj::Cue_Matrix_Struct)</code></pre><p>Evaluate the accuracy of the results from <code>learn_paths</code> or <code>build_paths</code>.</p><p><strong>Obligatory Arguments</strong></p><ul><li><code>res::Array</code>: the results from <code>learn_paths</code> or <code>build_paths</code></li><li><code>cue_obj::Cue_Matrix_Struct</code>: the C matrix object</li></ul><p><strong>Optional Arguments</strong></p><ul><li><code>digits</code>: the specified number of digits after the decimal place (or before if negative)</li><li><code>verbose::Bool=false</code>: if true, more information is printed</li></ul><p><strong>Examples</strong></p><pre><code class="language-julia">acc = JudiLing.eval_acc(res, cue_obj)</code></pre></div><a class="docs-sourcelink" target="_blank" href="https://github.com/quantling/JudiLing.jl/blob/5ca73e4b27ef788e0b36d45e6360491a5a413be8/src/eval.jl#LL1020-L1037">source</a></section></article><article class="docstring"><header><a class="docstring-binding" id="JudiLing.eval_acc_loose-Tuple{Any, Any}" href="#JudiLing.eval_acc_loose-Tuple{Any, Any}"><code>JudiLing.eval_acc_loose</code></a> — <span class="docstring-category">Method</span></header><section><div><pre><code class="language-julia">eval_acc_loose(res, gold_inds)</code></pre><p>Lenient evaluation of the accuracy of the results from <code>learn_paths</code> or <code>build_paths</code>, counting a prediction as correct when the correlation of the predicted and gold standard semantic vectors is among the n top correlations, where n is equal to <code>max_can</code> in the &#39;learn<em>paths&#39; or `build</em>paths` function.</p><p><strong>Obligatory Arguments</strong></p><ul><li><code>res::Array</code>: the results from <code>learn_paths</code> or <code>build_paths</code></li><li><code>gold_inds::Array</code>: the gold paths&#39; indices</li></ul><p><strong>Optional Arguments</strong></p><ul><li><code>digits</code>: the specified number of digits after the decimal place (or before if negative)</li><li><code>verbose::Bool=false</code>: if true, more information is printed</li></ul><p><strong>Examples</strong></p><pre><code class="language-julia"># evaluation on training data
 acc_train_loose = JudiLing.eval_acc_loose(
     res_train,
     cue_obj_train.gold_ind,
@@ -68,4 +68,4 @@
     res_val,
     cue_obj_val.gold_ind,
     verbose=false
-)</code></pre></div><a class="docs-sourcelink" target="_blank" href="https://github.com/quantling/JudiLing.jl/blob/244bb0c648484065ffd5a41781ccc1caf2e5db60/src/eval.jl#LL1042-L1074">source</a></section></article><article class="docstring"><header><a class="docstring-binding" id="JudiLing.extract_gpi" href="#JudiLing.extract_gpi"><code>JudiLing.extract_gpi</code></a> — <span class="docstring-category">Function</span></header><section><div><p>extract_gpi(gpi, threshold=0.1, tolerance=(-1000.0))</p><p>Extract, using gold paths&#39; information, how many n-grams for a gold path are below the threshold but above the tolerance.</p></div><a class="docs-sourcelink" target="_blank" href="https://github.com/quantling/JudiLing.jl/blob/244bb0c648484065ffd5a41781ccc1caf2e5db60/src/eval.jl#LL1104-L1109">source</a></section></article></article><nav class="docs-footer"><a class="docs-footer-prevpage" href="../find_path/">« Find Paths</a><a class="docs-footer-nextpage" href="../output/">Output »</a><div class="flexbox-break"></div><p class="footer-message">Powered by <a href="https://github.com/JuliaDocs/Documenter.jl">Documenter.jl</a> and the <a href="https://julialang.org/">Julia Programming Language</a>.</p></nav></div><div class="modal" id="documenter-settings"><div class="modal-background"></div><div class="modal-card"><header class="modal-card-head"><p class="modal-card-title">Settings</p><button class="delete"></button></header><section class="modal-card-body"><p><label class="label">Theme</label><div class="select"><select id="documenter-themepicker"><option value="documenter-light">documenter-light</option><option value="documenter-dark">documenter-dark</option></select></div></p><hr/><p>This document was generated with <a href="https://github.com/JuliaDocs/Documenter.jl">Documenter.jl</a> on <span class="colophon-date" title="Wednesday 3 July 2024 16:02">Wednesday 3 July 2024</span>. Using Julia version 1.10.4.</p></section><footer class="modal-card-foot"></footer></div></div></div></body></html>
+)</code></pre></div><a class="docs-sourcelink" target="_blank" href="https://github.com/quantling/JudiLing.jl/blob/5ca73e4b27ef788e0b36d45e6360491a5a413be8/src/eval.jl#LL1042-L1074">source</a></section></article><article class="docstring"><header><a class="docstring-binding" id="JudiLing.extract_gpi" href="#JudiLing.extract_gpi"><code>JudiLing.extract_gpi</code></a> — <span class="docstring-category">Function</span></header><section><div><p>extract_gpi(gpi, threshold=0.1, tolerance=(-1000.0))</p><p>Extract, using gold paths&#39; information, how many n-grams for a gold path are below the threshold but above the tolerance.</p></div><a class="docs-sourcelink" target="_blank" href="https://github.com/quantling/JudiLing.jl/blob/5ca73e4b27ef788e0b36d45e6360491a5a413be8/src/eval.jl#LL1104-L1109">source</a></section></article></article><nav class="docs-footer"><a class="docs-footer-prevpage" href="../find_path/">« Find Paths</a><a class="docs-footer-nextpage" href="../output/">Output »</a><div class="flexbox-break"></div><p class="footer-message">Powered by <a href="https://github.com/JuliaDocs/Documenter.jl">Documenter.jl</a> and the <a href="https://julialang.org/">Julia Programming Language</a>.</p></nav></div><div class="modal" id="documenter-settings"><div class="modal-background"></div><div class="modal-card"><header class="modal-card-head"><p class="modal-card-title">Settings</p><button class="delete"></button></header><section class="modal-card-body"><p><label class="label">Theme</label><div class="select"><select id="documenter-themepicker"><option value="documenter-light">documenter-light</option><option value="documenter-dark">documenter-dark</option></select></div></p><hr/><p>This document was generated with <a href="https://github.com/JuliaDocs/Documenter.jl">Documenter.jl</a> on <span class="colophon-date" title="Wednesday 3 July 2024 16:16">Wednesday 3 July 2024</span>. Using Julia version 1.10.4.</p></section><footer class="modal-card-foot"></footer></div></div></div></body></html>
diff --git a/dev/man/find_path/index.html b/dev/man/find_path/index.html
index 709e836..ffc0ea4 100644
--- a/dev/man/find_path/index.html
+++ b/dev/man/find_path/index.html
@@ -1,5 +1,5 @@
 <!DOCTYPE html>
-<html lang="en"><head><meta charset="UTF-8"/><meta name="viewport" content="width=device-width, initial-scale=1.0"/><title>Find Paths · JudiLing.jl</title><link rel="canonical" href="https://quantling.github.io/JudiLing.jl/man/find_path/"/><link href="https://fonts.googleapis.com/css?family=Lato|Roboto+Mono" rel="stylesheet" type="text/css"/><link href="https://cdnjs.cloudflare.com/ajax/libs/font-awesome/5.15.0/css/fontawesome.min.css" rel="stylesheet" type="text/css"/><link href="https://cdnjs.cloudflare.com/ajax/libs/font-awesome/5.15.0/css/solid.min.css" rel="stylesheet" type="text/css"/><link href="https://cdnjs.cloudflare.com/ajax/libs/font-awesome/5.15.0/css/brands.min.css" rel="stylesheet" type="text/css"/><link href="https://cdnjs.cloudflare.com/ajax/libs/KaTeX/0.11.1/katex.min.css" rel="stylesheet" type="text/css"/><script>documenterBaseURL="../.."</script><script src="https://cdnjs.cloudflare.com/ajax/libs/require.js/2.3.6/require.min.js" data-main="../../assets/documenter.js"></script><script src="../../siteinfo.js"></script><script src="../../../versions.js"></script><link class="docs-theme-link" rel="stylesheet" type="text/css" href="../../assets/themes/documenter-dark.css" data-theme-name="documenter-dark"/><link class="docs-theme-link" rel="stylesheet" type="text/css" href="../../assets/themes/documenter-light.css" data-theme-name="documenter-light" data-theme-primary/><script src="../../assets/themeswap.js"></script></head><body><div id="documenter"><nav class="docs-sidebar"><div class="docs-package-name"><span class="docs-autofit">JudiLing.jl</span></div><form class="docs-search" action="../../search/"><input class="docs-search-query" id="documenter-search-query" name="q" type="text" placeholder="Search docs"/></form><ul class="docs-menu"><li><a class="tocitem" href="../../">Home</a></li><li><span class="tocitem">Manual</span><ul><li><a class="tocitem" href="../input/">Loading data</a></li><li><a class="tocitem" href="../make_cue_matrix/">Make Cue Matrix</a></li><li><a class="tocitem" href="../make_semantic_matrix/">Make Semantic Matrix</a></li><li><a class="tocitem" href="../cholesky/">Cholesky</a></li><li><a class="tocitem" href="../make_adjacency_matrix/">Make Adjacency Matrix</a></li><li><a class="tocitem" href="../make_yt_matrix/">Make Yt Matrix</a></li><li class="is-active"><a class="tocitem" href>Find Paths</a><ul class="internal"><li><a class="tocitem" href="#Structures"><span>Structures</span></a></li><li><a class="tocitem" href="#Build-paths"><span>Build paths</span></a></li><li><a class="tocitem" href="#Learn-paths"><span>Learn paths</span></a></li><li><a class="tocitem" href="#Utility-functions"><span>Utility functions</span></a></li></ul></li><li><a class="tocitem" href="../eval/">Evaluation</a></li><li><a class="tocitem" href="../output/">Output</a></li><li><a class="tocitem" href="../test_combo/">Test Combo</a></li><li><a class="tocitem" href="../display/">Display</a></li><li><a class="tocitem" href="../utils/">Utils</a></li><li><a class="tocitem" href="../pickle/">Pickle</a></li><li><a class="tocitem" href="../pyndl/">Pyndl</a></li><li><a class="tocitem" href="../wh/">Widrow-Hoff Learning</a></li><li><a class="tocitem" href="../deep_learning/">Deep learning</a></li><li><a class="tocitem" href="../measures_func/">Measures function</a></li></ul></li><li><a class="tocitem" href="../all_manual/">All Manual index</a></li></ul><div class="docs-version-selector field has-addons"><div class="control"><span class="docs-label button is-static is-size-7">Version</span></div><div class="docs-selector control is-expanded"><div class="select is-fullwidth is-size-7"><select id="documenter-version-selector"></select></div></div></div></nav><div class="docs-main"><header class="docs-navbar"><nav class="breadcrumb"><ul class="is-hidden-mobile"><li><a class="is-disabled">Manual</a></li><li class="is-active"><a href>Find Paths</a></li></ul><ul class="is-hidden-tablet"><li class="is-active"><a href>Find Paths</a></li></ul></nav><div class="docs-right"><a class="docs-edit-link" href="https://github.com/quantling/JudiLing.jl/blob/master/docs/src/man/find_path.md#L" title="Edit on GitHub"><span class="docs-icon fab"></span><span class="docs-label is-hidden-touch">Edit on GitHub</span></a><a class="docs-settings-button fas fa-cog" id="documenter-settings-button" href="#" title="Settings"></a><a class="docs-sidebar-button fa fa-bars is-hidden-desktop" id="documenter-sidebar-button" href="#"></a></div></header><article class="content" id="documenter-page"><h1 id="Find-Paths"><a class="docs-heading-anchor" href="#Find-Paths">Find Paths</a><a id="Find-Paths-1"></a><a class="docs-heading-anchor-permalink" href="#Find-Paths" title="Permalink"></a></h1><h2 id="Structures"><a class="docs-heading-anchor" href="#Structures">Structures</a><a id="Structures-1"></a><a class="docs-heading-anchor-permalink" href="#Structures" title="Permalink"></a></h2><article class="docstring"><header><a class="docstring-binding" id="JudiLing.Result_Path_Info_Struct" href="#JudiLing.Result_Path_Info_Struct"><code>JudiLing.Result_Path_Info_Struct</code></a> — <span class="docstring-category">Type</span></header><section><div><p>Store paths&#39; information built by <code>learn_paths</code> or <code>build_paths</code></p></div><a class="docs-sourcelink" target="_blank" href="https://github.com/quantling/JudiLing.jl/blob/244bb0c648484065ffd5a41781ccc1caf2e5db60/src/find_path.jl#LL1-L3">source</a></section></article><article class="docstring"><header><a class="docstring-binding" id="JudiLing.Gold_Path_Info_Struct" href="#JudiLing.Gold_Path_Info_Struct"><code>JudiLing.Gold_Path_Info_Struct</code></a> — <span class="docstring-category">Type</span></header><section><div><p>Store gold paths&#39; information including indices and indices&#39; support and total support. It can be used to evaluate how low the threshold needs to be set in order to find most of the correct paths or if set very low, all of the correct paths.</p></div><a class="docs-sourcelink" target="_blank" href="https://github.com/quantling/JudiLing.jl/blob/244bb0c648484065ffd5a41781ccc1caf2e5db60/src/find_path.jl#LL10-L14">source</a></section></article><article class="docstring"><header><a class="docstring-binding" id="JudiLing.Threshold_Stat_Struct" href="#JudiLing.Threshold_Stat_Struct"><code>JudiLing.Threshold_Stat_Struct</code></a> — <span class="docstring-category">Type</span></header><section><div><p>Store threshold and tolerance proportional for each timestep.</p></div><a class="docs-sourcelink" target="_blank" href="https://github.com/quantling/JudiLing.jl/blob/244bb0c648484065ffd5a41781ccc1caf2e5db60/src/find_path.jl#LL21-L23">source</a></section></article><h2 id="Build-paths"><a class="docs-heading-anchor" href="#Build-paths">Build paths</a><a id="Build-paths-1"></a><a class="docs-heading-anchor-permalink" href="#Build-paths" title="Permalink"></a></h2><article class="docstring"><header><a class="docstring-binding" id="JudiLing.build_paths" href="#JudiLing.build_paths"><code>JudiLing.build_paths</code></a> — <span class="docstring-category">Function</span></header><section><div><p>The build_paths function constructs paths by only considering those n-grams that are close to the target. It first takes the predicted c-hat vector and finds the closest n neighbors in the C matrix. Then it selects all n-grams of these neighbors, and constructs all valid paths with those n-grams. The path producing the best correlation with the target semantic vector (through synthesis by analysis) is selected.</p></div><a class="docs-sourcelink" target="_blank" href="https://github.com/quantling/JudiLing.jl/blob/244bb0c648484065ffd5a41781ccc1caf2e5db60/src/find_path.jl#LL39-L45">source</a></section></article><article class="docstring"><header><a class="docstring-binding" id="JudiLing.build_paths-NTuple{8, Any}" href="#JudiLing.build_paths-NTuple{8, Any}"><code>JudiLing.build_paths</code></a> — <span class="docstring-category">Method</span></header><section><div><pre><code class="language-julia">build_paths(
+<html lang="en"><head><meta charset="UTF-8"/><meta name="viewport" content="width=device-width, initial-scale=1.0"/><title>Find Paths · JudiLing.jl</title><link rel="canonical" href="https://quantling.github.io/JudiLing.jl/man/find_path/"/><link href="https://fonts.googleapis.com/css?family=Lato|Roboto+Mono" rel="stylesheet" type="text/css"/><link href="https://cdnjs.cloudflare.com/ajax/libs/font-awesome/5.15.0/css/fontawesome.min.css" rel="stylesheet" type="text/css"/><link href="https://cdnjs.cloudflare.com/ajax/libs/font-awesome/5.15.0/css/solid.min.css" rel="stylesheet" type="text/css"/><link href="https://cdnjs.cloudflare.com/ajax/libs/font-awesome/5.15.0/css/brands.min.css" rel="stylesheet" type="text/css"/><link href="https://cdnjs.cloudflare.com/ajax/libs/KaTeX/0.11.1/katex.min.css" rel="stylesheet" type="text/css"/><script>documenterBaseURL="../.."</script><script src="https://cdnjs.cloudflare.com/ajax/libs/require.js/2.3.6/require.min.js" data-main="../../assets/documenter.js"></script><script src="../../siteinfo.js"></script><script src="../../../versions.js"></script><link class="docs-theme-link" rel="stylesheet" type="text/css" href="../../assets/themes/documenter-dark.css" data-theme-name="documenter-dark"/><link class="docs-theme-link" rel="stylesheet" type="text/css" href="../../assets/themes/documenter-light.css" data-theme-name="documenter-light" data-theme-primary/><script src="../../assets/themeswap.js"></script></head><body><div id="documenter"><nav class="docs-sidebar"><div class="docs-package-name"><span class="docs-autofit">JudiLing.jl</span></div><form class="docs-search" action="../../search/"><input class="docs-search-query" id="documenter-search-query" name="q" type="text" placeholder="Search docs"/></form><ul class="docs-menu"><li><a class="tocitem" href="../../">Home</a></li><li><span class="tocitem">Manual</span><ul><li><a class="tocitem" href="../input/">Loading data</a></li><li><a class="tocitem" href="../make_cue_matrix/">Make Cue Matrix</a></li><li><a class="tocitem" href="../make_semantic_matrix/">Make Semantic Matrix</a></li><li><a class="tocitem" href="../cholesky/">Cholesky</a></li><li><a class="tocitem" href="../make_adjacency_matrix/">Make Adjacency Matrix</a></li><li><a class="tocitem" href="../make_yt_matrix/">Make Yt Matrix</a></li><li class="is-active"><a class="tocitem" href>Find Paths</a><ul class="internal"><li><a class="tocitem" href="#Structures"><span>Structures</span></a></li><li><a class="tocitem" href="#Build-paths"><span>Build paths</span></a></li><li><a class="tocitem" href="#Learn-paths"><span>Learn paths</span></a></li><li><a class="tocitem" href="#Utility-functions"><span>Utility functions</span></a></li></ul></li><li><a class="tocitem" href="../eval/">Evaluation</a></li><li><a class="tocitem" href="../output/">Output</a></li><li><a class="tocitem" href="../test_combo/">Test Combo</a></li><li><a class="tocitem" href="../display/">Display</a></li><li><a class="tocitem" href="../utils/">Utils</a></li><li><a class="tocitem" href="../pickle/">Pickle</a></li><li><a class="tocitem" href="../pyndl/">Pyndl</a></li><li><a class="tocitem" href="../wh/">Widrow-Hoff Learning</a></li><li><a class="tocitem" href="../deep_learning/">Deep learning</a></li><li><a class="tocitem" href="../measures_func/">Measures function</a></li></ul></li><li><a class="tocitem" href="../all_manual/">All Manual index</a></li></ul><div class="docs-version-selector field has-addons"><div class="control"><span class="docs-label button is-static is-size-7">Version</span></div><div class="docs-selector control is-expanded"><div class="select is-fullwidth is-size-7"><select id="documenter-version-selector"></select></div></div></div></nav><div class="docs-main"><header class="docs-navbar"><nav class="breadcrumb"><ul class="is-hidden-mobile"><li><a class="is-disabled">Manual</a></li><li class="is-active"><a href>Find Paths</a></li></ul><ul class="is-hidden-tablet"><li class="is-active"><a href>Find Paths</a></li></ul></nav><div class="docs-right"><a class="docs-edit-link" href="https://github.com/quantling/JudiLing.jl/blob/master/docs/src/man/find_path.md#L" title="Edit on GitHub"><span class="docs-icon fab"></span><span class="docs-label is-hidden-touch">Edit on GitHub</span></a><a class="docs-settings-button fas fa-cog" id="documenter-settings-button" href="#" title="Settings"></a><a class="docs-sidebar-button fa fa-bars is-hidden-desktop" id="documenter-sidebar-button" href="#"></a></div></header><article class="content" id="documenter-page"><h1 id="Find-Paths"><a class="docs-heading-anchor" href="#Find-Paths">Find Paths</a><a id="Find-Paths-1"></a><a class="docs-heading-anchor-permalink" href="#Find-Paths" title="Permalink"></a></h1><h2 id="Structures"><a class="docs-heading-anchor" href="#Structures">Structures</a><a id="Structures-1"></a><a class="docs-heading-anchor-permalink" href="#Structures" title="Permalink"></a></h2><article class="docstring"><header><a class="docstring-binding" id="JudiLing.Result_Path_Info_Struct" href="#JudiLing.Result_Path_Info_Struct"><code>JudiLing.Result_Path_Info_Struct</code></a> — <span class="docstring-category">Type</span></header><section><div><p>Store paths&#39; information built by <code>learn_paths</code> or <code>build_paths</code></p></div><a class="docs-sourcelink" target="_blank" href="https://github.com/quantling/JudiLing.jl/blob/5ca73e4b27ef788e0b36d45e6360491a5a413be8/src/find_path.jl#LL1-L3">source</a></section></article><article class="docstring"><header><a class="docstring-binding" id="JudiLing.Gold_Path_Info_Struct" href="#JudiLing.Gold_Path_Info_Struct"><code>JudiLing.Gold_Path_Info_Struct</code></a> — <span class="docstring-category">Type</span></header><section><div><p>Store gold paths&#39; information including indices and indices&#39; support and total support. It can be used to evaluate how low the threshold needs to be set in order to find most of the correct paths or if set very low, all of the correct paths.</p></div><a class="docs-sourcelink" target="_blank" href="https://github.com/quantling/JudiLing.jl/blob/5ca73e4b27ef788e0b36d45e6360491a5a413be8/src/find_path.jl#LL10-L14">source</a></section></article><article class="docstring"><header><a class="docstring-binding" id="JudiLing.Threshold_Stat_Struct" href="#JudiLing.Threshold_Stat_Struct"><code>JudiLing.Threshold_Stat_Struct</code></a> — <span class="docstring-category">Type</span></header><section><div><p>Store threshold and tolerance proportional for each timestep.</p></div><a class="docs-sourcelink" target="_blank" href="https://github.com/quantling/JudiLing.jl/blob/5ca73e4b27ef788e0b36d45e6360491a5a413be8/src/find_path.jl#LL21-L23">source</a></section></article><h2 id="Build-paths"><a class="docs-heading-anchor" href="#Build-paths">Build paths</a><a id="Build-paths-1"></a><a class="docs-heading-anchor-permalink" href="#Build-paths" title="Permalink"></a></h2><article class="docstring"><header><a class="docstring-binding" id="JudiLing.build_paths" href="#JudiLing.build_paths"><code>JudiLing.build_paths</code></a> — <span class="docstring-category">Function</span></header><section><div><p>The build_paths function constructs paths by only considering those n-grams that are close to the target. It first takes the predicted c-hat vector and finds the closest n neighbors in the C matrix. Then it selects all n-grams of these neighbors, and constructs all valid paths with those n-grams. The path producing the best correlation with the target semantic vector (through synthesis by analysis) is selected.</p></div><a class="docs-sourcelink" target="_blank" href="https://github.com/quantling/JudiLing.jl/blob/5ca73e4b27ef788e0b36d45e6360491a5a413be8/src/find_path.jl#LL39-L45">source</a></section></article><article class="docstring"><header><a class="docstring-binding" id="JudiLing.build_paths-NTuple{8, Any}" href="#JudiLing.build_paths-NTuple{8, Any}"><code>JudiLing.build_paths</code></a> — <span class="docstring-category">Method</span></header><section><div><pre><code class="language-julia">build_paths(
     data_val,
     C_train,
     S_val,
@@ -66,7 +66,7 @@
     pca_eval_M=Fo,
     n_neighbors=3,
     verbose=true
-    )</code></pre></div><a class="docs-sourcelink" target="_blank" href="https://github.com/quantling/JudiLing.jl/blob/244bb0c648484065ffd5a41781ccc1caf2e5db60/src/find_path.jl#LL635-L739">source</a></section></article><h2 id="Learn-paths"><a class="docs-heading-anchor" href="#Learn-paths">Learn paths</a><a id="Learn-paths-1"></a><a class="docs-heading-anchor-permalink" href="#Learn-paths" title="Permalink"></a></h2><article class="docstring"><header><a class="docstring-binding" id="JudiLing.learn_paths" href="#JudiLing.learn_paths"><code>JudiLing.learn_paths</code></a> — <span class="docstring-category">Function</span></header><section><div><p>A sequence finding algorithm using discrimination learning to predict, for a given word, which n-grams are best supported for a given position in the sequence of n-grams.</p></div><a class="docs-sourcelink" target="_blank" href="https://github.com/quantling/JudiLing.jl/blob/244bb0c648484065ffd5a41781ccc1caf2e5db60/src/find_path.jl#LL33-L36">source</a></section></article><article class="docstring"><header><a class="docstring-binding" id="JudiLing.learn_paths-Tuple{DataFrames.DataFrame, JudiLing.Cue_Matrix_Struct, Union{SparseArrays.SparseMatrixCSC, Matrix}, Any, Union{SparseArrays.SparseMatrixCSC, Matrix}}" href="#JudiLing.learn_paths-Tuple{DataFrames.DataFrame, JudiLing.Cue_Matrix_Struct, Union{SparseArrays.SparseMatrixCSC, Matrix}, Any, Union{SparseArrays.SparseMatrixCSC, Matrix}}"><code>JudiLing.learn_paths</code></a> — <span class="docstring-category">Method</span></header><section><div><pre><code class="language-julia">learn_paths(
+    )</code></pre></div><a class="docs-sourcelink" target="_blank" href="https://github.com/quantling/JudiLing.jl/blob/5ca73e4b27ef788e0b36d45e6360491a5a413be8/src/find_path.jl#LL635-L739">source</a></section></article><h2 id="Learn-paths"><a class="docs-heading-anchor" href="#Learn-paths">Learn paths</a><a id="Learn-paths-1"></a><a class="docs-heading-anchor-permalink" href="#Learn-paths" title="Permalink"></a></h2><article class="docstring"><header><a class="docstring-binding" id="JudiLing.learn_paths" href="#JudiLing.learn_paths"><code>JudiLing.learn_paths</code></a> — <span class="docstring-category">Function</span></header><section><div><p>A sequence finding algorithm using discrimination learning to predict, for a given word, which n-grams are best supported for a given position in the sequence of n-grams.</p></div><a class="docs-sourcelink" target="_blank" href="https://github.com/quantling/JudiLing.jl/blob/5ca73e4b27ef788e0b36d45e6360491a5a413be8/src/find_path.jl#LL33-L36">source</a></section></article><article class="docstring"><header><a class="docstring-binding" id="JudiLing.learn_paths-Tuple{DataFrames.DataFrame, JudiLing.Cue_Matrix_Struct, Union{SparseArrays.SparseMatrixCSC, Matrix}, Any, Union{SparseArrays.SparseMatrixCSC, Matrix}}" href="#JudiLing.learn_paths-Tuple{DataFrames.DataFrame, JudiLing.Cue_Matrix_Struct, Union{SparseArrays.SparseMatrixCSC, Matrix}, Any, Union{SparseArrays.SparseMatrixCSC, Matrix}}"><code>JudiLing.learn_paths</code></a> — <span class="docstring-category">Method</span></header><section><div><pre><code class="language-julia">learn_paths(
     data::DataFrame,
     cue_obj::Cue_Matrix_Struct,
     S_val::Union{SparseMatrixCSC, Matrix},
@@ -80,7 +80,7 @@
     max_tolerance::Int = 3,
     activation::Union{Nothing, Function} = nothing,
     ignore_nan::Bool = true,
-    verbose::Bool = true)</code></pre><p>A high-level wrapper function for <code>learn_paths</code> with much less control. It aims for users who is very new to JudiLing and <code>learn_paths</code> function.</p><p><strong>Obligatory Arguments</strong></p><ul><li><code>data::DataFrame</code>: the training dataset</li><li><code>cue_obj::Cue_Matrix_Struct</code>: the C matrix object containing all information with C</li><li><code>S_val::Union{SparseMatrixCSC, Matrix}</code>: the S matrix for validation dataset</li><li><code>F_train::Union{SparseMatrixCSC, Matrix, Chain}</code>: either the F matrix for training dataset, or a deep learning comprehension model trained on the training set</li><li><code>Chat_val::Union{SparseMatrixCSC, Matrix}</code>: the Chat matrix for validation dataset</li></ul><p><strong>Optional Arguments</strong></p><ul><li><code>Shat_val::Union{Nothing, Matrix}=nothing</code>: the Shat matrix for the validation dataset</li><li><code>check_gold_path::Bool=false</code>: if true, return a list of support values for the gold path; this information is returned as second output value</li><li><code>threshold::Float64=0.1</code>:the value set for the support such that if the support of an n-gram is higher than this value, the n-gram will be taking into consideration</li><li><code>is_tolerant::Bool=false</code>: if true, select a specified number (given by <code>max_tolerance</code>) of n-grams whose supports are below threshold but above a second tolerance threshold to be added to the path</li><li><code>tolerance::Float64=(-1000.0)</code>: the value set for the second threshold (in tolerant mode) such that if the support for an n-gram is in between this value and the threshold and the max_tolerance number has not been reached, then allow this n-gram to be added to the path</li><li><code>max_tolerance::Int64=4</code>: maximum number of n-grams allowed in a path</li><li><code>activation::Function=nothing</code>: the activation function you want to pass</li><li><code>ignore_nan::Bool=true</code>: whether to ignore NaN when compare correlations, otherwise NaN will be selected as the max correlation value</li><li><code>verbose::Bool=false</code>: if true, more information is printed</li></ul><p><strong>Examples</strong></p><pre><code class="language-julia">res = learn_paths(latin, cue_obj, S, F, Chat)</code></pre></div><a class="docs-sourcelink" target="_blank" href="https://github.com/quantling/JudiLing.jl/blob/244bb0c648484065ffd5a41781ccc1caf2e5db60/src/find_path.jl#LL543-L585">source</a></section></article><article class="docstring"><header><a class="docstring-binding" id="JudiLing.learn_paths-Tuple{DataFrames.DataFrame, DataFrames.DataFrame, Union{SparseArrays.SparseMatrixCSC, Matrix}, Union{SparseArrays.SparseMatrixCSC, Matrix}, Any, Union{SparseArrays.SparseMatrixCSC, Matrix}, SparseArrays.SparseMatrixCSC, Dict, Dict}" href="#JudiLing.learn_paths-Tuple{DataFrames.DataFrame, DataFrames.DataFrame, Union{SparseArrays.SparseMatrixCSC, Matrix}, Union{SparseArrays.SparseMatrixCSC, Matrix}, Any, Union{SparseArrays.SparseMatrixCSC, Matrix}, SparseArrays.SparseMatrixCSC, Dict, Dict}"><code>JudiLing.learn_paths</code></a> — <span class="docstring-category">Method</span></header><section><div><pre><code class="language-julia">learn_paths(
+    verbose::Bool = true)</code></pre><p>A high-level wrapper function for <code>learn_paths</code> with much less control. It aims for users who is very new to JudiLing and <code>learn_paths</code> function.</p><p><strong>Obligatory Arguments</strong></p><ul><li><code>data::DataFrame</code>: the training dataset</li><li><code>cue_obj::Cue_Matrix_Struct</code>: the C matrix object containing all information with C</li><li><code>S_val::Union{SparseMatrixCSC, Matrix}</code>: the S matrix for validation dataset</li><li><code>F_train::Union{SparseMatrixCSC, Matrix, Chain}</code>: either the F matrix for training dataset, or a deep learning comprehension model trained on the training set</li><li><code>Chat_val::Union{SparseMatrixCSC, Matrix}</code>: the Chat matrix for validation dataset</li></ul><p><strong>Optional Arguments</strong></p><ul><li><code>Shat_val::Union{Nothing, Matrix}=nothing</code>: the Shat matrix for the validation dataset</li><li><code>check_gold_path::Bool=false</code>: if true, return a list of support values for the gold path; this information is returned as second output value</li><li><code>threshold::Float64=0.1</code>:the value set for the support such that if the support of an n-gram is higher than this value, the n-gram will be taking into consideration</li><li><code>is_tolerant::Bool=false</code>: if true, select a specified number (given by <code>max_tolerance</code>) of n-grams whose supports are below threshold but above a second tolerance threshold to be added to the path</li><li><code>tolerance::Float64=(-1000.0)</code>: the value set for the second threshold (in tolerant mode) such that if the support for an n-gram is in between this value and the threshold and the max_tolerance number has not been reached, then allow this n-gram to be added to the path</li><li><code>max_tolerance::Int64=4</code>: maximum number of n-grams allowed in a path</li><li><code>activation::Function=nothing</code>: the activation function you want to pass</li><li><code>ignore_nan::Bool=true</code>: whether to ignore NaN when compare correlations, otherwise NaN will be selected as the max correlation value</li><li><code>verbose::Bool=false</code>: if true, more information is printed</li></ul><p><strong>Examples</strong></p><pre><code class="language-julia">res = learn_paths(latin, cue_obj, S, F, Chat)</code></pre></div><a class="docs-sourcelink" target="_blank" href="https://github.com/quantling/JudiLing.jl/blob/5ca73e4b27ef788e0b36d45e6360491a5a413be8/src/find_path.jl#LL543-L585">source</a></section></article><article class="docstring"><header><a class="docstring-binding" id="JudiLing.learn_paths-Tuple{DataFrames.DataFrame, DataFrames.DataFrame, Union{SparseArrays.SparseMatrixCSC, Matrix}, Union{SparseArrays.SparseMatrixCSC, Matrix}, Any, Union{SparseArrays.SparseMatrixCSC, Matrix}, SparseArrays.SparseMatrixCSC, Dict, Dict}" href="#JudiLing.learn_paths-Tuple{DataFrames.DataFrame, DataFrames.DataFrame, Union{SparseArrays.SparseMatrixCSC, Matrix}, Union{SparseArrays.SparseMatrixCSC, Matrix}, Any, Union{SparseArrays.SparseMatrixCSC, Matrix}, SparseArrays.SparseMatrixCSC, Dict, Dict}"><code>JudiLing.learn_paths</code></a> — <span class="docstring-category">Method</span></header><section><div><pre><code class="language-julia">learn_paths(
     data_train::DataFrame,
     data_val::DataFrame,
     C_train::Union{Matrix, SparseMatrixCSC},
@@ -227,7 +227,7 @@
 if_pca=true,
 pca_eval_M=Fo,
 verbose=true);
-</code></pre></div><a class="docs-sourcelink" target="_blank" href="https://github.com/quantling/JudiLing.jl/blob/244bb0c648484065ffd5a41781ccc1caf2e5db60/src/find_path.jl#LL48-L241">source</a></section></article><article class="docstring"><header><a class="docstring-binding" id="JudiLing.learn_paths_rpi-Tuple{DataFrames.DataFrame, DataFrames.DataFrame, Union{SparseArrays.SparseMatrixCSC, Matrix}, Union{SparseArrays.SparseMatrixCSC, Matrix}, Any, Union{SparseArrays.SparseMatrixCSC, Matrix}, SparseArrays.SparseMatrixCSC, Dict, Dict}" href="#JudiLing.learn_paths_rpi-Tuple{DataFrames.DataFrame, DataFrames.DataFrame, Union{SparseArrays.SparseMatrixCSC, Matrix}, Union{SparseArrays.SparseMatrixCSC, Matrix}, Any, Union{SparseArrays.SparseMatrixCSC, Matrix}, SparseArrays.SparseMatrixCSC, Dict, Dict}"><code>JudiLing.learn_paths_rpi</code></a> — <span class="docstring-category">Method</span></header><section><div><pre><code class="language-julia">learn_paths_rpi(
+</code></pre></div><a class="docs-sourcelink" target="_blank" href="https://github.com/quantling/JudiLing.jl/blob/5ca73e4b27ef788e0b36d45e6360491a5a413be8/src/find_path.jl#LL48-L241">source</a></section></article><article class="docstring"><header><a class="docstring-binding" id="JudiLing.learn_paths_rpi-Tuple{DataFrames.DataFrame, DataFrames.DataFrame, Union{SparseArrays.SparseMatrixCSC, Matrix}, Union{SparseArrays.SparseMatrixCSC, Matrix}, Any, Union{SparseArrays.SparseMatrixCSC, Matrix}, SparseArrays.SparseMatrixCSC, Dict, Dict}" href="#JudiLing.learn_paths_rpi-Tuple{DataFrames.DataFrame, DataFrames.DataFrame, Union{SparseArrays.SparseMatrixCSC, Matrix}, Union{SparseArrays.SparseMatrixCSC, Matrix}, Any, Union{SparseArrays.SparseMatrixCSC, Matrix}, SparseArrays.SparseMatrixCSC, Dict, Dict}"><code>JudiLing.learn_paths_rpi</code></a> — <span class="docstring-category">Method</span></header><section><div><pre><code class="language-julia">learn_paths_rpi(
     data_train::DataFrame,
     data_val::DataFrame,
     C_train::Union{Matrix, SparseMatrixCSC},
@@ -260,5 +260,5 @@
     ignore_nan::Bool = true,
     check_threshold_stat::Bool = false,
     verbose::Bool = false
-)</code></pre><p>Calculate learn_paths with results indices supports as well.</p><p><strong>Obligatory Arguments</strong></p><ul><li><code>data::DataFrame</code>: the training dataset</li><li><code>data_val::DataFrame</code>: the validation dataset</li><li><code>C_train::Union{SparseMatrixCSC, Matrix}</code>: the C matrix for training dataset</li><li><code>S_val::Union{SparseMatrixCSC, Matrix}</code>: the S matrix for validation dataset</li><li><code>F_train::Union{SparseMatrixCSC, Matrix, Chain}</code>: the F matrix for training dataset, or a deep learning comprehension model trained on the training data</li><li><code>Chat_val::Union{SparseMatrixCSC, Matrix}</code>: the Chat matrix for validation dataset</li><li><code>A::SparseMatrixCSC</code>: the adjacency matrix</li><li><code>i2f::Dict</code>: the dictionary returning features given indices</li><li><code>f2i::Dict</code>: the dictionary returning indices given features</li></ul><p><strong>Optional Arguments</strong></p><ul><li><code>gold_ind::Union{Nothing, Vector}=nothing</code>: gold paths&#39; indices</li><li><code>Shat_val::Union{Nothing, Matrix}=nothing</code>: the Shat matrix for the validation dataset</li><li><code>check_gold_path::Bool=false</code>: if true, return a list of support values for the gold path; this information is returned as second output value</li><li><code>max_t::Int64=15</code>: maximum timestep</li><li><code>max_can::Int64=10</code>: maximum number of candidates to consider</li><li><code>threshold::Float64=0.1</code>:the value set for the support such that if the support of an n-gram is higher than this value, the n-gram will be taking into consideration</li><li><code>is_tolerant::Bool=false</code>: if true, select a specified number (given by <code>max_tolerance</code>) of n-grams whose supports are below threshold but above a second tolerance threshold to be added to the path</li><li><code>tolerance::Float64=(-1000.0)</code>: the value set for the second threshold (in tolerant mode) such that if the support for an n-gram is in between this value and the threshold and the max_tolerance number has not been reached, then allow this n-gram to be added to the path</li><li><code>max_tolerance::Int64=4</code>: maximum number of n-grams allowed in a path</li><li><code>grams::Int64=3</code>: the number n of grams that make up an n-gram</li><li><code>tokenized::Bool=false</code>: if true, the dataset target is tokenized</li><li><code>sep_token::Union{Nothing, String, Char}=nothing</code>: separator token</li><li><code>keep_sep::Bool=false</code>:if true, keep separators in cues</li><li><code>target_col::Union{String, :Symbol}=:Words</code>: the column name for target strings</li><li><code>start_end_token::Union{String, Char}=&quot;#&quot;</code>: start and end token in boundary cues</li><li><code>issparse::Union{Symbol, Bool}=:auto</code>: control of whether output of Mt matrix is a dense matrix or a sparse matrix</li><li><code>sparse_ratio::Float64=0.05</code>: the ratio to decide whether a matrix is sparse</li><li><code>if_pca::Bool=false</code>: turn on to enable pca mode</li><li><code>pca_eval_M::Matrix=nothing</code>: pass original F for pca mode</li><li><code>activation::Function=nothing</code>: the activation function you want to pass</li><li><code>ignore_nan::Bool=true</code>: whether to ignore NaN when compare correlations, otherwise NaN will be selected as the max correlation value</li><li><code>check_threshold_stat::Bool=false</code>: if true, return a threshold and torlerance proportion for each timestep</li><li><code>verbose::Bool=false</code>: if true, more information is printed</li></ul></div><a class="docs-sourcelink" target="_blank" href="https://github.com/quantling/JudiLing.jl/blob/244bb0c648484065ffd5a41781ccc1caf2e5db60/src/find_path.jl#LL864-L937">source</a></section></article><h2 id="Utility-functions"><a class="docs-heading-anchor" href="#Utility-functions">Utility functions</a><a id="Utility-functions-1"></a><a class="docs-heading-anchor-permalink" href="#Utility-functions" title="Permalink"></a></h2><article class="docstring"><header><a class="docstring-binding" id="JudiLing.eval_can-NTuple{7, Any}" href="#JudiLing.eval_can-NTuple{7, Any}"><code>JudiLing.eval_can</code></a> — <span class="docstring-category">Method</span></header><section><div><pre><code class="language-julia">eval_can(candidates, S, F::Union{Matrix,SparseMatrixCSC, Chain}, i2f, max_can, if_pca, pca_eval_M)</code></pre><p>Calculate for each candidate path the correlation between predicted semantic vector and the gold standard semantic vector, and select as target for production the path with the highest correlation.</p></div><a class="docs-sourcelink" target="_blank" href="https://github.com/quantling/JudiLing.jl/blob/244bb0c648484065ffd5a41781ccc1caf2e5db60/src/find_path.jl#LL1068-L1074">source</a></section></article><article class="docstring"><header><a class="docstring-binding" id="JudiLing.find_top_feature_indices-Tuple{Any, Any}" href="#JudiLing.find_top_feature_indices-Tuple{Any, Any}"><code>JudiLing.find_top_feature_indices</code></a> — <span class="docstring-category">Method</span></header><section><div><pre><code class="language-julia">find_top_feature_indices(rC, C_train_ind)</code></pre><p>Find all indices for the n-grams of the top n closest neighbors of a given target.</p></div><a class="docs-sourcelink" target="_blank" href="https://github.com/quantling/JudiLing.jl/blob/244bb0c648484065ffd5a41781ccc1caf2e5db60/src/find_path.jl#LL1129-L1134">source</a></section></article><article class="docstring"><header><a class="docstring-binding" id="JudiLing.make_ngrams_ind-Tuple{Any, Any}" href="#JudiLing.make_ngrams_ind-Tuple{Any, Any}"><code>JudiLing.make_ngrams_ind</code></a> — <span class="docstring-category">Method</span></header><section><div><pre><code class="language-julia">make_ngrams_ind(res, n)</code></pre><p>Construct ngrams indices.</p></div><a class="docs-sourcelink" target="_blank" href="https://github.com/quantling/JudiLing.jl/blob/244bb0c648484065ffd5a41781ccc1caf2e5db60/src/find_path.jl#LL1174-L1178">source</a></section></article><article class="docstring"><header><a class="docstring-binding" id="JudiLing.predict_shat-Tuple{Union{SparseArrays.SparseMatrixCSC, Matrix}, Vector{Int64}}" href="#JudiLing.predict_shat-Tuple{Union{SparseArrays.SparseMatrixCSC, Matrix}, Vector{Int64}}"><code>JudiLing.predict_shat</code></a> — <span class="docstring-category">Method</span></header><section><div><pre><code class="language-julia">predict_shat(F::Union{Matrix, SparseMatrixCSC},
-             ci::Vector{Int})</code></pre><p>Predicts semantic vector shat given a comprehension matrix <code>F</code> and a list of indices of ngrams <code>ci</code>.</p><p><strong>Obligatory arguments</strong></p><ul><li><code>F::Union{Matrix, SparseMatrixCSC}</code>: Comprehension matrix F.</li><li><code>ci::Vector{Int}</code>: Vector of indices of ngrams in c vector. Essentially, this is a vector indicating which ngrams in a c vector are absent and which are present.</li></ul></div><a class="docs-sourcelink" target="_blank" href="https://github.com/quantling/JudiLing.jl/blob/244bb0c648484065ffd5a41781ccc1caf2e5db60/src/find_path.jl#LL1194-L1204">source</a></section></article></article><nav class="docs-footer"><a class="docs-footer-prevpage" href="../make_yt_matrix/">« Make Yt Matrix</a><a class="docs-footer-nextpage" href="../eval/">Evaluation »</a><div class="flexbox-break"></div><p class="footer-message">Powered by <a href="https://github.com/JuliaDocs/Documenter.jl">Documenter.jl</a> and the <a href="https://julialang.org/">Julia Programming Language</a>.</p></nav></div><div class="modal" id="documenter-settings"><div class="modal-background"></div><div class="modal-card"><header class="modal-card-head"><p class="modal-card-title">Settings</p><button class="delete"></button></header><section class="modal-card-body"><p><label class="label">Theme</label><div class="select"><select id="documenter-themepicker"><option value="documenter-light">documenter-light</option><option value="documenter-dark">documenter-dark</option></select></div></p><hr/><p>This document was generated with <a href="https://github.com/JuliaDocs/Documenter.jl">Documenter.jl</a> on <span class="colophon-date" title="Wednesday 3 July 2024 16:02">Wednesday 3 July 2024</span>. Using Julia version 1.10.4.</p></section><footer class="modal-card-foot"></footer></div></div></div></body></html>
+)</code></pre><p>Calculate learn_paths with results indices supports as well.</p><p><strong>Obligatory Arguments</strong></p><ul><li><code>data::DataFrame</code>: the training dataset</li><li><code>data_val::DataFrame</code>: the validation dataset</li><li><code>C_train::Union{SparseMatrixCSC, Matrix}</code>: the C matrix for training dataset</li><li><code>S_val::Union{SparseMatrixCSC, Matrix}</code>: the S matrix for validation dataset</li><li><code>F_train::Union{SparseMatrixCSC, Matrix, Chain}</code>: the F matrix for training dataset, or a deep learning comprehension model trained on the training data</li><li><code>Chat_val::Union{SparseMatrixCSC, Matrix}</code>: the Chat matrix for validation dataset</li><li><code>A::SparseMatrixCSC</code>: the adjacency matrix</li><li><code>i2f::Dict</code>: the dictionary returning features given indices</li><li><code>f2i::Dict</code>: the dictionary returning indices given features</li></ul><p><strong>Optional Arguments</strong></p><ul><li><code>gold_ind::Union{Nothing, Vector}=nothing</code>: gold paths&#39; indices</li><li><code>Shat_val::Union{Nothing, Matrix}=nothing</code>: the Shat matrix for the validation dataset</li><li><code>check_gold_path::Bool=false</code>: if true, return a list of support values for the gold path; this information is returned as second output value</li><li><code>max_t::Int64=15</code>: maximum timestep</li><li><code>max_can::Int64=10</code>: maximum number of candidates to consider</li><li><code>threshold::Float64=0.1</code>:the value set for the support such that if the support of an n-gram is higher than this value, the n-gram will be taking into consideration</li><li><code>is_tolerant::Bool=false</code>: if true, select a specified number (given by <code>max_tolerance</code>) of n-grams whose supports are below threshold but above a second tolerance threshold to be added to the path</li><li><code>tolerance::Float64=(-1000.0)</code>: the value set for the second threshold (in tolerant mode) such that if the support for an n-gram is in between this value and the threshold and the max_tolerance number has not been reached, then allow this n-gram to be added to the path</li><li><code>max_tolerance::Int64=4</code>: maximum number of n-grams allowed in a path</li><li><code>grams::Int64=3</code>: the number n of grams that make up an n-gram</li><li><code>tokenized::Bool=false</code>: if true, the dataset target is tokenized</li><li><code>sep_token::Union{Nothing, String, Char}=nothing</code>: separator token</li><li><code>keep_sep::Bool=false</code>:if true, keep separators in cues</li><li><code>target_col::Union{String, :Symbol}=:Words</code>: the column name for target strings</li><li><code>start_end_token::Union{String, Char}=&quot;#&quot;</code>: start and end token in boundary cues</li><li><code>issparse::Union{Symbol, Bool}=:auto</code>: control of whether output of Mt matrix is a dense matrix or a sparse matrix</li><li><code>sparse_ratio::Float64=0.05</code>: the ratio to decide whether a matrix is sparse</li><li><code>if_pca::Bool=false</code>: turn on to enable pca mode</li><li><code>pca_eval_M::Matrix=nothing</code>: pass original F for pca mode</li><li><code>activation::Function=nothing</code>: the activation function you want to pass</li><li><code>ignore_nan::Bool=true</code>: whether to ignore NaN when compare correlations, otherwise NaN will be selected as the max correlation value</li><li><code>check_threshold_stat::Bool=false</code>: if true, return a threshold and torlerance proportion for each timestep</li><li><code>verbose::Bool=false</code>: if true, more information is printed</li></ul></div><a class="docs-sourcelink" target="_blank" href="https://github.com/quantling/JudiLing.jl/blob/5ca73e4b27ef788e0b36d45e6360491a5a413be8/src/find_path.jl#LL864-L937">source</a></section></article><h2 id="Utility-functions"><a class="docs-heading-anchor" href="#Utility-functions">Utility functions</a><a id="Utility-functions-1"></a><a class="docs-heading-anchor-permalink" href="#Utility-functions" title="Permalink"></a></h2><article class="docstring"><header><a class="docstring-binding" id="JudiLing.eval_can-NTuple{7, Any}" href="#JudiLing.eval_can-NTuple{7, Any}"><code>JudiLing.eval_can</code></a> — <span class="docstring-category">Method</span></header><section><div><pre><code class="language-julia">eval_can(candidates, S, F::Union{Matrix,SparseMatrixCSC, Chain}, i2f, max_can, if_pca, pca_eval_M)</code></pre><p>Calculate for each candidate path the correlation between predicted semantic vector and the gold standard semantic vector, and select as target for production the path with the highest correlation.</p></div><a class="docs-sourcelink" target="_blank" href="https://github.com/quantling/JudiLing.jl/blob/5ca73e4b27ef788e0b36d45e6360491a5a413be8/src/find_path.jl#LL1068-L1074">source</a></section></article><article class="docstring"><header><a class="docstring-binding" id="JudiLing.find_top_feature_indices-Tuple{Any, Any}" href="#JudiLing.find_top_feature_indices-Tuple{Any, Any}"><code>JudiLing.find_top_feature_indices</code></a> — <span class="docstring-category">Method</span></header><section><div><pre><code class="language-julia">find_top_feature_indices(rC, C_train_ind)</code></pre><p>Find all indices for the n-grams of the top n closest neighbors of a given target.</p></div><a class="docs-sourcelink" target="_blank" href="https://github.com/quantling/JudiLing.jl/blob/5ca73e4b27ef788e0b36d45e6360491a5a413be8/src/find_path.jl#LL1129-L1134">source</a></section></article><article class="docstring"><header><a class="docstring-binding" id="JudiLing.make_ngrams_ind-Tuple{Any, Any}" href="#JudiLing.make_ngrams_ind-Tuple{Any, Any}"><code>JudiLing.make_ngrams_ind</code></a> — <span class="docstring-category">Method</span></header><section><div><pre><code class="language-julia">make_ngrams_ind(res, n)</code></pre><p>Construct ngrams indices.</p></div><a class="docs-sourcelink" target="_blank" href="https://github.com/quantling/JudiLing.jl/blob/5ca73e4b27ef788e0b36d45e6360491a5a413be8/src/find_path.jl#LL1174-L1178">source</a></section></article><article class="docstring"><header><a class="docstring-binding" id="JudiLing.predict_shat-Tuple{Union{SparseArrays.SparseMatrixCSC, Matrix}, Vector{Int64}}" href="#JudiLing.predict_shat-Tuple{Union{SparseArrays.SparseMatrixCSC, Matrix}, Vector{Int64}}"><code>JudiLing.predict_shat</code></a> — <span class="docstring-category">Method</span></header><section><div><pre><code class="language-julia">predict_shat(F::Union{Matrix, SparseMatrixCSC},
+             ci::Vector{Int})</code></pre><p>Predicts semantic vector shat given a comprehension matrix <code>F</code> and a list of indices of ngrams <code>ci</code>.</p><p><strong>Obligatory arguments</strong></p><ul><li><code>F::Union{Matrix, SparseMatrixCSC}</code>: Comprehension matrix F.</li><li><code>ci::Vector{Int}</code>: Vector of indices of ngrams in c vector. Essentially, this is a vector indicating which ngrams in a c vector are absent and which are present.</li></ul></div><a class="docs-sourcelink" target="_blank" href="https://github.com/quantling/JudiLing.jl/blob/5ca73e4b27ef788e0b36d45e6360491a5a413be8/src/find_path.jl#LL1194-L1204">source</a></section></article></article><nav class="docs-footer"><a class="docs-footer-prevpage" href="../make_yt_matrix/">« Make Yt Matrix</a><a class="docs-footer-nextpage" href="../eval/">Evaluation »</a><div class="flexbox-break"></div><p class="footer-message">Powered by <a href="https://github.com/JuliaDocs/Documenter.jl">Documenter.jl</a> and the <a href="https://julialang.org/">Julia Programming Language</a>.</p></nav></div><div class="modal" id="documenter-settings"><div class="modal-background"></div><div class="modal-card"><header class="modal-card-head"><p class="modal-card-title">Settings</p><button class="delete"></button></header><section class="modal-card-body"><p><label class="label">Theme</label><div class="select"><select id="documenter-themepicker"><option value="documenter-light">documenter-light</option><option value="documenter-dark">documenter-dark</option></select></div></p><hr/><p>This document was generated with <a href="https://github.com/JuliaDocs/Documenter.jl">Documenter.jl</a> on <span class="colophon-date" title="Wednesday 3 July 2024 16:16">Wednesday 3 July 2024</span>. Using Julia version 1.10.4.</p></section><footer class="modal-card-foot"></footer></div></div></div></body></html>
diff --git a/dev/man/input/index.html b/dev/man/input/index.html
index 7aff442..a9141d6 100644
--- a/dev/man/input/index.html
+++ b/dev/man/input/index.html
@@ -2,7 +2,7 @@
 <html lang="en"><head><meta charset="UTF-8"/><meta name="viewport" content="width=device-width, initial-scale=1.0"/><title>Loading data · JudiLing.jl</title><link rel="canonical" href="https://quantling.github.io/JudiLing.jl/man/input/"/><link href="https://fonts.googleapis.com/css?family=Lato|Roboto+Mono" rel="stylesheet" type="text/css"/><link href="https://cdnjs.cloudflare.com/ajax/libs/font-awesome/5.15.0/css/fontawesome.min.css" rel="stylesheet" type="text/css"/><link href="https://cdnjs.cloudflare.com/ajax/libs/font-awesome/5.15.0/css/solid.min.css" rel="stylesheet" type="text/css"/><link href="https://cdnjs.cloudflare.com/ajax/libs/font-awesome/5.15.0/css/brands.min.css" rel="stylesheet" type="text/css"/><link href="https://cdnjs.cloudflare.com/ajax/libs/KaTeX/0.11.1/katex.min.css" rel="stylesheet" type="text/css"/><script>documenterBaseURL="../.."</script><script src="https://cdnjs.cloudflare.com/ajax/libs/require.js/2.3.6/require.min.js" data-main="../../assets/documenter.js"></script><script src="../../siteinfo.js"></script><script src="../../../versions.js"></script><link class="docs-theme-link" rel="stylesheet" type="text/css" href="../../assets/themes/documenter-dark.css" data-theme-name="documenter-dark"/><link class="docs-theme-link" rel="stylesheet" type="text/css" href="../../assets/themes/documenter-light.css" data-theme-name="documenter-light" data-theme-primary/><script src="../../assets/themeswap.js"></script></head><body><div id="documenter"><nav class="docs-sidebar"><div class="docs-package-name"><span class="docs-autofit">JudiLing.jl</span></div><form class="docs-search" action="../../search/"><input class="docs-search-query" id="documenter-search-query" name="q" type="text" placeholder="Search docs"/></form><ul class="docs-menu"><li><a class="tocitem" href="../../">Home</a></li><li><span class="tocitem">Manual</span><ul><li class="is-active"><a class="tocitem" href>Loading data</a></li><li><a class="tocitem" href="../make_cue_matrix/">Make Cue Matrix</a></li><li><a class="tocitem" href="../make_semantic_matrix/">Make Semantic Matrix</a></li><li><a class="tocitem" href="../cholesky/">Cholesky</a></li><li><a class="tocitem" href="../make_adjacency_matrix/">Make Adjacency Matrix</a></li><li><a class="tocitem" href="../make_yt_matrix/">Make Yt Matrix</a></li><li><a class="tocitem" href="../find_path/">Find Paths</a></li><li><a class="tocitem" href="../eval/">Evaluation</a></li><li><a class="tocitem" href="../output/">Output</a></li><li><a class="tocitem" href="../test_combo/">Test Combo</a></li><li><a class="tocitem" href="../display/">Display</a></li><li><a class="tocitem" href="../utils/">Utils</a></li><li><a class="tocitem" href="../pickle/">Pickle</a></li><li><a class="tocitem" href="../pyndl/">Pyndl</a></li><li><a class="tocitem" href="../wh/">Widrow-Hoff Learning</a></li><li><a class="tocitem" href="../deep_learning/">Deep learning</a></li><li><a class="tocitem" href="../measures_func/">Measures function</a></li></ul></li><li><a class="tocitem" href="../all_manual/">All Manual index</a></li></ul><div class="docs-version-selector field has-addons"><div class="control"><span class="docs-label button is-static is-size-7">Version</span></div><div class="docs-selector control is-expanded"><div class="select is-fullwidth is-size-7"><select id="documenter-version-selector"></select></div></div></div></nav><div class="docs-main"><header class="docs-navbar"><nav class="breadcrumb"><ul class="is-hidden-mobile"><li><a class="is-disabled">Manual</a></li><li class="is-active"><a href>Loading data</a></li></ul><ul class="is-hidden-tablet"><li class="is-active"><a href>Loading data</a></li></ul></nav><div class="docs-right"><a class="docs-edit-link" href="https://github.com/quantling/JudiLing.jl/blob/master/docs/src/man/input.md#L" title="Edit on GitHub"><span class="docs-icon fab"></span><span class="docs-label is-hidden-touch">Edit on GitHub</span></a><a class="docs-settings-button fas fa-cog" id="documenter-settings-button" href="#" title="Settings"></a><a class="docs-sidebar-button fa fa-bars is-hidden-desktop" id="documenter-sidebar-button" href="#"></a></div></header><article class="content" id="documenter-page"><h1 id="Loading-data"><a class="docs-heading-anchor" href="#Loading-data">Loading data</a><a id="Loading-data-1"></a><a class="docs-heading-anchor-permalink" href="#Loading-data" title="Permalink"></a></h1><article class="docstring"><header><a class="docstring-binding" id="JudiLing.load_dataset-Tuple{String}" href="#JudiLing.load_dataset-Tuple{String}"><code>JudiLing.load_dataset</code></a> — <span class="docstring-category">Method</span></header><section><div><pre><code class="language-julia">load_dataset(filepath::String;
             delim::String=&quot;,&quot;,
             kargs...)</code></pre><p>Load a dataset from file, usually comma- or tab-separated. Returns a DataFrame.</p><p><strong>Obligatory arguments</strong></p><ul><li><code>filepath::String</code>: Path to file to be loaded.</li></ul><p><strong>Optional arguments</strong></p><ul><li><code>delim::String=&quot;,&quot;</code>: Delimiter in the file (usually either <code>&quot;,&quot;</code> or <code>&quot;\t&quot;</code>).</li><li><code>kargs...</code>: Further keyword arguments are passed to <code>CSV.File()</code>.</li></ul><p><strong>Example</strong></p><pre><code class="language-julia">latin = JudiLing.load_dataset(&quot;latin.csv&quot;)
-first(latin, 10)</code></pre></div><a class="docs-sourcelink" target="_blank" href="https://github.com/quantling/JudiLing.jl/blob/244bb0c648484065ffd5a41781ccc1caf2e5db60/src/input.jl#LL1-L21">source</a></section></article><article class="docstring"><header><a class="docstring-binding" id="JudiLing.loading_data_randomly_split-Tuple{String, String, String}" href="#JudiLing.loading_data_randomly_split-Tuple{String, String, String}"><code>JudiLing.loading_data_randomly_split</code></a> — <span class="docstring-category">Method</span></header><section><div><pre><code class="language-julia">loading_data_randomly_split(
+first(latin, 10)</code></pre></div><a class="docs-sourcelink" target="_blank" href="https://github.com/quantling/JudiLing.jl/blob/5ca73e4b27ef788e0b36d45e6360491a5a413be8/src/input.jl#LL1-L21">source</a></section></article><article class="docstring"><header><a class="docstring-binding" id="JudiLing.loading_data_randomly_split-Tuple{String, String, String}" href="#JudiLing.loading_data_randomly_split-Tuple{String, String, String}"><code>JudiLing.loading_data_randomly_split</code></a> — <span class="docstring-category">Method</span></header><section><div><pre><code class="language-julia">loading_data_randomly_split(
     data_path::String,
     output_dir_path::String,
     data_prefix::String;
@@ -13,7 +13,7 @@
     &quot;careful&quot;,
     &quot;latin&quot;,
     [&quot;Lexeme&quot;,&quot;Person&quot;,&quot;Number&quot;,&quot;Tense&quot;,&quot;Voice&quot;,&quot;Mood&quot;]
-)</code></pre></div><a class="docs-sourcelink" target="_blank" href="https://github.com/quantling/JudiLing.jl/blob/244bb0c648484065ffd5a41781ccc1caf2e5db60/src/input.jl#LL59-L93">source</a></section></article><article class="docstring"><header><a class="docstring-binding" id="JudiLing.loading_data_careful_split-Tuple{String, String, String, Union{Vector{String}, Vector{Symbol}}}" href="#JudiLing.loading_data_careful_split-Tuple{String, String, String, Union{Vector{String}, Vector{Symbol}}}"><code>JudiLing.loading_data_careful_split</code></a> — <span class="docstring-category">Method</span></header><section><div><pre><code class="language-julia">loading_data_careful_split(
+)</code></pre></div><a class="docs-sourcelink" target="_blank" href="https://github.com/quantling/JudiLing.jl/blob/5ca73e4b27ef788e0b36d45e6360491a5a413be8/src/input.jl#LL59-L93">source</a></section></article><article class="docstring"><header><a class="docstring-binding" id="JudiLing.loading_data_careful_split-Tuple{String, String, String, Union{Vector{String}, Vector{Symbol}}}" href="#JudiLing.loading_data_careful_split-Tuple{String, String, String, Union{Vector{String}, Vector{Symbol}}}"><code>JudiLing.loading_data_careful_split</code></a> — <span class="docstring-category">Method</span></header><section><div><pre><code class="language-julia">loading_data_careful_split(
     data_path::String,
     data_prefix::String,
     output_dir_path::String,
@@ -33,4 +33,4 @@
     &quot;latin&quot;,
     &quot;careful&quot;,
     [&quot;Lexeme&quot;,&quot;Person&quot;,&quot;Number&quot;,&quot;Tense&quot;,&quot;Voice&quot;,&quot;Mood&quot;]
-)</code></pre></div><a class="docs-sourcelink" target="_blank" href="https://github.com/quantling/JudiLing.jl/blob/244bb0c648484065ffd5a41781ccc1caf2e5db60/src/input.jl#LL151-L203">source</a></section></article></article><nav class="docs-footer"><a class="docs-footer-prevpage" href="../../">« Home</a><a class="docs-footer-nextpage" href="../make_cue_matrix/">Make Cue Matrix »</a><div class="flexbox-break"></div><p class="footer-message">Powered by <a href="https://github.com/JuliaDocs/Documenter.jl">Documenter.jl</a> and the <a href="https://julialang.org/">Julia Programming Language</a>.</p></nav></div><div class="modal" id="documenter-settings"><div class="modal-background"></div><div class="modal-card"><header class="modal-card-head"><p class="modal-card-title">Settings</p><button class="delete"></button></header><section class="modal-card-body"><p><label class="label">Theme</label><div class="select"><select id="documenter-themepicker"><option value="documenter-light">documenter-light</option><option value="documenter-dark">documenter-dark</option></select></div></p><hr/><p>This document was generated with <a href="https://github.com/JuliaDocs/Documenter.jl">Documenter.jl</a> on <span class="colophon-date" title="Wednesday 3 July 2024 16:02">Wednesday 3 July 2024</span>. Using Julia version 1.10.4.</p></section><footer class="modal-card-foot"></footer></div></div></div></body></html>
+)</code></pre></div><a class="docs-sourcelink" target="_blank" href="https://github.com/quantling/JudiLing.jl/blob/5ca73e4b27ef788e0b36d45e6360491a5a413be8/src/input.jl#LL151-L203">source</a></section></article></article><nav class="docs-footer"><a class="docs-footer-prevpage" href="../../">« Home</a><a class="docs-footer-nextpage" href="../make_cue_matrix/">Make Cue Matrix »</a><div class="flexbox-break"></div><p class="footer-message">Powered by <a href="https://github.com/JuliaDocs/Documenter.jl">Documenter.jl</a> and the <a href="https://julialang.org/">Julia Programming Language</a>.</p></nav></div><div class="modal" id="documenter-settings"><div class="modal-background"></div><div class="modal-card"><header class="modal-card-head"><p class="modal-card-title">Settings</p><button class="delete"></button></header><section class="modal-card-body"><p><label class="label">Theme</label><div class="select"><select id="documenter-themepicker"><option value="documenter-light">documenter-light</option><option value="documenter-dark">documenter-dark</option></select></div></p><hr/><p>This document was generated with <a href="https://github.com/JuliaDocs/Documenter.jl">Documenter.jl</a> on <span class="colophon-date" title="Wednesday 3 July 2024 16:16">Wednesday 3 July 2024</span>. Using Julia version 1.10.4.</p></section><footer class="modal-card-foot"></footer></div></div></div></body></html>
diff --git a/dev/man/make_adjacency_matrix/index.html b/dev/man/make_adjacency_matrix/index.html
index f016f8d..99ac529 100644
--- a/dev/man/make_adjacency_matrix/index.html
+++ b/dev/man/make_adjacency_matrix/index.html
@@ -8,7 +8,7 @@
 JudiLing.make_adjacency_matrix(
     i2f,
     tokenized=true,
-    sep_token=&quot;-&quot;)</code></pre></div><a class="docs-sourcelink" target="_blank" href="https://github.com/quantling/JudiLing.jl/blob/244bb0c648484065ffd5a41781ccc1caf2e5db60/src/make_adjacency_matrix.jl#LL1-L29">source</a></section></article><article class="docstring"><header><a class="docstring-binding" id="JudiLing.make_full_adjacency_matrix-Tuple{Any}" href="#JudiLing.make_full_adjacency_matrix-Tuple{Any}"><code>JudiLing.make_full_adjacency_matrix</code></a> — <span class="docstring-category">Method</span></header><section><div><pre><code class="language-julia">make_adjacency_matrix(i2f)</code></pre><p>Make full adjacency matrix based only on the form of n-grams regardless of whether they are seen in the training data. This usually takes hours for large datasets, as all possible combinations are considered.</p><p><strong>Obligatory Arguments</strong></p><ul><li><code>i2f::Dict</code>: the dictionary returning features given indices</li></ul><p><strong>Optional Arguments</strong></p><ul><li><code>tokenized::Bool=false</code>:if true, the dataset target is assumed to be tokenized</li><li><code>sep_token::Union{Nothing, String, Char}=nothing</code>: separator token</li><li><code>verbose::Bool=false</code>: if true, more information will be printed</li></ul><p><strong>Examples</strong></p><pre><code class="language-julia"># without tokenization
+    sep_token=&quot;-&quot;)</code></pre></div><a class="docs-sourcelink" target="_blank" href="https://github.com/quantling/JudiLing.jl/blob/5ca73e4b27ef788e0b36d45e6360491a5a413be8/src/make_adjacency_matrix.jl#LL1-L29">source</a></section></article><article class="docstring"><header><a class="docstring-binding" id="JudiLing.make_full_adjacency_matrix-Tuple{Any}" href="#JudiLing.make_full_adjacency_matrix-Tuple{Any}"><code>JudiLing.make_full_adjacency_matrix</code></a> — <span class="docstring-category">Method</span></header><section><div><pre><code class="language-julia">make_adjacency_matrix(i2f)</code></pre><p>Make full adjacency matrix based only on the form of n-grams regardless of whether they are seen in the training data. This usually takes hours for large datasets, as all possible combinations are considered.</p><p><strong>Obligatory Arguments</strong></p><ul><li><code>i2f::Dict</code>: the dictionary returning features given indices</li></ul><p><strong>Optional Arguments</strong></p><ul><li><code>tokenized::Bool=false</code>:if true, the dataset target is assumed to be tokenized</li><li><code>sep_token::Union{Nothing, String, Char}=nothing</code>: separator token</li><li><code>verbose::Bool=false</code>: if true, more information will be printed</li></ul><p><strong>Examples</strong></p><pre><code class="language-julia"># without tokenization
 i2f = Dict([(1, &quot;#ab&quot;), (2, &quot;abc&quot;), (3, &quot;bc#&quot;), (4, &quot;#bc&quot;), (5, &quot;ab#&quot;)])
 JudiLing.make_adjacency_matrix(i2f)
 
@@ -17,11 +17,11 @@
 JudiLing.make_adjacency_matrix(
     i2f,
     tokenized=true,
-    sep_token=&quot;-&quot;)</code></pre></div><a class="docs-sourcelink" target="_blank" href="https://github.com/quantling/JudiLing.jl/blob/244bb0c648484065ffd5a41781ccc1caf2e5db60/src/make_adjacency_matrix.jl#LL1-L29">source</a></section></article><article class="docstring"><header><a class="docstring-binding" id="JudiLing.make_combined_adjacency_matrix-Tuple{Any, Any}" href="#JudiLing.make_combined_adjacency_matrix-Tuple{Any, Any}"><code>JudiLing.make_combined_adjacency_matrix</code></a> — <span class="docstring-category">Method</span></header><section><div><pre><code class="language-julia">make_combined_adjacency_matrix(data_train, data_val)</code></pre><p>Make combined adjacency matrix.</p><p><strong>Obligatory Arguments</strong></p><ul><li><code>data_train::DataFrame</code>: training dataset</li><li><code>data_val::DataFrame</code>: validation dataset</li></ul><p><strong>Optional Arguments</strong></p><ul><li><code>grams=3</code>: the number of grams for cues</li><li><code>target_col=:Words</code>: the column name for target strings</li><li><code>tokenized=false</code>:if true, the dataset target is assumed to be tokenized</li><li><code>sep_token=nothing</code>: separator</li><li><code>keep_sep=false</code>: if true, keep separators in cues</li><li><code>start_end_token=&quot;#&quot;</code>: start and end token in boundary cues</li><li><code>verbose=false</code>: if true, more information is printed</li></ul><p><strong>Examples</strong></p><pre><code class="language-julia">JudiLing.make_combined_adjacency_matrix(
+    sep_token=&quot;-&quot;)</code></pre></div><a class="docs-sourcelink" target="_blank" href="https://github.com/quantling/JudiLing.jl/blob/5ca73e4b27ef788e0b36d45e6360491a5a413be8/src/make_adjacency_matrix.jl#LL1-L29">source</a></section></article><article class="docstring"><header><a class="docstring-binding" id="JudiLing.make_combined_adjacency_matrix-Tuple{Any, Any}" href="#JudiLing.make_combined_adjacency_matrix-Tuple{Any, Any}"><code>JudiLing.make_combined_adjacency_matrix</code></a> — <span class="docstring-category">Method</span></header><section><div><pre><code class="language-julia">make_combined_adjacency_matrix(data_train, data_val)</code></pre><p>Make combined adjacency matrix.</p><p><strong>Obligatory Arguments</strong></p><ul><li><code>data_train::DataFrame</code>: training dataset</li><li><code>data_val::DataFrame</code>: validation dataset</li></ul><p><strong>Optional Arguments</strong></p><ul><li><code>grams=3</code>: the number of grams for cues</li><li><code>target_col=:Words</code>: the column name for target strings</li><li><code>tokenized=false</code>:if true, the dataset target is assumed to be tokenized</li><li><code>sep_token=nothing</code>: separator</li><li><code>keep_sep=false</code>: if true, keep separators in cues</li><li><code>start_end_token=&quot;#&quot;</code>: start and end token in boundary cues</li><li><code>verbose=false</code>: if true, more information is printed</li></ul><p><strong>Examples</strong></p><pre><code class="language-julia">JudiLing.make_combined_adjacency_matrix(
     latin_train,
     latin_val,
     grams=3,
     target_col=:Word,
     tokenized=false,
     keep_sep=false
-    )</code></pre></div><a class="docs-sourcelink" target="_blank" href="https://github.com/quantling/JudiLing.jl/blob/244bb0c648484065ffd5a41781ccc1caf2e5db60/src/make_adjacency_matrix.jl#LL72-L101">source</a></section></article></article><nav class="docs-footer"><a class="docs-footer-prevpage" href="../cholesky/">« Cholesky</a><a class="docs-footer-nextpage" href="../make_yt_matrix/">Make Yt Matrix »</a><div class="flexbox-break"></div><p class="footer-message">Powered by <a href="https://github.com/JuliaDocs/Documenter.jl">Documenter.jl</a> and the <a href="https://julialang.org/">Julia Programming Language</a>.</p></nav></div><div class="modal" id="documenter-settings"><div class="modal-background"></div><div class="modal-card"><header class="modal-card-head"><p class="modal-card-title">Settings</p><button class="delete"></button></header><section class="modal-card-body"><p><label class="label">Theme</label><div class="select"><select id="documenter-themepicker"><option value="documenter-light">documenter-light</option><option value="documenter-dark">documenter-dark</option></select></div></p><hr/><p>This document was generated with <a href="https://github.com/JuliaDocs/Documenter.jl">Documenter.jl</a> on <span class="colophon-date" title="Wednesday 3 July 2024 16:02">Wednesday 3 July 2024</span>. Using Julia version 1.10.4.</p></section><footer class="modal-card-foot"></footer></div></div></div></body></html>
+    )</code></pre></div><a class="docs-sourcelink" target="_blank" href="https://github.com/quantling/JudiLing.jl/blob/5ca73e4b27ef788e0b36d45e6360491a5a413be8/src/make_adjacency_matrix.jl#LL72-L101">source</a></section></article></article><nav class="docs-footer"><a class="docs-footer-prevpage" href="../cholesky/">« Cholesky</a><a class="docs-footer-nextpage" href="../make_yt_matrix/">Make Yt Matrix »</a><div class="flexbox-break"></div><p class="footer-message">Powered by <a href="https://github.com/JuliaDocs/Documenter.jl">Documenter.jl</a> and the <a href="https://julialang.org/">Julia Programming Language</a>.</p></nav></div><div class="modal" id="documenter-settings"><div class="modal-background"></div><div class="modal-card"><header class="modal-card-head"><p class="modal-card-title">Settings</p><button class="delete"></button></header><section class="modal-card-body"><p><label class="label">Theme</label><div class="select"><select id="documenter-themepicker"><option value="documenter-light">documenter-light</option><option value="documenter-dark">documenter-dark</option></select></div></p><hr/><p>This document was generated with <a href="https://github.com/JuliaDocs/Documenter.jl">Documenter.jl</a> on <span class="colophon-date" title="Wednesday 3 July 2024 16:16">Wednesday 3 July 2024</span>. Using Julia version 1.10.4.</p></section><footer class="modal-card-foot"></footer></div></div></div></body></html>
diff --git a/dev/man/make_cue_matrix/index.html b/dev/man/make_cue_matrix/index.html
index 38af40f..3e8bc69 100644
--- a/dev/man/make_cue_matrix/index.html
+++ b/dev/man/make_cue_matrix/index.html
@@ -1,5 +1,5 @@
 <!DOCTYPE html>
-<html lang="en"><head><meta charset="UTF-8"/><meta name="viewport" content="width=device-width, initial-scale=1.0"/><title>Make Cue Matrix · JudiLing.jl</title><link rel="canonical" href="https://quantling.github.io/JudiLing.jl/man/make_cue_matrix/"/><link href="https://fonts.googleapis.com/css?family=Lato|Roboto+Mono" rel="stylesheet" type="text/css"/><link href="https://cdnjs.cloudflare.com/ajax/libs/font-awesome/5.15.0/css/fontawesome.min.css" rel="stylesheet" type="text/css"/><link href="https://cdnjs.cloudflare.com/ajax/libs/font-awesome/5.15.0/css/solid.min.css" rel="stylesheet" type="text/css"/><link href="https://cdnjs.cloudflare.com/ajax/libs/font-awesome/5.15.0/css/brands.min.css" rel="stylesheet" type="text/css"/><link href="https://cdnjs.cloudflare.com/ajax/libs/KaTeX/0.11.1/katex.min.css" rel="stylesheet" type="text/css"/><script>documenterBaseURL="../.."</script><script src="https://cdnjs.cloudflare.com/ajax/libs/require.js/2.3.6/require.min.js" data-main="../../assets/documenter.js"></script><script src="../../siteinfo.js"></script><script src="../../../versions.js"></script><link class="docs-theme-link" rel="stylesheet" type="text/css" href="../../assets/themes/documenter-dark.css" data-theme-name="documenter-dark"/><link class="docs-theme-link" rel="stylesheet" type="text/css" href="../../assets/themes/documenter-light.css" data-theme-name="documenter-light" data-theme-primary/><script src="../../assets/themeswap.js"></script></head><body><div id="documenter"><nav class="docs-sidebar"><div class="docs-package-name"><span class="docs-autofit">JudiLing.jl</span></div><form class="docs-search" action="../../search/"><input class="docs-search-query" id="documenter-search-query" name="q" type="text" placeholder="Search docs"/></form><ul class="docs-menu"><li><a class="tocitem" href="../../">Home</a></li><li><span class="tocitem">Manual</span><ul><li><a class="tocitem" href="../input/">Loading data</a></li><li class="is-active"><a class="tocitem" href>Make Cue Matrix</a></li><li><a class="tocitem" href="../make_semantic_matrix/">Make Semantic Matrix</a></li><li><a class="tocitem" href="../cholesky/">Cholesky</a></li><li><a class="tocitem" href="../make_adjacency_matrix/">Make Adjacency Matrix</a></li><li><a class="tocitem" href="../make_yt_matrix/">Make Yt Matrix</a></li><li><a class="tocitem" href="../find_path/">Find Paths</a></li><li><a class="tocitem" href="../eval/">Evaluation</a></li><li><a class="tocitem" href="../output/">Output</a></li><li><a class="tocitem" href="../test_combo/">Test Combo</a></li><li><a class="tocitem" href="../display/">Display</a></li><li><a class="tocitem" href="../utils/">Utils</a></li><li><a class="tocitem" href="../pickle/">Pickle</a></li><li><a class="tocitem" href="../pyndl/">Pyndl</a></li><li><a class="tocitem" href="../wh/">Widrow-Hoff Learning</a></li><li><a class="tocitem" href="../deep_learning/">Deep learning</a></li><li><a class="tocitem" href="../measures_func/">Measures function</a></li></ul></li><li><a class="tocitem" href="../all_manual/">All Manual index</a></li></ul><div class="docs-version-selector field has-addons"><div class="control"><span class="docs-label button is-static is-size-7">Version</span></div><div class="docs-selector control is-expanded"><div class="select is-fullwidth is-size-7"><select id="documenter-version-selector"></select></div></div></div></nav><div class="docs-main"><header class="docs-navbar"><nav class="breadcrumb"><ul class="is-hidden-mobile"><li><a class="is-disabled">Manual</a></li><li class="is-active"><a href>Make Cue Matrix</a></li></ul><ul class="is-hidden-tablet"><li class="is-active"><a href>Make Cue Matrix</a></li></ul></nav><div class="docs-right"><a class="docs-edit-link" href="https://github.com/quantling/JudiLing.jl/blob/master/docs/src/man/make_cue_matrix.md#L" title="Edit on GitHub"><span class="docs-icon fab"></span><span class="docs-label is-hidden-touch">Edit on GitHub</span></a><a class="docs-settings-button fas fa-cog" id="documenter-settings-button" href="#" title="Settings"></a><a class="docs-sidebar-button fa fa-bars is-hidden-desktop" id="documenter-sidebar-button" href="#"></a></div></header><article class="content" id="documenter-page"><h1 id="Make-Cue-Matrix"><a class="docs-heading-anchor" href="#Make-Cue-Matrix">Make Cue Matrix</a><a id="Make-Cue-Matrix-1"></a><a class="docs-heading-anchor-permalink" href="#Make-Cue-Matrix" title="Permalink"></a></h1><article class="docstring"><header><a class="docstring-binding" id="JudiLing.Cue_Matrix_Struct" href="#JudiLing.Cue_Matrix_Struct"><code>JudiLing.Cue_Matrix_Struct</code></a> — <span class="docstring-category">Type</span></header><section><div><p>A structure that stores information created by make<em>cue</em>matrix: C is the cue matrix; f2i is a dictionary returning the indices for features; i2f is a dictionary returning the features for indices; gold<em>ind is a list of indices of gold paths; A is the adjacency matrix; grams is the number of grams for cues; target</em>col is the column name for target strings; tokenized is whether the dataset target is tokenized; sep<em>token is the separator; keep</em>sep is whether to keep separators in cues; start<em>end</em>token is the start and end token in boundary cues.</p></div><a class="docs-sourcelink" target="_blank" href="https://github.com/quantling/JudiLing.jl/blob/244bb0c648484065ffd5a41781ccc1caf2e5db60/src/make_cue_matrix.jl#LL1-L14">source</a></section></article><article class="docstring"><header><a class="docstring-binding" id="JudiLing.make_cue_matrix" href="#JudiLing.make_cue_matrix"><code>JudiLing.make_cue_matrix</code></a> — <span class="docstring-category">Function</span></header><section><div><p>Construct cue matrix.</p></div><a class="docs-sourcelink" target="_blank" href="https://github.com/quantling/JudiLing.jl/blob/244bb0c648484065ffd5a41781ccc1caf2e5db60/src/make_cue_matrix.jl#LL29-L31">source</a></section></article><article class="docstring"><header><a class="docstring-binding" id="JudiLing.make_combined_cue_matrix" href="#JudiLing.make_combined_cue_matrix"><code>JudiLing.make_combined_cue_matrix</code></a> — <span class="docstring-category">Function</span></header><section><div><p>Construct cue matrix where combined features and adjacencies for both training datasets and validation datasets.</p></div><a class="docs-sourcelink" target="_blank" href="https://github.com/quantling/JudiLing.jl/blob/244bb0c648484065ffd5a41781ccc1caf2e5db60/src/make_cue_matrix.jl#LL34-L36">source</a></section></article><article class="docstring"><header><a class="docstring-binding" id="JudiLing.make_ngrams" href="#JudiLing.make_ngrams"><code>JudiLing.make_ngrams</code></a> — <span class="docstring-category">Function</span></header><section><div><p>Given a list of string tokens, extract their n-grams.</p></div><a class="docs-sourcelink" target="_blank" href="https://github.com/quantling/JudiLing.jl/blob/244bb0c648484065ffd5a41781ccc1caf2e5db60/src/make_cue_matrix.jl#LL39-L41">source</a></section></article><article class="docstring"><header><a class="docstring-binding" id="JudiLing.make_cue_matrix-Tuple{DataFrames.DataFrame}" href="#JudiLing.make_cue_matrix-Tuple{DataFrames.DataFrame}"><code>JudiLing.make_cue_matrix</code></a> — <span class="docstring-category">Method</span></header><section><div><pre><code class="language-julia">make_cue_matrix(data::DataFrame)</code></pre><p>Make the cue matrix for training datasets and corresponding indices as well as the adjacency matrix and gold paths given a dataset in a form of dataframe.</p><p><strong>Obligatory Arguments</strong></p><ul><li><code>data::DataFrame</code>: the dataset</li></ul><p><strong>Optional Arguments</strong></p><ul><li><code>grams::Int64=3</code>: the number of grams for cues</li><li><code>target_col::Union{String, Symbol}=:Words</code>: the column name for target strings</li><li><code>tokenized::Bool=false</code>:if true, the dataset target is assumed to be tokenized</li><li><code>sep_token::Union{Nothing, String, Char}=nothing</code>: separator</li><li><code>keep_sep::Bool=false</code>: if true, keep separators in cues</li><li><code>start_end_token::Union{String, Char}=&quot;#&quot;</code>: start and end token in boundary cues</li><li><code>verbose::Bool=false</code>: if true, more information is printed</li></ul><p><strong>Examples</strong></p><pre><code class="language-julia"># make cue matrix without tokenization
+<html lang="en"><head><meta charset="UTF-8"/><meta name="viewport" content="width=device-width, initial-scale=1.0"/><title>Make Cue Matrix · JudiLing.jl</title><link rel="canonical" href="https://quantling.github.io/JudiLing.jl/man/make_cue_matrix/"/><link href="https://fonts.googleapis.com/css?family=Lato|Roboto+Mono" rel="stylesheet" type="text/css"/><link href="https://cdnjs.cloudflare.com/ajax/libs/font-awesome/5.15.0/css/fontawesome.min.css" rel="stylesheet" type="text/css"/><link href="https://cdnjs.cloudflare.com/ajax/libs/font-awesome/5.15.0/css/solid.min.css" rel="stylesheet" type="text/css"/><link href="https://cdnjs.cloudflare.com/ajax/libs/font-awesome/5.15.0/css/brands.min.css" rel="stylesheet" type="text/css"/><link href="https://cdnjs.cloudflare.com/ajax/libs/KaTeX/0.11.1/katex.min.css" rel="stylesheet" type="text/css"/><script>documenterBaseURL="../.."</script><script src="https://cdnjs.cloudflare.com/ajax/libs/require.js/2.3.6/require.min.js" data-main="../../assets/documenter.js"></script><script src="../../siteinfo.js"></script><script src="../../../versions.js"></script><link class="docs-theme-link" rel="stylesheet" type="text/css" href="../../assets/themes/documenter-dark.css" data-theme-name="documenter-dark"/><link class="docs-theme-link" rel="stylesheet" type="text/css" href="../../assets/themes/documenter-light.css" data-theme-name="documenter-light" data-theme-primary/><script src="../../assets/themeswap.js"></script></head><body><div id="documenter"><nav class="docs-sidebar"><div class="docs-package-name"><span class="docs-autofit">JudiLing.jl</span></div><form class="docs-search" action="../../search/"><input class="docs-search-query" id="documenter-search-query" name="q" type="text" placeholder="Search docs"/></form><ul class="docs-menu"><li><a class="tocitem" href="../../">Home</a></li><li><span class="tocitem">Manual</span><ul><li><a class="tocitem" href="../input/">Loading data</a></li><li class="is-active"><a class="tocitem" href>Make Cue Matrix</a></li><li><a class="tocitem" href="../make_semantic_matrix/">Make Semantic Matrix</a></li><li><a class="tocitem" href="../cholesky/">Cholesky</a></li><li><a class="tocitem" href="../make_adjacency_matrix/">Make Adjacency Matrix</a></li><li><a class="tocitem" href="../make_yt_matrix/">Make Yt Matrix</a></li><li><a class="tocitem" href="../find_path/">Find Paths</a></li><li><a class="tocitem" href="../eval/">Evaluation</a></li><li><a class="tocitem" href="../output/">Output</a></li><li><a class="tocitem" href="../test_combo/">Test Combo</a></li><li><a class="tocitem" href="../display/">Display</a></li><li><a class="tocitem" href="../utils/">Utils</a></li><li><a class="tocitem" href="../pickle/">Pickle</a></li><li><a class="tocitem" href="../pyndl/">Pyndl</a></li><li><a class="tocitem" href="../wh/">Widrow-Hoff Learning</a></li><li><a class="tocitem" href="../deep_learning/">Deep learning</a></li><li><a class="tocitem" href="../measures_func/">Measures function</a></li></ul></li><li><a class="tocitem" href="../all_manual/">All Manual index</a></li></ul><div class="docs-version-selector field has-addons"><div class="control"><span class="docs-label button is-static is-size-7">Version</span></div><div class="docs-selector control is-expanded"><div class="select is-fullwidth is-size-7"><select id="documenter-version-selector"></select></div></div></div></nav><div class="docs-main"><header class="docs-navbar"><nav class="breadcrumb"><ul class="is-hidden-mobile"><li><a class="is-disabled">Manual</a></li><li class="is-active"><a href>Make Cue Matrix</a></li></ul><ul class="is-hidden-tablet"><li class="is-active"><a href>Make Cue Matrix</a></li></ul></nav><div class="docs-right"><a class="docs-edit-link" href="https://github.com/quantling/JudiLing.jl/blob/master/docs/src/man/make_cue_matrix.md#L" title="Edit on GitHub"><span class="docs-icon fab"></span><span class="docs-label is-hidden-touch">Edit on GitHub</span></a><a class="docs-settings-button fas fa-cog" id="documenter-settings-button" href="#" title="Settings"></a><a class="docs-sidebar-button fa fa-bars is-hidden-desktop" id="documenter-sidebar-button" href="#"></a></div></header><article class="content" id="documenter-page"><h1 id="Make-Cue-Matrix"><a class="docs-heading-anchor" href="#Make-Cue-Matrix">Make Cue Matrix</a><a id="Make-Cue-Matrix-1"></a><a class="docs-heading-anchor-permalink" href="#Make-Cue-Matrix" title="Permalink"></a></h1><article class="docstring"><header><a class="docstring-binding" id="JudiLing.Cue_Matrix_Struct" href="#JudiLing.Cue_Matrix_Struct"><code>JudiLing.Cue_Matrix_Struct</code></a> — <span class="docstring-category">Type</span></header><section><div><p>A structure that stores information created by make<em>cue</em>matrix: C is the cue matrix; f2i is a dictionary returning the indices for features; i2f is a dictionary returning the features for indices; gold<em>ind is a list of indices of gold paths; A is the adjacency matrix; grams is the number of grams for cues; target</em>col is the column name for target strings; tokenized is whether the dataset target is tokenized; sep<em>token is the separator; keep</em>sep is whether to keep separators in cues; start<em>end</em>token is the start and end token in boundary cues.</p></div><a class="docs-sourcelink" target="_blank" href="https://github.com/quantling/JudiLing.jl/blob/5ca73e4b27ef788e0b36d45e6360491a5a413be8/src/make_cue_matrix.jl#LL1-L14">source</a></section></article><article class="docstring"><header><a class="docstring-binding" id="JudiLing.make_cue_matrix" href="#JudiLing.make_cue_matrix"><code>JudiLing.make_cue_matrix</code></a> — <span class="docstring-category">Function</span></header><section><div><p>Construct cue matrix.</p></div><a class="docs-sourcelink" target="_blank" href="https://github.com/quantling/JudiLing.jl/blob/5ca73e4b27ef788e0b36d45e6360491a5a413be8/src/make_cue_matrix.jl#LL29-L31">source</a></section></article><article class="docstring"><header><a class="docstring-binding" id="JudiLing.make_combined_cue_matrix" href="#JudiLing.make_combined_cue_matrix"><code>JudiLing.make_combined_cue_matrix</code></a> — <span class="docstring-category">Function</span></header><section><div><p>Construct cue matrix where combined features and adjacencies for both training datasets and validation datasets.</p></div><a class="docs-sourcelink" target="_blank" href="https://github.com/quantling/JudiLing.jl/blob/5ca73e4b27ef788e0b36d45e6360491a5a413be8/src/make_cue_matrix.jl#LL34-L36">source</a></section></article><article class="docstring"><header><a class="docstring-binding" id="JudiLing.make_ngrams" href="#JudiLing.make_ngrams"><code>JudiLing.make_ngrams</code></a> — <span class="docstring-category">Function</span></header><section><div><p>Given a list of string tokens, extract their n-grams.</p></div><a class="docs-sourcelink" target="_blank" href="https://github.com/quantling/JudiLing.jl/blob/5ca73e4b27ef788e0b36d45e6360491a5a413be8/src/make_cue_matrix.jl#LL39-L41">source</a></section></article><article class="docstring"><header><a class="docstring-binding" id="JudiLing.make_cue_matrix-Tuple{DataFrames.DataFrame}" href="#JudiLing.make_cue_matrix-Tuple{DataFrames.DataFrame}"><code>JudiLing.make_cue_matrix</code></a> — <span class="docstring-category">Method</span></header><section><div><pre><code class="language-julia">make_cue_matrix(data::DataFrame)</code></pre><p>Make the cue matrix for training datasets and corresponding indices as well as the adjacency matrix and gold paths given a dataset in a form of dataframe.</p><p><strong>Obligatory Arguments</strong></p><ul><li><code>data::DataFrame</code>: the dataset</li></ul><p><strong>Optional Arguments</strong></p><ul><li><code>grams::Int64=3</code>: the number of grams for cues</li><li><code>target_col::Union{String, Symbol}=:Words</code>: the column name for target strings</li><li><code>tokenized::Bool=false</code>:if true, the dataset target is assumed to be tokenized</li><li><code>sep_token::Union{Nothing, String, Char}=nothing</code>: separator</li><li><code>keep_sep::Bool=false</code>: if true, keep separators in cues</li><li><code>start_end_token::Union{String, Char}=&quot;#&quot;</code>: start and end token in boundary cues</li><li><code>verbose::Bool=false</code>: if true, more information is printed</li></ul><p><strong>Examples</strong></p><pre><code class="language-julia"># make cue matrix without tokenization
 cue_obj_train = JudiLing.make_cue_matrix(
      latin_train,
     grams=3,
@@ -21,7 +21,7 @@
     start_end_token=&quot;#&quot;,
     keep_sep=true,
     verbose=false
-    )</code></pre></div><a class="docs-sourcelink" target="_blank" href="https://github.com/quantling/JudiLing.jl/blob/244bb0c648484065ffd5a41781ccc1caf2e5db60/src/make_cue_matrix.jl#LL44-L88">source</a></section></article><article class="docstring"><header><a class="docstring-binding" id="JudiLing.make_cue_matrix-Tuple{DataFrames.DataFrame, JudiLing.Cue_Matrix_Struct}" href="#JudiLing.make_cue_matrix-Tuple{DataFrames.DataFrame, JudiLing.Cue_Matrix_Struct}"><code>JudiLing.make_cue_matrix</code></a> — <span class="docstring-category">Method</span></header><section><div><pre><code class="language-julia">make_cue_matrix(data::DataFrame, cue_obj::Cue_Matrix_Struct)</code></pre><p>Make the cue matrix for validation datasets and corresponding indices as well as the adjacency matrix and gold paths given a dataset in a form of dataframe.</p><p><strong>Obligatory Arguments</strong></p><ul><li><code>data::DataFrame</code>: the dataset</li><li><code>cue_obj::Cue_Matrix_Struct</code>: training cue object</li></ul><p><strong>Optional Arguments</strong></p><ul><li><code>grams::Int64=3</code>: the number of grams for cues</li><li><code>target_col::Union{String, Symbol}=:Words</code>: the column name for target strings</li><li><code>tokenized::Bool=false</code>:if true, the dataset target is assumed to be tokenized</li><li><code>sep_token::Union{Nothing, String, Char}=nothing</code>: separator</li><li><code>keep_sep::Bool=false</code>: if true, keep separators in cues</li><li><code>start_end_token::Union{String, Char}=&quot;#&quot;</code>: start and end token in boundary cues</li><li><code>verbose::Bool=false</code>: if true, more information is printed</li></ul><p><strong>Examples</strong></p><pre><code class="language-julia"># make cue matrix without tokenization
+    )</code></pre></div><a class="docs-sourcelink" target="_blank" href="https://github.com/quantling/JudiLing.jl/blob/5ca73e4b27ef788e0b36d45e6360491a5a413be8/src/make_cue_matrix.jl#LL44-L88">source</a></section></article><article class="docstring"><header><a class="docstring-binding" id="JudiLing.make_cue_matrix-Tuple{DataFrames.DataFrame, JudiLing.Cue_Matrix_Struct}" href="#JudiLing.make_cue_matrix-Tuple{DataFrames.DataFrame, JudiLing.Cue_Matrix_Struct}"><code>JudiLing.make_cue_matrix</code></a> — <span class="docstring-category">Method</span></header><section><div><pre><code class="language-julia">make_cue_matrix(data::DataFrame, cue_obj::Cue_Matrix_Struct)</code></pre><p>Make the cue matrix for validation datasets and corresponding indices as well as the adjacency matrix and gold paths given a dataset in a form of dataframe.</p><p><strong>Obligatory Arguments</strong></p><ul><li><code>data::DataFrame</code>: the dataset</li><li><code>cue_obj::Cue_Matrix_Struct</code>: training cue object</li></ul><p><strong>Optional Arguments</strong></p><ul><li><code>grams::Int64=3</code>: the number of grams for cues</li><li><code>target_col::Union{String, Symbol}=:Words</code>: the column name for target strings</li><li><code>tokenized::Bool=false</code>:if true, the dataset target is assumed to be tokenized</li><li><code>sep_token::Union{Nothing, String, Char}=nothing</code>: separator</li><li><code>keep_sep::Bool=false</code>: if true, keep separators in cues</li><li><code>start_end_token::Union{String, Char}=&quot;#&quot;</code>: start and end token in boundary cues</li><li><code>verbose::Bool=false</code>: if true, more information is printed</li></ul><p><strong>Examples</strong></p><pre><code class="language-julia"># make cue matrix without tokenization
 cue_obj_val = JudiLing.make_cue_matrix(
   latin_val,
   cue_obj_train,
@@ -45,7 +45,7 @@
     keep_sep=true,
     start_end_token=&quot;#&quot;,
     verbose=false
-    )</code></pre></div><a class="docs-sourcelink" target="_blank" href="https://github.com/quantling/JudiLing.jl/blob/244bb0c648484065ffd5a41781ccc1caf2e5db60/src/make_cue_matrix.jl#LL177-L224">source</a></section></article><article class="docstring"><header><a class="docstring-binding" id="JudiLing.make_cue_matrix-Tuple{DataFrames.DataFrame, DataFrames.DataFrame}" href="#JudiLing.make_cue_matrix-Tuple{DataFrames.DataFrame, DataFrames.DataFrame}"><code>JudiLing.make_cue_matrix</code></a> — <span class="docstring-category">Method</span></header><section><div><pre><code class="language-julia">make_cue_matrix(data_train::DataFrame, data_val::DataFrame)</code></pre><p>Make the cue matrix for traiing and validation datasets at the same time.</p><p><strong>Obligatory Arguments</strong></p><ul><li><code>data_train::DataFrame</code>: the training dataset</li><li><code>data_val::DataFrame</code>: the validation dataset</li></ul><p><strong>Optional Arguments</strong></p><ul><li><code>grams::Int64=3</code>: the number of grams for cues</li><li><code>target_col::Union{String, Symbol}=:Words</code>: the column name for target strings</li><li><code>tokenized::Bool=false</code>:if true, the dataset target is assumed to be tokenized</li><li><code>sep_token::Union{Nothing, String, Char}=nothing</code>: separator</li><li><code>keep_sep::Bool=false</code>: if true, keep separators in cues</li><li><code>start_end_token::Union{String, Char}=&quot;#&quot;</code>: start and end token in boundary cues</li><li><code>verbose::Bool=false</code>: if true, more information is printed</li></ul><p><strong>Examples</strong></p><pre><code class="language-julia"># make cue matrix without tokenization
+    )</code></pre></div><a class="docs-sourcelink" target="_blank" href="https://github.com/quantling/JudiLing.jl/blob/5ca73e4b27ef788e0b36d45e6360491a5a413be8/src/make_cue_matrix.jl#LL177-L224">source</a></section></article><article class="docstring"><header><a class="docstring-binding" id="JudiLing.make_cue_matrix-Tuple{DataFrames.DataFrame, DataFrames.DataFrame}" href="#JudiLing.make_cue_matrix-Tuple{DataFrames.DataFrame, DataFrames.DataFrame}"><code>JudiLing.make_cue_matrix</code></a> — <span class="docstring-category">Method</span></header><section><div><pre><code class="language-julia">make_cue_matrix(data_train::DataFrame, data_val::DataFrame)</code></pre><p>Make the cue matrix for traiing and validation datasets at the same time.</p><p><strong>Obligatory Arguments</strong></p><ul><li><code>data_train::DataFrame</code>: the training dataset</li><li><code>data_val::DataFrame</code>: the validation dataset</li></ul><p><strong>Optional Arguments</strong></p><ul><li><code>grams::Int64=3</code>: the number of grams for cues</li><li><code>target_col::Union{String, Symbol}=:Words</code>: the column name for target strings</li><li><code>tokenized::Bool=false</code>:if true, the dataset target is assumed to be tokenized</li><li><code>sep_token::Union{Nothing, String, Char}=nothing</code>: separator</li><li><code>keep_sep::Bool=false</code>: if true, keep separators in cues</li><li><code>start_end_token::Union{String, Char}=&quot;#&quot;</code>: start and end token in boundary cues</li><li><code>verbose::Bool=false</code>: if true, more information is printed</li></ul><p><strong>Examples</strong></p><pre><code class="language-julia"># make cue matrix without tokenization
 cue_obj_train, cue_obj_val = JudiLing.make_cue_matrix(
     latin_train,
     latin_val,
@@ -66,7 +66,7 @@
     keep_sep=true,
     start_end_token=&quot;#&quot;,
     verbose=false
-    )</code></pre></div><a class="docs-sourcelink" target="_blank" href="https://github.com/quantling/JudiLing.jl/blob/244bb0c648484065ffd5a41781ccc1caf2e5db60/src/make_cue_matrix.jl#LL276-L319">source</a></section></article><article class="docstring"><header><a class="docstring-binding" id="JudiLing.make_combined_cue_matrix-Tuple{Any, Any}" href="#JudiLing.make_combined_cue_matrix-Tuple{Any, Any}"><code>JudiLing.make_combined_cue_matrix</code></a> — <span class="docstring-category">Method</span></header><section><div><pre><code class="language-julia">make_combined_cue_matrix(data_train, data_val)</code></pre><p>Make the cue matrix for training and validation datasets at the same time, where the features and adjacencies are combined.</p><p><strong>Obligatory Arguments</strong></p><ul><li><code>data_train::DataFrame</code>: the training dataset</li><li><code>data_val::DataFrame</code>: the validation dataset</li></ul><p><strong>Optional Arguments</strong></p><ul><li><code>grams::Int64=3</code>: the number of grams for cues</li><li><code>target_col::Union{String, Symbol}=:Words</code>: the column name for target strings</li><li><code>tokenized::Bool=false</code>:if true, the dataset target is assumed to be tokenized</li><li><code>sep_token::Union{Nothing, String, Char}=nothing</code>: separator</li><li><code>keep_sep::Bool=false</code>: if true, keep separators in cues</li><li><code>start_end_token::Union{String, Char}=&quot;#&quot;</code>: start and end token in boundary cues</li><li><code>verbose::Bool=false</code>: if true, more information is printed</li></ul><p><strong>Examples</strong></p><pre><code class="language-julia"># make cue matrix without tokenization
+    )</code></pre></div><a class="docs-sourcelink" target="_blank" href="https://github.com/quantling/JudiLing.jl/blob/5ca73e4b27ef788e0b36d45e6360491a5a413be8/src/make_cue_matrix.jl#LL276-L319">source</a></section></article><article class="docstring"><header><a class="docstring-binding" id="JudiLing.make_combined_cue_matrix-Tuple{Any, Any}" href="#JudiLing.make_combined_cue_matrix-Tuple{Any, Any}"><code>JudiLing.make_combined_cue_matrix</code></a> — <span class="docstring-category">Method</span></header><section><div><pre><code class="language-julia">make_combined_cue_matrix(data_train, data_val)</code></pre><p>Make the cue matrix for training and validation datasets at the same time, where the features and adjacencies are combined.</p><p><strong>Obligatory Arguments</strong></p><ul><li><code>data_train::DataFrame</code>: the training dataset</li><li><code>data_val::DataFrame</code>: the validation dataset</li></ul><p><strong>Optional Arguments</strong></p><ul><li><code>grams::Int64=3</code>: the number of grams for cues</li><li><code>target_col::Union{String, Symbol}=:Words</code>: the column name for target strings</li><li><code>tokenized::Bool=false</code>:if true, the dataset target is assumed to be tokenized</li><li><code>sep_token::Union{Nothing, String, Char}=nothing</code>: separator</li><li><code>keep_sep::Bool=false</code>: if true, keep separators in cues</li><li><code>start_end_token::Union{String, Char}=&quot;#&quot;</code>: start and end token in boundary cues</li><li><code>verbose::Bool=false</code>: if true, more information is printed</li></ul><p><strong>Examples</strong></p><pre><code class="language-julia"># make cue matrix without tokenization
 cue_obj_train, cue_obj_val = JudiLing.make_combined_cue_matrix(
     latin_train,
     latin_val,
@@ -87,9 +87,9 @@
     keep_sep=true,
     start_end_token=&quot;#&quot;,
     verbose=false
-    )</code></pre></div><a class="docs-sourcelink" target="_blank" href="https://github.com/quantling/JudiLing.jl/blob/244bb0c648484065ffd5a41781ccc1caf2e5db60/src/make_cue_matrix.jl#LL358-L401">source</a></section></article><article class="docstring"><header><a class="docstring-binding" id="JudiLing.make_cue_matrix_from_CFBS-Union{Tuple{Array{Vector{T}, 1}}, Tuple{T}} where T" href="#JudiLing.make_cue_matrix_from_CFBS-Union{Tuple{Array{Vector{T}, 1}}, Tuple{T}} where T"><code>JudiLing.make_cue_matrix_from_CFBS</code></a> — <span class="docstring-category">Method</span></header><section><div><pre><code class="language-julia">make_cue_matrix_from_CFBS(features::Vector{Vector{T}};
+    )</code></pre></div><a class="docs-sourcelink" target="_blank" href="https://github.com/quantling/JudiLing.jl/blob/5ca73e4b27ef788e0b36d45e6360491a5a413be8/src/make_cue_matrix.jl#LL358-L401">source</a></section></article><article class="docstring"><header><a class="docstring-binding" id="JudiLing.make_cue_matrix_from_CFBS-Union{Tuple{Array{Vector{T}, 1}}, Tuple{T}} where T" href="#JudiLing.make_cue_matrix_from_CFBS-Union{Tuple{Array{Vector{T}, 1}}, Tuple{T}} where T"><code>JudiLing.make_cue_matrix_from_CFBS</code></a> — <span class="docstring-category">Method</span></header><section><div><pre><code class="language-julia">make_cue_matrix_from_CFBS(features::Vector{Vector{T}};
                           pad_val::T = 0.,
-                          ncol::Union{Missing,Int}=missing) where {T}</code></pre><p>Create a cue matrix from a vector of feature vectors (usually CFBS vectors). It is expected (though of course not necessary) that the vectors have varying lengths. They are consequently padded on the right with the provided <code>pad_val</code>.</p><p><strong>Obligatory arguments</strong></p><ul><li><code>features::Vector{Vector{T}}</code>: vector of vectors containing C-FBS features</li></ul><p><strong>Optional arguments</strong></p><ul><li><code>pad_val::T = 0.</code>: Value with which the feature vectors will be padded</li><li><code>ncol::Union{Missing,Int}=missing</code>: Number of columns of the C matrix. If not set, will be set to the maximum number of features</li></ul><p><strong>Examples</strong></p><pre><code class="language-julia">C = JudiLing.make_cue_matrix_from_CFBS(features)</code></pre></div><a class="docs-sourcelink" target="_blank" href="https://github.com/quantling/JudiLing.jl/blob/244bb0c648484065ffd5a41781ccc1caf2e5db60/src/make_cue_matrix.jl#LL461-L480">source</a></section></article><article class="docstring"><header><a class="docstring-binding" id="JudiLing.make_combined_cue_matrix_from_CFBS-Union{Tuple{T}, Tuple{Array{Vector{T}, 1}, Array{Vector{T}, 1}}} where T" href="#JudiLing.make_combined_cue_matrix_from_CFBS-Union{Tuple{T}, Tuple{Array{Vector{T}, 1}, Array{Vector{T}, 1}}} where T"><code>JudiLing.make_combined_cue_matrix_from_CFBS</code></a> — <span class="docstring-category">Method</span></header><section><div><pre><code class="language-julia">make_combined_cue_matrix_from_CFBS(features_train::Vector{Vector{T}},
+                          ncol::Union{Missing,Int}=missing) where {T}</code></pre><p>Create a cue matrix from a vector of feature vectors (usually CFBS vectors). It is expected (though of course not necessary) that the vectors have varying lengths. They are consequently padded on the right with the provided <code>pad_val</code>.</p><p><strong>Obligatory arguments</strong></p><ul><li><code>features::Vector{Vector{T}}</code>: vector of vectors containing C-FBS features</li></ul><p><strong>Optional arguments</strong></p><ul><li><code>pad_val::T = 0.</code>: Value with which the feature vectors will be padded</li><li><code>ncol::Union{Missing,Int}=missing</code>: Number of columns of the C matrix. If not set, will be set to the maximum number of features</li></ul><p><strong>Examples</strong></p><pre><code class="language-julia">C = JudiLing.make_cue_matrix_from_CFBS(features)</code></pre></div><a class="docs-sourcelink" target="_blank" href="https://github.com/quantling/JudiLing.jl/blob/5ca73e4b27ef788e0b36d45e6360491a5a413be8/src/make_cue_matrix.jl#LL461-L480">source</a></section></article><article class="docstring"><header><a class="docstring-binding" id="JudiLing.make_combined_cue_matrix_from_CFBS-Union{Tuple{T}, Tuple{Array{Vector{T}, 1}, Array{Vector{T}, 1}}} where T" href="#JudiLing.make_combined_cue_matrix_from_CFBS-Union{Tuple{T}, Tuple{Array{Vector{T}, 1}, Array{Vector{T}, 1}}} where T"><code>JudiLing.make_combined_cue_matrix_from_CFBS</code></a> — <span class="docstring-category">Method</span></header><section><div><pre><code class="language-julia">make_combined_cue_matrix_from_CFBS(features_train::Vector{Vector{T}},
                                    features_test::Vector{Vector{T}};
                                    pad_val::T = 0.,
-                                   ncol::Union{Missing,Int}=missing) where {T}</code></pre><p>Create cue matrices from two vectors of feature vectors (usually CFBS vectors). It is expected (though of course not necessary) that the vectors have varying lengths. They are consequently padded on the right with the provided <code>pad_val</code>. The cue matrices are set to have to the size of the maximum number of feature values in <code>features_train</code> and <code>features_test</code>.</p><p><strong>Obligatory arguments</strong></p><ul><li><code>features_train::Vector{Vector{T}}</code>: vector of vectors containing C-FBS features</li><li><code>features_test::Vector{Vector{T}}</code>: vector of vectors containing C-FBS features</li></ul><p><strong>Optional arguments</strong></p><ul><li><code>pad_val::T = 0.</code>: Value with which the feature vectors will be padded</li><li><code>ncol::Union{Missing,Int}=missing</code>: Number of columns of the C matrices. If not set, will be set to the maximum number of features in <code>features_train</code> and <code>features_test</code></li></ul><p><strong>Examples</strong></p><pre><code class="language-julia">C_train, C_test = JudiLing.make_combined_cue_matrix_from_CFBS(features_train, features_test)</code></pre></div><a class="docs-sourcelink" target="_blank" href="https://github.com/quantling/JudiLing.jl/blob/244bb0c648484065ffd5a41781ccc1caf2e5db60/src/make_cue_matrix.jl#LL506-L529">source</a></section></article><article class="docstring"><header><a class="docstring-binding" id="JudiLing.make_ngrams-NTuple{5, Any}" href="#JudiLing.make_ngrams-NTuple{5, Any}"><code>JudiLing.make_ngrams</code></a> — <span class="docstring-category">Method</span></header><section><div><pre><code class="language-julia">make_ngrams(tokens, grams, keep_sep, sep_token, start_end_token)</code></pre><p>Given a list of string tokens return a list of all n-grams for these tokens.</p></div><a class="docs-sourcelink" target="_blank" href="https://github.com/quantling/JudiLing.jl/blob/244bb0c648484065ffd5a41781ccc1caf2e5db60/src/make_cue_matrix.jl#LL561-L565">source</a></section></article></article><nav class="docs-footer"><a class="docs-footer-prevpage" href="../input/">« Loading data</a><a class="docs-footer-nextpage" href="../make_semantic_matrix/">Make Semantic Matrix »</a><div class="flexbox-break"></div><p class="footer-message">Powered by <a href="https://github.com/JuliaDocs/Documenter.jl">Documenter.jl</a> and the <a href="https://julialang.org/">Julia Programming Language</a>.</p></nav></div><div class="modal" id="documenter-settings"><div class="modal-background"></div><div class="modal-card"><header class="modal-card-head"><p class="modal-card-title">Settings</p><button class="delete"></button></header><section class="modal-card-body"><p><label class="label">Theme</label><div class="select"><select id="documenter-themepicker"><option value="documenter-light">documenter-light</option><option value="documenter-dark">documenter-dark</option></select></div></p><hr/><p>This document was generated with <a href="https://github.com/JuliaDocs/Documenter.jl">Documenter.jl</a> on <span class="colophon-date" title="Wednesday 3 July 2024 16:02">Wednesday 3 July 2024</span>. Using Julia version 1.10.4.</p></section><footer class="modal-card-foot"></footer></div></div></div></body></html>
+                                   ncol::Union{Missing,Int}=missing) where {T}</code></pre><p>Create cue matrices from two vectors of feature vectors (usually CFBS vectors). It is expected (though of course not necessary) that the vectors have varying lengths. They are consequently padded on the right with the provided <code>pad_val</code>. The cue matrices are set to have to the size of the maximum number of feature values in <code>features_train</code> and <code>features_test</code>.</p><p><strong>Obligatory arguments</strong></p><ul><li><code>features_train::Vector{Vector{T}}</code>: vector of vectors containing C-FBS features</li><li><code>features_test::Vector{Vector{T}}</code>: vector of vectors containing C-FBS features</li></ul><p><strong>Optional arguments</strong></p><ul><li><code>pad_val::T = 0.</code>: Value with which the feature vectors will be padded</li><li><code>ncol::Union{Missing,Int}=missing</code>: Number of columns of the C matrices. If not set, will be set to the maximum number of features in <code>features_train</code> and <code>features_test</code></li></ul><p><strong>Examples</strong></p><pre><code class="language-julia">C_train, C_test = JudiLing.make_combined_cue_matrix_from_CFBS(features_train, features_test)</code></pre></div><a class="docs-sourcelink" target="_blank" href="https://github.com/quantling/JudiLing.jl/blob/5ca73e4b27ef788e0b36d45e6360491a5a413be8/src/make_cue_matrix.jl#LL506-L529">source</a></section></article><article class="docstring"><header><a class="docstring-binding" id="JudiLing.make_ngrams-NTuple{5, Any}" href="#JudiLing.make_ngrams-NTuple{5, Any}"><code>JudiLing.make_ngrams</code></a> — <span class="docstring-category">Method</span></header><section><div><pre><code class="language-julia">make_ngrams(tokens, grams, keep_sep, sep_token, start_end_token)</code></pre><p>Given a list of string tokens return a list of all n-grams for these tokens.</p></div><a class="docs-sourcelink" target="_blank" href="https://github.com/quantling/JudiLing.jl/blob/5ca73e4b27ef788e0b36d45e6360491a5a413be8/src/make_cue_matrix.jl#LL561-L565">source</a></section></article></article><nav class="docs-footer"><a class="docs-footer-prevpage" href="../input/">« Loading data</a><a class="docs-footer-nextpage" href="../make_semantic_matrix/">Make Semantic Matrix »</a><div class="flexbox-break"></div><p class="footer-message">Powered by <a href="https://github.com/JuliaDocs/Documenter.jl">Documenter.jl</a> and the <a href="https://julialang.org/">Julia Programming Language</a>.</p></nav></div><div class="modal" id="documenter-settings"><div class="modal-background"></div><div class="modal-card"><header class="modal-card-head"><p class="modal-card-title">Settings</p><button class="delete"></button></header><section class="modal-card-body"><p><label class="label">Theme</label><div class="select"><select id="documenter-themepicker"><option value="documenter-light">documenter-light</option><option value="documenter-dark">documenter-dark</option></select></div></p><hr/><p>This document was generated with <a href="https://github.com/JuliaDocs/Documenter.jl">Documenter.jl</a> on <span class="colophon-date" title="Wednesday 3 July 2024 16:16">Wednesday 3 July 2024</span>. Using Julia version 1.10.4.</p></section><footer class="modal-card-foot"></footer></div></div></div></body></html>
diff --git a/dev/man/make_semantic_matrix/index.html b/dev/man/make_semantic_matrix/index.html
index 78e322e..b26d69d 100644
--- a/dev/man/make_semantic_matrix/index.html
+++ b/dev/man/make_semantic_matrix/index.html
@@ -1,12 +1,12 @@
 <!DOCTYPE html>
-<html lang="en"><head><meta charset="UTF-8"/><meta name="viewport" content="width=device-width, initial-scale=1.0"/><title>Make Semantic Matrix · JudiLing.jl</title><link rel="canonical" href="https://quantling.github.io/JudiLing.jl/man/make_semantic_matrix/"/><link href="https://fonts.googleapis.com/css?family=Lato|Roboto+Mono" rel="stylesheet" type="text/css"/><link href="https://cdnjs.cloudflare.com/ajax/libs/font-awesome/5.15.0/css/fontawesome.min.css" rel="stylesheet" type="text/css"/><link href="https://cdnjs.cloudflare.com/ajax/libs/font-awesome/5.15.0/css/solid.min.css" rel="stylesheet" type="text/css"/><link href="https://cdnjs.cloudflare.com/ajax/libs/font-awesome/5.15.0/css/brands.min.css" rel="stylesheet" type="text/css"/><link href="https://cdnjs.cloudflare.com/ajax/libs/KaTeX/0.11.1/katex.min.css" rel="stylesheet" type="text/css"/><script>documenterBaseURL="../.."</script><script src="https://cdnjs.cloudflare.com/ajax/libs/require.js/2.3.6/require.min.js" data-main="../../assets/documenter.js"></script><script src="../../siteinfo.js"></script><script src="../../../versions.js"></script><link class="docs-theme-link" rel="stylesheet" type="text/css" href="../../assets/themes/documenter-dark.css" data-theme-name="documenter-dark"/><link class="docs-theme-link" rel="stylesheet" type="text/css" href="../../assets/themes/documenter-light.css" data-theme-name="documenter-light" data-theme-primary/><script src="../../assets/themeswap.js"></script></head><body><div id="documenter"><nav class="docs-sidebar"><div class="docs-package-name"><span class="docs-autofit">JudiLing.jl</span></div><form class="docs-search" action="../../search/"><input class="docs-search-query" id="documenter-search-query" name="q" type="text" placeholder="Search docs"/></form><ul class="docs-menu"><li><a class="tocitem" href="../../">Home</a></li><li><span class="tocitem">Manual</span><ul><li><a class="tocitem" href="../input/">Loading data</a></li><li><a class="tocitem" href="../make_cue_matrix/">Make Cue Matrix</a></li><li class="is-active"><a class="tocitem" href>Make Semantic Matrix</a><ul class="internal"><li><a class="tocitem" href="#Make-binary-semantic-vectors"><span>Make binary semantic vectors</span></a></li><li><a class="tocitem" href="#Simulate-semantic-vectors"><span>Simulate semantic vectors</span></a></li><li><a class="tocitem" href="#Load-from-word2vec,-fasttext-or-similar"><span>Load from word2vec, fasttext or similar</span></a></li><li><a class="tocitem" href="#Utility-functions"><span>Utility functions</span></a></li></ul></li><li><a class="tocitem" href="../cholesky/">Cholesky</a></li><li><a class="tocitem" href="../make_adjacency_matrix/">Make Adjacency Matrix</a></li><li><a class="tocitem" href="../make_yt_matrix/">Make Yt Matrix</a></li><li><a class="tocitem" href="../find_path/">Find Paths</a></li><li><a class="tocitem" href="../eval/">Evaluation</a></li><li><a class="tocitem" href="../output/">Output</a></li><li><a class="tocitem" href="../test_combo/">Test Combo</a></li><li><a class="tocitem" href="../display/">Display</a></li><li><a class="tocitem" href="../utils/">Utils</a></li><li><a class="tocitem" href="../pickle/">Pickle</a></li><li><a class="tocitem" href="../pyndl/">Pyndl</a></li><li><a class="tocitem" href="../wh/">Widrow-Hoff Learning</a></li><li><a class="tocitem" href="../deep_learning/">Deep learning</a></li><li><a class="tocitem" href="../measures_func/">Measures function</a></li></ul></li><li><a class="tocitem" href="../all_manual/">All Manual index</a></li></ul><div class="docs-version-selector field has-addons"><div class="control"><span class="docs-label button is-static is-size-7">Version</span></div><div class="docs-selector control is-expanded"><div class="select is-fullwidth is-size-7"><select id="documenter-version-selector"></select></div></div></div></nav><div class="docs-main"><header class="docs-navbar"><nav class="breadcrumb"><ul class="is-hidden-mobile"><li><a class="is-disabled">Manual</a></li><li class="is-active"><a href>Make Semantic Matrix</a></li></ul><ul class="is-hidden-tablet"><li class="is-active"><a href>Make Semantic Matrix</a></li></ul></nav><div class="docs-right"><a class="docs-edit-link" href="https://github.com/quantling/JudiLing.jl/blob/master/docs/src/man/make_semantic_matrix.md#L" title="Edit on GitHub"><span class="docs-icon fab"></span><span class="docs-label is-hidden-touch">Edit on GitHub</span></a><a class="docs-settings-button fas fa-cog" id="documenter-settings-button" href="#" title="Settings"></a><a class="docs-sidebar-button fa fa-bars is-hidden-desktop" id="documenter-sidebar-button" href="#"></a></div></header><article class="content" id="documenter-page"><h1 id="Make-Semantic-Matrix"><a class="docs-heading-anchor" href="#Make-Semantic-Matrix">Make Semantic Matrix</a><a id="Make-Semantic-Matrix-1"></a><a class="docs-heading-anchor-permalink" href="#Make-Semantic-Matrix" title="Permalink"></a></h1><h2 id="Make-binary-semantic-vectors"><a class="docs-heading-anchor" href="#Make-binary-semantic-vectors">Make binary semantic vectors</a><a id="Make-binary-semantic-vectors-1"></a><a class="docs-heading-anchor-permalink" href="#Make-binary-semantic-vectors" title="Permalink"></a></h2><article class="docstring"><header><a class="docstring-binding" id="JudiLing.PS_Matrix_Struct" href="#JudiLing.PS_Matrix_Struct"><code>JudiLing.PS_Matrix_Struct</code></a> — <span class="docstring-category">Type</span></header><section><div><p>A structure that stores the discrete semantic vectors: pS is the discrete semantic matrix; f2i is a dictionary returning the indices for features; i2f is a dictionary returning the features for indices.</p></div><a class="docs-sourcelink" target="_blank" href="https://github.com/quantling/JudiLing.jl/blob/244bb0c648484065ffd5a41781ccc1caf2e5db60/src/make_semantic_matrix.jl#LL1-L6">source</a></section></article><article class="docstring"><header><a class="docstring-binding" id="JudiLing.make_pS_matrix" href="#JudiLing.make_pS_matrix"><code>JudiLing.make_pS_matrix</code></a> — <span class="docstring-category">Function</span></header><section><div><p>Make discrete semantic matrix.</p></div><a class="docs-sourcelink" target="_blank" href="https://github.com/quantling/JudiLing.jl/blob/244bb0c648484065ffd5a41781ccc1caf2e5db60/src/make_semantic_matrix.jl#LL26-L28">source</a></section></article><article class="docstring"><header><a class="docstring-binding" id="JudiLing.make_pS_matrix-Tuple{Any}" href="#JudiLing.make_pS_matrix-Tuple{Any}"><code>JudiLing.make_pS_matrix</code></a> — <span class="docstring-category">Method</span></header><section><div><pre><code class="language-julia">make_pS_matrix(data)</code></pre><p>Create a discrete semantic matrix given a dataframe.</p><p><strong>Obligatory Arguments</strong></p><ul><li><code>data::DataFrame</code>: the dataset</li></ul><p><strong>Optional Arguments</strong></p><ul><li><code>features_col::Symbol=:CommunicativeIntention</code>: the column name for target</li><li><code>sep_token::String=&quot;_&quot;</code>: separator</li></ul><p><strong>Examples</strong></p><pre><code class="language-julia">s_obj_train = JudiLing.make_pS_matrix(
+<html lang="en"><head><meta charset="UTF-8"/><meta name="viewport" content="width=device-width, initial-scale=1.0"/><title>Make Semantic Matrix · JudiLing.jl</title><link rel="canonical" href="https://quantling.github.io/JudiLing.jl/man/make_semantic_matrix/"/><link href="https://fonts.googleapis.com/css?family=Lato|Roboto+Mono" rel="stylesheet" type="text/css"/><link href="https://cdnjs.cloudflare.com/ajax/libs/font-awesome/5.15.0/css/fontawesome.min.css" rel="stylesheet" type="text/css"/><link href="https://cdnjs.cloudflare.com/ajax/libs/font-awesome/5.15.0/css/solid.min.css" rel="stylesheet" type="text/css"/><link href="https://cdnjs.cloudflare.com/ajax/libs/font-awesome/5.15.0/css/brands.min.css" rel="stylesheet" type="text/css"/><link href="https://cdnjs.cloudflare.com/ajax/libs/KaTeX/0.11.1/katex.min.css" rel="stylesheet" type="text/css"/><script>documenterBaseURL="../.."</script><script src="https://cdnjs.cloudflare.com/ajax/libs/require.js/2.3.6/require.min.js" data-main="../../assets/documenter.js"></script><script src="../../siteinfo.js"></script><script src="../../../versions.js"></script><link class="docs-theme-link" rel="stylesheet" type="text/css" href="../../assets/themes/documenter-dark.css" data-theme-name="documenter-dark"/><link class="docs-theme-link" rel="stylesheet" type="text/css" href="../../assets/themes/documenter-light.css" data-theme-name="documenter-light" data-theme-primary/><script src="../../assets/themeswap.js"></script></head><body><div id="documenter"><nav class="docs-sidebar"><div class="docs-package-name"><span class="docs-autofit">JudiLing.jl</span></div><form class="docs-search" action="../../search/"><input class="docs-search-query" id="documenter-search-query" name="q" type="text" placeholder="Search docs"/></form><ul class="docs-menu"><li><a class="tocitem" href="../../">Home</a></li><li><span class="tocitem">Manual</span><ul><li><a class="tocitem" href="../input/">Loading data</a></li><li><a class="tocitem" href="../make_cue_matrix/">Make Cue Matrix</a></li><li class="is-active"><a class="tocitem" href>Make Semantic Matrix</a><ul class="internal"><li><a class="tocitem" href="#Make-binary-semantic-vectors"><span>Make binary semantic vectors</span></a></li><li><a class="tocitem" href="#Simulate-semantic-vectors"><span>Simulate semantic vectors</span></a></li><li><a class="tocitem" href="#Load-from-word2vec,-fasttext-or-similar"><span>Load from word2vec, fasttext or similar</span></a></li><li><a class="tocitem" href="#Utility-functions"><span>Utility functions</span></a></li></ul></li><li><a class="tocitem" href="../cholesky/">Cholesky</a></li><li><a class="tocitem" href="../make_adjacency_matrix/">Make Adjacency Matrix</a></li><li><a class="tocitem" href="../make_yt_matrix/">Make Yt Matrix</a></li><li><a class="tocitem" href="../find_path/">Find Paths</a></li><li><a class="tocitem" href="../eval/">Evaluation</a></li><li><a class="tocitem" href="../output/">Output</a></li><li><a class="tocitem" href="../test_combo/">Test Combo</a></li><li><a class="tocitem" href="../display/">Display</a></li><li><a class="tocitem" href="../utils/">Utils</a></li><li><a class="tocitem" href="../pickle/">Pickle</a></li><li><a class="tocitem" href="../pyndl/">Pyndl</a></li><li><a class="tocitem" href="../wh/">Widrow-Hoff Learning</a></li><li><a class="tocitem" href="../deep_learning/">Deep learning</a></li><li><a class="tocitem" href="../measures_func/">Measures function</a></li></ul></li><li><a class="tocitem" href="../all_manual/">All Manual index</a></li></ul><div class="docs-version-selector field has-addons"><div class="control"><span class="docs-label button is-static is-size-7">Version</span></div><div class="docs-selector control is-expanded"><div class="select is-fullwidth is-size-7"><select id="documenter-version-selector"></select></div></div></div></nav><div class="docs-main"><header class="docs-navbar"><nav class="breadcrumb"><ul class="is-hidden-mobile"><li><a class="is-disabled">Manual</a></li><li class="is-active"><a href>Make Semantic Matrix</a></li></ul><ul class="is-hidden-tablet"><li class="is-active"><a href>Make Semantic Matrix</a></li></ul></nav><div class="docs-right"><a class="docs-edit-link" href="https://github.com/quantling/JudiLing.jl/blob/master/docs/src/man/make_semantic_matrix.md#L" title="Edit on GitHub"><span class="docs-icon fab"></span><span class="docs-label is-hidden-touch">Edit on GitHub</span></a><a class="docs-settings-button fas fa-cog" id="documenter-settings-button" href="#" title="Settings"></a><a class="docs-sidebar-button fa fa-bars is-hidden-desktop" id="documenter-sidebar-button" href="#"></a></div></header><article class="content" id="documenter-page"><h1 id="Make-Semantic-Matrix"><a class="docs-heading-anchor" href="#Make-Semantic-Matrix">Make Semantic Matrix</a><a id="Make-Semantic-Matrix-1"></a><a class="docs-heading-anchor-permalink" href="#Make-Semantic-Matrix" title="Permalink"></a></h1><h2 id="Make-binary-semantic-vectors"><a class="docs-heading-anchor" href="#Make-binary-semantic-vectors">Make binary semantic vectors</a><a id="Make-binary-semantic-vectors-1"></a><a class="docs-heading-anchor-permalink" href="#Make-binary-semantic-vectors" title="Permalink"></a></h2><article class="docstring"><header><a class="docstring-binding" id="JudiLing.PS_Matrix_Struct" href="#JudiLing.PS_Matrix_Struct"><code>JudiLing.PS_Matrix_Struct</code></a> — <span class="docstring-category">Type</span></header><section><div><p>A structure that stores the discrete semantic vectors: pS is the discrete semantic matrix; f2i is a dictionary returning the indices for features; i2f is a dictionary returning the features for indices.</p></div><a class="docs-sourcelink" target="_blank" href="https://github.com/quantling/JudiLing.jl/blob/5ca73e4b27ef788e0b36d45e6360491a5a413be8/src/make_semantic_matrix.jl#LL1-L6">source</a></section></article><article class="docstring"><header><a class="docstring-binding" id="JudiLing.make_pS_matrix" href="#JudiLing.make_pS_matrix"><code>JudiLing.make_pS_matrix</code></a> — <span class="docstring-category">Function</span></header><section><div><p>Make discrete semantic matrix.</p></div><a class="docs-sourcelink" target="_blank" href="https://github.com/quantling/JudiLing.jl/blob/5ca73e4b27ef788e0b36d45e6360491a5a413be8/src/make_semantic_matrix.jl#LL26-L28">source</a></section></article><article class="docstring"><header><a class="docstring-binding" id="JudiLing.make_pS_matrix-Tuple{Any}" href="#JudiLing.make_pS_matrix-Tuple{Any}"><code>JudiLing.make_pS_matrix</code></a> — <span class="docstring-category">Method</span></header><section><div><pre><code class="language-julia">make_pS_matrix(data)</code></pre><p>Create a discrete semantic matrix given a dataframe.</p><p><strong>Obligatory Arguments</strong></p><ul><li><code>data::DataFrame</code>: the dataset</li></ul><p><strong>Optional Arguments</strong></p><ul><li><code>features_col::Symbol=:CommunicativeIntention</code>: the column name for target</li><li><code>sep_token::String=&quot;_&quot;</code>: separator</li></ul><p><strong>Examples</strong></p><pre><code class="language-julia">s_obj_train = JudiLing.make_pS_matrix(
     utterance,
     features_col=:CommunicativeIntention,
-    sep_token=&quot;_&quot;)</code></pre></div><a class="docs-sourcelink" target="_blank" href="https://github.com/quantling/JudiLing.jl/blob/244bb0c648484065ffd5a41781ccc1caf2e5db60/src/make_semantic_matrix.jl#LL51-L70">source</a></section></article><article class="docstring"><header><a class="docstring-binding" id="JudiLing.make_pS_matrix-Tuple{Any, Any}" href="#JudiLing.make_pS_matrix-Tuple{Any, Any}"><code>JudiLing.make_pS_matrix</code></a> — <span class="docstring-category">Method</span></header><section><div><pre><code class="language-julia">make_pS_matrix(data_val, pS_obj)</code></pre><p>Construct discrete semantic matrix for the validation datasets given by the exemplar in the dataframe, and given the S matrix for the training datasets.</p><p><strong>Obligatory Arguments</strong></p><ul><li><code>data_val::DataFrame</code>: the dataset</li><li><code>pS_obj::PS_Matrix_Struct</code>: training PS object</li></ul><p><strong>Optional Arguments</strong></p><ul><li><code>features_col::Symbol=:CommunicativeIntention</code>: the column name for target</li><li><code>sep_token::String=&quot;_&quot;</code>: separator</li></ul><p><strong>Examples</strong></p><pre><code class="language-julia">s_obj_val = JudiLing.make_pS_matrix(
+    sep_token=&quot;_&quot;)</code></pre></div><a class="docs-sourcelink" target="_blank" href="https://github.com/quantling/JudiLing.jl/blob/5ca73e4b27ef788e0b36d45e6360491a5a413be8/src/make_semantic_matrix.jl#LL51-L70">source</a></section></article><article class="docstring"><header><a class="docstring-binding" id="JudiLing.make_pS_matrix-Tuple{Any, Any}" href="#JudiLing.make_pS_matrix-Tuple{Any, Any}"><code>JudiLing.make_pS_matrix</code></a> — <span class="docstring-category">Method</span></header><section><div><pre><code class="language-julia">make_pS_matrix(data_val, pS_obj)</code></pre><p>Construct discrete semantic matrix for the validation datasets given by the exemplar in the dataframe, and given the S matrix for the training datasets.</p><p><strong>Obligatory Arguments</strong></p><ul><li><code>data_val::DataFrame</code>: the dataset</li><li><code>pS_obj::PS_Matrix_Struct</code>: training PS object</li></ul><p><strong>Optional Arguments</strong></p><ul><li><code>features_col::Symbol=:CommunicativeIntention</code>: the column name for target</li><li><code>sep_token::String=&quot;_&quot;</code>: separator</li></ul><p><strong>Examples</strong></p><pre><code class="language-julia">s_obj_val = JudiLing.make_pS_matrix(
     data_val,
     s_obj_train,
     features_col=:CommunicativeIntention,
-    sep_token=&quot;_&quot;)</code></pre></div><a class="docs-sourcelink" target="_blank" href="https://github.com/quantling/JudiLing.jl/blob/244bb0c648484065ffd5a41781ccc1caf2e5db60/src/make_semantic_matrix.jl#LL114-L136">source</a></section></article><article class="docstring"><header><a class="docstring-binding" id="JudiLing.make_combined_pS_matrix-Tuple{Any, Any}" href="#JudiLing.make_combined_pS_matrix-Tuple{Any, Any}"><code>JudiLing.make_combined_pS_matrix</code></a> — <span class="docstring-category">Method</span></header><section><div><pre><code class="language-julia">make_combined_pS_matrix(
+    sep_token=&quot;_&quot;)</code></pre></div><a class="docs-sourcelink" target="_blank" href="https://github.com/quantling/JudiLing.jl/blob/5ca73e4b27ef788e0b36d45e6360491a5a413be8/src/make_semantic_matrix.jl#LL114-L136">source</a></section></article><article class="docstring"><header><a class="docstring-binding" id="JudiLing.make_combined_pS_matrix-Tuple{Any, Any}" href="#JudiLing.make_combined_pS_matrix-Tuple{Any, Any}"><code>JudiLing.make_combined_pS_matrix</code></a> — <span class="docstring-category">Method</span></header><section><div><pre><code class="language-julia">make_combined_pS_matrix(
     data_train,
     data_val;
     features_col = :CommunicativeIntention,
@@ -15,7 +15,7 @@
     data_train,
     data_val,
     features_col=:CommunicativeIntention,
-    sep_token=&quot;_&quot;)</code></pre></div><a class="docs-sourcelink" target="_blank" href="https://github.com/quantling/JudiLing.jl/blob/244bb0c648484065ffd5a41781ccc1caf2e5db60/src/make_semantic_matrix.jl#LL182-L208">source</a></section></article><h2 id="Simulate-semantic-vectors"><a class="docs-heading-anchor" href="#Simulate-semantic-vectors">Simulate semantic vectors</a><a id="Simulate-semantic-vectors-1"></a><a class="docs-heading-anchor-permalink" href="#Simulate-semantic-vectors" title="Permalink"></a></h2><article class="docstring"><header><a class="docstring-binding" id="JudiLing.L_Matrix_Struct" href="#JudiLing.L_Matrix_Struct"><code>JudiLing.L_Matrix_Struct</code></a> — <span class="docstring-category">Type</span></header><section><div><p>A structure that stores Lexome semantic vectors: L is Lexome semantic matrix; f2i is a dictionary returning the indices for features; i2f is a dictionary returning the features for indices.</p></div><a class="docs-sourcelink" target="_blank" href="https://github.com/quantling/JudiLing.jl/blob/244bb0c648484065ffd5a41781ccc1caf2e5db60/src/make_semantic_matrix.jl#LL13-L18">source</a></section></article><article class="docstring"><header><a class="docstring-binding" id="JudiLing.make_S_matrix" href="#JudiLing.make_S_matrix"><code>JudiLing.make_S_matrix</code></a> — <span class="docstring-category">Function</span></header><section><div><p>Make simulated semantic matrix.</p></div><a class="docs-sourcelink" target="_blank" href="https://github.com/quantling/JudiLing.jl/blob/244bb0c648484065ffd5a41781ccc1caf2e5db60/src/make_semantic_matrix.jl#LL31-L33">source</a></section></article><article class="docstring"><header><a class="docstring-binding" id="JudiLing.make_L_matrix" href="#JudiLing.make_L_matrix"><code>JudiLing.make_L_matrix</code></a> — <span class="docstring-category">Function</span></header><section><div><p>Make simulated lexome matrix.</p></div><a class="docs-sourcelink" target="_blank" href="https://github.com/quantling/JudiLing.jl/blob/244bb0c648484065ffd5a41781ccc1caf2e5db60/src/make_semantic_matrix.jl#LL36-L38">source</a></section></article><article class="docstring"><header><a class="docstring-binding" id="JudiLing.make_combined_S_matrix" href="#JudiLing.make_combined_S_matrix"><code>JudiLing.make_combined_S_matrix</code></a> — <span class="docstring-category">Function</span></header><section><div><p>Make combined simulated S matrices, where combined features from both training datasets and validation datasets</p></div><a class="docs-sourcelink" target="_blank" href="https://github.com/quantling/JudiLing.jl/blob/244bb0c648484065ffd5a41781ccc1caf2e5db60/src/make_semantic_matrix.jl#LL41-L43">source</a></section></article><article class="docstring"><header><a class="docstring-binding" id="JudiLing.make_combined_L_matrix" href="#JudiLing.make_combined_L_matrix"><code>JudiLing.make_combined_L_matrix</code></a> — <span class="docstring-category">Function</span></header><section><div><p>Make combined simulated Lexome matrix, where combined features from both training datasets and validation datasets</p></div><a class="docs-sourcelink" target="_blank" href="https://github.com/quantling/JudiLing.jl/blob/244bb0c648484065ffd5a41781ccc1caf2e5db60/src/make_semantic_matrix.jl#LL46-L48">source</a></section></article><article class="docstring"><header><a class="docstring-binding" id="JudiLing.make_S_matrix-Tuple{DataFrames.DataFrame, Vector, Vector}" href="#JudiLing.make_S_matrix-Tuple{DataFrames.DataFrame, Vector, Vector}"><code>JudiLing.make_S_matrix</code></a> — <span class="docstring-category">Method</span></header><section><div><pre><code class="language-julia">make_S_matrix(data::DataFrame, base::Vector, inflections::Vector)</code></pre><p>Create simulated semantic matrix for the training datasets, given the input data of a vector specified contex lexemes and a vector specified gramatic lexemes. The semantic vector of a word form is constructed summing semantic vectors of content and gramatic lexemes.</p><p><strong>Obligatory Arguments</strong></p><ul><li><code>data::DataFrame</code>: the dataset</li><li><code>base::Vector</code>: context lexemes</li><li><code>inflections::Vector</code>: grammatic lexemes</li></ul><p><strong>Optional Arguments</strong></p><ul><li><code>ncol::Int64=200</code>: dimension of semantic vectors, usually the same as that of cue vectors</li><li><code>sd_base_mean::Int64=1</code>: the sd mean of base features</li><li><code>sd_inflection_mean::Int64=1</code>: the sd mean of inflectional features</li><li><code>sd_base::Int64=4</code>: the sd of base features</li><li><code>sd_inflection::Int64=4</code>: the sd of inflectional features</li><li><code>seed::Int64=314</code>: the random seed</li><li><code>isdeep::Bool=true</code>: if true, mean of each feature is also randomized</li><li><code>add_noise::Bool=true</code>: if true, add additional Gaussian noise</li><li><code>sd_noise::Int64=1</code>: the sd of the Gaussian noise</li><li><code>normalized::Bool=false</code>: if true, most of the values range between 1 and -1, it may slightly exceed between 1 or -1 depending on the sd</li></ul><p><strong>Examples</strong></p><pre><code class="language-julia"># basic usage
+    sep_token=&quot;_&quot;)</code></pre></div><a class="docs-sourcelink" target="_blank" href="https://github.com/quantling/JudiLing.jl/blob/5ca73e4b27ef788e0b36d45e6360491a5a413be8/src/make_semantic_matrix.jl#LL182-L208">source</a></section></article><h2 id="Simulate-semantic-vectors"><a class="docs-heading-anchor" href="#Simulate-semantic-vectors">Simulate semantic vectors</a><a id="Simulate-semantic-vectors-1"></a><a class="docs-heading-anchor-permalink" href="#Simulate-semantic-vectors" title="Permalink"></a></h2><article class="docstring"><header><a class="docstring-binding" id="JudiLing.L_Matrix_Struct" href="#JudiLing.L_Matrix_Struct"><code>JudiLing.L_Matrix_Struct</code></a> — <span class="docstring-category">Type</span></header><section><div><p>A structure that stores Lexome semantic vectors: L is Lexome semantic matrix; f2i is a dictionary returning the indices for features; i2f is a dictionary returning the features for indices.</p></div><a class="docs-sourcelink" target="_blank" href="https://github.com/quantling/JudiLing.jl/blob/5ca73e4b27ef788e0b36d45e6360491a5a413be8/src/make_semantic_matrix.jl#LL13-L18">source</a></section></article><article class="docstring"><header><a class="docstring-binding" id="JudiLing.make_S_matrix" href="#JudiLing.make_S_matrix"><code>JudiLing.make_S_matrix</code></a> — <span class="docstring-category">Function</span></header><section><div><p>Make simulated semantic matrix.</p></div><a class="docs-sourcelink" target="_blank" href="https://github.com/quantling/JudiLing.jl/blob/5ca73e4b27ef788e0b36d45e6360491a5a413be8/src/make_semantic_matrix.jl#LL31-L33">source</a></section></article><article class="docstring"><header><a class="docstring-binding" id="JudiLing.make_L_matrix" href="#JudiLing.make_L_matrix"><code>JudiLing.make_L_matrix</code></a> — <span class="docstring-category">Function</span></header><section><div><p>Make simulated lexome matrix.</p></div><a class="docs-sourcelink" target="_blank" href="https://github.com/quantling/JudiLing.jl/blob/5ca73e4b27ef788e0b36d45e6360491a5a413be8/src/make_semantic_matrix.jl#LL36-L38">source</a></section></article><article class="docstring"><header><a class="docstring-binding" id="JudiLing.make_combined_S_matrix" href="#JudiLing.make_combined_S_matrix"><code>JudiLing.make_combined_S_matrix</code></a> — <span class="docstring-category">Function</span></header><section><div><p>Make combined simulated S matrices, where combined features from both training datasets and validation datasets</p></div><a class="docs-sourcelink" target="_blank" href="https://github.com/quantling/JudiLing.jl/blob/5ca73e4b27ef788e0b36d45e6360491a5a413be8/src/make_semantic_matrix.jl#LL41-L43">source</a></section></article><article class="docstring"><header><a class="docstring-binding" id="JudiLing.make_combined_L_matrix" href="#JudiLing.make_combined_L_matrix"><code>JudiLing.make_combined_L_matrix</code></a> — <span class="docstring-category">Function</span></header><section><div><p>Make combined simulated Lexome matrix, where combined features from both training datasets and validation datasets</p></div><a class="docs-sourcelink" target="_blank" href="https://github.com/quantling/JudiLing.jl/blob/5ca73e4b27ef788e0b36d45e6360491a5a413be8/src/make_semantic_matrix.jl#LL46-L48">source</a></section></article><article class="docstring"><header><a class="docstring-binding" id="JudiLing.make_S_matrix-Tuple{DataFrames.DataFrame, Vector, Vector}" href="#JudiLing.make_S_matrix-Tuple{DataFrames.DataFrame, Vector, Vector}"><code>JudiLing.make_S_matrix</code></a> — <span class="docstring-category">Method</span></header><section><div><pre><code class="language-julia">make_S_matrix(data::DataFrame, base::Vector, inflections::Vector)</code></pre><p>Create simulated semantic matrix for the training datasets, given the input data of a vector specified contex lexemes and a vector specified gramatic lexemes. The semantic vector of a word form is constructed summing semantic vectors of content and gramatic lexemes.</p><p><strong>Obligatory Arguments</strong></p><ul><li><code>data::DataFrame</code>: the dataset</li><li><code>base::Vector</code>: context lexemes</li><li><code>inflections::Vector</code>: grammatic lexemes</li></ul><p><strong>Optional Arguments</strong></p><ul><li><code>ncol::Int64=200</code>: dimension of semantic vectors, usually the same as that of cue vectors</li><li><code>sd_base_mean::Int64=1</code>: the sd mean of base features</li><li><code>sd_inflection_mean::Int64=1</code>: the sd mean of inflectional features</li><li><code>sd_base::Int64=4</code>: the sd of base features</li><li><code>sd_inflection::Int64=4</code>: the sd of inflectional features</li><li><code>seed::Int64=314</code>: the random seed</li><li><code>isdeep::Bool=true</code>: if true, mean of each feature is also randomized</li><li><code>add_noise::Bool=true</code>: if true, add additional Gaussian noise</li><li><code>sd_noise::Int64=1</code>: the sd of the Gaussian noise</li><li><code>normalized::Bool=false</code>: if true, most of the values range between 1 and -1, it may slightly exceed between 1 or -1 depending on the sd</li></ul><p><strong>Examples</strong></p><pre><code class="language-julia"># basic usage
 S_train = JudiLing.make_S_matrix(
     french,
     [&quot;Lexeme&quot;],
@@ -51,7 +51,7 @@
     sd_base=4,
     sd_inflection=4,
     sd_noise=1,
-    ...)</code></pre></div><a class="docs-sourcelink" target="_blank" href="https://github.com/quantling/JudiLing.jl/blob/244bb0c648484065ffd5a41781ccc1caf2e5db60/src/make_semantic_matrix.jl#LL248-L313">source</a></section></article><article class="docstring"><header><a class="docstring-binding" id="JudiLing.make_S_matrix-Tuple{DataFrames.DataFrame, DataFrames.DataFrame, Vector, Vector}" href="#JudiLing.make_S_matrix-Tuple{DataFrames.DataFrame, DataFrames.DataFrame, Vector, Vector}"><code>JudiLing.make_S_matrix</code></a> — <span class="docstring-category">Method</span></header><section><div><pre><code class="language-julia">make_S_matrix(data_train::DataFrame, data_val::DataFrame, base::Vector, inflections::Vector)</code></pre><p>Create simulated semantic matrix for the validation datasets, given the input data of a vector specified contex lexemes and a vector specified gramatic lexemes. The semantic vector of a word form is constructed summing semantic vectors of content and gramatic lexemes.</p><p><strong>Obligatory Arguments</strong></p><ul><li><code>data_train::DataFrame</code>: the training dataset</li><li><code>data_val::DataFrame</code>: the validation dataset</li><li><code>base::Vector</code>: context lexemes</li><li><code>inflections::Vector</code>: grammatic lexemes</li></ul><p><strong>Optional Arguments</strong></p><ul><li><code>ncol::Int64=200</code>: dimension of semantic vectors, usually the same as that of cue vectors</li><li><code>sd_base_mean::Int64=1</code>: the sd mean of base features</li><li><code>sd_inflection_mean::Int64=1</code>: the sd mean of inflectional features</li><li><code>sd_base::Int64=4</code>: the sd of base features</li><li><code>sd_inflection::Int64=4</code>: the sd of inflectional features</li><li><code>seed::Int64=314</code>: the random seed</li><li><code>isdeep::Bool=true</code>: if true, mean of each feature is also randomized</li><li><code>add_noise::Bool=true</code>: if true, add additional Gaussian noise</li><li><code>sd_noise::Int64=1</code>: the sd of the Gaussian noise</li><li><code>normalized::Bool=false</code>: if true, most of the values range between 1 and -1, it may slightly exceed between 1 or -1 depending on the sd</li></ul><p><strong>Examples</strong></p><pre><code class="language-julia"># basic usage
+    ...)</code></pre></div><a class="docs-sourcelink" target="_blank" href="https://github.com/quantling/JudiLing.jl/blob/5ca73e4b27ef788e0b36d45e6360491a5a413be8/src/make_semantic_matrix.jl#LL248-L313">source</a></section></article><article class="docstring"><header><a class="docstring-binding" id="JudiLing.make_S_matrix-Tuple{DataFrames.DataFrame, DataFrames.DataFrame, Vector, Vector}" href="#JudiLing.make_S_matrix-Tuple{DataFrames.DataFrame, DataFrames.DataFrame, Vector, Vector}"><code>JudiLing.make_S_matrix</code></a> — <span class="docstring-category">Method</span></header><section><div><pre><code class="language-julia">make_S_matrix(data_train::DataFrame, data_val::DataFrame, base::Vector, inflections::Vector)</code></pre><p>Create simulated semantic matrix for the validation datasets, given the input data of a vector specified contex lexemes and a vector specified gramatic lexemes. The semantic vector of a word form is constructed summing semantic vectors of content and gramatic lexemes.</p><p><strong>Obligatory Arguments</strong></p><ul><li><code>data_train::DataFrame</code>: the training dataset</li><li><code>data_val::DataFrame</code>: the validation dataset</li><li><code>base::Vector</code>: context lexemes</li><li><code>inflections::Vector</code>: grammatic lexemes</li></ul><p><strong>Optional Arguments</strong></p><ul><li><code>ncol::Int64=200</code>: dimension of semantic vectors, usually the same as that of cue vectors</li><li><code>sd_base_mean::Int64=1</code>: the sd mean of base features</li><li><code>sd_inflection_mean::Int64=1</code>: the sd mean of inflectional features</li><li><code>sd_base::Int64=4</code>: the sd of base features</li><li><code>sd_inflection::Int64=4</code>: the sd of inflectional features</li><li><code>seed::Int64=314</code>: the random seed</li><li><code>isdeep::Bool=true</code>: if true, mean of each feature is also randomized</li><li><code>add_noise::Bool=true</code>: if true, add additional Gaussian noise</li><li><code>sd_noise::Int64=1</code>: the sd of the Gaussian noise</li><li><code>normalized::Bool=false</code>: if true, most of the values range between 1 and -1, it may slightly exceed between 1 or -1 depending on the sd</li></ul><p><strong>Examples</strong></p><pre><code class="language-julia"># basic usage
 S_train, S_val = JudiLing.make_S_matrix(
     french,
     french_val,
@@ -88,7 +88,7 @@
     sd_base=4,
     sd_inflection=4,
     sd_noise=1,
-    ...)</code></pre></div><a class="docs-sourcelink" target="_blank" href="https://github.com/quantling/JudiLing.jl/blob/244bb0c648484065ffd5a41781ccc1caf2e5db60/src/make_semantic_matrix.jl#LL354-L421">source</a></section></article><article class="docstring"><header><a class="docstring-binding" id="JudiLing.make_S_matrix-Tuple{DataFrames.DataFrame, Vector}" href="#JudiLing.make_S_matrix-Tuple{DataFrames.DataFrame, Vector}"><code>JudiLing.make_S_matrix</code></a> — <span class="docstring-category">Method</span></header><section><div><pre><code class="language-julia">make_S_matrix(data::DataFrame, base::Vector)</code></pre><p>Create simulated semantic matrix for the training datasets with only base features, given the input data of a vector specified contex lexemes and a vector specified gramatic lexemes. The semantic vector of a word form is constructed summing semantic vectors of content and gramatic lexemes.</p><p><strong>Obligatory Arguments</strong></p><ul><li><code>data::DataFrame</code>: the dataset</li><li><code>base::Vector</code>: context lexemes</li></ul><p><strong>Optional Arguments</strong></p><ul><li><code>ncol::Int64=200</code>: dimension of semantic vectors, usually the same as that of cue vectors</li><li><code>sd_base_mean::Int64=1</code>: the sd mean of base features</li><li><code>sd_base::Int64=4</code>: the sd of base features</li><li><code>seed::Int64=314</code>: the random seed</li><li><code>isdeep::Bool=true</code>: if true, mean of each feature is also randomized</li><li><code>add_noise::Bool=true</code>: if true, add additional Gaussian noise</li><li><code>sd_noise::Int64=1</code>: the sd of the Gaussian noise</li><li><code>normalized::Bool=false</code>: if true, most of the values range between 1 and -1, it may slightly exceed between 1 or -1 depending on the sd</li></ul><p><strong>Examples</strong></p><pre><code class="language-julia"># basic usage
+    ...)</code></pre></div><a class="docs-sourcelink" target="_blank" href="https://github.com/quantling/JudiLing.jl/blob/5ca73e4b27ef788e0b36d45e6360491a5a413be8/src/make_semantic_matrix.jl#LL354-L421">source</a></section></article><article class="docstring"><header><a class="docstring-binding" id="JudiLing.make_S_matrix-Tuple{DataFrames.DataFrame, Vector}" href="#JudiLing.make_S_matrix-Tuple{DataFrames.DataFrame, Vector}"><code>JudiLing.make_S_matrix</code></a> — <span class="docstring-category">Method</span></header><section><div><pre><code class="language-julia">make_S_matrix(data::DataFrame, base::Vector)</code></pre><p>Create simulated semantic matrix for the training datasets with only base features, given the input data of a vector specified contex lexemes and a vector specified gramatic lexemes. The semantic vector of a word form is constructed summing semantic vectors of content and gramatic lexemes.</p><p><strong>Obligatory Arguments</strong></p><ul><li><code>data::DataFrame</code>: the dataset</li><li><code>base::Vector</code>: context lexemes</li></ul><p><strong>Optional Arguments</strong></p><ul><li><code>ncol::Int64=200</code>: dimension of semantic vectors, usually the same as that of cue vectors</li><li><code>sd_base_mean::Int64=1</code>: the sd mean of base features</li><li><code>sd_base::Int64=4</code>: the sd of base features</li><li><code>seed::Int64=314</code>: the random seed</li><li><code>isdeep::Bool=true</code>: if true, mean of each feature is also randomized</li><li><code>add_noise::Bool=true</code>: if true, add additional Gaussian noise</li><li><code>sd_noise::Int64=1</code>: the sd of the Gaussian noise</li><li><code>normalized::Bool=false</code>: if true, most of the values range between 1 and -1, it may slightly exceed between 1 or -1 depending on the sd</li></ul><p><strong>Examples</strong></p><pre><code class="language-julia"># basic usage
 S_train = JudiLing.make_S_matrix(
     french,
     [&quot;Lexeme&quot;],
@@ -123,7 +123,7 @@
     sd_base=4,
     sd_inflection=4,
     sd_noise=1,
-    ...)</code></pre></div><a class="docs-sourcelink" target="_blank" href="https://github.com/quantling/JudiLing.jl/blob/244bb0c648484065ffd5a41781ccc1caf2e5db60/src/make_semantic_matrix.jl#LL464-L526">source</a></section></article><article class="docstring"><header><a class="docstring-binding" id="JudiLing.make_S_matrix-Tuple{DataFrames.DataFrame, DataFrames.DataFrame, Vector}" href="#JudiLing.make_S_matrix-Tuple{DataFrames.DataFrame, DataFrames.DataFrame, Vector}"><code>JudiLing.make_S_matrix</code></a> — <span class="docstring-category">Method</span></header><section><div><pre><code class="language-julia">make_S_matrix(data_train::DataFrame, data_val::DataFrame, base::Vector)</code></pre><p>Create simulated semantic matrix for the validation datasets with only base features, given the input data of a vector specified contex lexemes and a vector specified gramatic lexemes. The semantic vector of a word form is constructed summing semantic vectors of content and gramatic lexemes.</p><p><strong>Obligatory Arguments</strong></p><ul><li><code>data_train::DataFrame</code>: the training dataset</li><li><code>data_val::DataFrame</code>: the validation dataset</li><li><code>base::Vector</code>: context lexemes</li></ul><p><strong>Optional Arguments</strong></p><ul><li><code>ncol::Int64=200</code>: dimension of semantic vectors, usually the same as that of cue vectors</li><li><code>sd_base_mean::Int64=1</code>: the sd mean of base features</li><li><code>sd_base::Int64=4</code>: the sd of base features</li><li><code>seed::Int64=314</code>: the random seed</li><li><code>isdeep::Bool=true</code>: if true, mean of each feature is also randomized</li><li><code>add_noise::Bool=true</code>: if true, add additional Gaussian noise</li><li><code>sd_noise::Int64=1</code>: the sd of the Gaussian noise</li><li><code>normalized::Bool=false</code>: if true, most of the values range between 1 and -1, it may slightly exceed between 1 or -1 depending on the sd</li></ul><p><strong>Examples</strong></p><pre><code class="language-julia"># basic usage
+    ...)</code></pre></div><a class="docs-sourcelink" target="_blank" href="https://github.com/quantling/JudiLing.jl/blob/5ca73e4b27ef788e0b36d45e6360491a5a413be8/src/make_semantic_matrix.jl#LL464-L526">source</a></section></article><article class="docstring"><header><a class="docstring-binding" id="JudiLing.make_S_matrix-Tuple{DataFrames.DataFrame, DataFrames.DataFrame, Vector}" href="#JudiLing.make_S_matrix-Tuple{DataFrames.DataFrame, DataFrames.DataFrame, Vector}"><code>JudiLing.make_S_matrix</code></a> — <span class="docstring-category">Method</span></header><section><div><pre><code class="language-julia">make_S_matrix(data_train::DataFrame, data_val::DataFrame, base::Vector)</code></pre><p>Create simulated semantic matrix for the validation datasets with only base features, given the input data of a vector specified contex lexemes and a vector specified gramatic lexemes. The semantic vector of a word form is constructed summing semantic vectors of content and gramatic lexemes.</p><p><strong>Obligatory Arguments</strong></p><ul><li><code>data_train::DataFrame</code>: the training dataset</li><li><code>data_val::DataFrame</code>: the validation dataset</li><li><code>base::Vector</code>: context lexemes</li></ul><p><strong>Optional Arguments</strong></p><ul><li><code>ncol::Int64=200</code>: dimension of semantic vectors, usually the same as that of cue vectors</li><li><code>sd_base_mean::Int64=1</code>: the sd mean of base features</li><li><code>sd_base::Int64=4</code>: the sd of base features</li><li><code>seed::Int64=314</code>: the random seed</li><li><code>isdeep::Bool=true</code>: if true, mean of each feature is also randomized</li><li><code>add_noise::Bool=true</code>: if true, add additional Gaussian noise</li><li><code>sd_noise::Int64=1</code>: the sd of the Gaussian noise</li><li><code>normalized::Bool=false</code>: if true, most of the values range between 1 and -1, it may slightly exceed between 1 or -1 depending on the sd</li></ul><p><strong>Examples</strong></p><pre><code class="language-julia"># basic usage
 S_train, S_val = JudiLing.make_S_matrix(
     french,
     french_val,
@@ -159,7 +159,7 @@
     sd_base=4,
     sd_inflection=4,
     sd_noise=1,
-    ...)</code></pre></div><a class="docs-sourcelink" target="_blank" href="https://github.com/quantling/JudiLing.jl/blob/244bb0c648484065ffd5a41781ccc1caf2e5db60/src/make_semantic_matrix.jl#LL560-L623">source</a></section></article><article class="docstring"><header><a class="docstring-binding" id="JudiLing.make_S_matrix-Tuple{DataFrames.DataFrame, Vector, Vector, JudiLing.L_Matrix_Struct}" href="#JudiLing.make_S_matrix-Tuple{DataFrames.DataFrame, Vector, Vector, JudiLing.L_Matrix_Struct}"><code>JudiLing.make_S_matrix</code></a> — <span class="docstring-category">Method</span></header><section><div><pre><code class="language-julia">make_S_matrix(data_train::DataFrame, base::Vector, inflections::Vector, L::L_Matrix_Struct)</code></pre><p>Create simulated semantic matrix where lexome matrix is available.</p><p><strong>Obligatory Arguments</strong></p><ul><li><code>data::DataFrame</code>: the dataset</li><li><code>base::Vector</code>: context lexemes</li><li><code>inflections::Vector</code>: grammatic lexemes</li><li><code>L::L_Matrix_Struct</code>: the lexome matrix</li></ul><p><strong>Optional Arguments</strong></p><ul><li><code>add_noise::Bool=true</code>: if true, add additional Gaussian noise</li><li><code>sd_noise::Int64=1</code>: the sd of the Gaussian noise</li><li><code>normalized::Bool=false</code>: if true, most of the values range between 1 and -1, it may slightly exceed between 1 or -1 depending on the sd</li></ul><p><strong>Examples</strong></p><pre><code class="language-julia"># basic usage
+    ...)</code></pre></div><a class="docs-sourcelink" target="_blank" href="https://github.com/quantling/JudiLing.jl/blob/5ca73e4b27ef788e0b36d45e6360491a5a413be8/src/make_semantic_matrix.jl#LL560-L623">source</a></section></article><article class="docstring"><header><a class="docstring-binding" id="JudiLing.make_S_matrix-Tuple{DataFrames.DataFrame, Vector, Vector, JudiLing.L_Matrix_Struct}" href="#JudiLing.make_S_matrix-Tuple{DataFrames.DataFrame, Vector, Vector, JudiLing.L_Matrix_Struct}"><code>JudiLing.make_S_matrix</code></a> — <span class="docstring-category">Method</span></header><section><div><pre><code class="language-julia">make_S_matrix(data_train::DataFrame, base::Vector, inflections::Vector, L::L_Matrix_Struct)</code></pre><p>Create simulated semantic matrix where lexome matrix is available.</p><p><strong>Obligatory Arguments</strong></p><ul><li><code>data::DataFrame</code>: the dataset</li><li><code>base::Vector</code>: context lexemes</li><li><code>inflections::Vector</code>: grammatic lexemes</li><li><code>L::L_Matrix_Struct</code>: the lexome matrix</li></ul><p><strong>Optional Arguments</strong></p><ul><li><code>add_noise::Bool=true</code>: if true, add additional Gaussian noise</li><li><code>sd_noise::Int64=1</code>: the sd of the Gaussian noise</li><li><code>normalized::Bool=false</code>: if true, most of the values range between 1 and -1, it may slightly exceed between 1 or -1 depending on the sd</li></ul><p><strong>Examples</strong></p><pre><code class="language-julia"># basic usage
 S1 = JudiLing.make_S_matrix(
     latin,
     [&quot;Lexeme&quot;],
@@ -168,7 +168,7 @@
      add_noise=true,
     sd_noise=1,
     normalized=false
-    )</code></pre></div><a class="docs-sourcelink" target="_blank" href="https://github.com/quantling/JudiLing.jl/blob/244bb0c648484065ffd5a41781ccc1caf2e5db60/src/make_semantic_matrix.jl#LL660-L689">source</a></section></article><article class="docstring"><header><a class="docstring-binding" id="JudiLing.make_S_matrix-Tuple{DataFrames.DataFrame, Union{Nothing, DataFrames.DataFrame}, Vector, JudiLing.L_Matrix_Struct}" href="#JudiLing.make_S_matrix-Tuple{DataFrames.DataFrame, Union{Nothing, DataFrames.DataFrame}, Vector, JudiLing.L_Matrix_Struct}"><code>JudiLing.make_S_matrix</code></a> — <span class="docstring-category">Method</span></header><section><div><pre><code class="language-julia">make_S_matrix(data_train::DataFrame, data_val::Union{DataFrame, Nothing}, base::Vector, L::L_Matrix_Struct)</code></pre><p>Create simulated semantic matrix where lexome matrix is available.</p><p><strong>Obligatory Arguments</strong></p><ul><li><code>data_train::DataFrame</code>: the training dataset</li><li><code>data_val::DataFrame</code>: the validation dataset</li><li><code>base::Vector</code>: context lexemes</li><li><code>L::L_Matrix_Struct</code>: the lexome matrix</li></ul><p><strong>Optional Arguments</strong></p><ul><li><code>add_noise::Bool=true</code>: if true, add additional Gaussian noise</li><li><code>sd_noise::Int64=1</code>: the sd of the Gaussian noise</li><li><code>normalized::Bool=false</code>: if true, most of the values range between 1 and -1, it may slightly exceed between 1 or -1 depending on the sd</li></ul><p><strong>Examples</strong></p><pre><code class="language-julia"># basic usage
+    )</code></pre></div><a class="docs-sourcelink" target="_blank" href="https://github.com/quantling/JudiLing.jl/blob/5ca73e4b27ef788e0b36d45e6360491a5a413be8/src/make_semantic_matrix.jl#LL660-L689">source</a></section></article><article class="docstring"><header><a class="docstring-binding" id="JudiLing.make_S_matrix-Tuple{DataFrames.DataFrame, Union{Nothing, DataFrames.DataFrame}, Vector, JudiLing.L_Matrix_Struct}" href="#JudiLing.make_S_matrix-Tuple{DataFrames.DataFrame, Union{Nothing, DataFrames.DataFrame}, Vector, JudiLing.L_Matrix_Struct}"><code>JudiLing.make_S_matrix</code></a> — <span class="docstring-category">Method</span></header><section><div><pre><code class="language-julia">make_S_matrix(data_train::DataFrame, data_val::Union{DataFrame, Nothing}, base::Vector, L::L_Matrix_Struct)</code></pre><p>Create simulated semantic matrix where lexome matrix is available.</p><p><strong>Obligatory Arguments</strong></p><ul><li><code>data_train::DataFrame</code>: the training dataset</li><li><code>data_val::DataFrame</code>: the validation dataset</li><li><code>base::Vector</code>: context lexemes</li><li><code>L::L_Matrix_Struct</code>: the lexome matrix</li></ul><p><strong>Optional Arguments</strong></p><ul><li><code>add_noise::Bool=true</code>: if true, add additional Gaussian noise</li><li><code>sd_noise::Int64=1</code>: the sd of the Gaussian noise</li><li><code>normalized::Bool=false</code>: if true, most of the values range between 1 and -1, it may slightly exceed between 1 or -1 depending on the sd</li></ul><p><strong>Examples</strong></p><pre><code class="language-julia"># basic usage
 S1, S2 = JudiLing.make_S_matrix(
      latin,
     latin_val,
@@ -177,7 +177,7 @@
     add_noise=true,
     sd_noise=1,
     normalized=false
-    )</code></pre></div><a class="docs-sourcelink" target="_blank" href="https://github.com/quantling/JudiLing.jl/blob/244bb0c648484065ffd5a41781ccc1caf2e5db60/src/make_semantic_matrix.jl#LL711-L740">source</a></section></article><article class="docstring"><header><a class="docstring-binding" id="JudiLing.make_S_matrix-Tuple{DataFrames.DataFrame, Vector, JudiLing.L_Matrix_Struct}" href="#JudiLing.make_S_matrix-Tuple{DataFrames.DataFrame, Vector, JudiLing.L_Matrix_Struct}"><code>JudiLing.make_S_matrix</code></a> — <span class="docstring-category">Method</span></header><section><div><pre><code class="language-julia">make_S_matrix(data::DataFrame, base::Vector, L::L_Matrix_Struct)</code></pre><p>Create simulated semantic matrix where lexome matrix is available.</p><p><strong>Obligatory Arguments</strong></p><ul><li><code>data::DataFrame</code>: the dataset</li><li><code>base::Vector</code>: context lexemes</li><li><code>L::L_Matrix_Struct</code>: the lexome matrix</li></ul><p><strong>Optional Arguments</strong></p><ul><li><code>add_noise::Bool=true</code>: if true, add additional Gaussian noise</li><li><code>sd_noise::Int64=1</code>: the sd of the Gaussian noise</li><li><code>normalized::Bool=false</code>: if true, most of the values range between 1 and -1, it may slightly exceed between 1 or -1 depending on the sd</li></ul><p><strong>Examples</strong></p><pre><code class="language-julia"># basic usage
+    )</code></pre></div><a class="docs-sourcelink" target="_blank" href="https://github.com/quantling/JudiLing.jl/blob/5ca73e4b27ef788e0b36d45e6360491a5a413be8/src/make_semantic_matrix.jl#LL711-L740">source</a></section></article><article class="docstring"><header><a class="docstring-binding" id="JudiLing.make_S_matrix-Tuple{DataFrames.DataFrame, Vector, JudiLing.L_Matrix_Struct}" href="#JudiLing.make_S_matrix-Tuple{DataFrames.DataFrame, Vector, JudiLing.L_Matrix_Struct}"><code>JudiLing.make_S_matrix</code></a> — <span class="docstring-category">Method</span></header><section><div><pre><code class="language-julia">make_S_matrix(data::DataFrame, base::Vector, L::L_Matrix_Struct)</code></pre><p>Create simulated semantic matrix where lexome matrix is available.</p><p><strong>Obligatory Arguments</strong></p><ul><li><code>data::DataFrame</code>: the dataset</li><li><code>base::Vector</code>: context lexemes</li><li><code>L::L_Matrix_Struct</code>: the lexome matrix</li></ul><p><strong>Optional Arguments</strong></p><ul><li><code>add_noise::Bool=true</code>: if true, add additional Gaussian noise</li><li><code>sd_noise::Int64=1</code>: the sd of the Gaussian noise</li><li><code>normalized::Bool=false</code>: if true, most of the values range between 1 and -1, it may slightly exceed between 1 or -1 depending on the sd</li></ul><p><strong>Examples</strong></p><pre><code class="language-julia"># basic usage
 S1 = JudiLing.make_S_matrix(
     latin,
     [&quot;Lexeme&quot;],
@@ -185,7 +185,7 @@
     add_noise=true,
     sd_noise=1,
     normalized=false
-    )</code></pre></div><a class="docs-sourcelink" target="_blank" href="https://github.com/quantling/JudiLing.jl/blob/244bb0c648484065ffd5a41781ccc1caf2e5db60/src/make_semantic_matrix.jl#LL764-L791">source</a></section></article><article class="docstring"><header><a class="docstring-binding" id="JudiLing.make_S_matrix-Tuple{DataFrames.DataFrame, DataFrames.DataFrame, Vector, Vector, JudiLing.L_Matrix_Struct}" href="#JudiLing.make_S_matrix-Tuple{DataFrames.DataFrame, DataFrames.DataFrame, Vector, Vector, JudiLing.L_Matrix_Struct}"><code>JudiLing.make_S_matrix</code></a> — <span class="docstring-category">Method</span></header><section><div><pre><code class="language-julia">make_S_matrix(data_train::DataFrame, data_val::DataFrame, base::Vector, inflections::Vector, L::L_Matrix_Struct)</code></pre><p>Create simulated semantic matrix where lexome matrix is available.</p><p><strong>Obligatory Arguments</strong></p><ul><li><code>data_train::DataFrame</code>: the training dataset</li><li><code>data_val::DataFrame</code>: the validation dataset</li><li><code>base::Vector</code>: context lexemes</li><li><code>inflections::Vector</code>: grammatic lexemes</li><li><code>L::L_Matrix_Struct</code>: the lexome matrix</li></ul><p><strong>Optional Arguments</strong></p><ul><li><code>add_noise::Bool=true</code>: if true, add additional Gaussian noise</li><li><code>sd_noise::Int64=1</code>: the sd of the Gaussian noise</li><li><code>normalized::Bool=false</code>: if true, most of the values range between 1 and -1, it may slightly exceed between 1 or -1 depending on the sd</li></ul><p><strong>Examples</strong></p><pre><code class="language-julia"># basic usage
+    )</code></pre></div><a class="docs-sourcelink" target="_blank" href="https://github.com/quantling/JudiLing.jl/blob/5ca73e4b27ef788e0b36d45e6360491a5a413be8/src/make_semantic_matrix.jl#LL764-L791">source</a></section></article><article class="docstring"><header><a class="docstring-binding" id="JudiLing.make_S_matrix-Tuple{DataFrames.DataFrame, DataFrames.DataFrame, Vector, Vector, JudiLing.L_Matrix_Struct}" href="#JudiLing.make_S_matrix-Tuple{DataFrames.DataFrame, DataFrames.DataFrame, Vector, Vector, JudiLing.L_Matrix_Struct}"><code>JudiLing.make_S_matrix</code></a> — <span class="docstring-category">Method</span></header><section><div><pre><code class="language-julia">make_S_matrix(data_train::DataFrame, data_val::DataFrame, base::Vector, inflections::Vector, L::L_Matrix_Struct)</code></pre><p>Create simulated semantic matrix where lexome matrix is available.</p><p><strong>Obligatory Arguments</strong></p><ul><li><code>data_train::DataFrame</code>: the training dataset</li><li><code>data_val::DataFrame</code>: the validation dataset</li><li><code>base::Vector</code>: context lexemes</li><li><code>inflections::Vector</code>: grammatic lexemes</li><li><code>L::L_Matrix_Struct</code>: the lexome matrix</li></ul><p><strong>Optional Arguments</strong></p><ul><li><code>add_noise::Bool=true</code>: if true, add additional Gaussian noise</li><li><code>sd_noise::Int64=1</code>: the sd of the Gaussian noise</li><li><code>normalized::Bool=false</code>: if true, most of the values range between 1 and -1, it may slightly exceed between 1 or -1 depending on the sd</li></ul><p><strong>Examples</strong></p><pre><code class="language-julia"># basic usage
 S1, S2 = JudiLing.make_S_matrix(
     latin,
     latin_val,
@@ -195,51 +195,51 @@
     add_noise=true,
     sd_noise=1,
     normalized=false
-    )</code></pre></div><a class="docs-sourcelink" target="_blank" href="https://github.com/quantling/JudiLing.jl/blob/244bb0c648484065ffd5a41781ccc1caf2e5db60/src/make_semantic_matrix.jl#LL813-L844">source</a></section></article><article class="docstring"><header><a class="docstring-binding" id="JudiLing.make_L_matrix-Tuple{DataFrames.DataFrame, Vector}" href="#JudiLing.make_L_matrix-Tuple{DataFrames.DataFrame, Vector}"><code>JudiLing.make_L_matrix</code></a> — <span class="docstring-category">Method</span></header><section><div><pre><code class="language-julia">make_L_matrix(data::DataFrame, base::Vector)</code></pre><p>Create Lexome Matrix with simulated semantic vectors where there are only base features.</p><p><strong>Obligatory Arguments</strong></p><ul><li><code>data::DataFrame</code>: the dataset</li><li><code>base::Vector</code>: context lexemes</li></ul><p><strong>Optional Arguments</strong></p><ul><li><code>ncol::Int64=200</code>: dimension of semantic vectors, usually the same as that of cue vectors</li><li><code>sd_base_mean::Int64=1</code>: the sd mean of base features</li><li><code>sd_base::Int64=4</code>: the sd of base features</li><li><code>seed::Int64=314</code>: the random seed</li><li><code>isdeep::Bool=true</code>: if true, mean of each feature is also randomized</li></ul><p><strong>Examples</strong></p><pre><code class="language-julia"># basic usage
+    )</code></pre></div><a class="docs-sourcelink" target="_blank" href="https://github.com/quantling/JudiLing.jl/blob/5ca73e4b27ef788e0b36d45e6360491a5a413be8/src/make_semantic_matrix.jl#LL813-L844">source</a></section></article><article class="docstring"><header><a class="docstring-binding" id="JudiLing.make_L_matrix-Tuple{DataFrames.DataFrame, Vector}" href="#JudiLing.make_L_matrix-Tuple{DataFrames.DataFrame, Vector}"><code>JudiLing.make_L_matrix</code></a> — <span class="docstring-category">Method</span></header><section><div><pre><code class="language-julia">make_L_matrix(data::DataFrame, base::Vector)</code></pre><p>Create Lexome Matrix with simulated semantic vectors where there are only base features.</p><p><strong>Obligatory Arguments</strong></p><ul><li><code>data::DataFrame</code>: the dataset</li><li><code>base::Vector</code>: context lexemes</li></ul><p><strong>Optional Arguments</strong></p><ul><li><code>ncol::Int64=200</code>: dimension of semantic vectors, usually the same as that of cue vectors</li><li><code>sd_base_mean::Int64=1</code>: the sd mean of base features</li><li><code>sd_base::Int64=4</code>: the sd of base features</li><li><code>seed::Int64=314</code>: the random seed</li><li><code>isdeep::Bool=true</code>: if true, mean of each feature is also randomized</li></ul><p><strong>Examples</strong></p><pre><code class="language-julia"># basic usage
 L = JudiLing.make_L_matrix(
     latin,
     [&quot;Lexeme&quot;],
-    ncol=200)</code></pre></div><a class="docs-sourcelink" target="_blank" href="https://github.com/quantling/JudiLing.jl/blob/244bb0c648484065ffd5a41781ccc1caf2e5db60/src/make_semantic_matrix.jl#LL960-L984">source</a></section></article><article class="docstring"><header><a class="docstring-binding" id="JudiLing.make_combined_S_matrix-Tuple{DataFrames.DataFrame, DataFrames.DataFrame, Vector, Vector, JudiLing.L_Matrix_Struct}" href="#JudiLing.make_combined_S_matrix-Tuple{DataFrames.DataFrame, DataFrames.DataFrame, Vector, Vector, JudiLing.L_Matrix_Struct}"><code>JudiLing.make_combined_S_matrix</code></a> — <span class="docstring-category">Method</span></header><section><div><pre><code class="language-julia">make_combined_S_matrix(data_train::DataFrame, data_val::DataFrame, base::Vector, inflections::Vector, L::L_Matrix_Struct)</code></pre><p>Create simulated semantic matrix for the training datasets and validation datasets with existing Lexome matrix, where features are combined from both training datasets and validation datasets.</p><p><strong>Obligatory Arguments</strong></p><ul><li><code>data_train::DataFrame</code>: the training dataset</li><li><code>data_val::DataFrame</code>: the validation dataset</li><li><code>base::Vector</code>: context lexemes</li><li><code>inflections::Vector</code>: grammatic lexemes</li><li><code>L::L_Matrix_Struct</code>: the Lexome Matrix</li></ul><p><strong>Optional Arguments</strong></p><ul><li><code>add_noise::Bool=true</code>: if true, add additional Gaussian noise</li><li><code>sd_noise::Int64=1</code>: the sd of the Gaussian noise</li><li><code>normalized::Bool=false</code>: if true, most of the values range between 1 and -1, it may slightly exceed between 1 or -1 depending on the sd</li></ul><p><strong>Examples</strong></p><pre><code class="language-julia"># basic usage
+    ncol=200)</code></pre></div><a class="docs-sourcelink" target="_blank" href="https://github.com/quantling/JudiLing.jl/blob/5ca73e4b27ef788e0b36d45e6360491a5a413be8/src/make_semantic_matrix.jl#LL960-L984">source</a></section></article><article class="docstring"><header><a class="docstring-binding" id="JudiLing.make_combined_S_matrix-Tuple{DataFrames.DataFrame, DataFrames.DataFrame, Vector, Vector, JudiLing.L_Matrix_Struct}" href="#JudiLing.make_combined_S_matrix-Tuple{DataFrames.DataFrame, DataFrames.DataFrame, Vector, Vector, JudiLing.L_Matrix_Struct}"><code>JudiLing.make_combined_S_matrix</code></a> — <span class="docstring-category">Method</span></header><section><div><pre><code class="language-julia">make_combined_S_matrix(data_train::DataFrame, data_val::DataFrame, base::Vector, inflections::Vector, L::L_Matrix_Struct)</code></pre><p>Create simulated semantic matrix for the training datasets and validation datasets with existing Lexome matrix, where features are combined from both training datasets and validation datasets.</p><p><strong>Obligatory Arguments</strong></p><ul><li><code>data_train::DataFrame</code>: the training dataset</li><li><code>data_val::DataFrame</code>: the validation dataset</li><li><code>base::Vector</code>: context lexemes</li><li><code>inflections::Vector</code>: grammatic lexemes</li><li><code>L::L_Matrix_Struct</code>: the Lexome Matrix</li></ul><p><strong>Optional Arguments</strong></p><ul><li><code>add_noise::Bool=true</code>: if true, add additional Gaussian noise</li><li><code>sd_noise::Int64=1</code>: the sd of the Gaussian noise</li><li><code>normalized::Bool=false</code>: if true, most of the values range between 1 and -1, it may slightly exceed between 1 or -1 depending on the sd</li></ul><p><strong>Examples</strong></p><pre><code class="language-julia"># basic usage
 S_train, S_val = JudiLing.make_combined_S_matrix(
     latin_train,
     latin_val,
     [&quot;Lexeme&quot;],
     [&quot;Person&quot;,&quot;Number&quot;,&quot;Tense&quot;,&quot;Voice&quot;,&quot;Mood&quot;],
-    L)</code></pre></div><a class="docs-sourcelink" target="_blank" href="https://github.com/quantling/JudiLing.jl/blob/244bb0c648484065ffd5a41781ccc1caf2e5db60/src/make_semantic_matrix.jl#LL1134-L1163">source</a></section></article><article class="docstring"><header><a class="docstring-binding" id="JudiLing.make_combined_S_matrix-Tuple{DataFrames.DataFrame, Union{Nothing, DataFrames.DataFrame}, Vector, JudiLing.L_Matrix_Struct}" href="#JudiLing.make_combined_S_matrix-Tuple{DataFrames.DataFrame, Union{Nothing, DataFrames.DataFrame}, Vector, JudiLing.L_Matrix_Struct}"><code>JudiLing.make_combined_S_matrix</code></a> — <span class="docstring-category">Method</span></header><section><div><pre><code class="language-julia">make_combined_S_matrix(data_train::DataFrame, data_val::Union{DataFrame, Nothing}, base::Vector, L::L_Matrix_Struct)</code></pre><p>Create simulated semantic matrix for the training datasets and validation datasets with existing Lexome matrix, where features are combined from both training datasets and validation datasets.</p><p><strong>Obligatory Arguments</strong></p><ul><li><code>data_train::DataFrame</code>: the training dataset</li><li><code>data_val::DataFrame</code>: the validation dataset</li><li><code>base::Vector</code>: context lexemes</li><li><code>L::L_Matrix_Struct</code>: the Lexome Matrix</li></ul><p><strong>Optional Arguments</strong></p><ul><li><code>add_noise::Bool=true</code>: if true, add additional Gaussian noise</li><li><code>sd_noise::Int64=1</code>: the sd of the Gaussian noise</li><li><code>normalized::Bool=false</code>: if true, most of the values range between 1 and -1, it may slightly exceed between 1 or -1 depending on the sd</li></ul><p><strong>Examples</strong></p><pre><code class="language-julia"># basic usage
+    L)</code></pre></div><a class="docs-sourcelink" target="_blank" href="https://github.com/quantling/JudiLing.jl/blob/5ca73e4b27ef788e0b36d45e6360491a5a413be8/src/make_semantic_matrix.jl#LL1134-L1163">source</a></section></article><article class="docstring"><header><a class="docstring-binding" id="JudiLing.make_combined_S_matrix-Tuple{DataFrames.DataFrame, Union{Nothing, DataFrames.DataFrame}, Vector, JudiLing.L_Matrix_Struct}" href="#JudiLing.make_combined_S_matrix-Tuple{DataFrames.DataFrame, Union{Nothing, DataFrames.DataFrame}, Vector, JudiLing.L_Matrix_Struct}"><code>JudiLing.make_combined_S_matrix</code></a> — <span class="docstring-category">Method</span></header><section><div><pre><code class="language-julia">make_combined_S_matrix(data_train::DataFrame, data_val::Union{DataFrame, Nothing}, base::Vector, L::L_Matrix_Struct)</code></pre><p>Create simulated semantic matrix for the training datasets and validation datasets with existing Lexome matrix, where features are combined from both training datasets and validation datasets.</p><p><strong>Obligatory Arguments</strong></p><ul><li><code>data_train::DataFrame</code>: the training dataset</li><li><code>data_val::DataFrame</code>: the validation dataset</li><li><code>base::Vector</code>: context lexemes</li><li><code>L::L_Matrix_Struct</code>: the Lexome Matrix</li></ul><p><strong>Optional Arguments</strong></p><ul><li><code>add_noise::Bool=true</code>: if true, add additional Gaussian noise</li><li><code>sd_noise::Int64=1</code>: the sd of the Gaussian noise</li><li><code>normalized::Bool=false</code>: if true, most of the values range between 1 and -1, it may slightly exceed between 1 or -1 depending on the sd</li></ul><p><strong>Examples</strong></p><pre><code class="language-julia"># basic usage
 S_train, S_val = JudiLing.make_combined_S_matrix(
     latin_train,
     latin_val,
     [&quot;Lexeme&quot;],
     [&quot;Person&quot;,&quot;Number&quot;,&quot;Tense&quot;,&quot;Voice&quot;,&quot;Mood&quot;],
-    L)</code></pre></div><a class="docs-sourcelink" target="_blank" href="https://github.com/quantling/JudiLing.jl/blob/244bb0c648484065ffd5a41781ccc1caf2e5db60/src/make_semantic_matrix.jl#LL1187-L1215">source</a></section></article><article class="docstring"><header><a class="docstring-binding" id="JudiLing.make_combined_S_matrix-Tuple{DataFrames.DataFrame, DataFrames.DataFrame, Vector, Vector}" href="#JudiLing.make_combined_S_matrix-Tuple{DataFrames.DataFrame, DataFrames.DataFrame, Vector, Vector}"><code>JudiLing.make_combined_S_matrix</code></a> — <span class="docstring-category">Method</span></header><section><div><pre><code class="language-julia">make_combined_S_matrix(  data_train::DataFrame, data_val::DataFrame, base::Vector, inflections::Vector)</code></pre><p>Create simulated semantic matrix for the training datasets and validation datasets, where features are combined from both training datasets and validation datasets.</p><p><strong>Obligatory Arguments</strong></p><ul><li><code>data_train::DataFrame</code>: the training dataset</li><li><code>data_val::DataFrame</code>: the validation dataset</li><li><code>base::Vector</code>: context lexemes</li><li><code>inflections::Vector</code>: grammatic lexemes</li></ul><p><strong>Optional Arguments</strong></p><ul><li><code>ncol::Int64=200</code>: dimension of semantic vectors, usually the same as that of cue vectors</li><li><code>sd_base_mean::Int64=1</code>: the sd mean of base features</li><li><code>sd_inflection_mean::Int64=1</code>: the sd mean of inflectional features</li><li><code>sd_base::Int64=4</code>: the sd of base features</li><li><code>sd_inflection::Int64=4</code>: the sd of inflectional features</li><li><code>seed::Int64=314</code>: the random seed</li><li><code>isdeep::Bool=true</code>: if true, mean of each feature is also randomized</li><li><code>add_noise::Bool=true</code>: if true, add additional Gaussian noise</li><li><code>sd_noise::Int64=1</code>: the sd of the Gaussian noise</li><li><code>normalized::Bool=false</code>: if true, most of the values range between 1 and -1, it may slightly exceed between 1 or -1 depending on the sd</li></ul><p><strong>Examples</strong></p><pre><code class="language-julia"># basic usage
+    L)</code></pre></div><a class="docs-sourcelink" target="_blank" href="https://github.com/quantling/JudiLing.jl/blob/5ca73e4b27ef788e0b36d45e6360491a5a413be8/src/make_semantic_matrix.jl#LL1187-L1215">source</a></section></article><article class="docstring"><header><a class="docstring-binding" id="JudiLing.make_combined_S_matrix-Tuple{DataFrames.DataFrame, DataFrames.DataFrame, Vector, Vector}" href="#JudiLing.make_combined_S_matrix-Tuple{DataFrames.DataFrame, DataFrames.DataFrame, Vector, Vector}"><code>JudiLing.make_combined_S_matrix</code></a> — <span class="docstring-category">Method</span></header><section><div><pre><code class="language-julia">make_combined_S_matrix(  data_train::DataFrame, data_val::DataFrame, base::Vector, inflections::Vector)</code></pre><p>Create simulated semantic matrix for the training datasets and validation datasets, where features are combined from both training datasets and validation datasets.</p><p><strong>Obligatory Arguments</strong></p><ul><li><code>data_train::DataFrame</code>: the training dataset</li><li><code>data_val::DataFrame</code>: the validation dataset</li><li><code>base::Vector</code>: context lexemes</li><li><code>inflections::Vector</code>: grammatic lexemes</li></ul><p><strong>Optional Arguments</strong></p><ul><li><code>ncol::Int64=200</code>: dimension of semantic vectors, usually the same as that of cue vectors</li><li><code>sd_base_mean::Int64=1</code>: the sd mean of base features</li><li><code>sd_inflection_mean::Int64=1</code>: the sd mean of inflectional features</li><li><code>sd_base::Int64=4</code>: the sd of base features</li><li><code>sd_inflection::Int64=4</code>: the sd of inflectional features</li><li><code>seed::Int64=314</code>: the random seed</li><li><code>isdeep::Bool=true</code>: if true, mean of each feature is also randomized</li><li><code>add_noise::Bool=true</code>: if true, add additional Gaussian noise</li><li><code>sd_noise::Int64=1</code>: the sd of the Gaussian noise</li><li><code>normalized::Bool=false</code>: if true, most of the values range between 1 and -1, it may slightly exceed between 1 or -1 depending on the sd</li></ul><p><strong>Examples</strong></p><pre><code class="language-julia"># basic usage
 S_train, S_val = JudiLing.make_combined_S_matrix(
     latin_train,
     latin_val,
     [&quot;Lexeme&quot;],
     [&quot;Person&quot;,&quot;Number&quot;,&quot;Tense&quot;,&quot;Voice&quot;,&quot;Mood&quot;],
-    ncol=n_features)</code></pre></div><a class="docs-sourcelink" target="_blank" href="https://github.com/quantling/JudiLing.jl/blob/244bb0c648484065ffd5a41781ccc1caf2e5db60/src/make_semantic_matrix.jl#LL1237-L1272">source</a></section></article><article class="docstring"><header><a class="docstring-binding" id="JudiLing.make_combined_S_matrix-Tuple{DataFrames.DataFrame, DataFrames.DataFrame, Vector}" href="#JudiLing.make_combined_S_matrix-Tuple{DataFrames.DataFrame, DataFrames.DataFrame, Vector}"><code>JudiLing.make_combined_S_matrix</code></a> — <span class="docstring-category">Method</span></header><section><div><pre><code class="language-julia">make_combined_S_matrix(data_train::DataFrame, data_val::DataFrame, base::Vector)</code></pre><p>Create simulated semantic matrix for the training datasets and validation datasets, where features are combined from both training datasets and validation datasets.</p><p><strong>Obligatory Arguments</strong></p><ul><li><code>data_train::DataFrame</code>: the training dataset</li><li><code>data_val::DataFrame</code>: the validation dataset</li><li><code>base::Vector</code>: context lexemes</li></ul><p><strong>Optional Arguments</strong></p><ul><li><code>ncol::Int64=200</code>: dimension of semantic vectors, usually the same as that of cue vectors</li><li><code>sd_base_mean::Int64=1</code>: the sd mean of base features</li><li><code>sd_inflection_mean::Int64=1</code>: the sd mean of inflectional features</li><li><code>sd_base::Int64=4</code>: the sd of base features</li><li><code>sd_inflection::Int64=4</code>: the sd of inflectional features</li><li><code>seed::Int64=314</code>: the random seed</li><li><code>isdeep::Bool=true</code>: if true, mean of each feature is also randomized</li><li><code>add_noise::Bool=true</code>: if true, add additional Gaussian noise</li><li><code>sd_noise::Int64=1</code>: the sd of the Gaussian noise</li><li><code>normalized::Bool=false</code>: if true, most of the values range between 1 and -1, it may slightly exceed between 1 or -1 depending on the sd</li></ul><p><strong>Examples</strong></p><pre><code class="language-julia"># basic usage
+    ncol=n_features)</code></pre></div><a class="docs-sourcelink" target="_blank" href="https://github.com/quantling/JudiLing.jl/blob/5ca73e4b27ef788e0b36d45e6360491a5a413be8/src/make_semantic_matrix.jl#LL1237-L1272">source</a></section></article><article class="docstring"><header><a class="docstring-binding" id="JudiLing.make_combined_S_matrix-Tuple{DataFrames.DataFrame, DataFrames.DataFrame, Vector}" href="#JudiLing.make_combined_S_matrix-Tuple{DataFrames.DataFrame, DataFrames.DataFrame, Vector}"><code>JudiLing.make_combined_S_matrix</code></a> — <span class="docstring-category">Method</span></header><section><div><pre><code class="language-julia">make_combined_S_matrix(data_train::DataFrame, data_val::DataFrame, base::Vector)</code></pre><p>Create simulated semantic matrix for the training datasets and validation datasets, where features are combined from both training datasets and validation datasets.</p><p><strong>Obligatory Arguments</strong></p><ul><li><code>data_train::DataFrame</code>: the training dataset</li><li><code>data_val::DataFrame</code>: the validation dataset</li><li><code>base::Vector</code>: context lexemes</li></ul><p><strong>Optional Arguments</strong></p><ul><li><code>ncol::Int64=200</code>: dimension of semantic vectors, usually the same as that of cue vectors</li><li><code>sd_base_mean::Int64=1</code>: the sd mean of base features</li><li><code>sd_inflection_mean::Int64=1</code>: the sd mean of inflectional features</li><li><code>sd_base::Int64=4</code>: the sd of base features</li><li><code>sd_inflection::Int64=4</code>: the sd of inflectional features</li><li><code>seed::Int64=314</code>: the random seed</li><li><code>isdeep::Bool=true</code>: if true, mean of each feature is also randomized</li><li><code>add_noise::Bool=true</code>: if true, add additional Gaussian noise</li><li><code>sd_noise::Int64=1</code>: the sd of the Gaussian noise</li><li><code>normalized::Bool=false</code>: if true, most of the values range between 1 and -1, it may slightly exceed between 1 or -1 depending on the sd</li></ul><p><strong>Examples</strong></p><pre><code class="language-julia"># basic usage
 S_train, S_val = JudiLing.make_combined_S_matrix(
     latin_train,
     latin_val,
     [&quot;Lexeme&quot;],
     [&quot;Person&quot;,&quot;Number&quot;,&quot;Tense&quot;,&quot;Voice&quot;,&quot;Mood&quot;],
-    ncol=n_features)</code></pre></div><a class="docs-sourcelink" target="_blank" href="https://github.com/quantling/JudiLing.jl/blob/244bb0c648484065ffd5a41781ccc1caf2e5db60/src/make_semantic_matrix.jl#LL1316-L1350">source</a></section></article><article class="docstring"><header><a class="docstring-binding" id="JudiLing.make_combined_L_matrix-Tuple{DataFrames.DataFrame, DataFrames.DataFrame, Vector, Vector}" href="#JudiLing.make_combined_L_matrix-Tuple{DataFrames.DataFrame, DataFrames.DataFrame, Vector, Vector}"><code>JudiLing.make_combined_L_matrix</code></a> — <span class="docstring-category">Method</span></header><section><div><pre><code class="language-julia">make_combined_L_matrix(data_train::DataFrame, data_val::DataFrame, base::Vector, inflections::Vector)</code></pre><p>Create Lexome Matrix with simulated semantic vectors, where features are combined from both training datasets and validation datasets.</p><p><strong>Obligatory Arguments</strong></p><ul><li><code>data_train::DataFrame</code>: the training dataset</li><li><code>data_val::DataFrame</code>: the validation dataset</li><li><code>base::Vector</code>: context lexemes</li><li><code>inflections::Vector</code>: grammatic lexemes</li></ul><p><strong>Optional Arguments</strong></p><ul><li><code>ncol::Int64=200</code>: dimension of semantic vectors, usually the same as that of cue vectors</li><li><code>sd_base_mean::Int64=1</code>: the sd mean of base features</li><li><code>sd_inflection_mean::Int64=1</code>: the sd mean of inflectional features</li><li><code>sd_base::Int64=4</code>: the sd of base features</li><li><code>sd_inflection::Int64=4</code>: the sd of inflectional features</li><li><code>seed::Int64=314</code>: the random seed</li><li><code>isdeep::Bool=true</code>: if true, mean of each feature is also randomized</li></ul><p><strong>Examples</strong></p><pre><code class="language-julia"># basic usage
+    ncol=n_features)</code></pre></div><a class="docs-sourcelink" target="_blank" href="https://github.com/quantling/JudiLing.jl/blob/5ca73e4b27ef788e0b36d45e6360491a5a413be8/src/make_semantic_matrix.jl#LL1316-L1350">source</a></section></article><article class="docstring"><header><a class="docstring-binding" id="JudiLing.make_combined_L_matrix-Tuple{DataFrames.DataFrame, DataFrames.DataFrame, Vector, Vector}" href="#JudiLing.make_combined_L_matrix-Tuple{DataFrames.DataFrame, DataFrames.DataFrame, Vector, Vector}"><code>JudiLing.make_combined_L_matrix</code></a> — <span class="docstring-category">Method</span></header><section><div><pre><code class="language-julia">make_combined_L_matrix(data_train::DataFrame, data_val::DataFrame, base::Vector, inflections::Vector)</code></pre><p>Create Lexome Matrix with simulated semantic vectors, where features are combined from both training datasets and validation datasets.</p><p><strong>Obligatory Arguments</strong></p><ul><li><code>data_train::DataFrame</code>: the training dataset</li><li><code>data_val::DataFrame</code>: the validation dataset</li><li><code>base::Vector</code>: context lexemes</li><li><code>inflections::Vector</code>: grammatic lexemes</li></ul><p><strong>Optional Arguments</strong></p><ul><li><code>ncol::Int64=200</code>: dimension of semantic vectors, usually the same as that of cue vectors</li><li><code>sd_base_mean::Int64=1</code>: the sd mean of base features</li><li><code>sd_inflection_mean::Int64=1</code>: the sd mean of inflectional features</li><li><code>sd_base::Int64=4</code>: the sd of base features</li><li><code>sd_inflection::Int64=4</code>: the sd of inflectional features</li><li><code>seed::Int64=314</code>: the random seed</li><li><code>isdeep::Bool=true</code>: if true, mean of each feature is also randomized</li></ul><p><strong>Examples</strong></p><pre><code class="language-julia"># basic usage
 L = JudiLing.make_combined_L_matrix(
     latin_train,
     latin_val,
     [&quot;Lexeme&quot;],
     [&quot;Person&quot;,&quot;Number&quot;,&quot;Tense&quot;,&quot;Voice&quot;,&quot;Mood&quot;],
-    ncol=n_features)</code></pre></div><a class="docs-sourcelink" target="_blank" href="https://github.com/quantling/JudiLing.jl/blob/244bb0c648484065ffd5a41781ccc1caf2e5db60/src/make_semantic_matrix.jl#LL1007-L1038">source</a></section></article><article class="docstring"><header><a class="docstring-binding" id="JudiLing.make_combined_L_matrix-Tuple{DataFrames.DataFrame, DataFrames.DataFrame, Vector}" href="#JudiLing.make_combined_L_matrix-Tuple{DataFrames.DataFrame, DataFrames.DataFrame, Vector}"><code>JudiLing.make_combined_L_matrix</code></a> — <span class="docstring-category">Method</span></header><section><div><pre><code class="language-julia">make_combined_L_matrix(data_train::DataFrame, data_val::DataFrame, base::Vector)</code></pre><p>Create Lexome Matrix with simulated semantic vectors, where features are combined from both training datasets and validation datasets.</p><p><strong>Obligatory Arguments</strong></p><ul><li><code>data_train::DataFrame</code>: the training dataset</li><li><code>data_val::DataFrame</code>: the validation dataset</li><li><code>base::Vector</code>: context lexemes</li></ul><p><strong>Optional Arguments</strong></p><ul><li><code>ncol::Int64=200</code>: dimension of semantic vectors, usually the same as that of cue vectors</li><li><code>sd_base_mean::Int64=1</code>: the sd mean of base features</li><li><code>sd_inflection_mean::Int64=1</code>: the sd mean of inflectional features</li><li><code>sd_base::Int64=4</code>: the sd of base features</li><li><code>sd_inflection::Int64=4</code>: the sd of inflectional features</li><li><code>seed::Int64=314</code>: the random seed</li><li><code>isdeep::Bool=true</code>: if true, mean of each feature is also randomized</li></ul><p><strong>Examples</strong></p><pre><code class="language-julia"># basic usage
+    ncol=n_features)</code></pre></div><a class="docs-sourcelink" target="_blank" href="https://github.com/quantling/JudiLing.jl/blob/5ca73e4b27ef788e0b36d45e6360491a5a413be8/src/make_semantic_matrix.jl#LL1007-L1038">source</a></section></article><article class="docstring"><header><a class="docstring-binding" id="JudiLing.make_combined_L_matrix-Tuple{DataFrames.DataFrame, DataFrames.DataFrame, Vector}" href="#JudiLing.make_combined_L_matrix-Tuple{DataFrames.DataFrame, DataFrames.DataFrame, Vector}"><code>JudiLing.make_combined_L_matrix</code></a> — <span class="docstring-category">Method</span></header><section><div><pre><code class="language-julia">make_combined_L_matrix(data_train::DataFrame, data_val::DataFrame, base::Vector)</code></pre><p>Create Lexome Matrix with simulated semantic vectors, where features are combined from both training datasets and validation datasets.</p><p><strong>Obligatory Arguments</strong></p><ul><li><code>data_train::DataFrame</code>: the training dataset</li><li><code>data_val::DataFrame</code>: the validation dataset</li><li><code>base::Vector</code>: context lexemes</li></ul><p><strong>Optional Arguments</strong></p><ul><li><code>ncol::Int64=200</code>: dimension of semantic vectors, usually the same as that of cue vectors</li><li><code>sd_base_mean::Int64=1</code>: the sd mean of base features</li><li><code>sd_inflection_mean::Int64=1</code>: the sd mean of inflectional features</li><li><code>sd_base::Int64=4</code>: the sd of base features</li><li><code>sd_inflection::Int64=4</code>: the sd of inflectional features</li><li><code>seed::Int64=314</code>: the random seed</li><li><code>isdeep::Bool=true</code>: if true, mean of each feature is also randomized</li></ul><p><strong>Examples</strong></p><pre><code class="language-julia"># basic usage
 L = JudiLing.make_combined_L_matrix(
     latin_train,
     latin_val,
     [&quot;Lexeme&quot;],
-    ncol=n_features)</code></pre></div><a class="docs-sourcelink" target="_blank" href="https://github.com/quantling/JudiLing.jl/blob/244bb0c648484065ffd5a41781ccc1caf2e5db60/src/make_semantic_matrix.jl#LL1076-L1105">source</a></section></article><article class="docstring"><header><a class="docstring-binding" id="JudiLing.L_Matrix_Struct-NTuple{12, Any}" href="#JudiLing.L_Matrix_Struct-NTuple{12, Any}"><code>JudiLing.L_Matrix_Struct</code></a> — <span class="docstring-category">Method</span></header><section><div><pre><code class="language-julia">L_Matrix_Struct(L, sd_base, sd_base_mean, sd_inflection, sd_inflection_mean, base_f, infl_f, base_f2i, infl_f2i, n_base_f, n_infl_f, ncol)</code></pre><p>Construct L<em>Matrix</em>Struct with deep mode.</p></div><a class="docs-sourcelink" target="_blank" href="https://github.com/quantling/JudiLing.jl/blob/244bb0c648484065ffd5a41781ccc1caf2e5db60/src/make_semantic_matrix.jl#LL1731-L1735">source</a></section></article><article class="docstring"><header><a class="docstring-binding" id="JudiLing.L_Matrix_Struct-NTuple{10, Any}" href="#JudiLing.L_Matrix_Struct-NTuple{10, Any}"><code>JudiLing.L_Matrix_Struct</code></a> — <span class="docstring-category">Method</span></header><section><div><pre><code class="language-julia">L_Matrix_Struct(L, sd_base, sd_inflection, base_f, infl_f, base_f2i, infl_f2i, n_base_f, n_infl_f, ncol)</code></pre><p>Construct L<em>Matrix</em>Struct without deep mode.</p></div><a class="docs-sourcelink" target="_blank" href="https://github.com/quantling/JudiLing.jl/blob/244bb0c648484065ffd5a41781ccc1caf2e5db60/src/make_semantic_matrix.jl#LL1761-L1765">source</a></section></article><h2 id="Load-from-word2vec,-fasttext-or-similar"><a class="docs-heading-anchor" href="#Load-from-word2vec,-fasttext-or-similar">Load from word2vec, fasttext or similar</a><a id="Load-from-word2vec,-fasttext-or-similar-1"></a><a class="docs-heading-anchor-permalink" href="#Load-from-word2vec,-fasttext-or-similar" title="Permalink"></a></h2><article class="docstring"><header><a class="docstring-binding" id="JudiLing.load_S_matrix_from_fasttext-Tuple{DataFrames.DataFrame, Symbol}" href="#JudiLing.load_S_matrix_from_fasttext-Tuple{DataFrames.DataFrame, Symbol}"><code>JudiLing.load_S_matrix_from_fasttext</code></a> — <span class="docstring-category">Method</span></header><section><div><pre><code class="language-julia">load_S_matrix_from_fasttext(data::DataFrame,
+    ncol=n_features)</code></pre></div><a class="docs-sourcelink" target="_blank" href="https://github.com/quantling/JudiLing.jl/blob/5ca73e4b27ef788e0b36d45e6360491a5a413be8/src/make_semantic_matrix.jl#LL1076-L1105">source</a></section></article><article class="docstring"><header><a class="docstring-binding" id="JudiLing.L_Matrix_Struct-NTuple{12, Any}" href="#JudiLing.L_Matrix_Struct-NTuple{12, Any}"><code>JudiLing.L_Matrix_Struct</code></a> — <span class="docstring-category">Method</span></header><section><div><pre><code class="language-julia">L_Matrix_Struct(L, sd_base, sd_base_mean, sd_inflection, sd_inflection_mean, base_f, infl_f, base_f2i, infl_f2i, n_base_f, n_infl_f, ncol)</code></pre><p>Construct L<em>Matrix</em>Struct with deep mode.</p></div><a class="docs-sourcelink" target="_blank" href="https://github.com/quantling/JudiLing.jl/blob/5ca73e4b27ef788e0b36d45e6360491a5a413be8/src/make_semantic_matrix.jl#LL1731-L1735">source</a></section></article><article class="docstring"><header><a class="docstring-binding" id="JudiLing.L_Matrix_Struct-NTuple{10, Any}" href="#JudiLing.L_Matrix_Struct-NTuple{10, Any}"><code>JudiLing.L_Matrix_Struct</code></a> — <span class="docstring-category">Method</span></header><section><div><pre><code class="language-julia">L_Matrix_Struct(L, sd_base, sd_inflection, base_f, infl_f, base_f2i, infl_f2i, n_base_f, n_infl_f, ncol)</code></pre><p>Construct L<em>Matrix</em>Struct without deep mode.</p></div><a class="docs-sourcelink" target="_blank" href="https://github.com/quantling/JudiLing.jl/blob/5ca73e4b27ef788e0b36d45e6360491a5a413be8/src/make_semantic_matrix.jl#LL1761-L1765">source</a></section></article><h2 id="Load-from-word2vec,-fasttext-or-similar"><a class="docs-heading-anchor" href="#Load-from-word2vec,-fasttext-or-similar">Load from word2vec, fasttext or similar</a><a id="Load-from-word2vec,-fasttext-or-similar-1"></a><a class="docs-heading-anchor-permalink" href="#Load-from-word2vec,-fasttext-or-similar" title="Permalink"></a></h2><article class="docstring"><header><a class="docstring-binding" id="JudiLing.load_S_matrix_from_fasttext-Tuple{DataFrames.DataFrame, Symbol}" href="#JudiLing.load_S_matrix_from_fasttext-Tuple{DataFrames.DataFrame, Symbol}"><code>JudiLing.load_S_matrix_from_fasttext</code></a> — <span class="docstring-category">Method</span></header><section><div><pre><code class="language-julia">load_S_matrix_from_fasttext(data::DataFrame,
                                  language::Symbol;
                                  target_col=:Word,
                                  default_file::Int=1)</code></pre><p>Load semantic matrix from fasttext, loaded using the Embeddings.jl package. Subset fasttext vectors to include only words in <code>target_col</code> of <code>data</code>, and subset data to only include words in <code>target_col</code> for which semantic vector is available.</p><p>The last parameter, default_file, specifies which vectors are loaded. To learn about all available vectors, use the following commands:</p><pre><code class="language-julia">using Embeddings
 language_files(FastText_Text{:nl})</code></pre><p>replacing the language code (here <code>:nl</code>) with the language you are interested in. In general, for all languages other than English, these files are available:</p><ul><li><code>default_file=1</code> loads from https://fasttext.cc/docs/en/crawl-vectors.html, paper: E. Grave<em>, P. Bojanowski</em>, P. Gupta, A. Joulin, T. Mikolov,        Learning Word Vectors for 157 Languages License: CC BY-SA 3.0 https://creativecommons.org/licenses/by-sa/3.0/</li><li><code>default_file=2</code> loads from https://fasttext.cc/docs/en/pretrained-vectors.html paper: P. Bojanowski<em>, E. Grave</em>, A. Joulin, T. Mikolov,        Enriching Word Vectors with Subword Information License: CC BY-SA 3.0 https://creativecommons.org/licenses/by-sa/3.0/</li></ul><p><strong>Obligatory Arguments</strong></p><ul><li><code>data::DataFrame</code>: the dataset</li><li><code>language::Symbol</code>: the language of the words in the dataset,   offically ISO 639-2 (see https://github.com/JuliaText/Embeddings.jl/issues/34#issuecomment-782604523)   but practically it seems more like ISO 639-1 to me with ISO 639-2 only being used   if ISO 639-1 isn&#39;t available (see https://en.wikipedia.org/wiki/List<em>of</em>ISO<em>639-2</em>codes)</li></ul><p><strong>Optional Arguments</strong></p><ul><li><code>target_col=:Word</code>: column with orthographic representation of words in <code>data</code></li><li><code>default_file::Int=1</code>: source of vectors, for more information see above and here: https://github.com/JuliaText/Embeddings.jl#loading-different-embeddings</li></ul><p><strong>Examples</strong></p><pre><code class="language-julia"># basic usage
-latin_small, S = JudiLing.load_S_matrix_from_fasttext(latin, :la, target_col=:Word)</code></pre></div><a class="docs-sourcelink" target="_blank" href="https://github.com/quantling/JudiLing.jl/blob/244bb0c648484065ffd5a41781ccc1caf2e5db60/src/make_semantic_matrix.jl#LL1391-L1435">source</a></section></article><article class="docstring"><header><a class="docstring-binding" id="JudiLing.load_S_matrix_from_fasttext-Tuple{DataFrames.DataFrame, DataFrames.DataFrame, Symbol}" href="#JudiLing.load_S_matrix_from_fasttext-Tuple{DataFrames.DataFrame, DataFrames.DataFrame, Symbol}"><code>JudiLing.load_S_matrix_from_fasttext</code></a> — <span class="docstring-category">Method</span></header><section><div><pre><code class="language-julia">load_S_matrix_from_fasttext(data_train::DataFrame,
+latin_small, S = JudiLing.load_S_matrix_from_fasttext(latin, :la, target_col=:Word)</code></pre></div><a class="docs-sourcelink" target="_blank" href="https://github.com/quantling/JudiLing.jl/blob/5ca73e4b27ef788e0b36d45e6360491a5a413be8/src/make_semantic_matrix.jl#LL1391-L1435">source</a></section></article><article class="docstring"><header><a class="docstring-binding" id="JudiLing.load_S_matrix_from_fasttext-Tuple{DataFrames.DataFrame, DataFrames.DataFrame, Symbol}" href="#JudiLing.load_S_matrix_from_fasttext-Tuple{DataFrames.DataFrame, DataFrames.DataFrame, Symbol}"><code>JudiLing.load_S_matrix_from_fasttext</code></a> — <span class="docstring-category">Method</span></header><section><div><pre><code class="language-julia">load_S_matrix_from_fasttext(data_train::DataFrame,
                                  data_val::DataFrame,
                                  language::Symbol;
                                  target_col=:Word,
@@ -248,14 +248,14 @@
 latin_small_train, latin_small_val, S_train, S_val = JudiLing.load_S_matrix_from_fasttext(latin_train,
                                                       latin_val,
                                                       :la,
-                                                      target_col=:Word)</code></pre></div><a class="docs-sourcelink" target="_blank" href="https://github.com/quantling/JudiLing.jl/blob/244bb0c648484065ffd5a41781ccc1caf2e5db60/src/make_semantic_matrix.jl#LL1447-L1497">source</a></section></article><article class="docstring"><header><a class="docstring-binding" id="JudiLing.load_S_matrix_from_word2vec_file-Tuple{DataFrames.DataFrame, String}" href="#JudiLing.load_S_matrix_from_word2vec_file-Tuple{DataFrames.DataFrame, String}"><code>JudiLing.load_S_matrix_from_word2vec_file</code></a> — <span class="docstring-category">Method</span></header><section><div><pre><code class="language-julia">load_S_matrix_from_word2vec_file(data::DataFrame,
+                                                      target_col=:Word)</code></pre></div><a class="docs-sourcelink" target="_blank" href="https://github.com/quantling/JudiLing.jl/blob/5ca73e4b27ef788e0b36d45e6360491a5a413be8/src/make_semantic_matrix.jl#LL1447-L1497">source</a></section></article><article class="docstring"><header><a class="docstring-binding" id="JudiLing.load_S_matrix_from_word2vec_file-Tuple{DataFrames.DataFrame, String}" href="#JudiLing.load_S_matrix_from_word2vec_file-Tuple{DataFrames.DataFrame, String}"><code>JudiLing.load_S_matrix_from_word2vec_file</code></a> — <span class="docstring-category">Method</span></header><section><div><pre><code class="language-julia">load_S_matrix_from_word2vec_file(data::DataFrame,
                             filepath::String;
-                            target_col=:Word)</code></pre><p>Load semantic matrix from word2vec filepath. Subset word2vec vectors to include only words in <code>target_col</code> of <code>data</code>, and subset data to only include words in <code>target_col</code> for which semantic vector is available. Returns subsetted data and semantic matrix.</p><p><strong>Obligatory Arguments</strong></p><ul><li><code>data::DataFrame</code>: the training dataset</li><li><code>filepath::String</code>: path to file with word2vec vectors in .txt (not compressed in any way)</li></ul><p><strong>Optional Arguments</strong></p><ul><li><code>target_col=:Word</code>: column with orthographic representation of words in <code>data</code></li></ul></div><a class="docs-sourcelink" target="_blank" href="https://github.com/quantling/JudiLing.jl/blob/244bb0c648484065ffd5a41781ccc1caf2e5db60/src/make_semantic_matrix.jl#LL1608-L1625">source</a></section></article><article class="docstring"><header><a class="docstring-binding" id="JudiLing.load_S_matrix_from_word2vec_file-Tuple{DataFrames.DataFrame, DataFrames.DataFrame, String}" href="#JudiLing.load_S_matrix_from_word2vec_file-Tuple{DataFrames.DataFrame, DataFrames.DataFrame, String}"><code>JudiLing.load_S_matrix_from_word2vec_file</code></a> — <span class="docstring-category">Method</span></header><section><div><pre><code class="language-julia">load_S_matrix_from_word2vec_file(data_train::DataFrame,
+                            target_col=:Word)</code></pre><p>Load semantic matrix from word2vec filepath. Subset word2vec vectors to include only words in <code>target_col</code> of <code>data</code>, and subset data to only include words in <code>target_col</code> for which semantic vector is available. Returns subsetted data and semantic matrix.</p><p><strong>Obligatory Arguments</strong></p><ul><li><code>data::DataFrame</code>: the training dataset</li><li><code>filepath::String</code>: path to file with word2vec vectors in .txt (not compressed in any way)</li></ul><p><strong>Optional Arguments</strong></p><ul><li><code>target_col=:Word</code>: column with orthographic representation of words in <code>data</code></li></ul></div><a class="docs-sourcelink" target="_blank" href="https://github.com/quantling/JudiLing.jl/blob/5ca73e4b27ef788e0b36d45e6360491a5a413be8/src/make_semantic_matrix.jl#LL1608-L1625">source</a></section></article><article class="docstring"><header><a class="docstring-binding" id="JudiLing.load_S_matrix_from_word2vec_file-Tuple{DataFrames.DataFrame, DataFrames.DataFrame, String}" href="#JudiLing.load_S_matrix_from_word2vec_file-Tuple{DataFrames.DataFrame, DataFrames.DataFrame, String}"><code>JudiLing.load_S_matrix_from_word2vec_file</code></a> — <span class="docstring-category">Method</span></header><section><div><pre><code class="language-julia">load_S_matrix_from_word2vec_file(data_train::DataFrame,
                             data_val::DataFrame,
                             filepath::String;
-                            target_col=:Word)</code></pre><p>Load semantic matrix from word2vec filepath. Subset word2vec vectors to include only words in <code>target_col</code> of <code>data_train</code> and <code>data_val</code>, and subset data to only include words in <code>target_col</code> for which semantic vector is available. Returns subsetted train and val data and train and val semantic matrices.</p><p><strong>Obligatory Arguments</strong></p><ul><li><code>data_train::DataFrame</code>: the training dataset</li><li><code>data_val::DataFrame</code>: the validation dataset</li><li><code>filepath::String</code>: path to file with word2vec vectors in .txt (not compressed in any way)</li></ul><p><strong>Optional Arguments</strong></p><ul><li><code>target_col=:Word</code>: column with orthographic representation of words in <code>data</code></li></ul></div><a class="docs-sourcelink" target="_blank" href="https://github.com/quantling/JudiLing.jl/blob/244bb0c648484065ffd5a41781ccc1caf2e5db60/src/make_semantic_matrix.jl#LL1635-L1654">source</a></section></article><article class="docstring"><header><a class="docstring-binding" id="JudiLing.load_S_matrix_from_fasttext_file-Tuple{DataFrames.DataFrame, String}" href="#JudiLing.load_S_matrix_from_fasttext_file-Tuple{DataFrames.DataFrame, String}"><code>JudiLing.load_S_matrix_from_fasttext_file</code></a> — <span class="docstring-category">Method</span></header><section><div><pre><code class="language-julia">load_S_matrix_from_fasttext_file(data::DataFrame,
+                            target_col=:Word)</code></pre><p>Load semantic matrix from word2vec filepath. Subset word2vec vectors to include only words in <code>target_col</code> of <code>data_train</code> and <code>data_val</code>, and subset data to only include words in <code>target_col</code> for which semantic vector is available. Returns subsetted train and val data and train and val semantic matrices.</p><p><strong>Obligatory Arguments</strong></p><ul><li><code>data_train::DataFrame</code>: the training dataset</li><li><code>data_val::DataFrame</code>: the validation dataset</li><li><code>filepath::String</code>: path to file with word2vec vectors in .txt (not compressed in any way)</li></ul><p><strong>Optional Arguments</strong></p><ul><li><code>target_col=:Word</code>: column with orthographic representation of words in <code>data</code></li></ul></div><a class="docs-sourcelink" target="_blank" href="https://github.com/quantling/JudiLing.jl/blob/5ca73e4b27ef788e0b36d45e6360491a5a413be8/src/make_semantic_matrix.jl#LL1635-L1654">source</a></section></article><article class="docstring"><header><a class="docstring-binding" id="JudiLing.load_S_matrix_from_fasttext_file-Tuple{DataFrames.DataFrame, String}" href="#JudiLing.load_S_matrix_from_fasttext_file-Tuple{DataFrames.DataFrame, String}"><code>JudiLing.load_S_matrix_from_fasttext_file</code></a> — <span class="docstring-category">Method</span></header><section><div><pre><code class="language-julia">load_S_matrix_from_fasttext_file(data::DataFrame,
                             filepath::String;
-                            target_col=:Word)</code></pre><p>Load semantic matrix from fasttext filepath. Subset fasttext vectors to include only words in <code>target_col</code> of <code>data</code>, and subset data to only include words in <code>target_col</code> for which semantic vector is available. Returns subsetted data and semantic matrix.</p><p><strong>Obligatory Arguments</strong></p><ul><li><code>data::DataFrame</code>: the training dataset</li><li><code>filepath::String</code>: path to file with fasttext vectors in .txt or .vec (not compressed in any way)</li></ul><p><strong>Optional Arguments</strong></p><ul><li><code>target_col=:Word</code>: column with orthographic representation of words in <code>data</code></li></ul></div><a class="docs-sourcelink" target="_blank" href="https://github.com/quantling/JudiLing.jl/blob/244bb0c648484065ffd5a41781ccc1caf2e5db60/src/make_semantic_matrix.jl#LL1670-L1687">source</a></section></article><article class="docstring"><header><a class="docstring-binding" id="JudiLing.load_S_matrix_from_fasttext_file-Tuple{DataFrames.DataFrame, DataFrames.DataFrame, String}" href="#JudiLing.load_S_matrix_from_fasttext_file-Tuple{DataFrames.DataFrame, DataFrames.DataFrame, String}"><code>JudiLing.load_S_matrix_from_fasttext_file</code></a> — <span class="docstring-category">Method</span></header><section><div><pre><code class="language-julia">load_S_matrix_from_fasttext_file(data_train::DataFrame,
+                            target_col=:Word)</code></pre><p>Load semantic matrix from fasttext filepath. Subset fasttext vectors to include only words in <code>target_col</code> of <code>data</code>, and subset data to only include words in <code>target_col</code> for which semantic vector is available. Returns subsetted data and semantic matrix.</p><p><strong>Obligatory Arguments</strong></p><ul><li><code>data::DataFrame</code>: the training dataset</li><li><code>filepath::String</code>: path to file with fasttext vectors in .txt or .vec (not compressed in any way)</li></ul><p><strong>Optional Arguments</strong></p><ul><li><code>target_col=:Word</code>: column with orthographic representation of words in <code>data</code></li></ul></div><a class="docs-sourcelink" target="_blank" href="https://github.com/quantling/JudiLing.jl/blob/5ca73e4b27ef788e0b36d45e6360491a5a413be8/src/make_semantic_matrix.jl#LL1670-L1687">source</a></section></article><article class="docstring"><header><a class="docstring-binding" id="JudiLing.load_S_matrix_from_fasttext_file-Tuple{DataFrames.DataFrame, DataFrames.DataFrame, String}" href="#JudiLing.load_S_matrix_from_fasttext_file-Tuple{DataFrames.DataFrame, DataFrames.DataFrame, String}"><code>JudiLing.load_S_matrix_from_fasttext_file</code></a> — <span class="docstring-category">Method</span></header><section><div><pre><code class="language-julia">load_S_matrix_from_fasttext_file(data_train::DataFrame,
                             data_val::DataFrame,
                             filepath::String;
-                            target_col=:Word)</code></pre><p>Load semantic matrix from fasttext filepath. Subset fasttext vectors to include only words in <code>target_col</code> of <code>data_train</code> and <code>data_val</code>, and subset data to only include words in <code>target_col</code> for which semantic vector is available. Returns subsetted train and val data and train and val semantic matrices.</p><p><strong>Obligatory Arguments</strong></p><ul><li><code>data_train::DataFrame</code>: the training dataset</li><li><code>data_val::DataFrame</code>: the validation dataset</li><li><code>filepath::String</code>: path to file with fasttext vectors in .txt (not compressed in any way)</li></ul><p><strong>Optional Arguments</strong></p><ul><li><code>target_col=:Word</code>: column with orthographic representation of words in <code>data</code></li></ul></div><a class="docs-sourcelink" target="_blank" href="https://github.com/quantling/JudiLing.jl/blob/244bb0c648484065ffd5a41781ccc1caf2e5db60/src/make_semantic_matrix.jl#LL1697-L1716">source</a></section></article><h2 id="Utility-functions"><a class="docs-heading-anchor" href="#Utility-functions">Utility functions</a><a id="Utility-functions-1"></a><a class="docs-heading-anchor-permalink" href="#Utility-functions" title="Permalink"></a></h2><article class="docstring"><header><a class="docstring-binding" id="JudiLing.process_features-Tuple{Any, Any}" href="#JudiLing.process_features-Tuple{Any, Any}"><code>JudiLing.process_features</code></a> — <span class="docstring-category">Method</span></header><section><div><pre><code class="language-julia">process_features(data, feature_cols)</code></pre><p>Collect all features given datasets and feature column names.</p></div><a class="docs-sourcelink" target="_blank" href="https://github.com/quantling/JudiLing.jl/blob/244bb0c648484065ffd5a41781ccc1caf2e5db60/src/make_semantic_matrix.jl#LL1789-L1793">source</a></section></article><article class="docstring"><header><a class="docstring-binding" id="JudiLing.comp_f_M!-NTuple{6, Any}" href="#JudiLing.comp_f_M!-NTuple{6, Any}"><code>JudiLing.comp_f_M!</code></a> — <span class="docstring-category">Method</span></header><section><div><pre><code class="language-julia">comp_f_M!(L, sd, sd_mean, n_f, ncol, n_b)</code></pre><p>Compose feature Matrix with deep mode.</p></div><a class="docs-sourcelink" target="_blank" href="https://github.com/quantling/JudiLing.jl/blob/244bb0c648484065ffd5a41781ccc1caf2e5db60/src/make_semantic_matrix.jl#LL1802-L1806">source</a></section></article><article class="docstring"><header><a class="docstring-binding" id="JudiLing.comp_f_M!-NTuple{5, Any}" href="#JudiLing.comp_f_M!-NTuple{5, Any}"><code>JudiLing.comp_f_M!</code></a> — <span class="docstring-category">Method</span></header><section><div><pre><code class="language-julia">comp_f_M!(L, sd, n_f, ncol, n_b)</code></pre><p>Compose feature Matrix without deep mode.</p></div><a class="docs-sourcelink" target="_blank" href="https://github.com/quantling/JudiLing.jl/blob/244bb0c648484065ffd5a41781ccc1caf2e5db60/src/make_semantic_matrix.jl#LL1814-L1818">source</a></section></article><article class="docstring"><header><a class="docstring-binding" id="JudiLing.merge_f2i-NTuple{4, Any}" href="#JudiLing.merge_f2i-NTuple{4, Any}"><code>JudiLing.merge_f2i</code></a> — <span class="docstring-category">Method</span></header><section><div><pre><code class="language-julia">merge_f2i(base_f2i, infl_f2i, n_base_f, n_infl_f)</code></pre><p>Merge base f2i dictionary and inflectional f2i dictionary.</p></div><a class="docs-sourcelink" target="_blank" href="https://github.com/quantling/JudiLing.jl/blob/244bb0c648484065ffd5a41781ccc1caf2e5db60/src/make_semantic_matrix.jl#LL1825-L1829">source</a></section></article><article class="docstring"><header><a class="docstring-binding" id="JudiLing.lexome_sum-Tuple{Any, Any}" href="#JudiLing.lexome_sum-Tuple{Any, Any}"><code>JudiLing.lexome_sum</code></a> — <span class="docstring-category">Method</span></header><section><div><pre><code class="language-julia">lexome_sum(L, features)</code></pre><p>Sum up semantic vector, given lexome vector.</p></div><a class="docs-sourcelink" target="_blank" href="https://github.com/quantling/JudiLing.jl/blob/244bb0c648484065ffd5a41781ccc1caf2e5db60/src/make_semantic_matrix.jl#LL1841-L1845">source</a></section></article><article class="docstring"><header><a class="docstring-binding" id="JudiLing.make_St-NTuple{5, Any}" href="#JudiLing.make_St-NTuple{5, Any}"><code>JudiLing.make_St</code></a> — <span class="docstring-category">Method</span></header><section><div><pre><code class="language-julia">make_St(L, n, data, base, inflections)</code></pre><p>Make S transpose matrix with inflections.</p></div><a class="docs-sourcelink" target="_blank" href="https://github.com/quantling/JudiLing.jl/blob/244bb0c648484065ffd5a41781ccc1caf2e5db60/src/make_semantic_matrix.jl#LL1854-L1858">source</a></section></article><article class="docstring"><header><a class="docstring-binding" id="JudiLing.make_St-NTuple{4, Any}" href="#JudiLing.make_St-NTuple{4, Any}"><code>JudiLing.make_St</code></a> — <span class="docstring-category">Method</span></header><section><div><pre><code class="language-julia">make_St(L, n, data, base)</code></pre><p>Make S transpose matrix without inflections.</p></div><a class="docs-sourcelink" target="_blank" href="https://github.com/quantling/JudiLing.jl/blob/244bb0c648484065ffd5a41781ccc1caf2e5db60/src/make_semantic_matrix.jl#LL1870-L1874">source</a></section></article><article class="docstring"><header><a class="docstring-binding" id="JudiLing.add_St_noise!-Tuple{Any, Any}" href="#JudiLing.add_St_noise!-Tuple{Any, Any}"><code>JudiLing.add_St_noise!</code></a> — <span class="docstring-category">Method</span></header><section><div><pre><code class="language-julia">add_St_noise!(St, sd_noise)</code></pre><p>Add noise.</p></div><a class="docs-sourcelink" target="_blank" href="https://github.com/quantling/JudiLing.jl/blob/244bb0c648484065ffd5a41781ccc1caf2e5db60/src/make_semantic_matrix.jl#LL1884-L1888">source</a></section></article><article class="docstring"><header><a class="docstring-binding" id="JudiLing.normalize_St!-Tuple{Any, Any, Any}" href="#JudiLing.normalize_St!-Tuple{Any, Any, Any}"><code>JudiLing.normalize_St!</code></a> — <span class="docstring-category">Method</span></header><section><div><pre><code class="language-julia">normalize_St!(St, n_base, n_infl)</code></pre><p>Normalize S transpose with inflections.</p></div><a class="docs-sourcelink" target="_blank" href="https://github.com/quantling/JudiLing.jl/blob/244bb0c648484065ffd5a41781ccc1caf2e5db60/src/make_semantic_matrix.jl#LL1894-L1898">source</a></section></article><article class="docstring"><header><a class="docstring-binding" id="JudiLing.normalize_St!-Tuple{Any, Any}" href="#JudiLing.normalize_St!-Tuple{Any, Any}"><code>JudiLing.normalize_St!</code></a> — <span class="docstring-category">Method</span></header><section><div><pre><code class="language-julia">normalize_St!(St, n_base)</code></pre><p>Normalize S transpose without inflections.</p></div><a class="docs-sourcelink" target="_blank" href="https://github.com/quantling/JudiLing.jl/blob/244bb0c648484065ffd5a41781ccc1caf2e5db60/src/make_semantic_matrix.jl#LL1903-L1907">source</a></section></article></article><nav class="docs-footer"><a class="docs-footer-prevpage" href="../make_cue_matrix/">« Make Cue Matrix</a><a class="docs-footer-nextpage" href="../cholesky/">Cholesky »</a><div class="flexbox-break"></div><p class="footer-message">Powered by <a href="https://github.com/JuliaDocs/Documenter.jl">Documenter.jl</a> and the <a href="https://julialang.org/">Julia Programming Language</a>.</p></nav></div><div class="modal" id="documenter-settings"><div class="modal-background"></div><div class="modal-card"><header class="modal-card-head"><p class="modal-card-title">Settings</p><button class="delete"></button></header><section class="modal-card-body"><p><label class="label">Theme</label><div class="select"><select id="documenter-themepicker"><option value="documenter-light">documenter-light</option><option value="documenter-dark">documenter-dark</option></select></div></p><hr/><p>This document was generated with <a href="https://github.com/JuliaDocs/Documenter.jl">Documenter.jl</a> on <span class="colophon-date" title="Wednesday 3 July 2024 16:02">Wednesday 3 July 2024</span>. Using Julia version 1.10.4.</p></section><footer class="modal-card-foot"></footer></div></div></div></body></html>
+                            target_col=:Word)</code></pre><p>Load semantic matrix from fasttext filepath. Subset fasttext vectors to include only words in <code>target_col</code> of <code>data_train</code> and <code>data_val</code>, and subset data to only include words in <code>target_col</code> for which semantic vector is available. Returns subsetted train and val data and train and val semantic matrices.</p><p><strong>Obligatory Arguments</strong></p><ul><li><code>data_train::DataFrame</code>: the training dataset</li><li><code>data_val::DataFrame</code>: the validation dataset</li><li><code>filepath::String</code>: path to file with fasttext vectors in .txt (not compressed in any way)</li></ul><p><strong>Optional Arguments</strong></p><ul><li><code>target_col=:Word</code>: column with orthographic representation of words in <code>data</code></li></ul></div><a class="docs-sourcelink" target="_blank" href="https://github.com/quantling/JudiLing.jl/blob/5ca73e4b27ef788e0b36d45e6360491a5a413be8/src/make_semantic_matrix.jl#LL1697-L1716">source</a></section></article><h2 id="Utility-functions"><a class="docs-heading-anchor" href="#Utility-functions">Utility functions</a><a id="Utility-functions-1"></a><a class="docs-heading-anchor-permalink" href="#Utility-functions" title="Permalink"></a></h2><article class="docstring"><header><a class="docstring-binding" id="JudiLing.process_features-Tuple{Any, Any}" href="#JudiLing.process_features-Tuple{Any, Any}"><code>JudiLing.process_features</code></a> — <span class="docstring-category">Method</span></header><section><div><pre><code class="language-julia">process_features(data, feature_cols)</code></pre><p>Collect all features given datasets and feature column names.</p></div><a class="docs-sourcelink" target="_blank" href="https://github.com/quantling/JudiLing.jl/blob/5ca73e4b27ef788e0b36d45e6360491a5a413be8/src/make_semantic_matrix.jl#LL1789-L1793">source</a></section></article><article class="docstring"><header><a class="docstring-binding" id="JudiLing.comp_f_M!-NTuple{6, Any}" href="#JudiLing.comp_f_M!-NTuple{6, Any}"><code>JudiLing.comp_f_M!</code></a> — <span class="docstring-category">Method</span></header><section><div><pre><code class="language-julia">comp_f_M!(L, sd, sd_mean, n_f, ncol, n_b)</code></pre><p>Compose feature Matrix with deep mode.</p></div><a class="docs-sourcelink" target="_blank" href="https://github.com/quantling/JudiLing.jl/blob/5ca73e4b27ef788e0b36d45e6360491a5a413be8/src/make_semantic_matrix.jl#LL1802-L1806">source</a></section></article><article class="docstring"><header><a class="docstring-binding" id="JudiLing.comp_f_M!-NTuple{5, Any}" href="#JudiLing.comp_f_M!-NTuple{5, Any}"><code>JudiLing.comp_f_M!</code></a> — <span class="docstring-category">Method</span></header><section><div><pre><code class="language-julia">comp_f_M!(L, sd, n_f, ncol, n_b)</code></pre><p>Compose feature Matrix without deep mode.</p></div><a class="docs-sourcelink" target="_blank" href="https://github.com/quantling/JudiLing.jl/blob/5ca73e4b27ef788e0b36d45e6360491a5a413be8/src/make_semantic_matrix.jl#LL1814-L1818">source</a></section></article><article class="docstring"><header><a class="docstring-binding" id="JudiLing.merge_f2i-NTuple{4, Any}" href="#JudiLing.merge_f2i-NTuple{4, Any}"><code>JudiLing.merge_f2i</code></a> — <span class="docstring-category">Method</span></header><section><div><pre><code class="language-julia">merge_f2i(base_f2i, infl_f2i, n_base_f, n_infl_f)</code></pre><p>Merge base f2i dictionary and inflectional f2i dictionary.</p></div><a class="docs-sourcelink" target="_blank" href="https://github.com/quantling/JudiLing.jl/blob/5ca73e4b27ef788e0b36d45e6360491a5a413be8/src/make_semantic_matrix.jl#LL1825-L1829">source</a></section></article><article class="docstring"><header><a class="docstring-binding" id="JudiLing.lexome_sum-Tuple{Any, Any}" href="#JudiLing.lexome_sum-Tuple{Any, Any}"><code>JudiLing.lexome_sum</code></a> — <span class="docstring-category">Method</span></header><section><div><pre><code class="language-julia">lexome_sum(L, features)</code></pre><p>Sum up semantic vector, given lexome vector.</p></div><a class="docs-sourcelink" target="_blank" href="https://github.com/quantling/JudiLing.jl/blob/5ca73e4b27ef788e0b36d45e6360491a5a413be8/src/make_semantic_matrix.jl#LL1841-L1845">source</a></section></article><article class="docstring"><header><a class="docstring-binding" id="JudiLing.make_St-NTuple{5, Any}" href="#JudiLing.make_St-NTuple{5, Any}"><code>JudiLing.make_St</code></a> — <span class="docstring-category">Method</span></header><section><div><pre><code class="language-julia">make_St(L, n, data, base, inflections)</code></pre><p>Make S transpose matrix with inflections.</p></div><a class="docs-sourcelink" target="_blank" href="https://github.com/quantling/JudiLing.jl/blob/5ca73e4b27ef788e0b36d45e6360491a5a413be8/src/make_semantic_matrix.jl#LL1854-L1858">source</a></section></article><article class="docstring"><header><a class="docstring-binding" id="JudiLing.make_St-NTuple{4, Any}" href="#JudiLing.make_St-NTuple{4, Any}"><code>JudiLing.make_St</code></a> — <span class="docstring-category">Method</span></header><section><div><pre><code class="language-julia">make_St(L, n, data, base)</code></pre><p>Make S transpose matrix without inflections.</p></div><a class="docs-sourcelink" target="_blank" href="https://github.com/quantling/JudiLing.jl/blob/5ca73e4b27ef788e0b36d45e6360491a5a413be8/src/make_semantic_matrix.jl#LL1870-L1874">source</a></section></article><article class="docstring"><header><a class="docstring-binding" id="JudiLing.add_St_noise!-Tuple{Any, Any}" href="#JudiLing.add_St_noise!-Tuple{Any, Any}"><code>JudiLing.add_St_noise!</code></a> — <span class="docstring-category">Method</span></header><section><div><pre><code class="language-julia">add_St_noise!(St, sd_noise)</code></pre><p>Add noise.</p></div><a class="docs-sourcelink" target="_blank" href="https://github.com/quantling/JudiLing.jl/blob/5ca73e4b27ef788e0b36d45e6360491a5a413be8/src/make_semantic_matrix.jl#LL1884-L1888">source</a></section></article><article class="docstring"><header><a class="docstring-binding" id="JudiLing.normalize_St!-Tuple{Any, Any, Any}" href="#JudiLing.normalize_St!-Tuple{Any, Any, Any}"><code>JudiLing.normalize_St!</code></a> — <span class="docstring-category">Method</span></header><section><div><pre><code class="language-julia">normalize_St!(St, n_base, n_infl)</code></pre><p>Normalize S transpose with inflections.</p></div><a class="docs-sourcelink" target="_blank" href="https://github.com/quantling/JudiLing.jl/blob/5ca73e4b27ef788e0b36d45e6360491a5a413be8/src/make_semantic_matrix.jl#LL1894-L1898">source</a></section></article><article class="docstring"><header><a class="docstring-binding" id="JudiLing.normalize_St!-Tuple{Any, Any}" href="#JudiLing.normalize_St!-Tuple{Any, Any}"><code>JudiLing.normalize_St!</code></a> — <span class="docstring-category">Method</span></header><section><div><pre><code class="language-julia">normalize_St!(St, n_base)</code></pre><p>Normalize S transpose without inflections.</p></div><a class="docs-sourcelink" target="_blank" href="https://github.com/quantling/JudiLing.jl/blob/5ca73e4b27ef788e0b36d45e6360491a5a413be8/src/make_semantic_matrix.jl#LL1903-L1907">source</a></section></article></article><nav class="docs-footer"><a class="docs-footer-prevpage" href="../make_cue_matrix/">« Make Cue Matrix</a><a class="docs-footer-nextpage" href="../cholesky/">Cholesky »</a><div class="flexbox-break"></div><p class="footer-message">Powered by <a href="https://github.com/JuliaDocs/Documenter.jl">Documenter.jl</a> and the <a href="https://julialang.org/">Julia Programming Language</a>.</p></nav></div><div class="modal" id="documenter-settings"><div class="modal-background"></div><div class="modal-card"><header class="modal-card-head"><p class="modal-card-title">Settings</p><button class="delete"></button></header><section class="modal-card-body"><p><label class="label">Theme</label><div class="select"><select id="documenter-themepicker"><option value="documenter-light">documenter-light</option><option value="documenter-dark">documenter-dark</option></select></div></p><hr/><p>This document was generated with <a href="https://github.com/JuliaDocs/Documenter.jl">Documenter.jl</a> on <span class="colophon-date" title="Wednesday 3 July 2024 16:16">Wednesday 3 July 2024</span>. Using Julia version 1.10.4.</p></section><footer class="modal-card-foot"></footer></div></div></div></body></html>
diff --git a/dev/man/make_yt_matrix/index.html b/dev/man/make_yt_matrix/index.html
index aa8b7f1..e6c5844 100644
--- a/dev/man/make_yt_matrix/index.html
+++ b/dev/man/make_yt_matrix/index.html
@@ -1,3 +1,3 @@
 <!DOCTYPE html>
-<html lang="en"><head><meta charset="UTF-8"/><meta name="viewport" content="width=device-width, initial-scale=1.0"/><title>Make Yt Matrix · JudiLing.jl</title><link rel="canonical" href="https://quantling.github.io/JudiLing.jl/man/make_yt_matrix/"/><link href="https://fonts.googleapis.com/css?family=Lato|Roboto+Mono" rel="stylesheet" type="text/css"/><link href="https://cdnjs.cloudflare.com/ajax/libs/font-awesome/5.15.0/css/fontawesome.min.css" rel="stylesheet" type="text/css"/><link href="https://cdnjs.cloudflare.com/ajax/libs/font-awesome/5.15.0/css/solid.min.css" rel="stylesheet" type="text/css"/><link href="https://cdnjs.cloudflare.com/ajax/libs/font-awesome/5.15.0/css/brands.min.css" rel="stylesheet" type="text/css"/><link href="https://cdnjs.cloudflare.com/ajax/libs/KaTeX/0.11.1/katex.min.css" rel="stylesheet" type="text/css"/><script>documenterBaseURL="../.."</script><script src="https://cdnjs.cloudflare.com/ajax/libs/require.js/2.3.6/require.min.js" data-main="../../assets/documenter.js"></script><script src="../../siteinfo.js"></script><script src="../../../versions.js"></script><link class="docs-theme-link" rel="stylesheet" type="text/css" href="../../assets/themes/documenter-dark.css" data-theme-name="documenter-dark"/><link class="docs-theme-link" rel="stylesheet" type="text/css" href="../../assets/themes/documenter-light.css" data-theme-name="documenter-light" data-theme-primary/><script src="../../assets/themeswap.js"></script></head><body><div id="documenter"><nav class="docs-sidebar"><div class="docs-package-name"><span class="docs-autofit">JudiLing.jl</span></div><form class="docs-search" action="../../search/"><input class="docs-search-query" id="documenter-search-query" name="q" type="text" placeholder="Search docs"/></form><ul class="docs-menu"><li><a class="tocitem" href="../../">Home</a></li><li><span class="tocitem">Manual</span><ul><li><a class="tocitem" href="../input/">Loading data</a></li><li><a class="tocitem" href="../make_cue_matrix/">Make Cue Matrix</a></li><li><a class="tocitem" href="../make_semantic_matrix/">Make Semantic Matrix</a></li><li><a class="tocitem" href="../cholesky/">Cholesky</a></li><li><a class="tocitem" href="../make_adjacency_matrix/">Make Adjacency Matrix</a></li><li class="is-active"><a class="tocitem" href>Make Yt Matrix</a></li><li><a class="tocitem" href="../find_path/">Find Paths</a></li><li><a class="tocitem" href="../eval/">Evaluation</a></li><li><a class="tocitem" href="../output/">Output</a></li><li><a class="tocitem" href="../test_combo/">Test Combo</a></li><li><a class="tocitem" href="../display/">Display</a></li><li><a class="tocitem" href="../utils/">Utils</a></li><li><a class="tocitem" href="../pickle/">Pickle</a></li><li><a class="tocitem" href="../pyndl/">Pyndl</a></li><li><a class="tocitem" href="../wh/">Widrow-Hoff Learning</a></li><li><a class="tocitem" href="../deep_learning/">Deep learning</a></li><li><a class="tocitem" href="../measures_func/">Measures function</a></li></ul></li><li><a class="tocitem" href="../all_manual/">All Manual index</a></li></ul><div class="docs-version-selector field has-addons"><div class="control"><span class="docs-label button is-static is-size-7">Version</span></div><div class="docs-selector control is-expanded"><div class="select is-fullwidth is-size-7"><select id="documenter-version-selector"></select></div></div></div></nav><div class="docs-main"><header class="docs-navbar"><nav class="breadcrumb"><ul class="is-hidden-mobile"><li><a class="is-disabled">Manual</a></li><li class="is-active"><a href>Make Yt Matrix</a></li></ul><ul class="is-hidden-tablet"><li class="is-active"><a href>Make Yt Matrix</a></li></ul></nav><div class="docs-right"><a class="docs-edit-link" href="https://github.com/quantling/JudiLing.jl/blob/master/docs/src/man/make_yt_matrix.md#L" title="Edit on GitHub"><span class="docs-icon fab"></span><span class="docs-label is-hidden-touch">Edit on GitHub</span></a><a class="docs-settings-button fas fa-cog" id="documenter-settings-button" href="#" title="Settings"></a><a class="docs-sidebar-button fa fa-bars is-hidden-desktop" id="documenter-sidebar-button" href="#"></a></div></header><article class="content" id="documenter-page"><h1 id="Make-Yt-Matrix"><a class="docs-heading-anchor" href="#Make-Yt-Matrix">Make Yt Matrix</a><a id="Make-Yt-Matrix-1"></a><a class="docs-heading-anchor-permalink" href="#Make-Yt-Matrix" title="Permalink"></a></h1><article class="docstring"><header><a class="docstring-binding" id="JudiLing.make_Yt_matrix" href="#JudiLing.make_Yt_matrix"><code>JudiLing.make_Yt_matrix</code></a> — <span class="docstring-category">Function</span></header><section><div><p>Make Yt matrix for timestep t.</p></div><a class="docs-sourcelink" target="_blank" href="https://github.com/quantling/JudiLing.jl/blob/244bb0c648484065ffd5a41781ccc1caf2e5db60/src/make_yt_matrix.jl#LL1-L3">source</a></section></article><article class="docstring"><header><a class="docstring-binding" id="JudiLing.make_Yt_matrix-Tuple{Any, Any, Any}" href="#JudiLing.make_Yt_matrix-Tuple{Any, Any, Any}"><code>JudiLing.make_Yt_matrix</code></a> — <span class="docstring-category">Method</span></header><section><div><pre><code class="language-julia">make_Yt_matrix(t, data, f2i)</code></pre><p>Make Yt matrix for timestep t. A given column of the Yt matrix specifies the support for the corresponding n-gram predicted for timestep t for each of the observations (rows of Yt).</p><p><strong>Obligatory Arguments</strong></p><ul><li><code>t::Int64</code>: the timestep t</li><li><code>data::DataFrame</code>: the dataset</li><li><code>f2i::Dict</code>: the dictionary returning indices given features</li></ul><p><strong>Optional Arguments</strong></p><ul><li><code>tokenized::Bool=false</code>: if true, the dataset target is assumed to be tokenized</li><li><code>sep_token::Union{Nothing, String, Char}=nothing</code>: separator token</li><li><code>verbose::Bool=false</code>: if verbose, more information will be printed</li></ul><p><strong>Examples</strong></p><pre><code class="language-julia">latin = DataFrame(CSV.File(joinpath(&quot;data&quot;, &quot;latin_mini.csv&quot;)))
-JudiLing.make_Yt_matrix(2, latin)</code></pre></div><a class="docs-sourcelink" target="_blank" href="https://github.com/quantling/JudiLing.jl/blob/244bb0c648484065ffd5a41781ccc1caf2e5db60/src/make_yt_matrix.jl#LL6-L27">source</a></section></article></article><nav class="docs-footer"><a class="docs-footer-prevpage" href="../make_adjacency_matrix/">« Make Adjacency Matrix</a><a class="docs-footer-nextpage" href="../find_path/">Find Paths »</a><div class="flexbox-break"></div><p class="footer-message">Powered by <a href="https://github.com/JuliaDocs/Documenter.jl">Documenter.jl</a> and the <a href="https://julialang.org/">Julia Programming Language</a>.</p></nav></div><div class="modal" id="documenter-settings"><div class="modal-background"></div><div class="modal-card"><header class="modal-card-head"><p class="modal-card-title">Settings</p><button class="delete"></button></header><section class="modal-card-body"><p><label class="label">Theme</label><div class="select"><select id="documenter-themepicker"><option value="documenter-light">documenter-light</option><option value="documenter-dark">documenter-dark</option></select></div></p><hr/><p>This document was generated with <a href="https://github.com/JuliaDocs/Documenter.jl">Documenter.jl</a> on <span class="colophon-date" title="Wednesday 3 July 2024 16:02">Wednesday 3 July 2024</span>. Using Julia version 1.10.4.</p></section><footer class="modal-card-foot"></footer></div></div></div></body></html>
+<html lang="en"><head><meta charset="UTF-8"/><meta name="viewport" content="width=device-width, initial-scale=1.0"/><title>Make Yt Matrix · JudiLing.jl</title><link rel="canonical" href="https://quantling.github.io/JudiLing.jl/man/make_yt_matrix/"/><link href="https://fonts.googleapis.com/css?family=Lato|Roboto+Mono" rel="stylesheet" type="text/css"/><link href="https://cdnjs.cloudflare.com/ajax/libs/font-awesome/5.15.0/css/fontawesome.min.css" rel="stylesheet" type="text/css"/><link href="https://cdnjs.cloudflare.com/ajax/libs/font-awesome/5.15.0/css/solid.min.css" rel="stylesheet" type="text/css"/><link href="https://cdnjs.cloudflare.com/ajax/libs/font-awesome/5.15.0/css/brands.min.css" rel="stylesheet" type="text/css"/><link href="https://cdnjs.cloudflare.com/ajax/libs/KaTeX/0.11.1/katex.min.css" rel="stylesheet" type="text/css"/><script>documenterBaseURL="../.."</script><script src="https://cdnjs.cloudflare.com/ajax/libs/require.js/2.3.6/require.min.js" data-main="../../assets/documenter.js"></script><script src="../../siteinfo.js"></script><script src="../../../versions.js"></script><link class="docs-theme-link" rel="stylesheet" type="text/css" href="../../assets/themes/documenter-dark.css" data-theme-name="documenter-dark"/><link class="docs-theme-link" rel="stylesheet" type="text/css" href="../../assets/themes/documenter-light.css" data-theme-name="documenter-light" data-theme-primary/><script src="../../assets/themeswap.js"></script></head><body><div id="documenter"><nav class="docs-sidebar"><div class="docs-package-name"><span class="docs-autofit">JudiLing.jl</span></div><form class="docs-search" action="../../search/"><input class="docs-search-query" id="documenter-search-query" name="q" type="text" placeholder="Search docs"/></form><ul class="docs-menu"><li><a class="tocitem" href="../../">Home</a></li><li><span class="tocitem">Manual</span><ul><li><a class="tocitem" href="../input/">Loading data</a></li><li><a class="tocitem" href="../make_cue_matrix/">Make Cue Matrix</a></li><li><a class="tocitem" href="../make_semantic_matrix/">Make Semantic Matrix</a></li><li><a class="tocitem" href="../cholesky/">Cholesky</a></li><li><a class="tocitem" href="../make_adjacency_matrix/">Make Adjacency Matrix</a></li><li class="is-active"><a class="tocitem" href>Make Yt Matrix</a></li><li><a class="tocitem" href="../find_path/">Find Paths</a></li><li><a class="tocitem" href="../eval/">Evaluation</a></li><li><a class="tocitem" href="../output/">Output</a></li><li><a class="tocitem" href="../test_combo/">Test Combo</a></li><li><a class="tocitem" href="../display/">Display</a></li><li><a class="tocitem" href="../utils/">Utils</a></li><li><a class="tocitem" href="../pickle/">Pickle</a></li><li><a class="tocitem" href="../pyndl/">Pyndl</a></li><li><a class="tocitem" href="../wh/">Widrow-Hoff Learning</a></li><li><a class="tocitem" href="../deep_learning/">Deep learning</a></li><li><a class="tocitem" href="../measures_func/">Measures function</a></li></ul></li><li><a class="tocitem" href="../all_manual/">All Manual index</a></li></ul><div class="docs-version-selector field has-addons"><div class="control"><span class="docs-label button is-static is-size-7">Version</span></div><div class="docs-selector control is-expanded"><div class="select is-fullwidth is-size-7"><select id="documenter-version-selector"></select></div></div></div></nav><div class="docs-main"><header class="docs-navbar"><nav class="breadcrumb"><ul class="is-hidden-mobile"><li><a class="is-disabled">Manual</a></li><li class="is-active"><a href>Make Yt Matrix</a></li></ul><ul class="is-hidden-tablet"><li class="is-active"><a href>Make Yt Matrix</a></li></ul></nav><div class="docs-right"><a class="docs-edit-link" href="https://github.com/quantling/JudiLing.jl/blob/master/docs/src/man/make_yt_matrix.md#L" title="Edit on GitHub"><span class="docs-icon fab"></span><span class="docs-label is-hidden-touch">Edit on GitHub</span></a><a class="docs-settings-button fas fa-cog" id="documenter-settings-button" href="#" title="Settings"></a><a class="docs-sidebar-button fa fa-bars is-hidden-desktop" id="documenter-sidebar-button" href="#"></a></div></header><article class="content" id="documenter-page"><h1 id="Make-Yt-Matrix"><a class="docs-heading-anchor" href="#Make-Yt-Matrix">Make Yt Matrix</a><a id="Make-Yt-Matrix-1"></a><a class="docs-heading-anchor-permalink" href="#Make-Yt-Matrix" title="Permalink"></a></h1><article class="docstring"><header><a class="docstring-binding" id="JudiLing.make_Yt_matrix" href="#JudiLing.make_Yt_matrix"><code>JudiLing.make_Yt_matrix</code></a> — <span class="docstring-category">Function</span></header><section><div><p>Make Yt matrix for timestep t.</p></div><a class="docs-sourcelink" target="_blank" href="https://github.com/quantling/JudiLing.jl/blob/5ca73e4b27ef788e0b36d45e6360491a5a413be8/src/make_yt_matrix.jl#LL1-L3">source</a></section></article><article class="docstring"><header><a class="docstring-binding" id="JudiLing.make_Yt_matrix-Tuple{Any, Any, Any}" href="#JudiLing.make_Yt_matrix-Tuple{Any, Any, Any}"><code>JudiLing.make_Yt_matrix</code></a> — <span class="docstring-category">Method</span></header><section><div><pre><code class="language-julia">make_Yt_matrix(t, data, f2i)</code></pre><p>Make Yt matrix for timestep t. A given column of the Yt matrix specifies the support for the corresponding n-gram predicted for timestep t for each of the observations (rows of Yt).</p><p><strong>Obligatory Arguments</strong></p><ul><li><code>t::Int64</code>: the timestep t</li><li><code>data::DataFrame</code>: the dataset</li><li><code>f2i::Dict</code>: the dictionary returning indices given features</li></ul><p><strong>Optional Arguments</strong></p><ul><li><code>tokenized::Bool=false</code>: if true, the dataset target is assumed to be tokenized</li><li><code>sep_token::Union{Nothing, String, Char}=nothing</code>: separator token</li><li><code>verbose::Bool=false</code>: if verbose, more information will be printed</li></ul><p><strong>Examples</strong></p><pre><code class="language-julia">latin = DataFrame(CSV.File(joinpath(&quot;data&quot;, &quot;latin_mini.csv&quot;)))
+JudiLing.make_Yt_matrix(2, latin)</code></pre></div><a class="docs-sourcelink" target="_blank" href="https://github.com/quantling/JudiLing.jl/blob/5ca73e4b27ef788e0b36d45e6360491a5a413be8/src/make_yt_matrix.jl#LL6-L27">source</a></section></article></article><nav class="docs-footer"><a class="docs-footer-prevpage" href="../make_adjacency_matrix/">« Make Adjacency Matrix</a><a class="docs-footer-nextpage" href="../find_path/">Find Paths »</a><div class="flexbox-break"></div><p class="footer-message">Powered by <a href="https://github.com/JuliaDocs/Documenter.jl">Documenter.jl</a> and the <a href="https://julialang.org/">Julia Programming Language</a>.</p></nav></div><div class="modal" id="documenter-settings"><div class="modal-background"></div><div class="modal-card"><header class="modal-card-head"><p class="modal-card-title">Settings</p><button class="delete"></button></header><section class="modal-card-body"><p><label class="label">Theme</label><div class="select"><select id="documenter-themepicker"><option value="documenter-light">documenter-light</option><option value="documenter-dark">documenter-dark</option></select></div></p><hr/><p>This document was generated with <a href="https://github.com/JuliaDocs/Documenter.jl">Documenter.jl</a> on <span class="colophon-date" title="Wednesday 3 July 2024 16:16">Wednesday 3 July 2024</span>. Using Julia version 1.10.4.</p></section><footer class="modal-card-foot"></footer></div></div></div></body></html>
diff --git a/dev/man/measures_func/index.html b/dev/man/measures_func/index.html
index 164f644..7916f40 100644
--- a/dev/man/measures_func/index.html
+++ b/dev/man/measures_func/index.html
@@ -71,4 +71,4 @@
 Note: the `kargs` are just keyword arguments that are passed on from the parameters of `get_and_train_model` to the `measures_func`. For example, this could be a suffix that should be added to each added column in `measures_func`.
 
 ## Output
-The function has to return the dataset.</code></pre></article><nav class="docs-footer"><a class="docs-footer-prevpage" href="../deep_learning/">« Deep learning</a><a class="docs-footer-nextpage" href="../all_manual/">All Manual index »</a><div class="flexbox-break"></div><p class="footer-message">Powered by <a href="https://github.com/JuliaDocs/Documenter.jl">Documenter.jl</a> and the <a href="https://julialang.org/">Julia Programming Language</a>.</p></nav></div><div class="modal" id="documenter-settings"><div class="modal-background"></div><div class="modal-card"><header class="modal-card-head"><p class="modal-card-title">Settings</p><button class="delete"></button></header><section class="modal-card-body"><p><label class="label">Theme</label><div class="select"><select id="documenter-themepicker"><option value="documenter-light">documenter-light</option><option value="documenter-dark">documenter-dark</option></select></div></p><hr/><p>This document was generated with <a href="https://github.com/JuliaDocs/Documenter.jl">Documenter.jl</a> on <span class="colophon-date" title="Wednesday 3 July 2024 16:02">Wednesday 3 July 2024</span>. Using Julia version 1.10.4.</p></section><footer class="modal-card-foot"></footer></div></div></div></body></html>
+The function has to return the dataset.</code></pre></article><nav class="docs-footer"><a class="docs-footer-prevpage" href="../deep_learning/">« Deep learning</a><a class="docs-footer-nextpage" href="../all_manual/">All Manual index »</a><div class="flexbox-break"></div><p class="footer-message">Powered by <a href="https://github.com/JuliaDocs/Documenter.jl">Documenter.jl</a> and the <a href="https://julialang.org/">Julia Programming Language</a>.</p></nav></div><div class="modal" id="documenter-settings"><div class="modal-background"></div><div class="modal-card"><header class="modal-card-head"><p class="modal-card-title">Settings</p><button class="delete"></button></header><section class="modal-card-body"><p><label class="label">Theme</label><div class="select"><select id="documenter-themepicker"><option value="documenter-light">documenter-light</option><option value="documenter-dark">documenter-dark</option></select></div></p><hr/><p>This document was generated with <a href="https://github.com/JuliaDocs/Documenter.jl">Documenter.jl</a> on <span class="colophon-date" title="Wednesday 3 July 2024 16:16">Wednesday 3 July 2024</span>. Using Julia version 1.10.4.</p></section><footer class="modal-card-foot"></footer></div></div></div></body></html>
diff --git a/dev/man/output/index.html b/dev/man/output/index.html
index 81feccc..047ddde 100644
--- a/dev/man/output/index.html
+++ b/dev/man/output/index.html
@@ -1,5 +1,5 @@
 <!DOCTYPE html>
-<html lang="en"><head><meta charset="UTF-8"/><meta name="viewport" content="width=device-width, initial-scale=1.0"/><title>Output · JudiLing.jl</title><link rel="canonical" href="https://quantling.github.io/JudiLing.jl/man/output/"/><link href="https://fonts.googleapis.com/css?family=Lato|Roboto+Mono" rel="stylesheet" type="text/css"/><link href="https://cdnjs.cloudflare.com/ajax/libs/font-awesome/5.15.0/css/fontawesome.min.css" rel="stylesheet" type="text/css"/><link href="https://cdnjs.cloudflare.com/ajax/libs/font-awesome/5.15.0/css/solid.min.css" rel="stylesheet" type="text/css"/><link href="https://cdnjs.cloudflare.com/ajax/libs/font-awesome/5.15.0/css/brands.min.css" rel="stylesheet" type="text/css"/><link href="https://cdnjs.cloudflare.com/ajax/libs/KaTeX/0.11.1/katex.min.css" rel="stylesheet" type="text/css"/><script>documenterBaseURL="../.."</script><script src="https://cdnjs.cloudflare.com/ajax/libs/require.js/2.3.6/require.min.js" data-main="../../assets/documenter.js"></script><script src="../../siteinfo.js"></script><script src="../../../versions.js"></script><link class="docs-theme-link" rel="stylesheet" type="text/css" href="../../assets/themes/documenter-dark.css" data-theme-name="documenter-dark"/><link class="docs-theme-link" rel="stylesheet" type="text/css" href="../../assets/themes/documenter-light.css" data-theme-name="documenter-light" data-theme-primary/><script src="../../assets/themeswap.js"></script></head><body><div id="documenter"><nav class="docs-sidebar"><div class="docs-package-name"><span class="docs-autofit">JudiLing.jl</span></div><form class="docs-search" action="../../search/"><input class="docs-search-query" id="documenter-search-query" name="q" type="text" placeholder="Search docs"/></form><ul class="docs-menu"><li><a class="tocitem" href="../../">Home</a></li><li><span class="tocitem">Manual</span><ul><li><a class="tocitem" href="../input/">Loading data</a></li><li><a class="tocitem" href="../make_cue_matrix/">Make Cue Matrix</a></li><li><a class="tocitem" href="../make_semantic_matrix/">Make Semantic Matrix</a></li><li><a class="tocitem" href="../cholesky/">Cholesky</a></li><li><a class="tocitem" href="../make_adjacency_matrix/">Make Adjacency Matrix</a></li><li><a class="tocitem" href="../make_yt_matrix/">Make Yt Matrix</a></li><li><a class="tocitem" href="../find_path/">Find Paths</a></li><li><a class="tocitem" href="../eval/">Evaluation</a></li><li class="is-active"><a class="tocitem" href>Output</a></li><li><a class="tocitem" href="../test_combo/">Test Combo</a></li><li><a class="tocitem" href="../display/">Display</a></li><li><a class="tocitem" href="../utils/">Utils</a></li><li><a class="tocitem" href="../pickle/">Pickle</a></li><li><a class="tocitem" href="../pyndl/">Pyndl</a></li><li><a class="tocitem" href="../wh/">Widrow-Hoff Learning</a></li><li><a class="tocitem" href="../deep_learning/">Deep learning</a></li><li><a class="tocitem" href="../measures_func/">Measures function</a></li></ul></li><li><a class="tocitem" href="../all_manual/">All Manual index</a></li></ul><div class="docs-version-selector field has-addons"><div class="control"><span class="docs-label button is-static is-size-7">Version</span></div><div class="docs-selector control is-expanded"><div class="select is-fullwidth is-size-7"><select id="documenter-version-selector"></select></div></div></div></nav><div class="docs-main"><header class="docs-navbar"><nav class="breadcrumb"><ul class="is-hidden-mobile"><li><a class="is-disabled">Manual</a></li><li class="is-active"><a href>Output</a></li></ul><ul class="is-hidden-tablet"><li class="is-active"><a href>Output</a></li></ul></nav><div class="docs-right"><a class="docs-edit-link" href="https://github.com/quantling/JudiLing.jl/blob/master/docs/src/man/output.md#L" title="Edit on GitHub"><span class="docs-icon fab"></span><span class="docs-label is-hidden-touch">Edit on GitHub</span></a><a class="docs-settings-button fas fa-cog" id="documenter-settings-button" href="#" title="Settings"></a><a class="docs-sidebar-button fa fa-bars is-hidden-desktop" id="documenter-sidebar-button" href="#"></a></div></header><article class="content" id="documenter-page"><h1 id="Output"><a class="docs-heading-anchor" href="#Output">Output</a><a id="Output-1"></a><a class="docs-heading-anchor-permalink" href="#Output" title="Permalink"></a></h1><article class="docstring"><header><a class="docstring-binding" id="JudiLing.write2csv" href="#JudiLing.write2csv"><code>JudiLing.write2csv</code></a> — <span class="docstring-category">Function</span></header><section><div><p>Write results into a csv file. This function takes as input the results from the <code>learn_paths</code> and <code>build_paths</code> functions, including the information on gold paths that is optionally returned as second output result.</p></div><a class="docs-sourcelink" target="_blank" href="https://github.com/quantling/JudiLing.jl/blob/244bb0c648484065ffd5a41781ccc1caf2e5db60/src/output.jl#LL1-L5">source</a></section></article><article class="docstring"><header><a class="docstring-binding" id="JudiLing.write2df" href="#JudiLing.write2df"><code>JudiLing.write2df</code></a> — <span class="docstring-category">Function</span></header><section><div><p>Reformat results into a dataframe. This function takes as input the results from the <code>learn_paths</code> and <code>build_paths</code> functions, including the information on gold paths that is optionally returned as second output result.</p></div><a class="docs-sourcelink" target="_blank" href="https://github.com/quantling/JudiLing.jl/blob/244bb0c648484065ffd5a41781ccc1caf2e5db60/src/output.jl#LL8-L12">source</a></section></article><article class="docstring"><header><a class="docstring-binding" id="JudiLing.write_comprehension_eval" href="#JudiLing.write_comprehension_eval"><code>JudiLing.write_comprehension_eval</code></a> — <span class="docstring-category">Function</span></header><section><div><p>Write comprehension evaluation into a CSV file, include target and predicted ids and indentifiers and their correlations.</p></div><a class="docs-sourcelink" target="_blank" href="https://github.com/quantling/JudiLing.jl/blob/244bb0c648484065ffd5a41781ccc1caf2e5db60/src/output.jl#LL15-L18">source</a></section></article><article class="docstring"><header><a class="docstring-binding" id="JudiLing.write2csv-NTuple{5, Any}" href="#JudiLing.write2csv-NTuple{5, Any}"><code>JudiLing.write2csv</code></a> — <span class="docstring-category">Method</span></header><section><div><pre><code class="language-julia">write2csv(res, data, cue_obj_train, cue_obj_val, filename)</code></pre><p>Write results into csv file for the results from <code>learn_paths</code> and <code>build_paths</code>.</p><p><strong>Obligatory Arguments</strong></p><ul><li><code>res::Array{Array{Result_Path_Info_Struct,1},1}</code>: the results from <code>learn_paths</code> or <code>build_paths</code></li><li><code>data::DataFrame</code>: the dataset</li><li><code>cue_obj_train::Cue_Matrix_Struct</code>: the cue object for training dataset</li><li><code>cue_obj_val::Cue_Matrix_Struct</code>: the cue object for validation dataset</li><li><code>filename::String</code>: the filename</li></ul><p><strong>Optional Arguments</strong></p><ul><li><code>grams::Int64=3</code>: the number n in n-gram cues</li><li><code>tokenized::Bool=false</code>: if true, the dataset target is tokenized</li><li><code>sep_token::Union{Nothing, String, Char}=nothing</code>: separator</li><li><code>start_end_token::Union{String, Char}=&quot;#&quot;</code>: start and end token in boundary cues</li><li><code>output_sep_token::Union{String, Char}=&quot;&quot;</code>: output separator</li><li><code>path_sep_token::Union{String, Char}=&quot;:&quot;</code>: path separator</li><li><code>target_col::Union{String, Symbol}=:Words</code>: the column name for target strings</li><li><code>root_dir::String=&quot;.&quot;</code>: dir path for project root dir</li><li><code>output_dir::String=&quot;.&quot;</code>: output dir inside root dir</li></ul><p><strong>Examples</strong></p><pre><code class="language-julia"># writing results for training data
+<html lang="en"><head><meta charset="UTF-8"/><meta name="viewport" content="width=device-width, initial-scale=1.0"/><title>Output · JudiLing.jl</title><link rel="canonical" href="https://quantling.github.io/JudiLing.jl/man/output/"/><link href="https://fonts.googleapis.com/css?family=Lato|Roboto+Mono" rel="stylesheet" type="text/css"/><link href="https://cdnjs.cloudflare.com/ajax/libs/font-awesome/5.15.0/css/fontawesome.min.css" rel="stylesheet" type="text/css"/><link href="https://cdnjs.cloudflare.com/ajax/libs/font-awesome/5.15.0/css/solid.min.css" rel="stylesheet" type="text/css"/><link href="https://cdnjs.cloudflare.com/ajax/libs/font-awesome/5.15.0/css/brands.min.css" rel="stylesheet" type="text/css"/><link href="https://cdnjs.cloudflare.com/ajax/libs/KaTeX/0.11.1/katex.min.css" rel="stylesheet" type="text/css"/><script>documenterBaseURL="../.."</script><script src="https://cdnjs.cloudflare.com/ajax/libs/require.js/2.3.6/require.min.js" data-main="../../assets/documenter.js"></script><script src="../../siteinfo.js"></script><script src="../../../versions.js"></script><link class="docs-theme-link" rel="stylesheet" type="text/css" href="../../assets/themes/documenter-dark.css" data-theme-name="documenter-dark"/><link class="docs-theme-link" rel="stylesheet" type="text/css" href="../../assets/themes/documenter-light.css" data-theme-name="documenter-light" data-theme-primary/><script src="../../assets/themeswap.js"></script></head><body><div id="documenter"><nav class="docs-sidebar"><div class="docs-package-name"><span class="docs-autofit">JudiLing.jl</span></div><form class="docs-search" action="../../search/"><input class="docs-search-query" id="documenter-search-query" name="q" type="text" placeholder="Search docs"/></form><ul class="docs-menu"><li><a class="tocitem" href="../../">Home</a></li><li><span class="tocitem">Manual</span><ul><li><a class="tocitem" href="../input/">Loading data</a></li><li><a class="tocitem" href="../make_cue_matrix/">Make Cue Matrix</a></li><li><a class="tocitem" href="../make_semantic_matrix/">Make Semantic Matrix</a></li><li><a class="tocitem" href="../cholesky/">Cholesky</a></li><li><a class="tocitem" href="../make_adjacency_matrix/">Make Adjacency Matrix</a></li><li><a class="tocitem" href="../make_yt_matrix/">Make Yt Matrix</a></li><li><a class="tocitem" href="../find_path/">Find Paths</a></li><li><a class="tocitem" href="../eval/">Evaluation</a></li><li class="is-active"><a class="tocitem" href>Output</a></li><li><a class="tocitem" href="../test_combo/">Test Combo</a></li><li><a class="tocitem" href="../display/">Display</a></li><li><a class="tocitem" href="../utils/">Utils</a></li><li><a class="tocitem" href="../pickle/">Pickle</a></li><li><a class="tocitem" href="../pyndl/">Pyndl</a></li><li><a class="tocitem" href="../wh/">Widrow-Hoff Learning</a></li><li><a class="tocitem" href="../deep_learning/">Deep learning</a></li><li><a class="tocitem" href="../measures_func/">Measures function</a></li></ul></li><li><a class="tocitem" href="../all_manual/">All Manual index</a></li></ul><div class="docs-version-selector field has-addons"><div class="control"><span class="docs-label button is-static is-size-7">Version</span></div><div class="docs-selector control is-expanded"><div class="select is-fullwidth is-size-7"><select id="documenter-version-selector"></select></div></div></div></nav><div class="docs-main"><header class="docs-navbar"><nav class="breadcrumb"><ul class="is-hidden-mobile"><li><a class="is-disabled">Manual</a></li><li class="is-active"><a href>Output</a></li></ul><ul class="is-hidden-tablet"><li class="is-active"><a href>Output</a></li></ul></nav><div class="docs-right"><a class="docs-edit-link" href="https://github.com/quantling/JudiLing.jl/blob/master/docs/src/man/output.md#L" title="Edit on GitHub"><span class="docs-icon fab"></span><span class="docs-label is-hidden-touch">Edit on GitHub</span></a><a class="docs-settings-button fas fa-cog" id="documenter-settings-button" href="#" title="Settings"></a><a class="docs-sidebar-button fa fa-bars is-hidden-desktop" id="documenter-sidebar-button" href="#"></a></div></header><article class="content" id="documenter-page"><h1 id="Output"><a class="docs-heading-anchor" href="#Output">Output</a><a id="Output-1"></a><a class="docs-heading-anchor-permalink" href="#Output" title="Permalink"></a></h1><article class="docstring"><header><a class="docstring-binding" id="JudiLing.write2csv" href="#JudiLing.write2csv"><code>JudiLing.write2csv</code></a> — <span class="docstring-category">Function</span></header><section><div><p>Write results into a csv file. This function takes as input the results from the <code>learn_paths</code> and <code>build_paths</code> functions, including the information on gold paths that is optionally returned as second output result.</p></div><a class="docs-sourcelink" target="_blank" href="https://github.com/quantling/JudiLing.jl/blob/5ca73e4b27ef788e0b36d45e6360491a5a413be8/src/output.jl#LL1-L5">source</a></section></article><article class="docstring"><header><a class="docstring-binding" id="JudiLing.write2df" href="#JudiLing.write2df"><code>JudiLing.write2df</code></a> — <span class="docstring-category">Function</span></header><section><div><p>Reformat results into a dataframe. This function takes as input the results from the <code>learn_paths</code> and <code>build_paths</code> functions, including the information on gold paths that is optionally returned as second output result.</p></div><a class="docs-sourcelink" target="_blank" href="https://github.com/quantling/JudiLing.jl/blob/5ca73e4b27ef788e0b36d45e6360491a5a413be8/src/output.jl#LL8-L12">source</a></section></article><article class="docstring"><header><a class="docstring-binding" id="JudiLing.write_comprehension_eval" href="#JudiLing.write_comprehension_eval"><code>JudiLing.write_comprehension_eval</code></a> — <span class="docstring-category">Function</span></header><section><div><p>Write comprehension evaluation into a CSV file, include target and predicted ids and indentifiers and their correlations.</p></div><a class="docs-sourcelink" target="_blank" href="https://github.com/quantling/JudiLing.jl/blob/5ca73e4b27ef788e0b36d45e6360491a5a413be8/src/output.jl#LL15-L18">source</a></section></article><article class="docstring"><header><a class="docstring-binding" id="JudiLing.write2csv-NTuple{5, Any}" href="#JudiLing.write2csv-NTuple{5, Any}"><code>JudiLing.write2csv</code></a> — <span class="docstring-category">Method</span></header><section><div><pre><code class="language-julia">write2csv(res, data, cue_obj_train, cue_obj_val, filename)</code></pre><p>Write results into csv file for the results from <code>learn_paths</code> and <code>build_paths</code>.</p><p><strong>Obligatory Arguments</strong></p><ul><li><code>res::Array{Array{Result_Path_Info_Struct,1},1}</code>: the results from <code>learn_paths</code> or <code>build_paths</code></li><li><code>data::DataFrame</code>: the dataset</li><li><code>cue_obj_train::Cue_Matrix_Struct</code>: the cue object for training dataset</li><li><code>cue_obj_val::Cue_Matrix_Struct</code>: the cue object for validation dataset</li><li><code>filename::String</code>: the filename</li></ul><p><strong>Optional Arguments</strong></p><ul><li><code>grams::Int64=3</code>: the number n in n-gram cues</li><li><code>tokenized::Bool=false</code>: if true, the dataset target is tokenized</li><li><code>sep_token::Union{Nothing, String, Char}=nothing</code>: separator</li><li><code>start_end_token::Union{String, Char}=&quot;#&quot;</code>: start and end token in boundary cues</li><li><code>output_sep_token::Union{String, Char}=&quot;&quot;</code>: output separator</li><li><code>path_sep_token::Union{String, Char}=&quot;:&quot;</code>: path separator</li><li><code>target_col::Union{String, Symbol}=:Words</code>: the column name for target strings</li><li><code>root_dir::String=&quot;.&quot;</code>: dir path for project root dir</li><li><code>output_dir::String=&quot;.&quot;</code>: output dir inside root dir</li></ul><p><strong>Examples</strong></p><pre><code class="language-julia"># writing results for training data
 JudiLing.write2csv(
     res_train,
     latin_train,
@@ -31,7 +31,7 @@
     path_sep_token=&quot;:&quot;,
     target_col=:Word,
     root_dir=&quot;.&quot;,
-    output_dir=&quot;test_out&quot;)</code></pre></div><a class="docs-sourcelink" target="_blank" href="https://github.com/quantling/JudiLing.jl/blob/244bb0c648484065ffd5a41781ccc1caf2e5db60/src/output.jl#LL21-L80">source</a></section></article><article class="docstring"><header><a class="docstring-binding" id="JudiLing.write2csv-Tuple{Vector{JudiLing.Gold_Path_Info_Struct}, Any}" href="#JudiLing.write2csv-Tuple{Vector{JudiLing.Gold_Path_Info_Struct}, Any}"><code>JudiLing.write2csv</code></a> — <span class="docstring-category">Method</span></header><section><div><pre><code class="language-julia">write2csv(gpi::Vector{Gold_Path_Info_Struct}, filename)</code></pre><p>Write results into csv file for the gold paths&#39; information optionally returned by <code>learn_paths</code> and <code>build_paths</code>.</p><p><strong>Obligatory Arguments</strong></p><ul><li><code>gpi::Vector{Gold_Path_Info_Struct}</code>: the gold paths&#39; information</li><li><code>filename::String</code>: the filename</li></ul><p><strong>Optional Arguments</strong></p><ul><li><code>root_dir::String=&quot;.&quot;</code>: dir path for project root dir</li><li><code>output_dir::String=&quot;.&quot;</code>: output dir inside root dir</li></ul><p><strong>Examples</strong></p><pre><code class="language-julia"># write gold standard paths to csv for training data
+    output_dir=&quot;test_out&quot;)</code></pre></div><a class="docs-sourcelink" target="_blank" href="https://github.com/quantling/JudiLing.jl/blob/5ca73e4b27ef788e0b36d45e6360491a5a413be8/src/output.jl#LL21-L80">source</a></section></article><article class="docstring"><header><a class="docstring-binding" id="JudiLing.write2csv-Tuple{Vector{JudiLing.Gold_Path_Info_Struct}, Any}" href="#JudiLing.write2csv-Tuple{Vector{JudiLing.Gold_Path_Info_Struct}, Any}"><code>JudiLing.write2csv</code></a> — <span class="docstring-category">Method</span></header><section><div><pre><code class="language-julia">write2csv(gpi::Vector{Gold_Path_Info_Struct}, filename)</code></pre><p>Write results into csv file for the gold paths&#39; information optionally returned by <code>learn_paths</code> and <code>build_paths</code>.</p><p><strong>Obligatory Arguments</strong></p><ul><li><code>gpi::Vector{Gold_Path_Info_Struct}</code>: the gold paths&#39; information</li><li><code>filename::String</code>: the filename</li></ul><p><strong>Optional Arguments</strong></p><ul><li><code>root_dir::String=&quot;.&quot;</code>: dir path for project root dir</li><li><code>output_dir::String=&quot;.&quot;</code>: output dir inside root dir</li></ul><p><strong>Examples</strong></p><pre><code class="language-julia"># write gold standard paths to csv for training data
 JudiLing.write2csv(
     gpi_train,
     &quot;gpi_latin_train.csv&quot;,
@@ -45,7 +45,7 @@
     &quot;gpi_latin_val.csv&quot;,
     root_dir=&quot;.&quot;,
     output_dir=&quot;test_out&quot;
-    )</code></pre></div><a class="docs-sourcelink" target="_blank" href="https://github.com/quantling/JudiLing.jl/blob/244bb0c648484065ffd5a41781ccc1caf2e5db60/src/output.jl#LL124-L156">source</a></section></article><article class="docstring"><header><a class="docstring-binding" id="JudiLing.write2csv-Tuple{JudiLing.Threshold_Stat_Struct, Any}" href="#JudiLing.write2csv-Tuple{JudiLing.Threshold_Stat_Struct, Any}"><code>JudiLing.write2csv</code></a> — <span class="docstring-category">Method</span></header><section><div><pre><code class="language-julia">write2csv(ts::Threshold_Stat_Struct, filename)</code></pre><p>Write results into csv file for threshold and tolerance proportion for each timestep.</p><p><strong>Obligatory Arguments</strong></p><ul><li><code>gpi::Vector{Gold_Path_Info_Struct}</code>: the gold paths&#39; information</li><li><code>filename::String</code>: the filename</li></ul><p><strong>Optional Arguments</strong></p><ul><li><code>root_dir::String=&quot;.&quot;</code>: dir path for project root dir</li><li><code>output_dir::String=&quot;.&quot;</code>: output dir inside root dir</li></ul><p><strong>Examples</strong></p><pre><code class="language-julia">JudiLing.write2csv(ts, &quot;ts.csv&quot;, root_dir = @__DIR__, output_dir=&quot;out&quot;)</code></pre></div><a class="docs-sourcelink" target="_blank" href="https://github.com/quantling/JudiLing.jl/blob/244bb0c648484065ffd5a41781ccc1caf2e5db60/src/output.jl#LL186-L203">source</a></section></article><article class="docstring"><header><a class="docstring-binding" id="JudiLing.write2df-NTuple{4, Any}" href="#JudiLing.write2df-NTuple{4, Any}"><code>JudiLing.write2df</code></a> — <span class="docstring-category">Method</span></header><section><div><pre><code class="language-julia">write2df(res, data, cue_obj_train, cue_obj_val)</code></pre><p>Reformat results into a dataframe for the results form <code>learn_paths</code> and <code>build_paths</code> functions.</p><p><strong>Obligatory Arguments</strong></p><ul><li><code>res</code>: output of <code>learn_paths</code> or <code>build_paths</code></li><li><code>data::DataFrame</code>: the dataset</li><li><code>cue_obj_train</code>: cue object of the training data set</li><li><code>cue_obj_val</code>: cue object of the validation data set</li></ul><p><strong>Optional Arguments</strong></p><ul><li><code>grams::Int64=3</code>: the number n in n-gram cues</li><li><code>tokenized::Bool=false</code>: if true, the dataset target is tokenized</li><li><code>sep_token::Union{Nothing, String, Char}=nothing</code>: separator</li><li><code>start_end_token::Union{String, Char}=&quot;#&quot;</code>: start and end token in boundary cues</li><li><code>output_sep_token::Union{String, Char}=&quot;&quot;</code>: output separator</li><li><code>path_sep_token::Union{String, Char}=&quot;:&quot;</code>: path separator</li><li><code>target_col::Union{String, Symbol}=:Words</code>: the column name for target strings</li></ul><p><strong>Examples</strong></p><pre><code class="language-julia"># writing results for training data
+    )</code></pre></div><a class="docs-sourcelink" target="_blank" href="https://github.com/quantling/JudiLing.jl/blob/5ca73e4b27ef788e0b36d45e6360491a5a413be8/src/output.jl#LL124-L156">source</a></section></article><article class="docstring"><header><a class="docstring-binding" id="JudiLing.write2csv-Tuple{JudiLing.Threshold_Stat_Struct, Any}" href="#JudiLing.write2csv-Tuple{JudiLing.Threshold_Stat_Struct, Any}"><code>JudiLing.write2csv</code></a> — <span class="docstring-category">Method</span></header><section><div><pre><code class="language-julia">write2csv(ts::Threshold_Stat_Struct, filename)</code></pre><p>Write results into csv file for threshold and tolerance proportion for each timestep.</p><p><strong>Obligatory Arguments</strong></p><ul><li><code>gpi::Vector{Gold_Path_Info_Struct}</code>: the gold paths&#39; information</li><li><code>filename::String</code>: the filename</li></ul><p><strong>Optional Arguments</strong></p><ul><li><code>root_dir::String=&quot;.&quot;</code>: dir path for project root dir</li><li><code>output_dir::String=&quot;.&quot;</code>: output dir inside root dir</li></ul><p><strong>Examples</strong></p><pre><code class="language-julia">JudiLing.write2csv(ts, &quot;ts.csv&quot;, root_dir = @__DIR__, output_dir=&quot;out&quot;)</code></pre></div><a class="docs-sourcelink" target="_blank" href="https://github.com/quantling/JudiLing.jl/blob/5ca73e4b27ef788e0b36d45e6360491a5a413be8/src/output.jl#LL186-L203">source</a></section></article><article class="docstring"><header><a class="docstring-binding" id="JudiLing.write2df-NTuple{4, Any}" href="#JudiLing.write2df-NTuple{4, Any}"><code>JudiLing.write2df</code></a> — <span class="docstring-category">Method</span></header><section><div><pre><code class="language-julia">write2df(res, data, cue_obj_train, cue_obj_val)</code></pre><p>Reformat results into a dataframe for the results form <code>learn_paths</code> and <code>build_paths</code> functions.</p><p><strong>Obligatory Arguments</strong></p><ul><li><code>res</code>: output of <code>learn_paths</code> or <code>build_paths</code></li><li><code>data::DataFrame</code>: the dataset</li><li><code>cue_obj_train</code>: cue object of the training data set</li><li><code>cue_obj_val</code>: cue object of the validation data set</li></ul><p><strong>Optional Arguments</strong></p><ul><li><code>grams::Int64=3</code>: the number n in n-gram cues</li><li><code>tokenized::Bool=false</code>: if true, the dataset target is tokenized</li><li><code>sep_token::Union{Nothing, String, Char}=nothing</code>: separator</li><li><code>start_end_token::Union{String, Char}=&quot;#&quot;</code>: start and end token in boundary cues</li><li><code>output_sep_token::Union{String, Char}=&quot;&quot;</code>: output separator</li><li><code>path_sep_token::Union{String, Char}=&quot;:&quot;</code>: path separator</li><li><code>target_col::Union{String, Symbol}=:Words</code>: the column name for target strings</li></ul><p><strong>Examples</strong></p><pre><code class="language-julia"># writing results for training data
 JudiLing.write2df(
     res_train,
     latin_train,
@@ -71,10 +71,10 @@
     start_end_token=&quot;#&quot;,
     output_sep_token=&quot;&quot;,
     path_sep_token=&quot;:&quot;,
-    target_col=:Word)</code></pre></div><a class="docs-sourcelink" target="_blank" href="https://github.com/quantling/JudiLing.jl/blob/244bb0c648484065ffd5a41781ccc1caf2e5db60/src/output.jl#LL215-L266">source</a></section></article><article class="docstring"><header><a class="docstring-binding" id="JudiLing.write2df-Tuple{Vector{JudiLing.Gold_Path_Info_Struct}}" href="#JudiLing.write2df-Tuple{Vector{JudiLing.Gold_Path_Info_Struct}}"><code>JudiLing.write2df</code></a> — <span class="docstring-category">Method</span></header><section><div><pre><code class="language-julia">write2df(gpi::Vector{Gold_Path_Info_Struct})</code></pre><p>Write results into a dataframe for the gold paths&#39; information optionally returned by <code>learn_paths</code> and <code>build_paths</code>.</p><p><strong>Obligatory Arguments</strong></p><ul><li><code>gpi::Vector{Gold_Path_Info_Struct}</code>: the gold paths&#39; information</li></ul><p><strong>Examples</strong></p><pre><code class="language-julia"># write gold standard paths to df for training data
+    target_col=:Word)</code></pre></div><a class="docs-sourcelink" target="_blank" href="https://github.com/quantling/JudiLing.jl/blob/5ca73e4b27ef788e0b36d45e6360491a5a413be8/src/output.jl#LL215-L266">source</a></section></article><article class="docstring"><header><a class="docstring-binding" id="JudiLing.write2df-Tuple{Vector{JudiLing.Gold_Path_Info_Struct}}" href="#JudiLing.write2df-Tuple{Vector{JudiLing.Gold_Path_Info_Struct}}"><code>JudiLing.write2df</code></a> — <span class="docstring-category">Method</span></header><section><div><pre><code class="language-julia">write2df(gpi::Vector{Gold_Path_Info_Struct})</code></pre><p>Write results into a dataframe for the gold paths&#39; information optionally returned by <code>learn_paths</code> and <code>build_paths</code>.</p><p><strong>Obligatory Arguments</strong></p><ul><li><code>gpi::Vector{Gold_Path_Info_Struct}</code>: the gold paths&#39; information</li></ul><p><strong>Examples</strong></p><pre><code class="language-julia"># write gold standard paths to df for training data
 JudiLing.write2csv(gpi_train)
 
 # write gold standard paths to df for validation data
-JudiLing.write2csv(gpi_val)</code></pre></div><a class="docs-sourcelink" target="_blank" href="https://github.com/quantling/JudiLing.jl/blob/244bb0c648484065ffd5a41781ccc1caf2e5db60/src/output.jl#LL360-L377">source</a></section></article><article class="docstring"><header><a class="docstring-binding" id="JudiLing.write2df-Tuple{JudiLing.Threshold_Stat_Struct}" href="#JudiLing.write2df-Tuple{JudiLing.Threshold_Stat_Struct}"><code>JudiLing.write2df</code></a> — <span class="docstring-category">Method</span></header><section><div><pre><code class="language-julia">write2df(ts::Threshold_Stat_Struct)</code></pre><p>Write results into a dataframe for threshold and tolerance proportion for each timestep.</p><p><strong>Obligatory Arguments</strong></p><ul><li><code>ts::Threshold_Stat_Struct</code>: the threshold and tolerance proportion</li></ul><p><strong>Examples</strong></p><pre><code class="language-julia">JudiLing.write2df(ts)</code></pre></div><a class="docs-sourcelink" target="_blank" href="https://github.com/quantling/JudiLing.jl/blob/244bb0c648484065ffd5a41781ccc1caf2e5db60/src/output.jl#LL414-L426">source</a></section></article><article class="docstring"><header><a class="docstring-binding" id="JudiLing.write_comprehension_eval-NTuple{5, Any}" href="#JudiLing.write_comprehension_eval-NTuple{5, Any}"><code>JudiLing.write_comprehension_eval</code></a> — <span class="docstring-category">Method</span></header><section><div><pre><code class="language-julia">write_comprehension_eval(SChat, SC, data, target_col, filename)</code></pre><p>Write comprehension evaluation into a CSV file, include target and predicted ids and indentifiers and their correlations.</p><p><strong>Obligatory Arguments</strong></p><ul><li><code>SChat::Matrix</code>: the Shat/Chat matrix</li><li><code>SC::Matrix</code>: the S/C matrix</li><li><code>data::DataFrame</code>: the data</li><li><code>target_col::Symbol</code>: the name of target column</li><li><code>filename::String</code>: the filename/filepath</li></ul><p><strong>Optional Arguments</strong></p><ul><li><code>k</code>: top k candidates</li><li><code>root_dir::String=&quot;.&quot;</code>: dir path for project root dir</li><li><code>output_dir::String=&quot;.&quot;</code>: output dir inside root dir</li></ul><p><strong>Examples</strong></p><pre><code class="language-julia">JudiLing.write_comprehension_eval(Chat, cue_obj.C, latin, :Word, &quot;output.csv&quot;,
-    k=10, root_dir=@__DIR__, output_dir=&quot;out&quot;)</code></pre></div><a class="docs-sourcelink" target="_blank" href="https://github.com/quantling/JudiLing.jl/blob/244bb0c648484065ffd5a41781ccc1caf2e5db60/src/output.jl#LL556-L579">source</a></section></article><article class="docstring"><header><a class="docstring-binding" id="JudiLing.write_comprehension_eval-NTuple{7, Any}" href="#JudiLing.write_comprehension_eval-NTuple{7, Any}"><code>JudiLing.write_comprehension_eval</code></a> — <span class="docstring-category">Method</span></header><section><div><pre><code class="language-julia">write_comprehension_eval(SChat, SC, SC_rest, data, data_rest, target_col, filename)</code></pre><p>Write comprehension evaluation into a CSV file for both training and validation datasets, include target and predicted ids and indentifiers and their correlations.</p><p><strong>Obligatory Arguments</strong></p><ul><li><code>SChat::Matrix</code>: the Shat/Chat matrix</li><li><code>SC::Matrix</code>: the S/C matrix</li><li><code>SC_rest::Matrix</code>: the rest S/C matrix</li><li><code>data::DataFrame</code>: the data</li><li><code>data_rest::DataFrame</code>: the rest data</li><li><code>target_col::Symbol</code>: the name of target column</li><li><code>filename::String</code>: the filename/filepath</li></ul><p><strong>Optional Arguments</strong></p><ul><li><code>k</code>: top k candidates</li><li><code>root_dir::String=&quot;.&quot;</code>: dir path for project root dir</li><li><code>output_dir::String=&quot;.&quot;</code>: output dir inside root dir</li></ul><p><strong>Examples</strong></p><pre><code class="language-julia">JudiLing.write_comprehension_eval(Shat_val, S_val, S_train, latin_val, latin_train,
-    :Word, &quot;all_output.csv&quot;, k=10, root_dir=@__DIR__, output_dir=&quot;out&quot;)</code></pre></div><a class="docs-sourcelink" target="_blank" href="https://github.com/quantling/JudiLing.jl/blob/244bb0c648484065ffd5a41781ccc1caf2e5db60/src/output.jl#LL622-L648">source</a></section></article><article class="docstring"><header><a class="docstring-binding" id="JudiLing.save_L_matrix-Tuple{Any, Any}" href="#JudiLing.save_L_matrix-Tuple{Any, Any}"><code>JudiLing.save_L_matrix</code></a> — <span class="docstring-category">Method</span></header><section><div><pre><code class="language-julia">save_L_matrix(L, filename)</code></pre><p>Save lexome matrix into csv file.</p><p><strong>Obligatory Arguments</strong></p><ul><li><code>L::L_Matrix_Struct</code>: the lexome matrix struct</li><li><code>filename::String</code>: the filename/filepath</li></ul><p><strong>Examples</strong></p><pre><code class="language-julia">JudiLing.save_L_matrix(L, joinpath(@__DIR__, &quot;L.csv&quot;))</code></pre></div><a class="docs-sourcelink" target="_blank" href="https://github.com/quantling/JudiLing.jl/blob/244bb0c648484065ffd5a41781ccc1caf2e5db60/src/output.jl#LL454-L467">source</a></section></article><article class="docstring"><header><a class="docstring-binding" id="JudiLing.load_L_matrix-Tuple{Any}" href="#JudiLing.load_L_matrix-Tuple{Any}"><code>JudiLing.load_L_matrix</code></a> — <span class="docstring-category">Method</span></header><section><div><pre><code class="language-julia">load_L_matrix(filename)</code></pre><p>Load lexome matrix from csv file.</p><p><strong>Obligatory Arguments</strong></p><ul><li><code>filename::String</code>: the filename/filepath</li></ul><p><strong>Optional Arguments</strong></p><ul><li><code>header::Bool=false</code>: header in csv</li></ul><p><strong>Examples</strong></p><pre><code class="language-julia">L_load = JudiLing.load_L_matrix(joinpath(@__DIR__, &quot;L.csv&quot;))</code></pre></div><a class="docs-sourcelink" target="_blank" href="https://github.com/quantling/JudiLing.jl/blob/244bb0c648484065ffd5a41781ccc1caf2e5db60/src/output.jl#LL476-L491">source</a></section></article><article class="docstring"><header><a class="docstring-binding" id="JudiLing.save_S_matrix-NTuple{4, Any}" href="#JudiLing.save_S_matrix-NTuple{4, Any}"><code>JudiLing.save_S_matrix</code></a> — <span class="docstring-category">Method</span></header><section><div><pre><code class="language-julia">save_S_matrix(S, filename, data, target_col)</code></pre><p>Save S matrix into a csv file.</p><p><strong>Obligatory Arguments</strong></p><ul><li><code>S::Matrix</code>: the S matrix</li><li><code>filename::String</code>: the filename/filepath</li><li><code>data::DataFrame</code>: the data</li><li><code>target_col::Symbol</code>: the name of target column</li></ul><p><strong>Optional Arguments</strong></p><ul><li><code>sep::Bool=&quot; &quot;</code>: separator in CSV file</li></ul><p><strong>Examples</strong></p><pre><code class="language-julia">JudiLing.save_S_matrix(S, joinpath(@__DIR__, &quot;S.csv&quot;), latin, :Word)</code></pre></div><a class="docs-sourcelink" target="_blank" href="https://github.com/quantling/JudiLing.jl/blob/244bb0c648484065ffd5a41781ccc1caf2e5db60/src/output.jl#LL503-L521">source</a></section></article><article class="docstring"><header><a class="docstring-binding" id="JudiLing.load_S_matrix-Tuple{Any}" href="#JudiLing.load_S_matrix-Tuple{Any}"><code>JudiLing.load_S_matrix</code></a> — <span class="docstring-category">Method</span></header><section><div><pre><code class="language-julia">load_S_matrix(filename)</code></pre><p>Load S matrix from a csv file.</p><p><strong>Obligatory Arguments</strong></p><ul><li><code>filename::String</code>: the filename/filepath</li></ul><p><strong>Optional Arguments</strong></p><ul><li><code>header::Bool=false</code>: header in csv</li><li><code>sep::Bool=&quot; &quot;</code>: separator in CSV file</li></ul><p><strong>Examples</strong></p><pre><code class="language-julia">JudiLing.load_S_matrix(joinpath(@__DIR__, &quot;S.csv&quot;))</code></pre></div><a class="docs-sourcelink" target="_blank" href="https://github.com/quantling/JudiLing.jl/blob/244bb0c648484065ffd5a41781ccc1caf2e5db60/src/output.jl#LL530-L546">source</a></section></article></article><nav class="docs-footer"><a class="docs-footer-prevpage" href="../eval/">« Evaluation</a><a class="docs-footer-nextpage" href="../test_combo/">Test Combo »</a><div class="flexbox-break"></div><p class="footer-message">Powered by <a href="https://github.com/JuliaDocs/Documenter.jl">Documenter.jl</a> and the <a href="https://julialang.org/">Julia Programming Language</a>.</p></nav></div><div class="modal" id="documenter-settings"><div class="modal-background"></div><div class="modal-card"><header class="modal-card-head"><p class="modal-card-title">Settings</p><button class="delete"></button></header><section class="modal-card-body"><p><label class="label">Theme</label><div class="select"><select id="documenter-themepicker"><option value="documenter-light">documenter-light</option><option value="documenter-dark">documenter-dark</option></select></div></p><hr/><p>This document was generated with <a href="https://github.com/JuliaDocs/Documenter.jl">Documenter.jl</a> on <span class="colophon-date" title="Wednesday 3 July 2024 16:02">Wednesday 3 July 2024</span>. Using Julia version 1.10.4.</p></section><footer class="modal-card-foot"></footer></div></div></div></body></html>
+JudiLing.write2csv(gpi_val)</code></pre></div><a class="docs-sourcelink" target="_blank" href="https://github.com/quantling/JudiLing.jl/blob/5ca73e4b27ef788e0b36d45e6360491a5a413be8/src/output.jl#LL360-L377">source</a></section></article><article class="docstring"><header><a class="docstring-binding" id="JudiLing.write2df-Tuple{JudiLing.Threshold_Stat_Struct}" href="#JudiLing.write2df-Tuple{JudiLing.Threshold_Stat_Struct}"><code>JudiLing.write2df</code></a> — <span class="docstring-category">Method</span></header><section><div><pre><code class="language-julia">write2df(ts::Threshold_Stat_Struct)</code></pre><p>Write results into a dataframe for threshold and tolerance proportion for each timestep.</p><p><strong>Obligatory Arguments</strong></p><ul><li><code>ts::Threshold_Stat_Struct</code>: the threshold and tolerance proportion</li></ul><p><strong>Examples</strong></p><pre><code class="language-julia">JudiLing.write2df(ts)</code></pre></div><a class="docs-sourcelink" target="_blank" href="https://github.com/quantling/JudiLing.jl/blob/5ca73e4b27ef788e0b36d45e6360491a5a413be8/src/output.jl#LL414-L426">source</a></section></article><article class="docstring"><header><a class="docstring-binding" id="JudiLing.write_comprehension_eval-NTuple{5, Any}" href="#JudiLing.write_comprehension_eval-NTuple{5, Any}"><code>JudiLing.write_comprehension_eval</code></a> — <span class="docstring-category">Method</span></header><section><div><pre><code class="language-julia">write_comprehension_eval(SChat, SC, data, target_col, filename)</code></pre><p>Write comprehension evaluation into a CSV file, include target and predicted ids and indentifiers and their correlations.</p><p><strong>Obligatory Arguments</strong></p><ul><li><code>SChat::Matrix</code>: the Shat/Chat matrix</li><li><code>SC::Matrix</code>: the S/C matrix</li><li><code>data::DataFrame</code>: the data</li><li><code>target_col::Symbol</code>: the name of target column</li><li><code>filename::String</code>: the filename/filepath</li></ul><p><strong>Optional Arguments</strong></p><ul><li><code>k</code>: top k candidates</li><li><code>root_dir::String=&quot;.&quot;</code>: dir path for project root dir</li><li><code>output_dir::String=&quot;.&quot;</code>: output dir inside root dir</li></ul><p><strong>Examples</strong></p><pre><code class="language-julia">JudiLing.write_comprehension_eval(Chat, cue_obj.C, latin, :Word, &quot;output.csv&quot;,
+    k=10, root_dir=@__DIR__, output_dir=&quot;out&quot;)</code></pre></div><a class="docs-sourcelink" target="_blank" href="https://github.com/quantling/JudiLing.jl/blob/5ca73e4b27ef788e0b36d45e6360491a5a413be8/src/output.jl#LL556-L579">source</a></section></article><article class="docstring"><header><a class="docstring-binding" id="JudiLing.write_comprehension_eval-NTuple{7, Any}" href="#JudiLing.write_comprehension_eval-NTuple{7, Any}"><code>JudiLing.write_comprehension_eval</code></a> — <span class="docstring-category">Method</span></header><section><div><pre><code class="language-julia">write_comprehension_eval(SChat, SC, SC_rest, data, data_rest, target_col, filename)</code></pre><p>Write comprehension evaluation into a CSV file for both training and validation datasets, include target and predicted ids and indentifiers and their correlations.</p><p><strong>Obligatory Arguments</strong></p><ul><li><code>SChat::Matrix</code>: the Shat/Chat matrix</li><li><code>SC::Matrix</code>: the S/C matrix</li><li><code>SC_rest::Matrix</code>: the rest S/C matrix</li><li><code>data::DataFrame</code>: the data</li><li><code>data_rest::DataFrame</code>: the rest data</li><li><code>target_col::Symbol</code>: the name of target column</li><li><code>filename::String</code>: the filename/filepath</li></ul><p><strong>Optional Arguments</strong></p><ul><li><code>k</code>: top k candidates</li><li><code>root_dir::String=&quot;.&quot;</code>: dir path for project root dir</li><li><code>output_dir::String=&quot;.&quot;</code>: output dir inside root dir</li></ul><p><strong>Examples</strong></p><pre><code class="language-julia">JudiLing.write_comprehension_eval(Shat_val, S_val, S_train, latin_val, latin_train,
+    :Word, &quot;all_output.csv&quot;, k=10, root_dir=@__DIR__, output_dir=&quot;out&quot;)</code></pre></div><a class="docs-sourcelink" target="_blank" href="https://github.com/quantling/JudiLing.jl/blob/5ca73e4b27ef788e0b36d45e6360491a5a413be8/src/output.jl#LL622-L648">source</a></section></article><article class="docstring"><header><a class="docstring-binding" id="JudiLing.save_L_matrix-Tuple{Any, Any}" href="#JudiLing.save_L_matrix-Tuple{Any, Any}"><code>JudiLing.save_L_matrix</code></a> — <span class="docstring-category">Method</span></header><section><div><pre><code class="language-julia">save_L_matrix(L, filename)</code></pre><p>Save lexome matrix into csv file.</p><p><strong>Obligatory Arguments</strong></p><ul><li><code>L::L_Matrix_Struct</code>: the lexome matrix struct</li><li><code>filename::String</code>: the filename/filepath</li></ul><p><strong>Examples</strong></p><pre><code class="language-julia">JudiLing.save_L_matrix(L, joinpath(@__DIR__, &quot;L.csv&quot;))</code></pre></div><a class="docs-sourcelink" target="_blank" href="https://github.com/quantling/JudiLing.jl/blob/5ca73e4b27ef788e0b36d45e6360491a5a413be8/src/output.jl#LL454-L467">source</a></section></article><article class="docstring"><header><a class="docstring-binding" id="JudiLing.load_L_matrix-Tuple{Any}" href="#JudiLing.load_L_matrix-Tuple{Any}"><code>JudiLing.load_L_matrix</code></a> — <span class="docstring-category">Method</span></header><section><div><pre><code class="language-julia">load_L_matrix(filename)</code></pre><p>Load lexome matrix from csv file.</p><p><strong>Obligatory Arguments</strong></p><ul><li><code>filename::String</code>: the filename/filepath</li></ul><p><strong>Optional Arguments</strong></p><ul><li><code>header::Bool=false</code>: header in csv</li></ul><p><strong>Examples</strong></p><pre><code class="language-julia">L_load = JudiLing.load_L_matrix(joinpath(@__DIR__, &quot;L.csv&quot;))</code></pre></div><a class="docs-sourcelink" target="_blank" href="https://github.com/quantling/JudiLing.jl/blob/5ca73e4b27ef788e0b36d45e6360491a5a413be8/src/output.jl#LL476-L491">source</a></section></article><article class="docstring"><header><a class="docstring-binding" id="JudiLing.save_S_matrix-NTuple{4, Any}" href="#JudiLing.save_S_matrix-NTuple{4, Any}"><code>JudiLing.save_S_matrix</code></a> — <span class="docstring-category">Method</span></header><section><div><pre><code class="language-julia">save_S_matrix(S, filename, data, target_col)</code></pre><p>Save S matrix into a csv file.</p><p><strong>Obligatory Arguments</strong></p><ul><li><code>S::Matrix</code>: the S matrix</li><li><code>filename::String</code>: the filename/filepath</li><li><code>data::DataFrame</code>: the data</li><li><code>target_col::Symbol</code>: the name of target column</li></ul><p><strong>Optional Arguments</strong></p><ul><li><code>sep::Bool=&quot; &quot;</code>: separator in CSV file</li></ul><p><strong>Examples</strong></p><pre><code class="language-julia">JudiLing.save_S_matrix(S, joinpath(@__DIR__, &quot;S.csv&quot;), latin, :Word)</code></pre></div><a class="docs-sourcelink" target="_blank" href="https://github.com/quantling/JudiLing.jl/blob/5ca73e4b27ef788e0b36d45e6360491a5a413be8/src/output.jl#LL503-L521">source</a></section></article><article class="docstring"><header><a class="docstring-binding" id="JudiLing.load_S_matrix-Tuple{Any}" href="#JudiLing.load_S_matrix-Tuple{Any}"><code>JudiLing.load_S_matrix</code></a> — <span class="docstring-category">Method</span></header><section><div><pre><code class="language-julia">load_S_matrix(filename)</code></pre><p>Load S matrix from a csv file.</p><p><strong>Obligatory Arguments</strong></p><ul><li><code>filename::String</code>: the filename/filepath</li></ul><p><strong>Optional Arguments</strong></p><ul><li><code>header::Bool=false</code>: header in csv</li><li><code>sep::Bool=&quot; &quot;</code>: separator in CSV file</li></ul><p><strong>Examples</strong></p><pre><code class="language-julia">JudiLing.load_S_matrix(joinpath(@__DIR__, &quot;S.csv&quot;))</code></pre></div><a class="docs-sourcelink" target="_blank" href="https://github.com/quantling/JudiLing.jl/blob/5ca73e4b27ef788e0b36d45e6360491a5a413be8/src/output.jl#LL530-L546">source</a></section></article></article><nav class="docs-footer"><a class="docs-footer-prevpage" href="../eval/">« Evaluation</a><a class="docs-footer-nextpage" href="../test_combo/">Test Combo »</a><div class="flexbox-break"></div><p class="footer-message">Powered by <a href="https://github.com/JuliaDocs/Documenter.jl">Documenter.jl</a> and the <a href="https://julialang.org/">Julia Programming Language</a>.</p></nav></div><div class="modal" id="documenter-settings"><div class="modal-background"></div><div class="modal-card"><header class="modal-card-head"><p class="modal-card-title">Settings</p><button class="delete"></button></header><section class="modal-card-body"><p><label class="label">Theme</label><div class="select"><select id="documenter-themepicker"><option value="documenter-light">documenter-light</option><option value="documenter-dark">documenter-dark</option></select></div></p><hr/><p>This document was generated with <a href="https://github.com/JuliaDocs/Documenter.jl">Documenter.jl</a> on <span class="colophon-date" title="Wednesday 3 July 2024 16:16">Wednesday 3 July 2024</span>. Using Julia version 1.10.4.</p></section><footer class="modal-card-foot"></footer></div></div></div></body></html>
diff --git a/dev/man/pickle/index.html b/dev/man/pickle/index.html
index 42c4b55..8b6183b 100644
--- a/dev/man/pickle/index.html
+++ b/dev/man/pickle/index.html
@@ -1,2 +1,2 @@
 <!DOCTYPE html>
-<html lang="en"><head><meta charset="UTF-8"/><meta name="viewport" content="width=device-width, initial-scale=1.0"/><title>Pickle · JudiLing.jl</title><link rel="canonical" href="https://quantling.github.io/JudiLing.jl/man/pickle/"/><link href="https://fonts.googleapis.com/css?family=Lato|Roboto+Mono" rel="stylesheet" type="text/css"/><link href="https://cdnjs.cloudflare.com/ajax/libs/font-awesome/5.15.0/css/fontawesome.min.css" rel="stylesheet" type="text/css"/><link href="https://cdnjs.cloudflare.com/ajax/libs/font-awesome/5.15.0/css/solid.min.css" rel="stylesheet" type="text/css"/><link href="https://cdnjs.cloudflare.com/ajax/libs/font-awesome/5.15.0/css/brands.min.css" rel="stylesheet" type="text/css"/><link href="https://cdnjs.cloudflare.com/ajax/libs/KaTeX/0.11.1/katex.min.css" rel="stylesheet" type="text/css"/><script>documenterBaseURL="../.."</script><script src="https://cdnjs.cloudflare.com/ajax/libs/require.js/2.3.6/require.min.js" data-main="../../assets/documenter.js"></script><script src="../../siteinfo.js"></script><script src="../../../versions.js"></script><link class="docs-theme-link" rel="stylesheet" type="text/css" href="../../assets/themes/documenter-dark.css" data-theme-name="documenter-dark"/><link class="docs-theme-link" rel="stylesheet" type="text/css" href="../../assets/themes/documenter-light.css" data-theme-name="documenter-light" data-theme-primary/><script src="../../assets/themeswap.js"></script></head><body><div id="documenter"><nav class="docs-sidebar"><div class="docs-package-name"><span class="docs-autofit">JudiLing.jl</span></div><form class="docs-search" action="../../search/"><input class="docs-search-query" id="documenter-search-query" name="q" type="text" placeholder="Search docs"/></form><ul class="docs-menu"><li><a class="tocitem" href="../../">Home</a></li><li><span class="tocitem">Manual</span><ul><li><a class="tocitem" href="../input/">Loading data</a></li><li><a class="tocitem" href="../make_cue_matrix/">Make Cue Matrix</a></li><li><a class="tocitem" href="../make_semantic_matrix/">Make Semantic Matrix</a></li><li><a class="tocitem" href="../cholesky/">Cholesky</a></li><li><a class="tocitem" href="../make_adjacency_matrix/">Make Adjacency Matrix</a></li><li><a class="tocitem" href="../make_yt_matrix/">Make Yt Matrix</a></li><li><a class="tocitem" href="../find_path/">Find Paths</a></li><li><a class="tocitem" href="../eval/">Evaluation</a></li><li><a class="tocitem" href="../output/">Output</a></li><li><a class="tocitem" href="../test_combo/">Test Combo</a></li><li><a class="tocitem" href="../display/">Display</a></li><li><a class="tocitem" href="../utils/">Utils</a></li><li class="is-active"><a class="tocitem" href>Pickle</a></li><li><a class="tocitem" href="../pyndl/">Pyndl</a></li><li><a class="tocitem" href="../wh/">Widrow-Hoff Learning</a></li><li><a class="tocitem" href="../deep_learning/">Deep learning</a></li><li><a class="tocitem" href="../measures_func/">Measures function</a></li></ul></li><li><a class="tocitem" href="../all_manual/">All Manual index</a></li></ul><div class="docs-version-selector field has-addons"><div class="control"><span class="docs-label button is-static is-size-7">Version</span></div><div class="docs-selector control is-expanded"><div class="select is-fullwidth is-size-7"><select id="documenter-version-selector"></select></div></div></div></nav><div class="docs-main"><header class="docs-navbar"><nav class="breadcrumb"><ul class="is-hidden-mobile"><li><a class="is-disabled">Manual</a></li><li class="is-active"><a href>Pickle</a></li></ul><ul class="is-hidden-tablet"><li class="is-active"><a href>Pickle</a></li></ul></nav><div class="docs-right"><a class="docs-edit-link" href="https://github.com/quantling/JudiLing.jl/blob/master/docs/src/man/pickle.md#L" title="Edit on GitHub"><span class="docs-icon fab"></span><span class="docs-label is-hidden-touch">Edit on GitHub</span></a><a class="docs-settings-button fas fa-cog" id="documenter-settings-button" href="#" title="Settings"></a><a class="docs-sidebar-button fa fa-bars is-hidden-desktop" id="documenter-sidebar-button" href="#"></a></div></header><article class="content" id="documenter-page"><h1 id="Utils"><a class="docs-heading-anchor" href="#Utils">Utils</a><a id="Utils-1"></a><a class="docs-heading-anchor-permalink" href="#Utils" title="Permalink"></a></h1><article class="docstring"><header><a class="docstring-binding" id="JudiLing.save_pickle" href="#JudiLing.save_pickle"><code>JudiLing.save_pickle</code></a> — <span class="docstring-category">Function</span></header><section><div><p>Save pickle from python pickle file.</p></div><a class="docs-sourcelink" target="_blank" href="https://github.com/quantling/JudiLing.jl/blob/244bb0c648484065ffd5a41781ccc1caf2e5db60/src/pickle.jl#LL8-L10">source</a></section></article><article class="docstring"><header><a class="docstring-binding" id="JudiLing.load_pickle" href="#JudiLing.load_pickle"><code>JudiLing.load_pickle</code></a> — <span class="docstring-category">Function</span></header><section><div><p>Load pickle from python pickle file.</p></div><a class="docs-sourcelink" target="_blank" href="https://github.com/quantling/JudiLing.jl/blob/244bb0c648484065ffd5a41781ccc1caf2e5db60/src/pickle.jl#LL13-L15">source</a></section></article></article><nav class="docs-footer"><a class="docs-footer-prevpage" href="../utils/">« Utils</a><a class="docs-footer-nextpage" href="../pyndl/">Pyndl »</a><div class="flexbox-break"></div><p class="footer-message">Powered by <a href="https://github.com/JuliaDocs/Documenter.jl">Documenter.jl</a> and the <a href="https://julialang.org/">Julia Programming Language</a>.</p></nav></div><div class="modal" id="documenter-settings"><div class="modal-background"></div><div class="modal-card"><header class="modal-card-head"><p class="modal-card-title">Settings</p><button class="delete"></button></header><section class="modal-card-body"><p><label class="label">Theme</label><div class="select"><select id="documenter-themepicker"><option value="documenter-light">documenter-light</option><option value="documenter-dark">documenter-dark</option></select></div></p><hr/><p>This document was generated with <a href="https://github.com/JuliaDocs/Documenter.jl">Documenter.jl</a> on <span class="colophon-date" title="Wednesday 3 July 2024 16:02">Wednesday 3 July 2024</span>. Using Julia version 1.10.4.</p></section><footer class="modal-card-foot"></footer></div></div></div></body></html>
+<html lang="en"><head><meta charset="UTF-8"/><meta name="viewport" content="width=device-width, initial-scale=1.0"/><title>Pickle · JudiLing.jl</title><link rel="canonical" href="https://quantling.github.io/JudiLing.jl/man/pickle/"/><link href="https://fonts.googleapis.com/css?family=Lato|Roboto+Mono" rel="stylesheet" type="text/css"/><link href="https://cdnjs.cloudflare.com/ajax/libs/font-awesome/5.15.0/css/fontawesome.min.css" rel="stylesheet" type="text/css"/><link href="https://cdnjs.cloudflare.com/ajax/libs/font-awesome/5.15.0/css/solid.min.css" rel="stylesheet" type="text/css"/><link href="https://cdnjs.cloudflare.com/ajax/libs/font-awesome/5.15.0/css/brands.min.css" rel="stylesheet" type="text/css"/><link href="https://cdnjs.cloudflare.com/ajax/libs/KaTeX/0.11.1/katex.min.css" rel="stylesheet" type="text/css"/><script>documenterBaseURL="../.."</script><script src="https://cdnjs.cloudflare.com/ajax/libs/require.js/2.3.6/require.min.js" data-main="../../assets/documenter.js"></script><script src="../../siteinfo.js"></script><script src="../../../versions.js"></script><link class="docs-theme-link" rel="stylesheet" type="text/css" href="../../assets/themes/documenter-dark.css" data-theme-name="documenter-dark"/><link class="docs-theme-link" rel="stylesheet" type="text/css" href="../../assets/themes/documenter-light.css" data-theme-name="documenter-light" data-theme-primary/><script src="../../assets/themeswap.js"></script></head><body><div id="documenter"><nav class="docs-sidebar"><div class="docs-package-name"><span class="docs-autofit">JudiLing.jl</span></div><form class="docs-search" action="../../search/"><input class="docs-search-query" id="documenter-search-query" name="q" type="text" placeholder="Search docs"/></form><ul class="docs-menu"><li><a class="tocitem" href="../../">Home</a></li><li><span class="tocitem">Manual</span><ul><li><a class="tocitem" href="../input/">Loading data</a></li><li><a class="tocitem" href="../make_cue_matrix/">Make Cue Matrix</a></li><li><a class="tocitem" href="../make_semantic_matrix/">Make Semantic Matrix</a></li><li><a class="tocitem" href="../cholesky/">Cholesky</a></li><li><a class="tocitem" href="../make_adjacency_matrix/">Make Adjacency Matrix</a></li><li><a class="tocitem" href="../make_yt_matrix/">Make Yt Matrix</a></li><li><a class="tocitem" href="../find_path/">Find Paths</a></li><li><a class="tocitem" href="../eval/">Evaluation</a></li><li><a class="tocitem" href="../output/">Output</a></li><li><a class="tocitem" href="../test_combo/">Test Combo</a></li><li><a class="tocitem" href="../display/">Display</a></li><li><a class="tocitem" href="../utils/">Utils</a></li><li class="is-active"><a class="tocitem" href>Pickle</a></li><li><a class="tocitem" href="../pyndl/">Pyndl</a></li><li><a class="tocitem" href="../wh/">Widrow-Hoff Learning</a></li><li><a class="tocitem" href="../deep_learning/">Deep learning</a></li><li><a class="tocitem" href="../measures_func/">Measures function</a></li></ul></li><li><a class="tocitem" href="../all_manual/">All Manual index</a></li></ul><div class="docs-version-selector field has-addons"><div class="control"><span class="docs-label button is-static is-size-7">Version</span></div><div class="docs-selector control is-expanded"><div class="select is-fullwidth is-size-7"><select id="documenter-version-selector"></select></div></div></div></nav><div class="docs-main"><header class="docs-navbar"><nav class="breadcrumb"><ul class="is-hidden-mobile"><li><a class="is-disabled">Manual</a></li><li class="is-active"><a href>Pickle</a></li></ul><ul class="is-hidden-tablet"><li class="is-active"><a href>Pickle</a></li></ul></nav><div class="docs-right"><a class="docs-edit-link" href="https://github.com/quantling/JudiLing.jl/blob/master/docs/src/man/pickle.md#L" title="Edit on GitHub"><span class="docs-icon fab"></span><span class="docs-label is-hidden-touch">Edit on GitHub</span></a><a class="docs-settings-button fas fa-cog" id="documenter-settings-button" href="#" title="Settings"></a><a class="docs-sidebar-button fa fa-bars is-hidden-desktop" id="documenter-sidebar-button" href="#"></a></div></header><article class="content" id="documenter-page"><h1 id="Utils"><a class="docs-heading-anchor" href="#Utils">Utils</a><a id="Utils-1"></a><a class="docs-heading-anchor-permalink" href="#Utils" title="Permalink"></a></h1><article class="docstring"><header><a class="docstring-binding" id="JudiLing.save_pickle" href="#JudiLing.save_pickle"><code>JudiLing.save_pickle</code></a> — <span class="docstring-category">Function</span></header><section><div><p>Save pickle from python pickle file.</p></div><a class="docs-sourcelink" target="_blank" href="https://github.com/quantling/JudiLing.jl/blob/5ca73e4b27ef788e0b36d45e6360491a5a413be8/src/pickle.jl#LL8-L10">source</a></section></article><article class="docstring"><header><a class="docstring-binding" id="JudiLing.load_pickle" href="#JudiLing.load_pickle"><code>JudiLing.load_pickle</code></a> — <span class="docstring-category">Function</span></header><section><div><p>Load pickle from python pickle file.</p></div><a class="docs-sourcelink" target="_blank" href="https://github.com/quantling/JudiLing.jl/blob/5ca73e4b27ef788e0b36d45e6360491a5a413be8/src/pickle.jl#LL13-L15">source</a></section></article></article><nav class="docs-footer"><a class="docs-footer-prevpage" href="../utils/">« Utils</a><a class="docs-footer-nextpage" href="../pyndl/">Pyndl »</a><div class="flexbox-break"></div><p class="footer-message">Powered by <a href="https://github.com/JuliaDocs/Documenter.jl">Documenter.jl</a> and the <a href="https://julialang.org/">Julia Programming Language</a>.</p></nav></div><div class="modal" id="documenter-settings"><div class="modal-background"></div><div class="modal-card"><header class="modal-card-head"><p class="modal-card-title">Settings</p><button class="delete"></button></header><section class="modal-card-body"><p><label class="label">Theme</label><div class="select"><select id="documenter-themepicker"><option value="documenter-light">documenter-light</option><option value="documenter-dark">documenter-dark</option></select></div></p><hr/><p>This document was generated with <a href="https://github.com/JuliaDocs/Documenter.jl">Documenter.jl</a> on <span class="colophon-date" title="Wednesday 3 July 2024 16:16">Wednesday 3 July 2024</span>. Using Julia version 1.10.4.</p></section><footer class="modal-card-foot"></footer></div></div></div></body></html>
diff --git a/dev/man/preprocess/index.html b/dev/man/preprocess/index.html
index e0879bd..848503e 100644
--- a/dev/man/preprocess/index.html
+++ b/dev/man/preprocess/index.html
@@ -1,2 +1,2 @@
 <!DOCTYPE html>
-<html lang="en"><head><meta charset="UTF-8"/><meta name="viewport" content="width=device-width, initial-scale=1.0"/><title>Preprocess · JudiLing.jl</title><link rel="canonical" href="https://quantling.github.io/JudiLing.jl/man/preprocess/"/><link href="https://fonts.googleapis.com/css?family=Lato|Roboto+Mono" rel="stylesheet" type="text/css"/><link href="https://cdnjs.cloudflare.com/ajax/libs/font-awesome/5.15.0/css/fontawesome.min.css" rel="stylesheet" type="text/css"/><link href="https://cdnjs.cloudflare.com/ajax/libs/font-awesome/5.15.0/css/solid.min.css" rel="stylesheet" type="text/css"/><link href="https://cdnjs.cloudflare.com/ajax/libs/font-awesome/5.15.0/css/brands.min.css" rel="stylesheet" type="text/css"/><link href="https://cdnjs.cloudflare.com/ajax/libs/KaTeX/0.11.1/katex.min.css" rel="stylesheet" type="text/css"/><script>documenterBaseURL="../.."</script><script src="https://cdnjs.cloudflare.com/ajax/libs/require.js/2.3.6/require.min.js" data-main="../../assets/documenter.js"></script><script src="../../siteinfo.js"></script><script src="../../../versions.js"></script><link class="docs-theme-link" rel="stylesheet" type="text/css" href="../../assets/themes/documenter-dark.css" data-theme-name="documenter-dark"/><link class="docs-theme-link" rel="stylesheet" type="text/css" href="../../assets/themes/documenter-light.css" data-theme-name="documenter-light" data-theme-primary/><script src="../../assets/themeswap.js"></script></head><body><div id="documenter"><nav class="docs-sidebar"><div class="docs-package-name"><span class="docs-autofit">JudiLing.jl</span></div><form class="docs-search" action="../../search/"><input class="docs-search-query" id="documenter-search-query" name="q" type="text" placeholder="Search docs"/></form><ul class="docs-menu"><li><a class="tocitem" href="../../">Home</a></li><li><span class="tocitem">Manual</span><ul><li><a class="tocitem" href="../input/">Loading data</a></li><li><a class="tocitem" href="../make_cue_matrix/">Make Cue Matrix</a></li><li><a class="tocitem" href="../make_semantic_matrix/">Make Semantic Matrix</a></li><li><a class="tocitem" href="../cholesky/">Cholesky</a></li><li><a class="tocitem" href="../make_adjacency_matrix/">Make Adjacency Matrix</a></li><li><a class="tocitem" href="../make_yt_matrix/">Make Yt Matrix</a></li><li><a class="tocitem" href="../find_path/">Find Paths</a></li><li><a class="tocitem" href="../eval/">Evaluation</a></li><li><a class="tocitem" href="../output/">Output</a></li><li><a class="tocitem" href="../test_combo/">Test Combo</a></li><li><a class="tocitem" href="../display/">Display</a></li><li><a class="tocitem" href="../utils/">Utils</a></li><li><a class="tocitem" href="../pickle/">Pickle</a></li><li><a class="tocitem" href="../pyndl/">Pyndl</a></li><li><a class="tocitem" href="../wh/">Widrow-Hoff Learning</a></li><li><a class="tocitem" href="../deep_learning/">Deep learning</a></li><li><a class="tocitem" href="../measures_func/">Measures function</a></li></ul></li><li><a class="tocitem" href="../all_manual/">All Manual index</a></li></ul><div class="docs-version-selector field has-addons"><div class="control"><span class="docs-label button is-static is-size-7">Version</span></div><div class="docs-selector control is-expanded"><div class="select is-fullwidth is-size-7"><select id="documenter-version-selector"></select></div></div></div></nav><div class="docs-main"><header class="docs-navbar"><nav class="breadcrumb"><ul class="is-hidden-mobile"><li class="is-active"><a href>Preprocess</a></li></ul><ul class="is-hidden-tablet"><li class="is-active"><a href>Preprocess</a></li></ul></nav><div class="docs-right"><a class="docs-edit-link" href="https://github.com/quantling/JudiLing.jl/blob/master/docs/src/man/preprocess.md#L" title="Edit on GitHub"><span class="docs-icon fab"></span><span class="docs-label is-hidden-touch">Edit on GitHub</span></a><a class="docs-settings-button fas fa-cog" id="documenter-settings-button" href="#" title="Settings"></a><a class="docs-sidebar-button fa fa-bars is-hidden-desktop" id="documenter-sidebar-button" href="#"></a></div></header><article class="content" id="documenter-page"><h1 id="Preprocess"><a class="docs-heading-anchor" href="#Preprocess">Preprocess</a><a id="Preprocess-1"></a><a class="docs-heading-anchor-permalink" href="#Preprocess" title="Permalink"></a></h1><article class="docstring"><header><a class="docstring-binding" id="JudiLing.SplitDataException" href="#JudiLing.SplitDataException"><code>JudiLing.SplitDataException</code></a> — <span class="docstring-category">Type</span></header><section><div><p>Split Data Exception</p></div><a class="docs-sourcelink" target="_blank" href="https://github.com/quantling/JudiLing.jl/blob/244bb0c648484065ffd5a41781ccc1caf2e5db60/src/preprocess.jl#LL1-L3">source</a></section></article><article class="docstring"><header><a class="docstring-binding" id="JudiLing.lpo_cv_split-Tuple{Any, Any}" href="#JudiLing.lpo_cv_split-Tuple{Any, Any}"><code>JudiLing.lpo_cv_split</code></a> — <span class="docstring-category">Method</span></header><section><div><pre><code class="language-julia">lpo_cv_split(p, data_path)</code></pre><p>Leave p out cross-validation.</p></div><a class="docs-sourcelink" target="_blank" href="https://github.com/quantling/JudiLing.jl/blob/244bb0c648484065ffd5a41781ccc1caf2e5db60/src/preprocess.jl#LL8-L12">source</a></section></article><article class="docstring"><header><a class="docstring-binding" id="JudiLing.loo_cv_split-Tuple{Any}" href="#JudiLing.loo_cv_split-Tuple{Any}"><code>JudiLing.loo_cv_split</code></a> — <span class="docstring-category">Method</span></header><section><div><pre><code class="language-julia">loo_cv_split(data_path)</code></pre><p>Leave one out cross-validation.</p></div><a class="docs-sourcelink" target="_blank" href="https://github.com/quantling/JudiLing.jl/blob/244bb0c648484065ffd5a41781ccc1caf2e5db60/src/preprocess.jl#LL24-L28">source</a></section></article><article class="docstring"><header><a class="docstring-binding" id="JudiLing.train_val_random_split-Tuple{Any, Any, Any}" href="#JudiLing.train_val_random_split-Tuple{Any, Any, Any}"><code>JudiLing.train_val_random_split</code></a> — <span class="docstring-category">Method</span></header><section><div><pre><code class="language-julia">train_val_random_split(data_path, output_dir_path, data_prefix)</code></pre><p>Randomly split dataset.</p></div><a class="docs-sourcelink" target="_blank" href="https://github.com/quantling/JudiLing.jl/blob/244bb0c648484065ffd5a41781ccc1caf2e5db60/src/preprocess.jl#LL33-L37">source</a></section></article><article class="docstring"><header><a class="docstring-binding" id="JudiLing.train_val_careful_split-NTuple{4, Any}" href="#JudiLing.train_val_careful_split-NTuple{4, Any}"><code>JudiLing.train_val_careful_split</code></a> — <span class="docstring-category">Method</span></header><section><div><pre><code class="language-julia">train_val_careful_split(data_path, output_dir_path, data_prefix, n_features_columns)</code></pre><p>Carefully split dataset.</p></div><a class="docs-sourcelink" target="_blank" href="https://github.com/quantling/JudiLing.jl/blob/244bb0c648484065ffd5a41781ccc1caf2e5db60/src/preprocess.jl#LL75-L79">source</a></section></article></article><nav class="docs-footer"><p class="footer-message">Powered by <a href="https://github.com/JuliaDocs/Documenter.jl">Documenter.jl</a> and the <a href="https://julialang.org/">Julia Programming Language</a>.</p></nav></div><div class="modal" id="documenter-settings"><div class="modal-background"></div><div class="modal-card"><header class="modal-card-head"><p class="modal-card-title">Settings</p><button class="delete"></button></header><section class="modal-card-body"><p><label class="label">Theme</label><div class="select"><select id="documenter-themepicker"><option value="documenter-light">documenter-light</option><option value="documenter-dark">documenter-dark</option></select></div></p><hr/><p>This document was generated with <a href="https://github.com/JuliaDocs/Documenter.jl">Documenter.jl</a> on <span class="colophon-date" title="Wednesday 3 July 2024 16:02">Wednesday 3 July 2024</span>. Using Julia version 1.10.4.</p></section><footer class="modal-card-foot"></footer></div></div></div></body></html>
+<html lang="en"><head><meta charset="UTF-8"/><meta name="viewport" content="width=device-width, initial-scale=1.0"/><title>Preprocess · JudiLing.jl</title><link rel="canonical" href="https://quantling.github.io/JudiLing.jl/man/preprocess/"/><link href="https://fonts.googleapis.com/css?family=Lato|Roboto+Mono" rel="stylesheet" type="text/css"/><link href="https://cdnjs.cloudflare.com/ajax/libs/font-awesome/5.15.0/css/fontawesome.min.css" rel="stylesheet" type="text/css"/><link href="https://cdnjs.cloudflare.com/ajax/libs/font-awesome/5.15.0/css/solid.min.css" rel="stylesheet" type="text/css"/><link href="https://cdnjs.cloudflare.com/ajax/libs/font-awesome/5.15.0/css/brands.min.css" rel="stylesheet" type="text/css"/><link href="https://cdnjs.cloudflare.com/ajax/libs/KaTeX/0.11.1/katex.min.css" rel="stylesheet" type="text/css"/><script>documenterBaseURL="../.."</script><script src="https://cdnjs.cloudflare.com/ajax/libs/require.js/2.3.6/require.min.js" data-main="../../assets/documenter.js"></script><script src="../../siteinfo.js"></script><script src="../../../versions.js"></script><link class="docs-theme-link" rel="stylesheet" type="text/css" href="../../assets/themes/documenter-dark.css" data-theme-name="documenter-dark"/><link class="docs-theme-link" rel="stylesheet" type="text/css" href="../../assets/themes/documenter-light.css" data-theme-name="documenter-light" data-theme-primary/><script src="../../assets/themeswap.js"></script></head><body><div id="documenter"><nav class="docs-sidebar"><div class="docs-package-name"><span class="docs-autofit">JudiLing.jl</span></div><form class="docs-search" action="../../search/"><input class="docs-search-query" id="documenter-search-query" name="q" type="text" placeholder="Search docs"/></form><ul class="docs-menu"><li><a class="tocitem" href="../../">Home</a></li><li><span class="tocitem">Manual</span><ul><li><a class="tocitem" href="../input/">Loading data</a></li><li><a class="tocitem" href="../make_cue_matrix/">Make Cue Matrix</a></li><li><a class="tocitem" href="../make_semantic_matrix/">Make Semantic Matrix</a></li><li><a class="tocitem" href="../cholesky/">Cholesky</a></li><li><a class="tocitem" href="../make_adjacency_matrix/">Make Adjacency Matrix</a></li><li><a class="tocitem" href="../make_yt_matrix/">Make Yt Matrix</a></li><li><a class="tocitem" href="../find_path/">Find Paths</a></li><li><a class="tocitem" href="../eval/">Evaluation</a></li><li><a class="tocitem" href="../output/">Output</a></li><li><a class="tocitem" href="../test_combo/">Test Combo</a></li><li><a class="tocitem" href="../display/">Display</a></li><li><a class="tocitem" href="../utils/">Utils</a></li><li><a class="tocitem" href="../pickle/">Pickle</a></li><li><a class="tocitem" href="../pyndl/">Pyndl</a></li><li><a class="tocitem" href="../wh/">Widrow-Hoff Learning</a></li><li><a class="tocitem" href="../deep_learning/">Deep learning</a></li><li><a class="tocitem" href="../measures_func/">Measures function</a></li></ul></li><li><a class="tocitem" href="../all_manual/">All Manual index</a></li></ul><div class="docs-version-selector field has-addons"><div class="control"><span class="docs-label button is-static is-size-7">Version</span></div><div class="docs-selector control is-expanded"><div class="select is-fullwidth is-size-7"><select id="documenter-version-selector"></select></div></div></div></nav><div class="docs-main"><header class="docs-navbar"><nav class="breadcrumb"><ul class="is-hidden-mobile"><li class="is-active"><a href>Preprocess</a></li></ul><ul class="is-hidden-tablet"><li class="is-active"><a href>Preprocess</a></li></ul></nav><div class="docs-right"><a class="docs-edit-link" href="https://github.com/quantling/JudiLing.jl/blob/master/docs/src/man/preprocess.md#L" title="Edit on GitHub"><span class="docs-icon fab"></span><span class="docs-label is-hidden-touch">Edit on GitHub</span></a><a class="docs-settings-button fas fa-cog" id="documenter-settings-button" href="#" title="Settings"></a><a class="docs-sidebar-button fa fa-bars is-hidden-desktop" id="documenter-sidebar-button" href="#"></a></div></header><article class="content" id="documenter-page"><h1 id="Preprocess"><a class="docs-heading-anchor" href="#Preprocess">Preprocess</a><a id="Preprocess-1"></a><a class="docs-heading-anchor-permalink" href="#Preprocess" title="Permalink"></a></h1><article class="docstring"><header><a class="docstring-binding" id="JudiLing.SplitDataException" href="#JudiLing.SplitDataException"><code>JudiLing.SplitDataException</code></a> — <span class="docstring-category">Type</span></header><section><div><p>Split Data Exception</p></div><a class="docs-sourcelink" target="_blank" href="https://github.com/quantling/JudiLing.jl/blob/5ca73e4b27ef788e0b36d45e6360491a5a413be8/src/preprocess.jl#LL1-L3">source</a></section></article><article class="docstring"><header><a class="docstring-binding" id="JudiLing.lpo_cv_split-Tuple{Any, Any}" href="#JudiLing.lpo_cv_split-Tuple{Any, Any}"><code>JudiLing.lpo_cv_split</code></a> — <span class="docstring-category">Method</span></header><section><div><pre><code class="language-julia">lpo_cv_split(p, data_path)</code></pre><p>Leave p out cross-validation.</p></div><a class="docs-sourcelink" target="_blank" href="https://github.com/quantling/JudiLing.jl/blob/5ca73e4b27ef788e0b36d45e6360491a5a413be8/src/preprocess.jl#LL8-L12">source</a></section></article><article class="docstring"><header><a class="docstring-binding" id="JudiLing.loo_cv_split-Tuple{Any}" href="#JudiLing.loo_cv_split-Tuple{Any}"><code>JudiLing.loo_cv_split</code></a> — <span class="docstring-category">Method</span></header><section><div><pre><code class="language-julia">loo_cv_split(data_path)</code></pre><p>Leave one out cross-validation.</p></div><a class="docs-sourcelink" target="_blank" href="https://github.com/quantling/JudiLing.jl/blob/5ca73e4b27ef788e0b36d45e6360491a5a413be8/src/preprocess.jl#LL24-L28">source</a></section></article><article class="docstring"><header><a class="docstring-binding" id="JudiLing.train_val_random_split-Tuple{Any, Any, Any}" href="#JudiLing.train_val_random_split-Tuple{Any, Any, Any}"><code>JudiLing.train_val_random_split</code></a> — <span class="docstring-category">Method</span></header><section><div><pre><code class="language-julia">train_val_random_split(data_path, output_dir_path, data_prefix)</code></pre><p>Randomly split dataset.</p></div><a class="docs-sourcelink" target="_blank" href="https://github.com/quantling/JudiLing.jl/blob/5ca73e4b27ef788e0b36d45e6360491a5a413be8/src/preprocess.jl#LL33-L37">source</a></section></article><article class="docstring"><header><a class="docstring-binding" id="JudiLing.train_val_careful_split-NTuple{4, Any}" href="#JudiLing.train_val_careful_split-NTuple{4, Any}"><code>JudiLing.train_val_careful_split</code></a> — <span class="docstring-category">Method</span></header><section><div><pre><code class="language-julia">train_val_careful_split(data_path, output_dir_path, data_prefix, n_features_columns)</code></pre><p>Carefully split dataset.</p></div><a class="docs-sourcelink" target="_blank" href="https://github.com/quantling/JudiLing.jl/blob/5ca73e4b27ef788e0b36d45e6360491a5a413be8/src/preprocess.jl#LL75-L79">source</a></section></article></article><nav class="docs-footer"><p class="footer-message">Powered by <a href="https://github.com/JuliaDocs/Documenter.jl">Documenter.jl</a> and the <a href="https://julialang.org/">Julia Programming Language</a>.</p></nav></div><div class="modal" id="documenter-settings"><div class="modal-background"></div><div class="modal-card"><header class="modal-card-head"><p class="modal-card-title">Settings</p><button class="delete"></button></header><section class="modal-card-body"><p><label class="label">Theme</label><div class="select"><select id="documenter-themepicker"><option value="documenter-light">documenter-light</option><option value="documenter-dark">documenter-dark</option></select></div></p><hr/><p>This document was generated with <a href="https://github.com/JuliaDocs/Documenter.jl">Documenter.jl</a> on <span class="colophon-date" title="Wednesday 3 July 2024 16:16">Wednesday 3 July 2024</span>. Using Julia version 1.10.4.</p></section><footer class="modal-card-foot"></footer></div></div></div></body></html>
diff --git a/dev/man/pyndl/index.html b/dev/man/pyndl/index.html
index 804fd2d..689b2fe 100644
--- a/dev/man/pyndl/index.html
+++ b/dev/man/pyndl/index.html
@@ -3,12 +3,12 @@
 using JudiLing</code></pre></div></div><h2 id="Calling-pyndl-from-JudiLing"><a class="docs-heading-anchor" href="#Calling-pyndl-from-JudiLing">Calling pyndl from JudiLing</a><a id="Calling-pyndl-from-JudiLing-1"></a><a class="docs-heading-anchor-permalink" href="#Calling-pyndl-from-JudiLing" title="Permalink"></a></h2><article class="docstring"><header><a class="docstring-binding" id="JudiLing.Pyndl_Weight_Struct" href="#JudiLing.Pyndl_Weight_Struct"><code>JudiLing.Pyndl_Weight_Struct</code></a> — <span class="docstring-category">Type</span></header><section><div><pre><code class="language-julia">Pyndl_Weight_Struct
     cues::Vector{String}
     outcomes::Vector{String}
-    weight::Matrix{Float64}</code></pre><ul><li><code>cues::Vector{String}</code>: Vector of cues, in the order that they appear in the weight matrix.</li><li><code>outcomes::Vector{String}</code>: Vector of outcomes, in the order that they appear in the weight matrix.</li><li><code>weight::Matrix{Float64}</code>: Weight matrix.</li></ul></div><a class="docs-sourcelink" target="_blank" href="https://github.com/quantling/JudiLing.jl/blob/244bb0c648484065ffd5a41781ccc1caf2e5db60/src/pyndl.jl#LL1-L10">source</a></section></article><article class="docstring"><header><a class="docstring-binding" id="JudiLing.pyndl-Tuple{String}" href="#JudiLing.pyndl-Tuple{String}"><code>JudiLing.pyndl</code></a> — <span class="docstring-category">Method</span></header><section><div><pre><code class="language-julia">pyndl(
+    weight::Matrix{Float64}</code></pre><ul><li><code>cues::Vector{String}</code>: Vector of cues, in the order that they appear in the weight matrix.</li><li><code>outcomes::Vector{String}</code>: Vector of outcomes, in the order that they appear in the weight matrix.</li><li><code>weight::Matrix{Float64}</code>: Weight matrix.</li></ul></div><a class="docs-sourcelink" target="_blank" href="https://github.com/quantling/JudiLing.jl/blob/5ca73e4b27ef788e0b36d45e6360491a5a413be8/src/pyndl.jl#LL1-L10">source</a></section></article><article class="docstring"><header><a class="docstring-binding" id="JudiLing.pyndl-Tuple{String}" href="#JudiLing.pyndl-Tuple{String}"><code>JudiLing.pyndl</code></a> — <span class="docstring-category">Method</span></header><section><div><pre><code class="language-julia">pyndl(
     data_path::String;
     alpha::Float64 = 0.1,
     betas::Tuple{Float64,Float64} = (0.1, 0.1),
     method::String = &quot;openmp&quot;
-)</code></pre><p>Compute weights using pyndl. See the documentation of pyndl for more information: https://pyndl.readthedocs.io/en/latest/</p><p><strong>Obligatory arguments</strong></p><ul><li><code>data_path::String</code>: Path to an events file as generated by pyndl&#39;s preprocess.create<em>event</em>file</li></ul><p><strong>Optional arguments</strong></p><ul><li><code>alpha::Float64 = 0.1</code>: α learning rate.</li><li><code>betas::Tuple{Float64,Float64} = (0.1, 0.1)</code>: β<em>1 and β</em>2 learning rates</li><li><code>method::String = &quot;openmp&quot;</code>: One of {&quot;openmp&quot;, &quot;threading&quot;}. &quot;openmp&quot; only works on Linux.</li></ul><p><strong>Example</strong></p><pre><code class="language-julia">weights = JudiLing.pyndl(&quot;data/latin_train_events.tab.gz&quot;)</code></pre></div><a class="docs-sourcelink" target="_blank" href="https://github.com/quantling/JudiLing.jl/blob/244bb0c648484065ffd5a41781ccc1caf2e5db60/src/pyndl.jl#LL17-L39">source</a></section></article><h2 id="Translating-output-of-pyndl-to-cue-and-semantic-matrices-in-JudiLing"><a class="docs-heading-anchor" href="#Translating-output-of-pyndl-to-cue-and-semantic-matrices-in-JudiLing">Translating output of pyndl to cue and semantic matrices in JudiLing</a><a id="Translating-output-of-pyndl-to-cue-and-semantic-matrices-in-JudiLing-1"></a><a class="docs-heading-anchor-permalink" href="#Translating-output-of-pyndl-to-cue-and-semantic-matrices-in-JudiLing" title="Permalink"></a></h2><p>With the weights in hand, the cue and semantic matrices can be computed:</p><article class="docstring"><header><a class="docstring-binding" id="JudiLing.make_cue_matrix-Tuple{DataFrames.DataFrame, JudiLing.Pyndl_Weight_Struct}" href="#JudiLing.make_cue_matrix-Tuple{DataFrames.DataFrame, JudiLing.Pyndl_Weight_Struct}"><code>JudiLing.make_cue_matrix</code></a> — <span class="docstring-category">Method</span></header><section><div><pre><code class="language-julia">make_cue_matrix(
+)</code></pre><p>Compute weights using pyndl. See the documentation of pyndl for more information: https://pyndl.readthedocs.io/en/latest/</p><p><strong>Obligatory arguments</strong></p><ul><li><code>data_path::String</code>: Path to an events file as generated by pyndl&#39;s preprocess.create<em>event</em>file</li></ul><p><strong>Optional arguments</strong></p><ul><li><code>alpha::Float64 = 0.1</code>: α learning rate.</li><li><code>betas::Tuple{Float64,Float64} = (0.1, 0.1)</code>: β<em>1 and β</em>2 learning rates</li><li><code>method::String = &quot;openmp&quot;</code>: One of {&quot;openmp&quot;, &quot;threading&quot;}. &quot;openmp&quot; only works on Linux.</li></ul><p><strong>Example</strong></p><pre><code class="language-julia">weights = JudiLing.pyndl(&quot;data/latin_train_events.tab.gz&quot;)</code></pre></div><a class="docs-sourcelink" target="_blank" href="https://github.com/quantling/JudiLing.jl/blob/5ca73e4b27ef788e0b36d45e6360491a5a413be8/src/pyndl.jl#LL17-L39">source</a></section></article><h2 id="Translating-output-of-pyndl-to-cue-and-semantic-matrices-in-JudiLing"><a class="docs-heading-anchor" href="#Translating-output-of-pyndl-to-cue-and-semantic-matrices-in-JudiLing">Translating output of pyndl to cue and semantic matrices in JudiLing</a><a id="Translating-output-of-pyndl-to-cue-and-semantic-matrices-in-JudiLing-1"></a><a class="docs-heading-anchor-permalink" href="#Translating-output-of-pyndl-to-cue-and-semantic-matrices-in-JudiLing" title="Permalink"></a></h2><p>With the weights in hand, the cue and semantic matrices can be computed:</p><article class="docstring"><header><a class="docstring-binding" id="JudiLing.make_cue_matrix-Tuple{DataFrames.DataFrame, JudiLing.Pyndl_Weight_Struct}" href="#JudiLing.make_cue_matrix-Tuple{DataFrames.DataFrame, JudiLing.Pyndl_Weight_Struct}"><code>JudiLing.make_cue_matrix</code></a> — <span class="docstring-category">Method</span></header><section><div><pre><code class="language-julia">make_cue_matrix(
     data::DataFrame,
     pyndl_weights::Pyndl_Weight_Struct;
     grams = 3,
@@ -21,7 +21,7 @@
 )</code></pre><p>Make the cue matrix based on a dataframe and weights computed with pyndl. Practically this means that the cues are extracted from the weights object and translated to the JudiLing format.</p><p><strong>Obligatory arguments</strong></p><ul><li><code>data::DataFrame</code>: Dataset with all the word types on which the weights were trained.</li><li><code>pyndl_weights::Pyndl_Weight_Struct</code>: Weights trained with JudiLing.pyndl</li></ul><p><strong>Optional argyments</strong></p><ul><li><code>grams = 3</code>: N-gram size (has to match the n-gram granularity of the cues on which the weights were trained).</li><li><code>target_col = &quot;Words&quot;</code>: Column with target words.</li><li><code>tokenized = false</code>: Whether the target words are already tokenized</li><li><code>sep_token = nothing</code>: The string separating the tokens (only used if <code>tokenized=true</code>).</li><li><code>keep_sep = false</code>: Whether the <code>sep_token</code> should be retained in the cues.</li><li><code>start_end_token = &quot;#&quot;</code>: The string with which to mark word boundaries.</li><li><code>verbose = false</code>: Verbose mode.</li></ul><p><strong>Example</strong></p><pre><code class="language-julia">weights = JudiLing.pyndl(&quot;data/latin_train_events.tab.gz&quot;)
 cue_obj = JudiLing.make_cue_matrix(&quot;latin_train.csv&quot;, weights,
                                     grams = 3,
-                                    target_col = &quot;Word&quot;)</code></pre></div><a class="docs-sourcelink" target="_blank" href="https://github.com/quantling/JudiLing.jl/blob/244bb0c648484065ffd5a41781ccc1caf2e5db60/src/pyndl.jl#LL71-L106">source</a></section></article><article class="docstring"><header><a class="docstring-binding" id="JudiLing.make_S_matrix-Tuple{DataFrames.DataFrame, JudiLing.Pyndl_Weight_Struct, Vector}" href="#JudiLing.make_S_matrix-Tuple{DataFrames.DataFrame, JudiLing.Pyndl_Weight_Struct, Vector}"><code>JudiLing.make_S_matrix</code></a> — <span class="docstring-category">Method</span></header><section><div><pre><code class="language-julia">make_S_matrix(
+                                    target_col = &quot;Word&quot;)</code></pre></div><a class="docs-sourcelink" target="_blank" href="https://github.com/quantling/JudiLing.jl/blob/5ca73e4b27ef788e0b36d45e6360491a5a413be8/src/pyndl.jl#LL71-L106">source</a></section></article><article class="docstring"><header><a class="docstring-binding" id="JudiLing.make_S_matrix-Tuple{DataFrames.DataFrame, JudiLing.Pyndl_Weight_Struct, Vector}" href="#JudiLing.make_S_matrix-Tuple{DataFrames.DataFrame, JudiLing.Pyndl_Weight_Struct, Vector}"><code>JudiLing.make_S_matrix</code></a> — <span class="docstring-category">Method</span></header><section><div><pre><code class="language-julia">make_S_matrix(
     data::DataFrame,
     pyndl_weights::Pyndl_Weight_Struct,
     n_features_columns::Vector;
@@ -31,7 +31,7 @@
 S = JudiLing.make_S_matrix(data,
                             weights_latin,
                             [&quot;Lexeme&quot;, &quot;Person&quot;, &quot;Number&quot;, &quot;Tense&quot;, &quot;Voice&quot;, &quot;Mood&quot;],
-                            tokenized=false)</code></pre></div><a class="docs-sourcelink" target="_blank" href="https://github.com/quantling/JudiLing.jl/blob/244bb0c648484065ffd5a41781ccc1caf2e5db60/src/pyndl.jl#LL273-L301">source</a></section></article><article class="docstring"><header><a class="docstring-binding" id="JudiLing.make_S_matrix-Tuple{DataFrames.DataFrame, DataFrames.DataFrame, JudiLing.Pyndl_Weight_Struct, Vector}" href="#JudiLing.make_S_matrix-Tuple{DataFrames.DataFrame, DataFrames.DataFrame, JudiLing.Pyndl_Weight_Struct, Vector}"><code>JudiLing.make_S_matrix</code></a> — <span class="docstring-category">Method</span></header><section><div><pre><code class="language-julia">make_S_matrix(
+                            tokenized=false)</code></pre></div><a class="docs-sourcelink" target="_blank" href="https://github.com/quantling/JudiLing.jl/blob/5ca73e4b27ef788e0b36d45e6360491a5a413be8/src/pyndl.jl#LL273-L301">source</a></section></article><article class="docstring"><header><a class="docstring-binding" id="JudiLing.make_S_matrix-Tuple{DataFrames.DataFrame, DataFrames.DataFrame, JudiLing.Pyndl_Weight_Struct, Vector}" href="#JudiLing.make_S_matrix-Tuple{DataFrames.DataFrame, DataFrames.DataFrame, JudiLing.Pyndl_Weight_Struct, Vector}"><code>JudiLing.make_S_matrix</code></a> — <span class="docstring-category">Method</span></header><section><div><pre><code class="language-julia">make_S_matrix(
     data_train::DataFrame,
     data_val::DataFrame,
     pyndl_weights::Pyndl_Weight_Struct,
@@ -43,4 +43,4 @@
                             val,
                             weights_latin,
                             [&quot;Lexeme&quot;, &quot;Person&quot;, &quot;Number&quot;, &quot;Tense&quot;, &quot;Voice&quot;, &quot;Mood&quot;],
-                            tokenized=false)</code></pre></div><a class="docs-sourcelink" target="_blank" href="https://github.com/quantling/JudiLing.jl/blob/244bb0c648484065ffd5a41781ccc1caf2e5db60/src/pyndl.jl#LL197-L228">source</a></section></article></article><nav class="docs-footer"><a class="docs-footer-prevpage" href="../pickle/">« Pickle</a><a class="docs-footer-nextpage" href="../wh/">Widrow-Hoff Learning »</a><div class="flexbox-break"></div><p class="footer-message">Powered by <a href="https://github.com/JuliaDocs/Documenter.jl">Documenter.jl</a> and the <a href="https://julialang.org/">Julia Programming Language</a>.</p></nav></div><div class="modal" id="documenter-settings"><div class="modal-background"></div><div class="modal-card"><header class="modal-card-head"><p class="modal-card-title">Settings</p><button class="delete"></button></header><section class="modal-card-body"><p><label class="label">Theme</label><div class="select"><select id="documenter-themepicker"><option value="documenter-light">documenter-light</option><option value="documenter-dark">documenter-dark</option></select></div></p><hr/><p>This document was generated with <a href="https://github.com/JuliaDocs/Documenter.jl">Documenter.jl</a> on <span class="colophon-date" title="Wednesday 3 July 2024 16:02">Wednesday 3 July 2024</span>. Using Julia version 1.10.4.</p></section><footer class="modal-card-foot"></footer></div></div></div></body></html>
+                            tokenized=false)</code></pre></div><a class="docs-sourcelink" target="_blank" href="https://github.com/quantling/JudiLing.jl/blob/5ca73e4b27ef788e0b36d45e6360491a5a413be8/src/pyndl.jl#LL197-L228">source</a></section></article></article><nav class="docs-footer"><a class="docs-footer-prevpage" href="../pickle/">« Pickle</a><a class="docs-footer-nextpage" href="../wh/">Widrow-Hoff Learning »</a><div class="flexbox-break"></div><p class="footer-message">Powered by <a href="https://github.com/JuliaDocs/Documenter.jl">Documenter.jl</a> and the <a href="https://julialang.org/">Julia Programming Language</a>.</p></nav></div><div class="modal" id="documenter-settings"><div class="modal-background"></div><div class="modal-card"><header class="modal-card-head"><p class="modal-card-title">Settings</p><button class="delete"></button></header><section class="modal-card-body"><p><label class="label">Theme</label><div class="select"><select id="documenter-themepicker"><option value="documenter-light">documenter-light</option><option value="documenter-dark">documenter-dark</option></select></div></p><hr/><p>This document was generated with <a href="https://github.com/JuliaDocs/Documenter.jl">Documenter.jl</a> on <span class="colophon-date" title="Wednesday 3 July 2024 16:16">Wednesday 3 July 2024</span>. Using Julia version 1.10.4.</p></section><footer class="modal-card-foot"></footer></div></div></div></body></html>
diff --git a/dev/man/test_combo/index.html b/dev/man/test_combo/index.html
index be42f16..2ed9f1f 100644
--- a/dev/man/test_combo/index.html
+++ b/dev/man/test_combo/index.html
@@ -1,2 +1,2 @@
 <!DOCTYPE html>
-<html lang="en"><head><meta charset="UTF-8"/><meta name="viewport" content="width=device-width, initial-scale=1.0"/><title>Test Combo · JudiLing.jl</title><link rel="canonical" href="https://quantling.github.io/JudiLing.jl/man/test_combo/"/><link href="https://fonts.googleapis.com/css?family=Lato|Roboto+Mono" rel="stylesheet" type="text/css"/><link href="https://cdnjs.cloudflare.com/ajax/libs/font-awesome/5.15.0/css/fontawesome.min.css" rel="stylesheet" type="text/css"/><link href="https://cdnjs.cloudflare.com/ajax/libs/font-awesome/5.15.0/css/solid.min.css" rel="stylesheet" type="text/css"/><link href="https://cdnjs.cloudflare.com/ajax/libs/font-awesome/5.15.0/css/brands.min.css" rel="stylesheet" type="text/css"/><link href="https://cdnjs.cloudflare.com/ajax/libs/KaTeX/0.11.1/katex.min.css" rel="stylesheet" type="text/css"/><script>documenterBaseURL="../.."</script><script src="https://cdnjs.cloudflare.com/ajax/libs/require.js/2.3.6/require.min.js" data-main="../../assets/documenter.js"></script><script src="../../siteinfo.js"></script><script src="../../../versions.js"></script><link class="docs-theme-link" rel="stylesheet" type="text/css" href="../../assets/themes/documenter-dark.css" data-theme-name="documenter-dark"/><link class="docs-theme-link" rel="stylesheet" type="text/css" href="../../assets/themes/documenter-light.css" data-theme-name="documenter-light" data-theme-primary/><script src="../../assets/themeswap.js"></script></head><body><div id="documenter"><nav class="docs-sidebar"><div class="docs-package-name"><span class="docs-autofit">JudiLing.jl</span></div><form class="docs-search" action="../../search/"><input class="docs-search-query" id="documenter-search-query" name="q" type="text" placeholder="Search docs"/></form><ul class="docs-menu"><li><a class="tocitem" href="../../">Home</a></li><li><span class="tocitem">Manual</span><ul><li><a class="tocitem" href="../input/">Loading data</a></li><li><a class="tocitem" href="../make_cue_matrix/">Make Cue Matrix</a></li><li><a class="tocitem" href="../make_semantic_matrix/">Make Semantic Matrix</a></li><li><a class="tocitem" href="../cholesky/">Cholesky</a></li><li><a class="tocitem" href="../make_adjacency_matrix/">Make Adjacency Matrix</a></li><li><a class="tocitem" href="../make_yt_matrix/">Make Yt Matrix</a></li><li><a class="tocitem" href="../find_path/">Find Paths</a></li><li><a class="tocitem" href="../eval/">Evaluation</a></li><li><a class="tocitem" href="../output/">Output</a></li><li class="is-active"><a class="tocitem" href>Test Combo</a></li><li><a class="tocitem" href="../display/">Display</a></li><li><a class="tocitem" href="../utils/">Utils</a></li><li><a class="tocitem" href="../pickle/">Pickle</a></li><li><a class="tocitem" href="../pyndl/">Pyndl</a></li><li><a class="tocitem" href="../wh/">Widrow-Hoff Learning</a></li><li><a class="tocitem" href="../deep_learning/">Deep learning</a></li><li><a class="tocitem" href="../measures_func/">Measures function</a></li></ul></li><li><a class="tocitem" href="../all_manual/">All Manual index</a></li></ul><div class="docs-version-selector field has-addons"><div class="control"><span class="docs-label button is-static is-size-7">Version</span></div><div class="docs-selector control is-expanded"><div class="select is-fullwidth is-size-7"><select id="documenter-version-selector"></select></div></div></div></nav><div class="docs-main"><header class="docs-navbar"><nav class="breadcrumb"><ul class="is-hidden-mobile"><li><a class="is-disabled">Manual</a></li><li class="is-active"><a href>Test Combo</a></li></ul><ul class="is-hidden-tablet"><li class="is-active"><a href>Test Combo</a></li></ul></nav><div class="docs-right"><a class="docs-edit-link" href="https://github.com/quantling/JudiLing.jl/blob/master/docs/src/man/test_combo.md#L" title="Edit on GitHub"><span class="docs-icon fab"></span><span class="docs-label is-hidden-touch">Edit on GitHub</span></a><a class="docs-settings-button fas fa-cog" id="documenter-settings-button" href="#" title="Settings"></a><a class="docs-sidebar-button fa fa-bars is-hidden-desktop" id="documenter-sidebar-button" href="#"></a></div></header><article class="content" id="documenter-page"><h1 id="Test-Combo"><a class="docs-heading-anchor" href="#Test-Combo">Test Combo</a><a id="Test-Combo-1"></a><a class="docs-heading-anchor-permalink" href="#Test-Combo" title="Permalink"></a></h1><article class="docstring"><header><a class="docstring-binding" id="JudiLing.test_combo-Tuple{Any}" href="#JudiLing.test_combo-Tuple{Any}"><code>JudiLing.test_combo</code></a> — <span class="docstring-category">Method</span></header><section><div><pre><code class="language-julia">test_combo(test_mode;kwargs...)</code></pre><p>A wrapper function for a full model for a specific combination of parameters. A detailed introduction is in <a href="man/@ref">Test Combo Introduction</a></p><p><strong>Obligatory Arguments</strong></p><ul><li><code>test_mode::Symbol</code>: which test mode, currently supports :train<em>only, :pre</em>split, :careful<em>split and :random</em>split.</li></ul><p><strong>Optional Arguments</strong></p><ul><li><code>train_sample_size::Int64=0</code>: the desired number of training data</li><li><code>val_sample_size::Int64=0</code>: the desired number of validation data</li><li><code>val_ratio::Float64=0.0</code>: the desired portion of validation data, if works only if :val<em>sample</em>size is 0.0.</li><li><code>extension::String=&quot;.csv&quot;</code>: the extension for data n<em>features</em>inflections</li><li><code>n_grams_target_col::Union{String, Symbol}=:Word</code>: the column name for target strings</li><li><code>n_grams_tokenized::Boolean=false</code>: if true, the dataset target is assumed to be tokenized</li><li><code>n_grams_sep_token::String=nothing</code>: separator</li><li><code>grams::Int64=3</code>: the number of grams for cues</li><li><code>n_grams_keep_sep::Boolean=false</code>: if true, keep separators in cues</li><li><code>start_end_token::String=&quot;:&quot;</code>: start and end token in boundary cues</li><li><code>path_sep_token::String=&quot;:&quot;</code>: path separator in the assembled path</li><li><code>random_seed::Int64=314</code>: the random seed</li><li><code>sd_base_mean::Int64=1</code>: the sd mean of base features</li><li><code>sd_inflection_mean::Int64=1</code>: the sd mean of inflectional features</li><li><code>sd_base::Int64=4</code>: the sd of base features</li><li><code>sd_inflection::Int64=4</code>: the sd of inflectional features</li><li><code>isdeep::Boolean=true</code>: if true, mean of each feature is also randomized</li><li><code>add_noise::Boolean=true</code>: if true, add additional Gaussian noise</li><li><code>sd_noise::Int64=1</code>: the sd of the Gaussian noise</li><li><code>normalized::Boolean=false</code>: if true, most of the values range between 1 and -1, it may slightly exceed between 1 or -1 depending on the sd</li><li><code>if_combined::Boolean=false</code>: if true, then features are combined with both training and validation data</li><li><code>learn_mode::Int64=:cholesky</code>: which learning mode, currently supports :cholesky and :wh</li><li><code>method::Int64=:additive</code>: whether :additive or :multiplicative decomposition is required</li><li><code>shift::Int64=0.02</code>: shift value for :additive decomposition</li><li><code>multiplier::Int64=1.01</code>: multiplier value for :multiplicative decomposition</li><li><code>output_format::Int64=:auto</code>: to force output format to dense(:dense) or sparse(:sparse), make it auto(:auto) to determined by the program</li><li><code>sparse_ratio::Int64=0.05</code>: the ratio to decide whether a matrix is sparse</li><li><code>wh_freq::Vector=nothing</code>: the learning sequence</li><li><code>init_weights::Matrix=nothing</code>: the initial weights</li><li><code>eta::Float64=0.1</code>: the learning rate</li><li><code>n_epochs::Int64=1</code>: the number of epochs to be trained</li><li><code>max_t::Int64=0</code>: the number of epochs to be trained</li><li><code>A::Matrix=nothing</code>: the number of epochs to be trained</li><li><code>A_mode::Symbol=:combined</code>: the adjacency matrix mode, currently supports :combined or :train_only</li><li><code>max_can::Int64=10</code>: the max number of candidate path to keep in the output</li><li><code>threshold_train::Float64=0.1</code>:the value set for the support such that if the support of an n-gram is higher than this value, the n-gram will be taking into consideration for training data</li><li><code>is_tolerant_train::Bool=false</code>: if true, select a specified number (given by <code>max_tolerance</code>) of n-grams whose supports are below threshold but above a second tolerance threshold to be added to the path  for training data</li><li><code>tolerance_train::Float64=-0.1</code>: the value set for the second threshold (in tolerant mode) such that if the support for an n-gram is in between this value and the threshold and the max_tolerance number has not been reached, then allow this n-gram to be added to the path  for training data</li><li><code>max_tolerance_train::Int64=2</code>: maximum number of n-grams allowed in a path for training data</li><li><code>threshold_val::Float64=0.1</code>:the value set for the support such that if the support of an n-gram is higher than this value, the n-gram will be taking into consideration for validation data</li><li><code>is_tolerant_val::Bool=false</code>: if true, select a specified number (given by <code>max_tolerance</code>) of n-grams whose supports are below threshold but above a second tolerance threshold to be added to the path for validation data</li><li><code>tolerance_val::Float64=-0.1</code>: the value set for the second threshold (in tolerant mode) such that if the support for an n-gram is in between this value and the threshold and the max_tolerance number has not been reached, then allow this n-gram to be added to the path for validation data</li><li><code>max_tolerance_val::Int64=2</code>: maximum number of n-grams allowed in a path for validation data</li><li><code>n_neighbors_train::Int64=10</code>: the top n form neighbors to be considered for training data</li><li><code>n_neighbors_val::Int64=20</code>: the top n form neighbors to be considered for validation data</li><li><code>issparse::Bool=false</code>: if true, keep sparse matrix format when learning paths</li><li><code>output_dir::String=&quot;out&quot;</code>: the output directory</li><li><code>verbose::Bool=false</code>: if true, more information will be printed</li></ul></div><a class="docs-sourcelink" target="_blank" href="https://github.com/quantling/JudiLing.jl/blob/244bb0c648484065ffd5a41781ccc1caf2e5db60/src/test_combo.jl#LL56-L113">source</a></section></article></article><nav class="docs-footer"><a class="docs-footer-prevpage" href="../output/">« Output</a><a class="docs-footer-nextpage" href="../display/">Display »</a><div class="flexbox-break"></div><p class="footer-message">Powered by <a href="https://github.com/JuliaDocs/Documenter.jl">Documenter.jl</a> and the <a href="https://julialang.org/">Julia Programming Language</a>.</p></nav></div><div class="modal" id="documenter-settings"><div class="modal-background"></div><div class="modal-card"><header class="modal-card-head"><p class="modal-card-title">Settings</p><button class="delete"></button></header><section class="modal-card-body"><p><label class="label">Theme</label><div class="select"><select id="documenter-themepicker"><option value="documenter-light">documenter-light</option><option value="documenter-dark">documenter-dark</option></select></div></p><hr/><p>This document was generated with <a href="https://github.com/JuliaDocs/Documenter.jl">Documenter.jl</a> on <span class="colophon-date" title="Wednesday 3 July 2024 16:02">Wednesday 3 July 2024</span>. Using Julia version 1.10.4.</p></section><footer class="modal-card-foot"></footer></div></div></div></body></html>
+<html lang="en"><head><meta charset="UTF-8"/><meta name="viewport" content="width=device-width, initial-scale=1.0"/><title>Test Combo · JudiLing.jl</title><link rel="canonical" href="https://quantling.github.io/JudiLing.jl/man/test_combo/"/><link href="https://fonts.googleapis.com/css?family=Lato|Roboto+Mono" rel="stylesheet" type="text/css"/><link href="https://cdnjs.cloudflare.com/ajax/libs/font-awesome/5.15.0/css/fontawesome.min.css" rel="stylesheet" type="text/css"/><link href="https://cdnjs.cloudflare.com/ajax/libs/font-awesome/5.15.0/css/solid.min.css" rel="stylesheet" type="text/css"/><link href="https://cdnjs.cloudflare.com/ajax/libs/font-awesome/5.15.0/css/brands.min.css" rel="stylesheet" type="text/css"/><link href="https://cdnjs.cloudflare.com/ajax/libs/KaTeX/0.11.1/katex.min.css" rel="stylesheet" type="text/css"/><script>documenterBaseURL="../.."</script><script src="https://cdnjs.cloudflare.com/ajax/libs/require.js/2.3.6/require.min.js" data-main="../../assets/documenter.js"></script><script src="../../siteinfo.js"></script><script src="../../../versions.js"></script><link class="docs-theme-link" rel="stylesheet" type="text/css" href="../../assets/themes/documenter-dark.css" data-theme-name="documenter-dark"/><link class="docs-theme-link" rel="stylesheet" type="text/css" href="../../assets/themes/documenter-light.css" data-theme-name="documenter-light" data-theme-primary/><script src="../../assets/themeswap.js"></script></head><body><div id="documenter"><nav class="docs-sidebar"><div class="docs-package-name"><span class="docs-autofit">JudiLing.jl</span></div><form class="docs-search" action="../../search/"><input class="docs-search-query" id="documenter-search-query" name="q" type="text" placeholder="Search docs"/></form><ul class="docs-menu"><li><a class="tocitem" href="../../">Home</a></li><li><span class="tocitem">Manual</span><ul><li><a class="tocitem" href="../input/">Loading data</a></li><li><a class="tocitem" href="../make_cue_matrix/">Make Cue Matrix</a></li><li><a class="tocitem" href="../make_semantic_matrix/">Make Semantic Matrix</a></li><li><a class="tocitem" href="../cholesky/">Cholesky</a></li><li><a class="tocitem" href="../make_adjacency_matrix/">Make Adjacency Matrix</a></li><li><a class="tocitem" href="../make_yt_matrix/">Make Yt Matrix</a></li><li><a class="tocitem" href="../find_path/">Find Paths</a></li><li><a class="tocitem" href="../eval/">Evaluation</a></li><li><a class="tocitem" href="../output/">Output</a></li><li class="is-active"><a class="tocitem" href>Test Combo</a></li><li><a class="tocitem" href="../display/">Display</a></li><li><a class="tocitem" href="../utils/">Utils</a></li><li><a class="tocitem" href="../pickle/">Pickle</a></li><li><a class="tocitem" href="../pyndl/">Pyndl</a></li><li><a class="tocitem" href="../wh/">Widrow-Hoff Learning</a></li><li><a class="tocitem" href="../deep_learning/">Deep learning</a></li><li><a class="tocitem" href="../measures_func/">Measures function</a></li></ul></li><li><a class="tocitem" href="../all_manual/">All Manual index</a></li></ul><div class="docs-version-selector field has-addons"><div class="control"><span class="docs-label button is-static is-size-7">Version</span></div><div class="docs-selector control is-expanded"><div class="select is-fullwidth is-size-7"><select id="documenter-version-selector"></select></div></div></div></nav><div class="docs-main"><header class="docs-navbar"><nav class="breadcrumb"><ul class="is-hidden-mobile"><li><a class="is-disabled">Manual</a></li><li class="is-active"><a href>Test Combo</a></li></ul><ul class="is-hidden-tablet"><li class="is-active"><a href>Test Combo</a></li></ul></nav><div class="docs-right"><a class="docs-edit-link" href="https://github.com/quantling/JudiLing.jl/blob/master/docs/src/man/test_combo.md#L" title="Edit on GitHub"><span class="docs-icon fab"></span><span class="docs-label is-hidden-touch">Edit on GitHub</span></a><a class="docs-settings-button fas fa-cog" id="documenter-settings-button" href="#" title="Settings"></a><a class="docs-sidebar-button fa fa-bars is-hidden-desktop" id="documenter-sidebar-button" href="#"></a></div></header><article class="content" id="documenter-page"><h1 id="Test-Combo"><a class="docs-heading-anchor" href="#Test-Combo">Test Combo</a><a id="Test-Combo-1"></a><a class="docs-heading-anchor-permalink" href="#Test-Combo" title="Permalink"></a></h1><article class="docstring"><header><a class="docstring-binding" id="JudiLing.test_combo-Tuple{Any}" href="#JudiLing.test_combo-Tuple{Any}"><code>JudiLing.test_combo</code></a> — <span class="docstring-category">Method</span></header><section><div><pre><code class="language-julia">test_combo(test_mode;kwargs...)</code></pre><p>A wrapper function for a full model for a specific combination of parameters. A detailed introduction is in <a href="man/@ref">Test Combo Introduction</a></p><div class="admonition is-info"><header class="admonition-header">Note</header><div class="admonition-body"><p>test<em>combo: test</em>combo is deprecated. While it will remain in the package it is no longer actively maintained.</p></div></div><p><strong>Obligatory Arguments</strong></p><ul><li><code>test_mode::Symbol</code>: which test mode, currently supports :train<em>only, :pre</em>split, :careful<em>split and :random</em>split.</li></ul><p><strong>Optional Arguments</strong></p><ul><li><code>train_sample_size::Int64=0</code>: the desired number of training data</li><li><code>val_sample_size::Int64=0</code>: the desired number of validation data</li><li><code>val_ratio::Float64=0.0</code>: the desired portion of validation data, if works only if :val<em>sample</em>size is 0.0.</li><li><code>extension::String=&quot;.csv&quot;</code>: the extension for data n<em>features</em>inflections</li><li><code>n_grams_target_col::Union{String, Symbol}=:Word</code>: the column name for target strings</li><li><code>n_grams_tokenized::Boolean=false</code>: if true, the dataset target is assumed to be tokenized</li><li><code>n_grams_sep_token::String=nothing</code>: separator</li><li><code>grams::Int64=3</code>: the number of grams for cues</li><li><code>n_grams_keep_sep::Boolean=false</code>: if true, keep separators in cues</li><li><code>start_end_token::String=&quot;:&quot;</code>: start and end token in boundary cues</li><li><code>path_sep_token::String=&quot;:&quot;</code>: path separator in the assembled path</li><li><code>random_seed::Int64=314</code>: the random seed</li><li><code>sd_base_mean::Int64=1</code>: the sd mean of base features</li><li><code>sd_inflection_mean::Int64=1</code>: the sd mean of inflectional features</li><li><code>sd_base::Int64=4</code>: the sd of base features</li><li><code>sd_inflection::Int64=4</code>: the sd of inflectional features</li><li><code>isdeep::Boolean=true</code>: if true, mean of each feature is also randomized</li><li><code>add_noise::Boolean=true</code>: if true, add additional Gaussian noise</li><li><code>sd_noise::Int64=1</code>: the sd of the Gaussian noise</li><li><code>normalized::Boolean=false</code>: if true, most of the values range between 1 and -1, it may slightly exceed between 1 or -1 depending on the sd</li><li><code>if_combined::Boolean=false</code>: if true, then features are combined with both training and validation data</li><li><code>learn_mode::Int64=:cholesky</code>: which learning mode, currently supports :cholesky and :wh</li><li><code>method::Int64=:additive</code>: whether :additive or :multiplicative decomposition is required</li><li><code>shift::Int64=0.02</code>: shift value for :additive decomposition</li><li><code>multiplier::Int64=1.01</code>: multiplier value for :multiplicative decomposition</li><li><code>output_format::Int64=:auto</code>: to force output format to dense(:dense) or sparse(:sparse), make it auto(:auto) to determined by the program</li><li><code>sparse_ratio::Int64=0.05</code>: the ratio to decide whether a matrix is sparse</li><li><code>wh_freq::Vector=nothing</code>: the learning sequence</li><li><code>init_weights::Matrix=nothing</code>: the initial weights</li><li><code>eta::Float64=0.1</code>: the learning rate</li><li><code>n_epochs::Int64=1</code>: the number of epochs to be trained</li><li><code>max_t::Int64=0</code>: the number of epochs to be trained</li><li><code>A::Matrix=nothing</code>: the number of epochs to be trained</li><li><code>A_mode::Symbol=:combined</code>: the adjacency matrix mode, currently supports :combined or :train_only</li><li><code>max_can::Int64=10</code>: the max number of candidate path to keep in the output</li><li><code>threshold_train::Float64=0.1</code>:the value set for the support such that if the support of an n-gram is higher than this value, the n-gram will be taking into consideration for training data</li><li><code>is_tolerant_train::Bool=false</code>: if true, select a specified number (given by <code>max_tolerance</code>) of n-grams whose supports are below threshold but above a second tolerance threshold to be added to the path  for training data</li><li><code>tolerance_train::Float64=-0.1</code>: the value set for the second threshold (in tolerant mode) such that if the support for an n-gram is in between this value and the threshold and the max_tolerance number has not been reached, then allow this n-gram to be added to the path  for training data</li><li><code>max_tolerance_train::Int64=2</code>: maximum number of n-grams allowed in a path for training data</li><li><code>threshold_val::Float64=0.1</code>:the value set for the support such that if the support of an n-gram is higher than this value, the n-gram will be taking into consideration for validation data</li><li><code>is_tolerant_val::Bool=false</code>: if true, select a specified number (given by <code>max_tolerance</code>) of n-grams whose supports are below threshold but above a second tolerance threshold to be added to the path for validation data</li><li><code>tolerance_val::Float64=-0.1</code>: the value set for the second threshold (in tolerant mode) such that if the support for an n-gram is in between this value and the threshold and the max_tolerance number has not been reached, then allow this n-gram to be added to the path for validation data</li><li><code>max_tolerance_val::Int64=2</code>: maximum number of n-grams allowed in a path for validation data</li><li><code>n_neighbors_train::Int64=10</code>: the top n form neighbors to be considered for training data</li><li><code>n_neighbors_val::Int64=20</code>: the top n form neighbors to be considered for validation data</li><li><code>issparse::Bool=false</code>: if true, keep sparse matrix format when learning paths</li><li><code>output_dir::String=&quot;out&quot;</code>: the output directory</li><li><code>verbose::Bool=false</code>: if true, more information will be printed</li></ul></div><a class="docs-sourcelink" target="_blank" href="https://github.com/quantling/JudiLing.jl/blob/5ca73e4b27ef788e0b36d45e6360491a5a413be8/src/test_combo.jl#LL56-L116">source</a></section></article></article><nav class="docs-footer"><a class="docs-footer-prevpage" href="../output/">« Output</a><a class="docs-footer-nextpage" href="../display/">Display »</a><div class="flexbox-break"></div><p class="footer-message">Powered by <a href="https://github.com/JuliaDocs/Documenter.jl">Documenter.jl</a> and the <a href="https://julialang.org/">Julia Programming Language</a>.</p></nav></div><div class="modal" id="documenter-settings"><div class="modal-background"></div><div class="modal-card"><header class="modal-card-head"><p class="modal-card-title">Settings</p><button class="delete"></button></header><section class="modal-card-body"><p><label class="label">Theme</label><div class="select"><select id="documenter-themepicker"><option value="documenter-light">documenter-light</option><option value="documenter-dark">documenter-dark</option></select></div></p><hr/><p>This document was generated with <a href="https://github.com/JuliaDocs/Documenter.jl">Documenter.jl</a> on <span class="colophon-date" title="Wednesday 3 July 2024 16:16">Wednesday 3 July 2024</span>. Using Julia version 1.10.4.</p></section><footer class="modal-card-foot"></footer></div></div></div></body></html>
diff --git a/dev/man/utils/index.html b/dev/man/utils/index.html
index fda958f..54d4806 100644
--- a/dev/man/utils/index.html
+++ b/dev/man/utils/index.html
@@ -1,13 +1,13 @@
 <!DOCTYPE html>
-<html lang="en"><head><meta charset="UTF-8"/><meta name="viewport" content="width=device-width, initial-scale=1.0"/><title>Utils · JudiLing.jl</title><link rel="canonical" href="https://quantling.github.io/JudiLing.jl/man/utils/"/><link href="https://fonts.googleapis.com/css?family=Lato|Roboto+Mono" rel="stylesheet" type="text/css"/><link href="https://cdnjs.cloudflare.com/ajax/libs/font-awesome/5.15.0/css/fontawesome.min.css" rel="stylesheet" type="text/css"/><link href="https://cdnjs.cloudflare.com/ajax/libs/font-awesome/5.15.0/css/solid.min.css" rel="stylesheet" type="text/css"/><link href="https://cdnjs.cloudflare.com/ajax/libs/font-awesome/5.15.0/css/brands.min.css" rel="stylesheet" type="text/css"/><link href="https://cdnjs.cloudflare.com/ajax/libs/KaTeX/0.11.1/katex.min.css" rel="stylesheet" type="text/css"/><script>documenterBaseURL="../.."</script><script src="https://cdnjs.cloudflare.com/ajax/libs/require.js/2.3.6/require.min.js" data-main="../../assets/documenter.js"></script><script src="../../siteinfo.js"></script><script src="../../../versions.js"></script><link class="docs-theme-link" rel="stylesheet" type="text/css" href="../../assets/themes/documenter-dark.css" data-theme-name="documenter-dark"/><link class="docs-theme-link" rel="stylesheet" type="text/css" href="../../assets/themes/documenter-light.css" data-theme-name="documenter-light" data-theme-primary/><script src="../../assets/themeswap.js"></script></head><body><div id="documenter"><nav class="docs-sidebar"><div class="docs-package-name"><span class="docs-autofit">JudiLing.jl</span></div><form class="docs-search" action="../../search/"><input class="docs-search-query" id="documenter-search-query" name="q" type="text" placeholder="Search docs"/></form><ul class="docs-menu"><li><a class="tocitem" href="../../">Home</a></li><li><span class="tocitem">Manual</span><ul><li><a class="tocitem" href="../input/">Loading data</a></li><li><a class="tocitem" href="../make_cue_matrix/">Make Cue Matrix</a></li><li><a class="tocitem" href="../make_semantic_matrix/">Make Semantic Matrix</a></li><li><a class="tocitem" href="../cholesky/">Cholesky</a></li><li><a class="tocitem" href="../make_adjacency_matrix/">Make Adjacency Matrix</a></li><li><a class="tocitem" href="../make_yt_matrix/">Make Yt Matrix</a></li><li><a class="tocitem" href="../find_path/">Find Paths</a></li><li><a class="tocitem" href="../eval/">Evaluation</a></li><li><a class="tocitem" href="../output/">Output</a></li><li><a class="tocitem" href="../test_combo/">Test Combo</a></li><li><a class="tocitem" href="../display/">Display</a></li><li class="is-active"><a class="tocitem" href>Utils</a></li><li><a class="tocitem" href="../pickle/">Pickle</a></li><li><a class="tocitem" href="../pyndl/">Pyndl</a></li><li><a class="tocitem" href="../wh/">Widrow-Hoff Learning</a></li><li><a class="tocitem" href="../deep_learning/">Deep learning</a></li><li><a class="tocitem" href="../measures_func/">Measures function</a></li></ul></li><li><a class="tocitem" href="../all_manual/">All Manual index</a></li></ul><div class="docs-version-selector field has-addons"><div class="control"><span class="docs-label button is-static is-size-7">Version</span></div><div class="docs-selector control is-expanded"><div class="select is-fullwidth is-size-7"><select id="documenter-version-selector"></select></div></div></div></nav><div class="docs-main"><header class="docs-navbar"><nav class="breadcrumb"><ul class="is-hidden-mobile"><li><a class="is-disabled">Manual</a></li><li class="is-active"><a href>Utils</a></li></ul><ul class="is-hidden-tablet"><li class="is-active"><a href>Utils</a></li></ul></nav><div class="docs-right"><a class="docs-edit-link" href="https://github.com/quantling/JudiLing.jl/blob/master/docs/src/man/utils.md#L" title="Edit on GitHub"><span class="docs-icon fab"></span><span class="docs-label is-hidden-touch">Edit on GitHub</span></a><a class="docs-settings-button fas fa-cog" id="documenter-settings-button" href="#" title="Settings"></a><a class="docs-sidebar-button fa fa-bars is-hidden-desktop" id="documenter-sidebar-button" href="#"></a></div></header><article class="content" id="documenter-page"><h1 id="Utils"><a class="docs-heading-anchor" href="#Utils">Utils</a><a id="Utils-1"></a><a class="docs-heading-anchor-permalink" href="#Utils" title="Permalink"></a></h1><article class="docstring"><header><a class="docstring-binding" id="JudiLing.iscorrect" href="#JudiLing.iscorrect"><code>JudiLing.iscorrect</code></a> — <span class="docstring-category">Function</span></header><section><div><p>Check whether the predictions are correct.</p></div><a class="docs-sourcelink" target="_blank" href="https://github.com/quantling/JudiLing.jl/blob/244bb0c648484065ffd5a41781ccc1caf2e5db60/src/utils.jl#LL1-L3">source</a></section></article><article class="docstring"><header><a class="docstring-binding" id="JudiLing.display_pred" href="#JudiLing.display_pred"><code>JudiLing.display_pred</code></a> — <span class="docstring-category">Function</span></header><section><div><p>Display prediction nicely.</p></div><a class="docs-sourcelink" target="_blank" href="https://github.com/quantling/JudiLing.jl/blob/244bb0c648484065ffd5a41781ccc1caf2e5db60/src/utils.jl#LL8-L10">source</a></section></article><article class="docstring"><header><a class="docstring-binding" id="JudiLing.translate" href="#JudiLing.translate"><code>JudiLing.translate</code></a> — <span class="docstring-category">Function</span></header><section><div><p>Translate indices into words or utterances</p></div><a class="docs-sourcelink" target="_blank" href="https://github.com/quantling/JudiLing.jl/blob/244bb0c648484065ffd5a41781ccc1caf2e5db60/src/utils.jl#LL41-L43">source</a></section></article><article class="docstring"><header><a class="docstring-binding" id="JudiLing.translate_path" href="#JudiLing.translate_path"><code>JudiLing.translate_path</code></a> — <span class="docstring-category">Function</span></header><section><div><p>Append indices together to form a path</p></div><a class="docs-sourcelink" target="_blank" href="https://github.com/quantling/JudiLing.jl/blob/244bb0c648484065ffd5a41781ccc1caf2e5db60/src/utils.jl#LL81-L83">source</a></section></article><article class="docstring"><header><a class="docstring-binding" id="JudiLing.is_truly_sparse" href="#JudiLing.is_truly_sparse"><code>JudiLing.is_truly_sparse</code></a> — <span class="docstring-category">Function</span></header><section><div><p>Check whether a matrix is truly sparse regardless its format, where M is originally a sparse matrix format.</p></div><a class="docs-sourcelink" target="_blank" href="https://github.com/quantling/JudiLing.jl/blob/244bb0c648484065ffd5a41781ccc1caf2e5db60/src/utils.jl#LL89-L91">source</a></section><section><div><p>Check whether a matrix is truly sparse regardless its format, where M is originally a dense matrix format.</p></div><a class="docs-sourcelink" target="_blank" href="https://github.com/quantling/JudiLing.jl/blob/244bb0c648484065ffd5a41781ccc1caf2e5db60/src/utils.jl#LL97-L99">source</a></section></article><article class="docstring"><header><a class="docstring-binding" id="JudiLing.isattachable" href="#JudiLing.isattachable"><code>JudiLing.isattachable</code></a> — <span class="docstring-category">Function</span></header><section><div><p>Check whether a gram can attach to another gram.</p></div><a class="docs-sourcelink" target="_blank" href="https://github.com/quantling/JudiLing.jl/blob/244bb0c648484065ffd5a41781ccc1caf2e5db60/src/utils.jl#LL106-L108">source</a></section><section><div><p>Check whether a gram can attach to another gram.</p></div><a class="docs-sourcelink" target="_blank" href="https://github.com/quantling/JudiLing.jl/blob/244bb0c648484065ffd5a41781ccc1caf2e5db60/src/utils.jl#LL114-L116">source</a></section></article><article class="docstring"><header><a class="docstring-binding" id="JudiLing.iscomplete" href="#JudiLing.iscomplete"><code>JudiLing.iscomplete</code></a> — <span class="docstring-category">Function</span></header><section><div><p>Check whether a path is complete.</p></div><a class="docs-sourcelink" target="_blank" href="https://github.com/quantling/JudiLing.jl/blob/244bb0c648484065ffd5a41781ccc1caf2e5db60/src/utils.jl#LL122-L124">source</a></section></article><article class="docstring"><header><a class="docstring-binding" id="JudiLing.isstart" href="#JudiLing.isstart"><code>JudiLing.isstart</code></a> — <span class="docstring-category">Function</span></header><section><div><p>Check whether a gram can start a path.</p></div><a class="docs-sourcelink" target="_blank" href="https://github.com/quantling/JudiLing.jl/blob/244bb0c648484065ffd5a41781ccc1caf2e5db60/src/utils.jl#LL138-L140">source</a></section></article><article class="docstring"><header><a class="docstring-binding" id="JudiLing.isnovel" href="#JudiLing.isnovel"><code>JudiLing.isnovel</code></a> — <span class="docstring-category">Function</span></header><section><div><p>Check whether a predicted path is in training data.</p></div><a class="docs-sourcelink" target="_blank" href="https://github.com/quantling/JudiLing.jl/blob/244bb0c648484065ffd5a41781ccc1caf2e5db60/src/utils.jl#LL154-L156">source</a></section></article><article class="docstring"><header><a class="docstring-binding" id="JudiLing.check_used_token" href="#JudiLing.check_used_token"><code>JudiLing.check_used_token</code></a> — <span class="docstring-category">Function</span></header><section><div><p>Check whether there are tokens already used in dataset as n-gram components.</p></div><a class="docs-sourcelink" target="_blank" href="https://github.com/quantling/JudiLing.jl/blob/244bb0c648484065ffd5a41781ccc1caf2e5db60/src/utils.jl#LL162-L164">source</a></section></article><article class="docstring"><header><a class="docstring-binding" id="JudiLing.cal_max_timestep" href="#JudiLing.cal_max_timestep"><code>JudiLing.cal_max_timestep</code></a> — <span class="docstring-category">Function</span></header><section><div><pre><code class="language-julia">function cal_max_timestep(
+<html lang="en"><head><meta charset="UTF-8"/><meta name="viewport" content="width=device-width, initial-scale=1.0"/><title>Utils · JudiLing.jl</title><link rel="canonical" href="https://quantling.github.io/JudiLing.jl/man/utils/"/><link href="https://fonts.googleapis.com/css?family=Lato|Roboto+Mono" rel="stylesheet" type="text/css"/><link href="https://cdnjs.cloudflare.com/ajax/libs/font-awesome/5.15.0/css/fontawesome.min.css" rel="stylesheet" type="text/css"/><link href="https://cdnjs.cloudflare.com/ajax/libs/font-awesome/5.15.0/css/solid.min.css" rel="stylesheet" type="text/css"/><link href="https://cdnjs.cloudflare.com/ajax/libs/font-awesome/5.15.0/css/brands.min.css" rel="stylesheet" type="text/css"/><link href="https://cdnjs.cloudflare.com/ajax/libs/KaTeX/0.11.1/katex.min.css" rel="stylesheet" type="text/css"/><script>documenterBaseURL="../.."</script><script src="https://cdnjs.cloudflare.com/ajax/libs/require.js/2.3.6/require.min.js" data-main="../../assets/documenter.js"></script><script src="../../siteinfo.js"></script><script src="../../../versions.js"></script><link class="docs-theme-link" rel="stylesheet" type="text/css" href="../../assets/themes/documenter-dark.css" data-theme-name="documenter-dark"/><link class="docs-theme-link" rel="stylesheet" type="text/css" href="../../assets/themes/documenter-light.css" data-theme-name="documenter-light" data-theme-primary/><script src="../../assets/themeswap.js"></script></head><body><div id="documenter"><nav class="docs-sidebar"><div class="docs-package-name"><span class="docs-autofit">JudiLing.jl</span></div><form class="docs-search" action="../../search/"><input class="docs-search-query" id="documenter-search-query" name="q" type="text" placeholder="Search docs"/></form><ul class="docs-menu"><li><a class="tocitem" href="../../">Home</a></li><li><span class="tocitem">Manual</span><ul><li><a class="tocitem" href="../input/">Loading data</a></li><li><a class="tocitem" href="../make_cue_matrix/">Make Cue Matrix</a></li><li><a class="tocitem" href="../make_semantic_matrix/">Make Semantic Matrix</a></li><li><a class="tocitem" href="../cholesky/">Cholesky</a></li><li><a class="tocitem" href="../make_adjacency_matrix/">Make Adjacency Matrix</a></li><li><a class="tocitem" href="../make_yt_matrix/">Make Yt Matrix</a></li><li><a class="tocitem" href="../find_path/">Find Paths</a></li><li><a class="tocitem" href="../eval/">Evaluation</a></li><li><a class="tocitem" href="../output/">Output</a></li><li><a class="tocitem" href="../test_combo/">Test Combo</a></li><li><a class="tocitem" href="../display/">Display</a></li><li class="is-active"><a class="tocitem" href>Utils</a></li><li><a class="tocitem" href="../pickle/">Pickle</a></li><li><a class="tocitem" href="../pyndl/">Pyndl</a></li><li><a class="tocitem" href="../wh/">Widrow-Hoff Learning</a></li><li><a class="tocitem" href="../deep_learning/">Deep learning</a></li><li><a class="tocitem" href="../measures_func/">Measures function</a></li></ul></li><li><a class="tocitem" href="../all_manual/">All Manual index</a></li></ul><div class="docs-version-selector field has-addons"><div class="control"><span class="docs-label button is-static is-size-7">Version</span></div><div class="docs-selector control is-expanded"><div class="select is-fullwidth is-size-7"><select id="documenter-version-selector"></select></div></div></div></nav><div class="docs-main"><header class="docs-navbar"><nav class="breadcrumb"><ul class="is-hidden-mobile"><li><a class="is-disabled">Manual</a></li><li class="is-active"><a href>Utils</a></li></ul><ul class="is-hidden-tablet"><li class="is-active"><a href>Utils</a></li></ul></nav><div class="docs-right"><a class="docs-edit-link" href="https://github.com/quantling/JudiLing.jl/blob/master/docs/src/man/utils.md#L" title="Edit on GitHub"><span class="docs-icon fab"></span><span class="docs-label is-hidden-touch">Edit on GitHub</span></a><a class="docs-settings-button fas fa-cog" id="documenter-settings-button" href="#" title="Settings"></a><a class="docs-sidebar-button fa fa-bars is-hidden-desktop" id="documenter-sidebar-button" href="#"></a></div></header><article class="content" id="documenter-page"><h1 id="Utils"><a class="docs-heading-anchor" href="#Utils">Utils</a><a id="Utils-1"></a><a class="docs-heading-anchor-permalink" href="#Utils" title="Permalink"></a></h1><article class="docstring"><header><a class="docstring-binding" id="JudiLing.iscorrect" href="#JudiLing.iscorrect"><code>JudiLing.iscorrect</code></a> — <span class="docstring-category">Function</span></header><section><div><p>Check whether the predictions are correct.</p></div><a class="docs-sourcelink" target="_blank" href="https://github.com/quantling/JudiLing.jl/blob/5ca73e4b27ef788e0b36d45e6360491a5a413be8/src/utils.jl#LL1-L3">source</a></section></article><article class="docstring"><header><a class="docstring-binding" id="JudiLing.display_pred" href="#JudiLing.display_pred"><code>JudiLing.display_pred</code></a> — <span class="docstring-category">Function</span></header><section><div><p>Display prediction nicely.</p></div><a class="docs-sourcelink" target="_blank" href="https://github.com/quantling/JudiLing.jl/blob/5ca73e4b27ef788e0b36d45e6360491a5a413be8/src/utils.jl#LL8-L10">source</a></section></article><article class="docstring"><header><a class="docstring-binding" id="JudiLing.translate" href="#JudiLing.translate"><code>JudiLing.translate</code></a> — <span class="docstring-category">Function</span></header><section><div><p>Translate indices into words or utterances</p></div><a class="docs-sourcelink" target="_blank" href="https://github.com/quantling/JudiLing.jl/blob/5ca73e4b27ef788e0b36d45e6360491a5a413be8/src/utils.jl#LL41-L43">source</a></section></article><article class="docstring"><header><a class="docstring-binding" id="JudiLing.translate_path" href="#JudiLing.translate_path"><code>JudiLing.translate_path</code></a> — <span class="docstring-category">Function</span></header><section><div><p>Append indices together to form a path</p></div><a class="docs-sourcelink" target="_blank" href="https://github.com/quantling/JudiLing.jl/blob/5ca73e4b27ef788e0b36d45e6360491a5a413be8/src/utils.jl#LL81-L83">source</a></section></article><article class="docstring"><header><a class="docstring-binding" id="JudiLing.is_truly_sparse" href="#JudiLing.is_truly_sparse"><code>JudiLing.is_truly_sparse</code></a> — <span class="docstring-category">Function</span></header><section><div><p>Check whether a matrix is truly sparse regardless its format, where M is originally a sparse matrix format.</p></div><a class="docs-sourcelink" target="_blank" href="https://github.com/quantling/JudiLing.jl/blob/5ca73e4b27ef788e0b36d45e6360491a5a413be8/src/utils.jl#LL89-L91">source</a></section><section><div><p>Check whether a matrix is truly sparse regardless its format, where M is originally a dense matrix format.</p></div><a class="docs-sourcelink" target="_blank" href="https://github.com/quantling/JudiLing.jl/blob/5ca73e4b27ef788e0b36d45e6360491a5a413be8/src/utils.jl#LL97-L99">source</a></section></article><article class="docstring"><header><a class="docstring-binding" id="JudiLing.isattachable" href="#JudiLing.isattachable"><code>JudiLing.isattachable</code></a> — <span class="docstring-category">Function</span></header><section><div><p>Check whether a gram can attach to another gram.</p></div><a class="docs-sourcelink" target="_blank" href="https://github.com/quantling/JudiLing.jl/blob/5ca73e4b27ef788e0b36d45e6360491a5a413be8/src/utils.jl#LL106-L108">source</a></section><section><div><p>Check whether a gram can attach to another gram.</p></div><a class="docs-sourcelink" target="_blank" href="https://github.com/quantling/JudiLing.jl/blob/5ca73e4b27ef788e0b36d45e6360491a5a413be8/src/utils.jl#LL114-L116">source</a></section></article><article class="docstring"><header><a class="docstring-binding" id="JudiLing.iscomplete" href="#JudiLing.iscomplete"><code>JudiLing.iscomplete</code></a> — <span class="docstring-category">Function</span></header><section><div><p>Check whether a path is complete.</p></div><a class="docs-sourcelink" target="_blank" href="https://github.com/quantling/JudiLing.jl/blob/5ca73e4b27ef788e0b36d45e6360491a5a413be8/src/utils.jl#LL122-L124">source</a></section></article><article class="docstring"><header><a class="docstring-binding" id="JudiLing.isstart" href="#JudiLing.isstart"><code>JudiLing.isstart</code></a> — <span class="docstring-category">Function</span></header><section><div><p>Check whether a gram can start a path.</p></div><a class="docs-sourcelink" target="_blank" href="https://github.com/quantling/JudiLing.jl/blob/5ca73e4b27ef788e0b36d45e6360491a5a413be8/src/utils.jl#LL138-L140">source</a></section></article><article class="docstring"><header><a class="docstring-binding" id="JudiLing.isnovel" href="#JudiLing.isnovel"><code>JudiLing.isnovel</code></a> — <span class="docstring-category">Function</span></header><section><div><p>Check whether a predicted path is in training data.</p></div><a class="docs-sourcelink" target="_blank" href="https://github.com/quantling/JudiLing.jl/blob/5ca73e4b27ef788e0b36d45e6360491a5a413be8/src/utils.jl#LL154-L156">source</a></section></article><article class="docstring"><header><a class="docstring-binding" id="JudiLing.check_used_token" href="#JudiLing.check_used_token"><code>JudiLing.check_used_token</code></a> — <span class="docstring-category">Function</span></header><section><div><p>Check whether there are tokens already used in dataset as n-gram components.</p></div><a class="docs-sourcelink" target="_blank" href="https://github.com/quantling/JudiLing.jl/blob/5ca73e4b27ef788e0b36d45e6360491a5a413be8/src/utils.jl#LL162-L164">source</a></section></article><article class="docstring"><header><a class="docstring-binding" id="JudiLing.cal_max_timestep" href="#JudiLing.cal_max_timestep"><code>JudiLing.cal_max_timestep</code></a> — <span class="docstring-category">Function</span></header><section><div><pre><code class="language-julia">function cal_max_timestep(
     data_train::DataFrame,
     data_val::DataFrame,
     target_col::Union{String, Symbol};
     tokenized::Bool = false,
     sep_token::Union{Nothing, String, Char} = &quot;&quot;,
-)</code></pre><p>Calculate the max timestep given training and validation datasets.</p><p><strong>Obligatory Arguments</strong></p><ul><li><code>data_train::DataFrame</code>: the training dataset</li><li><code>data_val::DataFrame</code>: the validation dataset</li><li><code>target_col::Union{String, Symbol}</code>: the column with the target word forms</li></ul><p><strong>Optional Arguments</strong></p><ul><li><code>tokenized::Bool = false</code>: Whether the word forms in the <code>target_col</code> are already tokenized</li><li><code>sep_token::Union{Nothing, String, Char} = &quot;&quot;</code>: The token with which the word forms are tokenized</li></ul><p><strong>Examples</strong></p><pre><code class="language-julia">JudiLing.cal_max_timestep(latin_train, latin_val, target_col=:Word)</code></pre></div><a class="docs-sourcelink" target="_blank" href="https://github.com/quantling/JudiLing.jl/blob/244bb0c648484065ffd5a41781ccc1caf2e5db60/src/utils.jl#LL174-L198">source</a></section><section><div><pre><code class="language-none">function cal_max_timestep(
+)</code></pre><p>Calculate the max timestep given training and validation datasets.</p><p><strong>Obligatory Arguments</strong></p><ul><li><code>data_train::DataFrame</code>: the training dataset</li><li><code>data_val::DataFrame</code>: the validation dataset</li><li><code>target_col::Union{String, Symbol}</code>: the column with the target word forms</li></ul><p><strong>Optional Arguments</strong></p><ul><li><code>tokenized::Bool = false</code>: Whether the word forms in the <code>target_col</code> are already tokenized</li><li><code>sep_token::Union{Nothing, String, Char} = &quot;&quot;</code>: The token with which the word forms are tokenized</li></ul><p><strong>Examples</strong></p><pre><code class="language-julia">JudiLing.cal_max_timestep(latin_train, latin_val, target_col=:Word)</code></pre></div><a class="docs-sourcelink" target="_blank" href="https://github.com/quantling/JudiLing.jl/blob/5ca73e4b27ef788e0b36d45e6360491a5a413be8/src/utils.jl#LL174-L198">source</a></section><section><div><pre><code class="language-none">function cal_max_timestep(
     data::DataFrame,
     target_col::Union{String, Symbol};
     tokenized::Bool = false,
     sep_token::Union{Nothing, String, Char} = &quot;&quot;,
-)</code></pre><p>Calculate the max timestep given training dataset.</p><p><strong>Obligatory Arguments</strong></p><ul><li><code>data::DataFrame</code>: the dataset</li><li><code>target_col::Union{String, Symbol}</code>: the column with the target word forms</li></ul><p><strong>Optional Arguments</strong></p><ul><li><code>tokenized::Bool = false</code>: Whether the word forms in the <code>target_col</code> are already tokenized</li><li><code>sep_token::Union{Nothing, String, Char} = &quot;&quot;</code>: The token with which the word forms are tokenized</li></ul><p><strong>Examples</strong></p><pre><code class="language-julia">JudiLing.cal_max_timestep(latin, target_col=:Word)</code></pre></div><a class="docs-sourcelink" target="_blank" href="https://github.com/quantling/JudiLing.jl/blob/244bb0c648484065ffd5a41781ccc1caf2e5db60/src/utils.jl#LL221-L243">source</a></section></article></article><nav class="docs-footer"><a class="docs-footer-prevpage" href="../display/">« Display</a><a class="docs-footer-nextpage" href="../pickle/">Pickle »</a><div class="flexbox-break"></div><p class="footer-message">Powered by <a href="https://github.com/JuliaDocs/Documenter.jl">Documenter.jl</a> and the <a href="https://julialang.org/">Julia Programming Language</a>.</p></nav></div><div class="modal" id="documenter-settings"><div class="modal-background"></div><div class="modal-card"><header class="modal-card-head"><p class="modal-card-title">Settings</p><button class="delete"></button></header><section class="modal-card-body"><p><label class="label">Theme</label><div class="select"><select id="documenter-themepicker"><option value="documenter-light">documenter-light</option><option value="documenter-dark">documenter-dark</option></select></div></p><hr/><p>This document was generated with <a href="https://github.com/JuliaDocs/Documenter.jl">Documenter.jl</a> on <span class="colophon-date" title="Wednesday 3 July 2024 16:02">Wednesday 3 July 2024</span>. Using Julia version 1.10.4.</p></section><footer class="modal-card-foot"></footer></div></div></div></body></html>
+)</code></pre><p>Calculate the max timestep given training dataset.</p><p><strong>Obligatory Arguments</strong></p><ul><li><code>data::DataFrame</code>: the dataset</li><li><code>target_col::Union{String, Symbol}</code>: the column with the target word forms</li></ul><p><strong>Optional Arguments</strong></p><ul><li><code>tokenized::Bool = false</code>: Whether the word forms in the <code>target_col</code> are already tokenized</li><li><code>sep_token::Union{Nothing, String, Char} = &quot;&quot;</code>: The token with which the word forms are tokenized</li></ul><p><strong>Examples</strong></p><pre><code class="language-julia">JudiLing.cal_max_timestep(latin, target_col=:Word)</code></pre></div><a class="docs-sourcelink" target="_blank" href="https://github.com/quantling/JudiLing.jl/blob/5ca73e4b27ef788e0b36d45e6360491a5a413be8/src/utils.jl#LL221-L243">source</a></section></article></article><nav class="docs-footer"><a class="docs-footer-prevpage" href="../display/">« Display</a><a class="docs-footer-nextpage" href="../pickle/">Pickle »</a><div class="flexbox-break"></div><p class="footer-message">Powered by <a href="https://github.com/JuliaDocs/Documenter.jl">Documenter.jl</a> and the <a href="https://julialang.org/">Julia Programming Language</a>.</p></nav></div><div class="modal" id="documenter-settings"><div class="modal-background"></div><div class="modal-card"><header class="modal-card-head"><p class="modal-card-title">Settings</p><button class="delete"></button></header><section class="modal-card-body"><p><label class="label">Theme</label><div class="select"><select id="documenter-themepicker"><option value="documenter-light">documenter-light</option><option value="documenter-dark">documenter-dark</option></select></div></p><hr/><p>This document was generated with <a href="https://github.com/JuliaDocs/Documenter.jl">Documenter.jl</a> on <span class="colophon-date" title="Wednesday 3 July 2024 16:16">Wednesday 3 July 2024</span>. Using Julia version 1.10.4.</p></section><footer class="modal-card-foot"></footer></div></div></div></body></html>
diff --git a/dev/man/wh/index.html b/dev/man/wh/index.html
index b01e979..bf39baa 100644
--- a/dev/man/wh/index.html
+++ b/dev/man/wh/index.html
@@ -10,4 +10,4 @@
     history_cols = nothing,
     history_rows = nothing,
     verbose = false,
-    )</code></pre><p>Widrow-Hoff Learning.</p><p><strong>Obligatory Arguments</strong></p><ul><li><code>test_mode::Symbol</code>: which test mode, currently supports :train<em>only, :pre</em>split, :careful<em>split and :random</em>split.</li></ul><p><strong>Optional Arguments</strong></p><ul><li><code>eta::Float64=0.1</code>: the learning rate</li><li><code>n_epochs::Int64=1</code>: the number of epochs to be trained</li><li><code>weights::Matrix=nothing</code>: the initial weights</li><li><code>learn_seq::Vector=nothing</code>: the learning sequence</li><li><code>save_history::Bool=false</code>: if true, a partical training history will be saved</li><li><code>history_cols::Vector=nothing</code>: the list of column indices you want to saved in history, e.g. <code>[1,32,42]</code> or <code>[2]</code></li><li><code>history_rows::Vector=nothing</code>: the list of row indices you want to saved in history, e.g. <code>[1,32,42]</code> or <code>[2]</code></li><li><code>verbose::Bool = false</code>: if true, more information will be printed out</li></ul></div><a class="docs-sourcelink" target="_blank" href="https://github.com/quantling/JudiLing.jl/blob/244bb0c648484065ffd5a41781ccc1caf2e5db60/src/wh.jl#LL1-L29">source</a></section></article><article class="docstring"><header><a class="docstring-binding" id="JudiLing.make_learn_seq-Tuple{Any}" href="#JudiLing.make_learn_seq-Tuple{Any}"><code>JudiLing.make_learn_seq</code></a> — <span class="docstring-category">Method</span></header><section><div><pre><code class="language-julia">make_learn_seq(freq; random_seed = 314)</code></pre><p>Make Widrow-Hoff learning sequence from frequencies. Creates a randomly ordered sequences of indices where each index appears according to its frequncy.</p><p><strong>Obligatory arguments</strong></p><ul><li><code>freq</code>: Vector with frequencies.</li></ul><p><strong>Optional arguments</strong></p><ul><li><code>random_seed = 314</code>: Random seed to control randomness.</li></ul><p><strong>Example</strong></p><pre><code class="language-julia">learn_seq = JudiLing.make_learn_seq(data.frequency)</code></pre></div><a class="docs-sourcelink" target="_blank" href="https://github.com/quantling/JudiLing.jl/blob/244bb0c648484065ffd5a41781ccc1caf2e5db60/src/wh.jl#LL103-L119">source</a></section></article></article><nav class="docs-footer"><a class="docs-footer-prevpage" href="../pyndl/">« Pyndl</a><a class="docs-footer-nextpage" href="../deep_learning/">Deep learning »</a><div class="flexbox-break"></div><p class="footer-message">Powered by <a href="https://github.com/JuliaDocs/Documenter.jl">Documenter.jl</a> and the <a href="https://julialang.org/">Julia Programming Language</a>.</p></nav></div><div class="modal" id="documenter-settings"><div class="modal-background"></div><div class="modal-card"><header class="modal-card-head"><p class="modal-card-title">Settings</p><button class="delete"></button></header><section class="modal-card-body"><p><label class="label">Theme</label><div class="select"><select id="documenter-themepicker"><option value="documenter-light">documenter-light</option><option value="documenter-dark">documenter-dark</option></select></div></p><hr/><p>This document was generated with <a href="https://github.com/JuliaDocs/Documenter.jl">Documenter.jl</a> on <span class="colophon-date" title="Wednesday 3 July 2024 16:02">Wednesday 3 July 2024</span>. Using Julia version 1.10.4.</p></section><footer class="modal-card-foot"></footer></div></div></div></body></html>
+    )</code></pre><p>Widrow-Hoff Learning.</p><p><strong>Obligatory Arguments</strong></p><ul><li><code>test_mode::Symbol</code>: which test mode, currently supports :train<em>only, :pre</em>split, :careful<em>split and :random</em>split.</li></ul><p><strong>Optional Arguments</strong></p><ul><li><code>eta::Float64=0.1</code>: the learning rate</li><li><code>n_epochs::Int64=1</code>: the number of epochs to be trained</li><li><code>weights::Matrix=nothing</code>: the initial weights</li><li><code>learn_seq::Vector=nothing</code>: the learning sequence</li><li><code>save_history::Bool=false</code>: if true, a partical training history will be saved</li><li><code>history_cols::Vector=nothing</code>: the list of column indices you want to saved in history, e.g. <code>[1,32,42]</code> or <code>[2]</code></li><li><code>history_rows::Vector=nothing</code>: the list of row indices you want to saved in history, e.g. <code>[1,32,42]</code> or <code>[2]</code></li><li><code>verbose::Bool = false</code>: if true, more information will be printed out</li></ul></div><a class="docs-sourcelink" target="_blank" href="https://github.com/quantling/JudiLing.jl/blob/5ca73e4b27ef788e0b36d45e6360491a5a413be8/src/wh.jl#LL1-L29">source</a></section></article><article class="docstring"><header><a class="docstring-binding" id="JudiLing.make_learn_seq-Tuple{Any}" href="#JudiLing.make_learn_seq-Tuple{Any}"><code>JudiLing.make_learn_seq</code></a> — <span class="docstring-category">Method</span></header><section><div><pre><code class="language-julia">make_learn_seq(freq; random_seed = 314)</code></pre><p>Make Widrow-Hoff learning sequence from frequencies. Creates a randomly ordered sequences of indices where each index appears according to its frequncy.</p><p><strong>Obligatory arguments</strong></p><ul><li><code>freq</code>: Vector with frequencies.</li></ul><p><strong>Optional arguments</strong></p><ul><li><code>random_seed = 314</code>: Random seed to control randomness.</li></ul><p><strong>Example</strong></p><pre><code class="language-julia">learn_seq = JudiLing.make_learn_seq(data.frequency)</code></pre></div><a class="docs-sourcelink" target="_blank" href="https://github.com/quantling/JudiLing.jl/blob/5ca73e4b27ef788e0b36d45e6360491a5a413be8/src/wh.jl#LL103-L119">source</a></section></article></article><nav class="docs-footer"><a class="docs-footer-prevpage" href="../pyndl/">« Pyndl</a><a class="docs-footer-nextpage" href="../deep_learning/">Deep learning »</a><div class="flexbox-break"></div><p class="footer-message">Powered by <a href="https://github.com/JuliaDocs/Documenter.jl">Documenter.jl</a> and the <a href="https://julialang.org/">Julia Programming Language</a>.</p></nav></div><div class="modal" id="documenter-settings"><div class="modal-background"></div><div class="modal-card"><header class="modal-card-head"><p class="modal-card-title">Settings</p><button class="delete"></button></header><section class="modal-card-body"><p><label class="label">Theme</label><div class="select"><select id="documenter-themepicker"><option value="documenter-light">documenter-light</option><option value="documenter-dark">documenter-dark</option></select></div></p><hr/><p>This document was generated with <a href="https://github.com/JuliaDocs/Documenter.jl">Documenter.jl</a> on <span class="colophon-date" title="Wednesday 3 July 2024 16:16">Wednesday 3 July 2024</span>. Using Julia version 1.10.4.</p></section><footer class="modal-card-foot"></footer></div></div></div></body></html>
diff --git a/dev/search/index.html b/dev/search/index.html
index 35594a9..f6a4643 100644
--- a/dev/search/index.html
+++ b/dev/search/index.html
@@ -1,2 +1,2 @@
 <!DOCTYPE html>
-<html lang="en"><head><meta charset="UTF-8"/><meta name="viewport" content="width=device-width, initial-scale=1.0"/><title>Search · JudiLing.jl</title><link rel="canonical" href="https://quantling.github.io/JudiLing.jl/search/"/><link href="https://fonts.googleapis.com/css?family=Lato|Roboto+Mono" rel="stylesheet" type="text/css"/><link href="https://cdnjs.cloudflare.com/ajax/libs/font-awesome/5.15.0/css/fontawesome.min.css" rel="stylesheet" type="text/css"/><link href="https://cdnjs.cloudflare.com/ajax/libs/font-awesome/5.15.0/css/solid.min.css" rel="stylesheet" type="text/css"/><link href="https://cdnjs.cloudflare.com/ajax/libs/font-awesome/5.15.0/css/brands.min.css" rel="stylesheet" type="text/css"/><link href="https://cdnjs.cloudflare.com/ajax/libs/KaTeX/0.11.1/katex.min.css" rel="stylesheet" type="text/css"/><script>documenterBaseURL=".."</script><script src="https://cdnjs.cloudflare.com/ajax/libs/require.js/2.3.6/require.min.js" data-main="../assets/documenter.js"></script><script src="../siteinfo.js"></script><script src="../../versions.js"></script><link class="docs-theme-link" rel="stylesheet" type="text/css" href="../assets/themes/documenter-dark.css" data-theme-name="documenter-dark"/><link class="docs-theme-link" rel="stylesheet" type="text/css" href="../assets/themes/documenter-light.css" data-theme-name="documenter-light" data-theme-primary/><script src="../assets/themeswap.js"></script></head><body><div id="documenter"><nav class="docs-sidebar"><div class="docs-package-name"><span class="docs-autofit">JudiLing.jl</span></div><form class="docs-search" action><input class="docs-search-query" id="documenter-search-query" name="q" type="text" placeholder="Search docs"/></form><ul class="docs-menu"><li><a class="tocitem" href="../">Home</a></li><li><span class="tocitem">Manual</span><ul><li><a class="tocitem" href="../man/input/">Loading data</a></li><li><a class="tocitem" href="../man/make_cue_matrix/">Make Cue Matrix</a></li><li><a class="tocitem" href="../man/make_semantic_matrix/">Make Semantic Matrix</a></li><li><a class="tocitem" href="../man/cholesky/">Cholesky</a></li><li><a class="tocitem" href="../man/make_adjacency_matrix/">Make Adjacency Matrix</a></li><li><a class="tocitem" href="../man/make_yt_matrix/">Make Yt Matrix</a></li><li><a class="tocitem" href="../man/find_path/">Find Paths</a></li><li><a class="tocitem" href="../man/eval/">Evaluation</a></li><li><a class="tocitem" href="../man/output/">Output</a></li><li><a class="tocitem" href="../man/test_combo/">Test Combo</a></li><li><a class="tocitem" href="../man/display/">Display</a></li><li><a class="tocitem" href="../man/utils/">Utils</a></li><li><a class="tocitem" href="../man/pickle/">Pickle</a></li><li><a class="tocitem" href="../man/pyndl/">Pyndl</a></li><li><a class="tocitem" href="../man/wh/">Widrow-Hoff Learning</a></li><li><a class="tocitem" href="../man/deep_learning/">Deep learning</a></li><li><a class="tocitem" href="../man/measures_func/">Measures function</a></li></ul></li><li><a class="tocitem" href="../man/all_manual/">All Manual index</a></li></ul><div class="docs-version-selector field has-addons"><div class="control"><span class="docs-label button is-static is-size-7">Version</span></div><div class="docs-selector control is-expanded"><div class="select is-fullwidth is-size-7"><select id="documenter-version-selector"></select></div></div></div></nav><div class="docs-main"><header class="docs-navbar"><nav class="breadcrumb"><ul class="is-hidden-mobile"><li class="is-active"><a href>Search</a></li></ul><ul class="is-hidden-tablet"><li class="is-active"><a href>Search</a></li></ul></nav><div class="docs-right"><a class="docs-settings-button fas fa-cog" id="documenter-settings-button" href="#" title="Settings"></a><a class="docs-sidebar-button fa fa-bars is-hidden-desktop" id="documenter-sidebar-button" href="#"></a></div></header><article><p id="documenter-search-info">Loading search...</p><ul id="documenter-search-results"></ul></article><nav class="docs-footer"><p class="footer-message">Powered by <a href="https://github.com/JuliaDocs/Documenter.jl">Documenter.jl</a> and the <a href="https://julialang.org/">Julia Programming Language</a>.</p></nav></div><div class="modal" id="documenter-settings"><div class="modal-background"></div><div class="modal-card"><header class="modal-card-head"><p class="modal-card-title">Settings</p><button class="delete"></button></header><section class="modal-card-body"><p><label class="label">Theme</label><div class="select"><select id="documenter-themepicker"><option value="documenter-light">documenter-light</option><option value="documenter-dark">documenter-dark</option></select></div></p><hr/><p>This document was generated with <a href="https://github.com/JuliaDocs/Documenter.jl">Documenter.jl</a> on <span class="colophon-date" title="Wednesday 3 July 2024 16:02">Wednesday 3 July 2024</span>. Using Julia version 1.10.4.</p></section><footer class="modal-card-foot"></footer></div></div></div></body><script src="../search_index.js"></script><script src="../assets/search.js"></script></html>
+<html lang="en"><head><meta charset="UTF-8"/><meta name="viewport" content="width=device-width, initial-scale=1.0"/><title>Search · JudiLing.jl</title><link rel="canonical" href="https://quantling.github.io/JudiLing.jl/search/"/><link href="https://fonts.googleapis.com/css?family=Lato|Roboto+Mono" rel="stylesheet" type="text/css"/><link href="https://cdnjs.cloudflare.com/ajax/libs/font-awesome/5.15.0/css/fontawesome.min.css" rel="stylesheet" type="text/css"/><link href="https://cdnjs.cloudflare.com/ajax/libs/font-awesome/5.15.0/css/solid.min.css" rel="stylesheet" type="text/css"/><link href="https://cdnjs.cloudflare.com/ajax/libs/font-awesome/5.15.0/css/brands.min.css" rel="stylesheet" type="text/css"/><link href="https://cdnjs.cloudflare.com/ajax/libs/KaTeX/0.11.1/katex.min.css" rel="stylesheet" type="text/css"/><script>documenterBaseURL=".."</script><script src="https://cdnjs.cloudflare.com/ajax/libs/require.js/2.3.6/require.min.js" data-main="../assets/documenter.js"></script><script src="../siteinfo.js"></script><script src="../../versions.js"></script><link class="docs-theme-link" rel="stylesheet" type="text/css" href="../assets/themes/documenter-dark.css" data-theme-name="documenter-dark"/><link class="docs-theme-link" rel="stylesheet" type="text/css" href="../assets/themes/documenter-light.css" data-theme-name="documenter-light" data-theme-primary/><script src="../assets/themeswap.js"></script></head><body><div id="documenter"><nav class="docs-sidebar"><div class="docs-package-name"><span class="docs-autofit">JudiLing.jl</span></div><form class="docs-search" action><input class="docs-search-query" id="documenter-search-query" name="q" type="text" placeholder="Search docs"/></form><ul class="docs-menu"><li><a class="tocitem" href="../">Home</a></li><li><span class="tocitem">Manual</span><ul><li><a class="tocitem" href="../man/input/">Loading data</a></li><li><a class="tocitem" href="../man/make_cue_matrix/">Make Cue Matrix</a></li><li><a class="tocitem" href="../man/make_semantic_matrix/">Make Semantic Matrix</a></li><li><a class="tocitem" href="../man/cholesky/">Cholesky</a></li><li><a class="tocitem" href="../man/make_adjacency_matrix/">Make Adjacency Matrix</a></li><li><a class="tocitem" href="../man/make_yt_matrix/">Make Yt Matrix</a></li><li><a class="tocitem" href="../man/find_path/">Find Paths</a></li><li><a class="tocitem" href="../man/eval/">Evaluation</a></li><li><a class="tocitem" href="../man/output/">Output</a></li><li><a class="tocitem" href="../man/test_combo/">Test Combo</a></li><li><a class="tocitem" href="../man/display/">Display</a></li><li><a class="tocitem" href="../man/utils/">Utils</a></li><li><a class="tocitem" href="../man/pickle/">Pickle</a></li><li><a class="tocitem" href="../man/pyndl/">Pyndl</a></li><li><a class="tocitem" href="../man/wh/">Widrow-Hoff Learning</a></li><li><a class="tocitem" href="../man/deep_learning/">Deep learning</a></li><li><a class="tocitem" href="../man/measures_func/">Measures function</a></li></ul></li><li><a class="tocitem" href="../man/all_manual/">All Manual index</a></li></ul><div class="docs-version-selector field has-addons"><div class="control"><span class="docs-label button is-static is-size-7">Version</span></div><div class="docs-selector control is-expanded"><div class="select is-fullwidth is-size-7"><select id="documenter-version-selector"></select></div></div></div></nav><div class="docs-main"><header class="docs-navbar"><nav class="breadcrumb"><ul class="is-hidden-mobile"><li class="is-active"><a href>Search</a></li></ul><ul class="is-hidden-tablet"><li class="is-active"><a href>Search</a></li></ul></nav><div class="docs-right"><a class="docs-settings-button fas fa-cog" id="documenter-settings-button" href="#" title="Settings"></a><a class="docs-sidebar-button fa fa-bars is-hidden-desktop" id="documenter-sidebar-button" href="#"></a></div></header><article><p id="documenter-search-info">Loading search...</p><ul id="documenter-search-results"></ul></article><nav class="docs-footer"><p class="footer-message">Powered by <a href="https://github.com/JuliaDocs/Documenter.jl">Documenter.jl</a> and the <a href="https://julialang.org/">Julia Programming Language</a>.</p></nav></div><div class="modal" id="documenter-settings"><div class="modal-background"></div><div class="modal-card"><header class="modal-card-head"><p class="modal-card-title">Settings</p><button class="delete"></button></header><section class="modal-card-body"><p><label class="label">Theme</label><div class="select"><select id="documenter-themepicker"><option value="documenter-light">documenter-light</option><option value="documenter-dark">documenter-dark</option></select></div></p><hr/><p>This document was generated with <a href="https://github.com/JuliaDocs/Documenter.jl">Documenter.jl</a> on <span class="colophon-date" title="Wednesday 3 July 2024 16:16">Wednesday 3 July 2024</span>. Using Julia version 1.10.4.</p></section><footer class="modal-card-foot"></footer></div></div></div></body><script src="../search_index.js"></script><script src="../assets/search.js"></script></html>
diff --git a/dev/search_index.js b/dev/search_index.js
index ff02ab3..7fdce6e 100644
--- a/dev/search_index.js
+++ b/dev/search_index.js
@@ -1,3 +1,3 @@
 var documenterSearchIndex = {"docs":
-[{"location":"man/deep_learning/","page":"Deep learning","title":"Deep learning","text":"CurrentModule = JudiLing","category":"page"},{"location":"man/deep_learning/#Deep-learning-in-JudiLing","page":"Deep learning","title":"Deep learning in JudiLing","text":"","category":"section"},{"location":"man/deep_learning/","page":"Deep learning","title":"Deep learning","text":"predict_from_deep_model(model::Flux.Chain,\n                                 X::Union{SparseMatrixCSC,Matrix})\npredict_shat(model::Flux.Chain,\n                  ci::Vector{Int})\nget_and_train_model(X_train::Union{SparseMatrixCSC,Matrix},\n                            Y_train::Union{SparseMatrixCSC,Matrix},\n                            X_val::Union{SparseMatrixCSC,Matrix,Missing},\n                            Y_val::Union{SparseMatrixCSC,Matrix,Missing},\n                            data_train::Union{DataFrame,Missing},\n                            data_val::Union{DataFrame,Missing},\n                            target_col::Union{Symbol, String,Missing},\n                            model_outpath::String;\n                            hidden_dim::Int=1000,\n                            n_epochs::Int=100,\n                            batchsize::Int=64,\n                            loss_func::Function=Flux.mse,\n                            optimizer=Flux.Adam(0.001),\n                            model::Union{Missing, Flux.Chain} = missing,\n                            early_stopping::Union{Missing, Int}=missing,\n                            optimise_for_acc::Bool=false,\n                            return_losses::Bool=false,\n                            verbose::Bool=true,\n                            measures_func::Union{Missing, Function}=missing,\n                            return_train_acc::Bool=false,\n                            kargs...)\nget_and_train_model(X_train::Union{SparseMatrixCSC,Matrix},\n                            Y_train::Union{SparseMatrixCSC,Matrix},\n                            model_outpath::String;\n                            data_train::Union{Missing, DataFrame}=missing,\n                            target_col::Union{Missing, Symbol, String}=missing,\n                            hidden_dim::Int=1000,\n                            n_epochs::Int=100,\n                            batchsize::Int=64,\n                            loss_func::Function=Flux.mse,\n                            optimizer=Flux.Adam(0.001),\n                            model::Union{Missing, Flux.Chain} = missing,\n                            return_losses::Bool=false,\n                            verbose::Bool=true,\n                            measures_func::Union{Missing, Function}=missing,\n                            return_train_acc::Bool=false,\n                            kargs...)\nfiddl(X_train::Union{SparseMatrixCSC,Matrix},\n              Y_train::Union{SparseMatrixCSC,Matrix},\n              learn_seq::Vector,\n              data::DataFrame,\n              target_col::Union{Symbol, String},\n              model_outpath::String;\n              hidden_dim::Int=1000,\n              batchsize::Int=64,\n              loss_func::Function=Flux.mse,\n              optimizer=Flux.Adam(0.001),\n              model::Union{Missing, Chain} = missing,\n              return_losses::Bool=false,\n              verbose::Bool=true,\n              n_batch_eval::Int=100,\n              measures_func::Union{Function, Missing}=missing,\n              kargs...)\n","category":"page"},{"location":"man/deep_learning/#JudiLing.predict_from_deep_model-Tuple{Chain, Union{SparseArrays.SparseMatrixCSC, Matrix}}","page":"Deep learning","title":"JudiLing.predict_from_deep_model","text":"predict_from_deep_model(model::Chain,\n                        X::Union{SparseMatrixCSC,Matrix})\n\nGenerates output of a model given input X.\n\nObligatory arguments\n\nmodel::Chain: Model of type Flux.Chain, as generated by get_and_train_model\nX::Union{SparseMatrixCSC,Matrix}: Input matrix of size (numberofsamples, inpdim) where inpdim is the input dimension of model\n\n\n\n\n\n","category":"method"},{"location":"man/deep_learning/#JudiLing.predict_shat-Tuple{Chain, Vector{Int64}}","page":"Deep learning","title":"JudiLing.predict_shat","text":"predict_shat(model::Chain,\n             ci::Vector{Int})\n\nPredicts semantic vector shat given a deep learning comprehension model model and a list of indices of ngrams ci.\n\nObligatory arguments\n\nmodel::Chain: Deep learning comprehension model as generated by get_and_train_model\nci::Vector{Int}: Vector of indices of ngrams in c vector. Essentially, this is a vector indicating which ngrams in a c vector are absent and which are present.\n\n\n\n\n\n","category":"method"},{"location":"man/deep_learning/#JudiLing.get_and_train_model-Tuple{Union{SparseArrays.SparseMatrixCSC, Matrix}, Union{SparseArrays.SparseMatrixCSC, Matrix}, Union{Missing, SparseArrays.SparseMatrixCSC, Matrix}, Union{Missing, SparseArrays.SparseMatrixCSC, Matrix}, Union{Missing, DataFrames.DataFrame}, Union{Missing, DataFrames.DataFrame}, Union{Missing, String, Symbol}, String}","page":"Deep learning","title":"JudiLing.get_and_train_model","text":"get_and_train_model(X_train::Union{SparseMatrixCSC,Matrix},\n                    Y_train::Union{SparseMatrixCSC,Matrix},\n                    X_val::Union{SparseMatrixCSC,Matrix,Missing},\n                    Y_val::Union{SparseMatrixCSC,Matrix,Missing},\n                    data_train::Union{DataFrame,Missing},\n                    data_val::Union{DataFrame,Missing},\n                    target_col::Union{Symbol,String,Missing},\n                    model_outpath::String;\n                    hidden_dim::Int=1000,\n                    n_epochs::Int=100,\n                    batchsize::Int=64,\n                    loss_func::Function=Flux.mse,\n                    optimizer=Flux.Adam(0.001)\n                    model::Union{Missing, Chain}=missing,\n                    early_stopping::Union{Missing, Int}=missing,\n                    optimise_for_acc::Bool=false\n                    return_losses::Bool=false,\n                    verbose::Bool=true,\n                    measures_func::Union{Missing, Function}=missing,\n                    return_train_acc::Bool=false,\n                    ...kargs\n                    )\n\nTrains a deep learning model from X_train to Y_train, saving the model with either the highest validation accuracy or lowest validation loss (depending on optimise_for_acc) to outpath.\n\nThe default model looks like this:\n\ninp_dim = size(X_train, 2)\nout_dim = size(Y_train, 2)\nChain(Dense(inp_dim => hidden_dim, relu), Dense(hidden_dim => out_dim))\n\nAny other model with the same input and output dimensions can be provided to the function with the model argument. The default loss function is mean squared error, but any other loss function can be provded, as long as it fits with the model architecture.\n\nBy default the adam optimizer (Kingma and Ba, 2015) with learning rate 0.001 is used. You can provide any other optimizer. If you want to use a different learning rate, e.g. 0.01, provide optimizer=Flux.Adam(0.01). If you do not want to use an optimizer at all, and simply use normal gradient descent, provide optimizer=Descent(0.001), again replacing the learning rate with the learning rate of your preference.\n\nReturns a named tuple with the following values:\n\nmodel: the trained model\ndata_train: the training data, including any measures if computed by measures_func\ndata_val: the validation data, including any measures if computed by measures_func\nlosses_train: The losses of the training data for each epoch.\nlosses_val: The losses of the validation data after each epoch.\naccs_train: The accuracies of the training data after each epoch, if return_train_acc=true.\naccs_val: The accuracies of the validation data after each epoch.\n\nObligatory arguments\n\nX_train::Union{SparseMatrixCSC,Matrix}: training input matrix of dimension m x n\nY_train::Union{SparseMatrixCSC,Matrix}: training output/target matrix of dimension m x k\nX_train::Union{SparseMatrixCSC,Matrix}: validation input matrix of dimension l x n\nY_train::Union{SparseMatrixCSC,Matrix}: validation output/target matrix of dimension l x k\ndata_train::DataFrame: training data\ndata_val::DataFrame: validation data\ntarget_col::Union{Symbol, String}: column with target wordforms in datatrain and dataval\nmodel_outpath::String: filepath to where final model should be stored (in .bson format)\n\nOptional arguments\n\nhidden_dim::Int=1000: hidden dimension of the model\nn_epochs::Int=100: number of epochs for which the model should be trained\nbatchsize::Int=64: batchsize during training\nloss_func::Function=Flux.mse: Loss function. Per default this is the mse loss, but other options might be a crossentropy loss (Flux.crossentropy). Make sure the model makes sense with the loss function!\noptimizer=Flux.Adam(0.001): optimizer to use for training\nmodel::Union{Missing, Chain} = missing: A custom model can be provided for training. Its requirements are that it has to correspond to the input and output size of the training and validation data\nearly_stopping::Union{Missing, Int}=missing: If missing, no early stopping is used. Otherwise early_stopping indicates how many epochs have to pass without improvement in validation accuracy before the training is stopped.\noptimise_for_acc::Bool=false: if true, keep model with highest validation accuracy. If false, keep model with lowest validation loss.\nreturn_losses::Bool=false: whether additional to the model per-epoch losses for the training and test data as well as per-epoch accuracy on the validation data should be returned\nverbose::Bool=true: Turn on verbose mode\nmeasures_func::Union{Missing, Function}=missing: A measures function which is run at the end of every epoch. For more information see The measures_func argument. If a measure is tagged for each epoch, the one tagged with \"final\" will be the one for the finally returned model.\nreturn_train_acc::Bool=false: If true, a vector with training accuracies is returned at the end of the training.\n...kargs: any additional keyword arguments are passed to the measures_func\n\n\n\n\n\n","category":"method"},{"location":"man/deep_learning/#JudiLing.get_and_train_model-Tuple{Union{SparseArrays.SparseMatrixCSC, Matrix}, Union{SparseArrays.SparseMatrixCSC, Matrix}, String}","page":"Deep learning","title":"JudiLing.get_and_train_model","text":"get_and_train_model(X_train::Union{SparseMatrixCSC,Matrix},\n                    Y_train::Union{SparseMatrixCSC,Matrix},\n                    model_outpath::String;\n                    data_train::Union{Missing, DataFrame}=missing,\n                    target_col::Union{Missing, Symbol, String}=missing,\n                    hidden_dim::Int=1000,\n                    n_epochs::Int=100,\n                    batchsize::Int=64,\n                    loss_func::Function=Flux.mse,\n                    optimizer=Flux.Adam(0.001),\n                    model::Union{Missing, Chain} = missing,\n                    return_losses::Bool=false,\n                    verbose::Bool=true,\n                    measures_func::Union{Missing, Function}=missing,\n                    return_train_acc::Bool=false,\n                    ...kargs)\n\nTrains a deep learning model from X_train to Y_train, saving the model after n_epochs epochs. The default model looks like this:\n\ninp_dim = size(X_train, 2)\nout_dim = size(Y_train, 2)\nChain(Dense(inp_dim => hidden_dim, relu), Dense(hidden_dim => out_dim))\n\nAny other model with the same input and output dimensions can be provided to the function with the model argument. The default loss function is mean squared error, but any other loss function can be provded, as long as it fits with the model architecture.\n\nBy default the adam optimizer (Kingma and Ba, 2015) with learning rate 0.001 is used. You can provide any other optimizer. If you want to use a different learning rate, e.g. 0.01, provide optimizer=Flux.Adam(0.01). If you do not want to use an optimizer at all, and simply use normal gradient descent, provide optimizer=Descent(0.001), again replacing the learning rate with the learning rate of your preference.\n\nReturns a named tuple with the following values:\n\nmodel: the trained model\ndata_train: the data, including any measures if computed by measures_func\ndata_val: missing for this function\nlosses_train: The losses of the training data for each epoch.\nlosses_val: missing for this function\naccs_train: The accuracies of the training data after each epoch, if return_train_acc=true.\naccs_val: missing for this function\n\nObligatory arguments\n\nX_train::Union{SparseMatrixCSC,Matrix}: training input matrix of dimension m x n\nY_train::Union{SparseMatrixCSC,Matrix}: training output/target matrix of dimension m x k\nmodel_outpath::String: filepath to where final model should be stored (in .bson format)\n\nOptional arguments\n\ndata_train::Union{Missing, DataFrame}=missing: The training data. Only necessary if a measuresfunc is included or returntrain_acc=true.\ntarget_col::Union{Missing, Symbol, String}=missing: The column with target word forms in the training data. Only necessary if a measuresfunc is included or returntrain_acc=true.\nhidden_dim::Int=1000: hidden dimension of the model\nn_epochs::Int=100: number of epochs for which the model should be trained\nbatchsize::Int=64: batchsize during training\nloss_func::Function=Flux.mse: Loss function. Per default this is the mse loss, but other options might be a crossentropy loss (Flux.crossentropy). Make sure the model makes sense with the loss function!\noptimizer=Flux.Adam(0.001): optimizer to use for training\nmodel::Union{Missing, Chain} = missing: A custom model can be provided for training. Its requirements are that it has to correspond to the input and output size of the training and validation data\nreturn_losses::Bool=false: whether additional to the model per-epoch losses for the training and test data as well as per-epoch accuracy on the validation data should be returned\nverbose::Bool=true: Turn on verbose mode\nmeasures_func::Union{Missing, Function}=missing: A measures function which is run at the end of every epoch. For more information see The measures_func argument.\nreturn_train_acc::Bool=false: If true, a vector with training accuracies is returned at the end of the training.\n...kargs: any additional keyword arguments are passed to the measures_func\n\n\n\n\n\n","category":"method"},{"location":"man/deep_learning/#JudiLing.fiddl-Tuple{Union{SparseArrays.SparseMatrixCSC, Matrix}, Union{SparseArrays.SparseMatrixCSC, Matrix}, Vector, DataFrames.DataFrame, Union{String, Symbol}, String}","page":"Deep learning","title":"JudiLing.fiddl","text":"fiddl(X_train::Union{SparseMatrixCSC,Matrix},\n        Y_train::Union{SparseMatrixCSC,Matrix},\n        learn_seq::Vector,\n        data::DataFrame,\n        target_col::Union{Symbol, String},\n        model_outpath::String;\n        hidden_dim::Int=1000,\n        batchsize::Int=64,\n        loss_func::Function=Flux.mse,\n        optimizer=Flux.Adam(0.001),\n        model::Union{Missing, Chain} = missing,\n        return_losses::Bool=false,\n        verbose::Bool=true,\n        n_batch_eval::Int=100,\n        compute_accuracy::Bool=true,\n        measures_func::Union{Function, Missing}=missing,\n        kargs...)\n\nTrains a deep learning model using the FIDDL method (frequency-informed deep discriminative learning). Optionally, after each n_batch_eval batches measures_func can be run to compute any measures which are then added to the data.\n\nnote: Note\nIf you get an OutOfMemory error, chances are that this is due to the eval_SC function being evaluated after each n_batch_eval batches. Setting compute_accuracy=false disables computing the mapping accuracy.\n\nReturns a named tuple with the following values:\n\nmodel: the trained model\ndata: the data, including any measures if computed by measures_func\nlosses_train: The losses of the data the model is trained on within each n_batch_eval batches.\nlosses: The losses of the full dataset after each n_batch_eval batches.\naccs: The accuracies of the full dataset after each n_batch_eval batches.\n\nObligatory arguments\n\nX_train::Union{SparseMatrixCSC,Matrix}: training input matrix of dimension m x n\nY_train::Union{SparseMatrixCSC,Matrix}: training output/target matrix of dimension m x k\nlearn_seq::Vector: List of indices in the order that the vectors in Xtrain and Ytrain should be presented to the model for training.\ndata::DataFrame: The full data.\ntarget_col::Union{Symbol, String}: The column with target word forms in the data.\nmodel_outpath::String: filepath to where final model should be stored (in .bson format)\n\nOptional arguments\n\nhidden_dim::Int=1000: hidden dimension of the model\nn_epochs::Int=100: number of epochs for which the model should be trained\nbatchsize::Int=64: batchsize during training\nloss_func::Function=Flux.mse: Loss function. Per default this is the mse loss, but other options might be a crossentropy loss (Flux.crossentropy). Make sure the model makes sense with the loss function!\noptimizer=Flux.Adam(0.001): optimizer to use for training\nmodel::Union{Missing, Chain} = missing: A custom model can be provided for training. Its requirements are that it has to correspond to the input and output size of the training and validation data\nreturn_losses::Bool=false: whether additional to the model per-epoch losses for the training and test data as well as per-epoch accuracy on the validation data should be returned\nverbose::Bool=true: Turn on verbose mode\nn_batch_eval::Int=100: Loss, accuracy and measures_func are evaluated every n_batch_eval batches.\ncompute_accuracy::Bool=true: Whether accuracy should be computed every n_batch_eval batches.\nmeasures_func::Union{Missing, Function}=missing: A measures function which is run each n_batch_eval batches. For more information see The measures_func argument.\n\n\n\n\n\n","category":"method"},{"location":"man/pickle/","page":"Pickle","title":"Pickle","text":"CurrentModule = JudiLing","category":"page"},{"location":"man/pickle/#Utils","page":"Pickle","title":"Utils","text":"","category":"section"},{"location":"man/pickle/","page":"Pickle","title":"Pickle","text":"    save_pickle\n    load_pickle","category":"page"},{"location":"man/pickle/#JudiLing.save_pickle","page":"Pickle","title":"JudiLing.save_pickle","text":"Save pickle from python pickle file.\n\n\n\n\n\n","category":"function"},{"location":"man/pickle/#JudiLing.load_pickle","page":"Pickle","title":"JudiLing.load_pickle","text":"Load pickle from python pickle file.\n\n\n\n\n\n","category":"function"},{"location":"man/measures_func/#The-measures_func-argument","page":"Measures function","title":"The measures_func argument","text":"","category":"section"},{"location":"man/measures_func/","page":"Measures function","title":"Measures function","text":"The deep learning functions get_and_train_model and fiddl take a measures_func as one of their arguments. This helps computing measures during the training. For this to work, the measures_func has to conform to the following format.","category":"page"},{"location":"man/measures_func/#For-get_and_train_model","page":"Measures function","title":"For get_and_train_model","text":"","category":"section"},{"location":"man/measures_func/","page":"Measures function","title":"Measures function","text":"data_train, data_val = measures_func(X_train,\n                                    Y_train,\n                                    X_val,\n                                    Y_val,\n                                    Yhat_train,\n                                    Yhat_val,\n                                    data_train,\n                                    data_val,\n                                    target_col,\n                                    model,\n                                    epoch;\n                                    kargs...)\n\n## Input\n\n- `X_train`: The input training matrix.\n- `Y_train`: The target training matrix\n- `X_val`: The input validation matrix.\n- `Y_val`: The target validation matrix.\n- `Yhat_train`: The predicted training matrix.\n- `Yhat_val`: The predicted validation matrix.\n- `data_train`: The training dataset.\n- `data_val`: The validation dataset.\n- `target_col`: The name of the column with the target wordforms in the datasets.\n- `model`: The trained model.\n- `epoch`: The epoch the training is currently in.\n- `kargs...`: Any other keyword arguments that should be passed to the function.\n\nNote: the `kargs` are just keyword arguments that are passed on from the parameters of `get_and_train_model` to the `measures_func`. For example, this could be a suffix that should be added to each added column in `measures_func`.\n\n## Output\nThe function has to return the training and validation dataframes.","category":"page"},{"location":"man/measures_func/#Example","page":"Measures function","title":"Example","text":"","category":"section"},{"location":"man/measures_func/","page":"Measures function","title":"Measures function","text":"Define a measures_func. This one computes target correlations for both training and validation datasets.","category":"page"},{"location":"man/measures_func/","page":"Measures function","title":"Measures function","text":"function compute_target_corr(X_train, Y_train, X_val, Y_val,\n                                    Yhat_train, Yhat_val, data_train,\n                                    data_val, target_col, model, epoch)\n        _, corr = JudiLing.eval_SC(Yhat_train, Y_train, R=true)\n        data_train[!, string(\"target_corr_\", epoch)] = diag(corr)\n        _, corr = JudiLing.eval_SC(Yhat_val, Y_val, R=true)\n        data_val[!, string(\"target_corr_\", epoch)] = diag(corr)\n        return(data_train, data_val)\nend","category":"page"},{"location":"man/measures_func/","page":"Measures function","title":"Measures function","text":"Train a model for 100 epochs, call compute_target_corr after each epoch.","category":"page"},{"location":"man/measures_func/","page":"Measures function","title":"Measures function","text":"res = JudiLing.get_and_train_model(cue_obj_train.C,\n                            S_train,\n                            cue_obj_val.C,\n                            S_val,\n                            train, val,\n                            :Word,\n                            \"test.bson\",\n                            return_losses=true,\n                            batchsize=3,\n                            measures_func=compute_target_corr)\n","category":"page"},{"location":"man/measures_func/#For-fiddl","page":"Measures function","title":"For fiddl","text":"","category":"section"},{"location":"man/measures_func/","page":"Measures function","title":"Measures function","text":"data = measures_func(X_train,\n                      Y_train,\n                      Yhat_train,\n                      data,\n                      target_col,\n                      model,\n                      step;\n                      kargs...)\n\n## Input\n\n- `X_train`: The input matrix of the full dataset.\n- `Y_train`: The target matrix of the full dataset.\n- `Yhat_train`: The predicted matrix of the full dataset at current step.\n- `data_train`: The full dataset.\n- `target_col`: The name of the column with the target wordforms in the dataset.\n- `model`: The trained model.\n- `step`: The step the training is currently in.\n- `kargs...`: Any other keyword arguments that should be passed to the function.\n\nNote: the `kargs` are just keyword arguments that are passed on from the parameters of `get_and_train_model` to the `measures_func`. For example, this could be a suffix that should be added to each added column in `measures_func`.\n\n## Output\nThe function has to return the dataset.","category":"page"},{"location":"man/pyndl/","page":"Pyndl","title":"Pyndl","text":"CurrentModule = JudiLing","category":"page"},{"location":"man/pyndl/","page":"Pyndl","title":"Pyndl","text":"JudiLing is able to call the python package pyndl internally to compute NDL models. pyndl uses event files to compute the mapping matrices, which have to be generated manually or by using pyndl in Python, see documentation here. The advantage of calling pyndl from JudiLing is that the resulting weights, cue and semantic matrices can be directly translated into JudiLing format and further processing can be done in JudiLing.","category":"page"},{"location":"man/pyndl/","page":"Pyndl","title":"Pyndl","text":"note: Note\nFor pyndl to be available in JudiLing, PyCall has to be imported before JudiLing:using PyCall\nusing JudiLing","category":"page"},{"location":"man/pyndl/#Calling-pyndl-from-JudiLing","page":"Pyndl","title":"Calling pyndl from JudiLing","text":"","category":"section"},{"location":"man/pyndl/","page":"Pyndl","title":"Pyndl","text":"    Pyndl_Weight_Struct\n    pyndl(\n        data_path::String;\n        alpha::Float64 = 0.1,\n        betas::Tuple{Float64,Float64} = (0.1, 0.1),\n        method::String = \"openmp\"\n    )","category":"page"},{"location":"man/pyndl/#JudiLing.Pyndl_Weight_Struct","page":"Pyndl","title":"JudiLing.Pyndl_Weight_Struct","text":"Pyndl_Weight_Struct\n    cues::Vector{String}\n    outcomes::Vector{String}\n    weight::Matrix{Float64}\n\ncues::Vector{String}: Vector of cues, in the order that they appear in the weight matrix.\noutcomes::Vector{String}: Vector of outcomes, in the order that they appear in the weight matrix.\nweight::Matrix{Float64}: Weight matrix.\n\n\n\n\n\n","category":"type"},{"location":"man/pyndl/#JudiLing.pyndl-Tuple{String}","page":"Pyndl","title":"JudiLing.pyndl","text":"pyndl(\n    data_path::String;\n    alpha::Float64 = 0.1,\n    betas::Tuple{Float64,Float64} = (0.1, 0.1),\n    method::String = \"openmp\"\n)\n\nCompute weights using pyndl. See the documentation of pyndl for more information: https://pyndl.readthedocs.io/en/latest/\n\nObligatory arguments\n\ndata_path::String: Path to an events file as generated by pyndl's preprocess.createeventfile\n\nOptional arguments\n\nalpha::Float64 = 0.1: α learning rate.\nbetas::Tuple{Float64,Float64} = (0.1, 0.1): β1 and β2 learning rates\nmethod::String = \"openmp\": One of {\"openmp\", \"threading\"}. \"openmp\" only works on Linux.\n\nExample\n\nweights = JudiLing.pyndl(\"data/latin_train_events.tab.gz\")\n\n\n\n\n\n","category":"method"},{"location":"man/pyndl/#Translating-output-of-pyndl-to-cue-and-semantic-matrices-in-JudiLing","page":"Pyndl","title":"Translating output of pyndl to cue and semantic matrices in JudiLing","text":"","category":"section"},{"location":"man/pyndl/","page":"Pyndl","title":"Pyndl","text":"With the weights in hand, the cue and semantic matrices can be computed:","category":"page"},{"location":"man/pyndl/","page":"Pyndl","title":"Pyndl","text":"    make_cue_matrix(\n        data::DataFrame,\n        pyndl_weights::Pyndl_Weight_Struct;\n        grams = 3,\n        target_col = \"Words\",\n        tokenized = false,\n        sep_token = nothing,\n        keep_sep = false,\n        start_end_token = \"#\",\n        verbose = false,\n    )\n    make_S_matrix(\n        data::DataFrame,\n        pyndl_weights::Pyndl_Weight_Struct,\n        n_features_columns::Vector;\n        tokenized::Bool=false,\n        sep_token::String=\"_\"\n    )\n    make_S_matrix(\n        data_train::DataFrame,\n        data_val::DataFrame,\n        pyndl_weights::Pyndl_Weight_Struct,\n        n_features_columns::Vector;\n        tokenized::Bool=false,\n        sep_token::String=\"_\"\n    )","category":"page"},{"location":"man/pyndl/#JudiLing.make_cue_matrix-Tuple{DataFrames.DataFrame, JudiLing.Pyndl_Weight_Struct}","page":"Pyndl","title":"JudiLing.make_cue_matrix","text":"make_cue_matrix(\n    data::DataFrame,\n    pyndl_weights::Pyndl_Weight_Struct;\n    grams = 3,\n    target_col = \"Words\",\n    tokenized = false,\n    sep_token = nothing,\n    keep_sep = false,\n    start_end_token = \"#\",\n    verbose = false,\n)\n\nMake the cue matrix based on a dataframe and weights computed with pyndl. Practically this means that the cues are extracted from the weights object and translated to the JudiLing format.\n\nObligatory arguments\n\ndata::DataFrame: Dataset with all the word types on which the weights were trained.\npyndl_weights::Pyndl_Weight_Struct: Weights trained with JudiLing.pyndl\n\nOptional argyments\n\ngrams = 3: N-gram size (has to match the n-gram granularity of the cues on which the weights were trained).\ntarget_col = \"Words\": Column with target words.\ntokenized = false: Whether the target words are already tokenized\nsep_token = nothing: The string separating the tokens (only used if tokenized=true).\nkeep_sep = false: Whether the sep_token should be retained in the cues.\nstart_end_token = \"#\": The string with which to mark word boundaries.\nverbose = false: Verbose mode.\n\nExample\n\nweights = JudiLing.pyndl(\"data/latin_train_events.tab.gz\")\ncue_obj = JudiLing.make_cue_matrix(\"latin_train.csv\", weights,\n                                    grams = 3,\n                                    target_col = \"Word\")\n\n\n\n\n\n","category":"method"},{"location":"man/pyndl/#JudiLing.make_S_matrix-Tuple{DataFrames.DataFrame, JudiLing.Pyndl_Weight_Struct, Vector}","page":"Pyndl","title":"JudiLing.make_S_matrix","text":"make_S_matrix(\n    data::DataFrame,\n    pyndl_weights::Pyndl_Weight_Struct,\n    n_features_columns::Vector;\n    tokenized::Bool=false,\n    sep_token::String=\"_\"\n)\n\nCreate semantic matrix based on a dataframe and weights computed with pyndl. Practically this means that the semantic features are extracted from the weights object and translated to the JudiLing format.\n\nObligatory arguments\n\ndata::DataFrame: The dataset with word types.\npyndl_weights::Pyndl_Weight_Struct: Weights trained with JudiLing.pyndl.\nn_features_columns::Vector: Vector of columns with the features in the dataset.\n\nOptional arguments\n\ntokenized=false: Whether the features in n_features_columns columns are already tokenized (e.g. \"feature1_feature2_feature3\")\nsep_token=\"_\": The string with which the features are separated (only used if tokenized=false).\n\nExample\n\nweights = JudiLing.pyndl(\"data/latin_train_events.tab.gz\")\nS = JudiLing.make_S_matrix(data,\n                            weights_latin,\n                            [\"Lexeme\", \"Person\", \"Number\", \"Tense\", \"Voice\", \"Mood\"],\n                            tokenized=false)\n\n\n\n\n\n","category":"method"},{"location":"man/pyndl/#JudiLing.make_S_matrix-Tuple{DataFrames.DataFrame, DataFrames.DataFrame, JudiLing.Pyndl_Weight_Struct, Vector}","page":"Pyndl","title":"JudiLing.make_S_matrix","text":"make_S_matrix(\n    data_train::DataFrame,\n    data_val::DataFrame,\n    pyndl_weights::Pyndl_Weight_Struct,\n    n_features_columns::Vector;\n    tokenized::Bool=false,\n    sep_token::String=\"_\"\n)\n\nCreate semantic matrix based on a training and validation dataframe and weights computed with pyndl. Practically this means that the semantic features are extracted from the weights object and translated to the JudiLing format.\n\nObligatory arguments\n\ndata_train::DataFrame: The training dataset.\ndata_val::DataFrame: The validation dataset.\npyndl_weights::Pyndl_Weight_Struct: Weights trained with JudiLing.pyndl.\nn_features_columns::Vector: Vector of columns with the features in the training and validation datasets.\n\nOptional arguments\n\ntokenized=false: Whether the features in n_features_columns columns are already tokenized (e.g. \"feature1_feature2_feature3\")\nsep_token=\"_\": The string with which the features are separated (only used if tokenized=false).\n\nExample\n\nweights = JudiLing.pyndl(\"data/latin_train_events.tab.gz\")\nS_train, S_val = JudiLing.make_S_matrix(train,\n                            val,\n                            weights_latin,\n                            [\"Lexeme\", \"Person\", \"Number\", \"Tense\", \"Voice\", \"Mood\"],\n                            tokenized=false)\n\n\n\n\n\n","category":"method"},{"location":"man/wh/","page":"Widrow-Hoff Learning","title":"Widrow-Hoff Learning","text":"CurrentModule = JudiLing","category":"page"},{"location":"man/wh/#Utils","page":"Widrow-Hoff Learning","title":"Utils","text":"","category":"section"},{"location":"man/wh/","page":"Widrow-Hoff Learning","title":"Widrow-Hoff Learning","text":"    wh_learn(\n        X,\n        Y;\n        eta = 0.01,\n        n_epochs = 1,\n        weights = nothing,\n        learn_seq = nothing,\n        save_history = false,\n        history_cols = nothing,\n        history_rows = nothing,\n        verbose = false,\n        )\n    make_learn_seq(freq; random_seed = 314)","category":"page"},{"location":"man/wh/#JudiLing.wh_learn-Tuple{Any, Any}","page":"Widrow-Hoff Learning","title":"JudiLing.wh_learn","text":"wh_learn(\n    X,\n    Y;\n    eta = 0.01,\n    n_epochs = 1,\n    weights = nothing,\n    learn_seq = nothing,\n    save_history = false,\n    history_cols = nothing,\n    history_rows = nothing,\n    verbose = false,\n    )\n\nWidrow-Hoff Learning.\n\nObligatory Arguments\n\ntest_mode::Symbol: which test mode, currently supports :trainonly, :presplit, :carefulsplit and :randomsplit.\n\nOptional Arguments\n\neta::Float64=0.1: the learning rate\nn_epochs::Int64=1: the number of epochs to be trained\nweights::Matrix=nothing: the initial weights\nlearn_seq::Vector=nothing: the learning sequence\nsave_history::Bool=false: if true, a partical training history will be saved\nhistory_cols::Vector=nothing: the list of column indices you want to saved in history, e.g. [1,32,42] or [2]\nhistory_rows::Vector=nothing: the list of row indices you want to saved in history, e.g. [1,32,42] or [2]\nverbose::Bool = false: if true, more information will be printed out\n\n\n\n\n\n","category":"method"},{"location":"man/wh/#JudiLing.make_learn_seq-Tuple{Any}","page":"Widrow-Hoff Learning","title":"JudiLing.make_learn_seq","text":"make_learn_seq(freq; random_seed = 314)\n\nMake Widrow-Hoff learning sequence from frequencies. Creates a randomly ordered sequences of indices where each index appears according to its frequncy.\n\nObligatory arguments\n\nfreq: Vector with frequencies.\n\nOptional arguments\n\nrandom_seed = 314: Random seed to control randomness.\n\nExample\n\nlearn_seq = JudiLing.make_learn_seq(data.frequency)\n\n\n\n\n\n","category":"method"},{"location":"man/utils/","page":"Utils","title":"Utils","text":"CurrentModule = JudiLing","category":"page"},{"location":"man/utils/#Utils","page":"Utils","title":"Utils","text":"","category":"section"},{"location":"man/utils/","page":"Utils","title":"Utils","text":"    iscorrect\n    display_pred\n    translate\n    translate_path\n    is_truly_sparse\n    isattachable\n    iscomplete\n    isstart\n    isnovel\n    check_used_token\n    cal_max_timestep","category":"page"},{"location":"man/utils/#JudiLing.iscorrect","page":"Utils","title":"JudiLing.iscorrect","text":"Check whether the predictions are correct.\n\n\n\n\n\n","category":"function"},{"location":"man/utils/#JudiLing.display_pred","page":"Utils","title":"JudiLing.display_pred","text":"Display prediction nicely.\n\n\n\n\n\n","category":"function"},{"location":"man/utils/#JudiLing.translate","page":"Utils","title":"JudiLing.translate","text":"Translate indices into words or utterances\n\n\n\n\n\n","category":"function"},{"location":"man/utils/#JudiLing.translate_path","page":"Utils","title":"JudiLing.translate_path","text":"Append indices together to form a path\n\n\n\n\n\n","category":"function"},{"location":"man/utils/#JudiLing.is_truly_sparse","page":"Utils","title":"JudiLing.is_truly_sparse","text":"Check whether a matrix is truly sparse regardless its format, where M is originally a sparse matrix format.\n\n\n\n\n\nCheck whether a matrix is truly sparse regardless its format, where M is originally a dense matrix format.\n\n\n\n\n\n","category":"function"},{"location":"man/utils/#JudiLing.isattachable","page":"Utils","title":"JudiLing.isattachable","text":"Check whether a gram can attach to another gram.\n\n\n\n\n\nCheck whether a gram can attach to another gram.\n\n\n\n\n\n","category":"function"},{"location":"man/utils/#JudiLing.iscomplete","page":"Utils","title":"JudiLing.iscomplete","text":"Check whether a path is complete.\n\n\n\n\n\n","category":"function"},{"location":"man/utils/#JudiLing.isstart","page":"Utils","title":"JudiLing.isstart","text":"Check whether a gram can start a path.\n\n\n\n\n\n","category":"function"},{"location":"man/utils/#JudiLing.isnovel","page":"Utils","title":"JudiLing.isnovel","text":"Check whether a predicted path is in training data.\n\n\n\n\n\n","category":"function"},{"location":"man/utils/#JudiLing.check_used_token","page":"Utils","title":"JudiLing.check_used_token","text":"Check whether there are tokens already used in dataset as n-gram components.\n\n\n\n\n\n","category":"function"},{"location":"man/utils/#JudiLing.cal_max_timestep","page":"Utils","title":"JudiLing.cal_max_timestep","text":"function cal_max_timestep(\n    data_train::DataFrame,\n    data_val::DataFrame,\n    target_col::Union{String, Symbol};\n    tokenized::Bool = false,\n    sep_token::Union{Nothing, String, Char} = \"\",\n)\n\nCalculate the max timestep given training and validation datasets.\n\nObligatory Arguments\n\ndata_train::DataFrame: the training dataset\ndata_val::DataFrame: the validation dataset\ntarget_col::Union{String, Symbol}: the column with the target word forms\n\nOptional Arguments\n\ntokenized::Bool = false: Whether the word forms in the target_col are already tokenized\nsep_token::Union{Nothing, String, Char} = \"\": The token with which the word forms are tokenized\n\nExamples\n\nJudiLing.cal_max_timestep(latin_train, latin_val, target_col=:Word)\n\n\n\n\n\nfunction cal_max_timestep(\n    data::DataFrame,\n    target_col::Union{String, Symbol};\n    tokenized::Bool = false,\n    sep_token::Union{Nothing, String, Char} = \"\",\n)\n\nCalculate the max timestep given training dataset.\n\nObligatory Arguments\n\ndata::DataFrame: the dataset\ntarget_col::Union{String, Symbol}: the column with the target word forms\n\nOptional Arguments\n\ntokenized::Bool = false: Whether the word forms in the target_col are already tokenized\nsep_token::Union{Nothing, String, Char} = \"\": The token with which the word forms are tokenized\n\nExamples\n\nJudiLing.cal_max_timestep(latin, target_col=:Word)\n\n\n\n\n\n","category":"function"},{"location":"man/make_adjacency_matrix/","page":"Make Adjacency Matrix","title":"Make Adjacency Matrix","text":"CurrentModule = JudiLing","category":"page"},{"location":"man/make_adjacency_matrix/#Make-Adjacency-Matrix","page":"Make Adjacency Matrix","title":"Make Adjacency Matrix","text":"","category":"section"},{"location":"man/make_adjacency_matrix/","page":"Make Adjacency Matrix","title":"Make Adjacency Matrix","text":"    make_full_adjacency_matrix\n    make_full_adjacency_matrix(i2f)\n    make_combined_adjacency_matrix(data_train, data_val)","category":"page"},{"location":"man/make_adjacency_matrix/#JudiLing.make_full_adjacency_matrix","page":"Make Adjacency Matrix","title":"JudiLing.make_full_adjacency_matrix","text":"make_adjacency_matrix(i2f)\n\nMake full adjacency matrix based only on the form of n-grams regardless of whether they are seen in the training data. This usually takes hours for large datasets, as all possible combinations are considered.\n\nObligatory Arguments\n\ni2f::Dict: the dictionary returning features given indices\n\nOptional Arguments\n\ntokenized::Bool=false:if true, the dataset target is assumed to be tokenized\nsep_token::Union{Nothing, String, Char}=nothing: separator token\nverbose::Bool=false: if true, more information will be printed\n\nExamples\n\n# without tokenization\ni2f = Dict([(1, \"#ab\"), (2, \"abc\"), (3, \"bc#\"), (4, \"#bc\"), (5, \"ab#\")])\nJudiLing.make_adjacency_matrix(i2f)\n\n# with tokenization\ni2f = Dict([(1, \"#-a-b\"), (2, \"a-b-c\"), (3, \"b-c-#\"), (4, \"#-b-c\"), (5, \"a-b-#\")])\nJudiLing.make_adjacency_matrix(\n    i2f,\n    tokenized=true,\n    sep_token=\"-\")\n\n\n\n\n\n","category":"function"},{"location":"man/make_adjacency_matrix/#JudiLing.make_full_adjacency_matrix-Tuple{Any}","page":"Make Adjacency Matrix","title":"JudiLing.make_full_adjacency_matrix","text":"make_adjacency_matrix(i2f)\n\nMake full adjacency matrix based only on the form of n-grams regardless of whether they are seen in the training data. This usually takes hours for large datasets, as all possible combinations are considered.\n\nObligatory Arguments\n\ni2f::Dict: the dictionary returning features given indices\n\nOptional Arguments\n\ntokenized::Bool=false:if true, the dataset target is assumed to be tokenized\nsep_token::Union{Nothing, String, Char}=nothing: separator token\nverbose::Bool=false: if true, more information will be printed\n\nExamples\n\n# without tokenization\ni2f = Dict([(1, \"#ab\"), (2, \"abc\"), (3, \"bc#\"), (4, \"#bc\"), (5, \"ab#\")])\nJudiLing.make_adjacency_matrix(i2f)\n\n# with tokenization\ni2f = Dict([(1, \"#-a-b\"), (2, \"a-b-c\"), (3, \"b-c-#\"), (4, \"#-b-c\"), (5, \"a-b-#\")])\nJudiLing.make_adjacency_matrix(\n    i2f,\n    tokenized=true,\n    sep_token=\"-\")\n\n\n\n\n\n","category":"method"},{"location":"man/make_adjacency_matrix/#JudiLing.make_combined_adjacency_matrix-Tuple{Any, Any}","page":"Make Adjacency Matrix","title":"JudiLing.make_combined_adjacency_matrix","text":"make_combined_adjacency_matrix(data_train, data_val)\n\nMake combined adjacency matrix.\n\nObligatory Arguments\n\ndata_train::DataFrame: training dataset\ndata_val::DataFrame: validation dataset\n\nOptional Arguments\n\ngrams=3: the number of grams for cues\ntarget_col=:Words: the column name for target strings\ntokenized=false:if true, the dataset target is assumed to be tokenized\nsep_token=nothing: separator\nkeep_sep=false: if true, keep separators in cues\nstart_end_token=\"#\": start and end token in boundary cues\nverbose=false: if true, more information is printed\n\nExamples\n\nJudiLing.make_combined_adjacency_matrix(\n    latin_train,\n    latin_val,\n    grams=3,\n    target_col=:Word,\n    tokenized=false,\n    keep_sep=false\n    )\n\n\n\n\n\n","category":"method"},{"location":"man/cholesky/","page":"Cholesky","title":"Cholesky","text":"CurrentModule = JudiLing","category":"page"},{"location":"man/cholesky/#Cholesky","page":"Cholesky","title":"Cholesky","text":"","category":"section"},{"location":"man/cholesky/","page":"Cholesky","title":"Cholesky","text":"    make_transform_fac\n    make_transform_matrix\n    make_transform_fac(X::SparseMatrixCSC)\n    make_transform_fac(X::Matrix)\n    make_transform_matrix(fac::Union{LinearAlgebra.Cholesky, SuiteSparse.CHOLMOD.Factor}, X::Union{SparseMatrixCSC, Matrix}, Y::Union{SparseMatrixCSC, Matrix})\n    make_transform_matrix(X::SparseMatrixCSC, Y::Matrix)\n    make_transform_matrix(X::Matrix, Y::Union{SparseMatrixCSC, Matrix})\n    make_transform_matrix(X::SparseMatrixCSC, Y::SparseMatrixCSC)\n    format_matrix(M::Union{SparseMatrixCSC, Matrix}, output_format=:auto)","category":"page"},{"location":"man/cholesky/#JudiLing.make_transform_fac","page":"Cholesky","title":"JudiLing.make_transform_fac","text":"The first part of make transform matrix, usually used by the learn_paths function to save time and computing resources.\n\n\n\n\n\n","category":"function"},{"location":"man/cholesky/#JudiLing.make_transform_matrix","page":"Cholesky","title":"JudiLing.make_transform_matrix","text":"Using Cholesky decomposition to calculate the transformation matrix from S to C or from C to S.\n\n\n\n\n\n","category":"function"},{"location":"man/cholesky/#JudiLing.make_transform_fac-Tuple{SparseArrays.SparseMatrixCSC}","page":"Cholesky","title":"JudiLing.make_transform_fac","text":"make_transform_fac(X::SparseMatrixCSC)\n\nCalculate the first step of Cholesky decomposition for sparse matrices.\n\n\n\n\n\n","category":"method"},{"location":"man/cholesky/#JudiLing.make_transform_fac-Tuple{Matrix}","page":"Cholesky","title":"JudiLing.make_transform_fac","text":"make_transform_fac(X::Matrix)\n\nCalculate the first step of Cholesky decomposition for dense matrices.\n\n\n\n\n\n","category":"method"},{"location":"man/cholesky/#JudiLing.make_transform_matrix-Tuple{Union{SparseArrays.CHOLMOD.Factor, LinearAlgebra.Cholesky}, Union{SparseArrays.SparseMatrixCSC, Matrix}, Union{SparseArrays.SparseMatrixCSC, Matrix}}","page":"Cholesky","title":"JudiLing.make_transform_matrix","text":"make_transform_matrix(fac::Union{LinearAlgebra.Cholesky, SuiteSparse.CHOLMOD.Factor}, X::Union{SparseMatrixCSC, Matrix}, Y::Union{SparseMatrixCSC, Matrix})\n\nSecond step in calculating the Cholesky decomposition for the transformation matrix.\n\n\n\n\n\n","category":"method"},{"location":"man/cholesky/#JudiLing.make_transform_matrix-Tuple{SparseArrays.SparseMatrixCSC, Matrix}","page":"Cholesky","title":"JudiLing.make_transform_matrix","text":"make_transform_matrix(X::SparseMatrixCSC, Y::Matrix)\n\nUse Cholesky decomposition to calculate the transformation matrix from X to Y, where X is a sparse matrix and Y is a dense matrix.\n\nObligatory Arguments\n\nX::SparseMatrixCSC: the X matrix, where X is a sparse matrix\nY::Matrix: the Y matrix, where Y is a dense matrix\n\nOptional Arguments\n\nmethod::Symbol = :additive: whether :additive or :multiplicative decomposition is required\nshift::Float64 = 0.02: shift value for :additive decomposition\nmultiplier::Float64 = 1.01: multiplier value for :multiplicative decomposition\noutput_format::Symbol = :auto: to force output format to dense(:dense) or sparse(:sparse), make it auto(:auto) to determined by the program\nsparse_ratio::Float64 = 0.05: the ratio to decide whether a matrix is sparse\nverbose::Bool = false: if true, more information will be printed out\n\nExamples\n\n# additive mode\nJudiLing.make_transform_matrix(\n    C,\n    S,\n    method = :additive,\n    shift = 0.02,\n    verbose = false)\n\n# multiplicative mode\nJudiLing.make_transform_matrix(\n    C,\n    S,\n    method = :multiplicative,\n    multiplier = 1.01,\n    verbose = false)\n\n# further control of sparsity ratio\nJudiLing.make_transform_matrix(\n  ...\n    output_format = :auto,\n    sparse_ratio = 0.05,\n  ...)\n\n\n\n\n\n","category":"method"},{"location":"man/cholesky/#JudiLing.make_transform_matrix-Tuple{Matrix, Union{SparseArrays.SparseMatrixCSC, Matrix}}","page":"Cholesky","title":"JudiLing.make_transform_matrix","text":"make_transform_matrix(X::Matrix, Y::Union{SparseMatrixCSC, Matrix})\n\nUse the Cholesky decomposition to calculate the transformation matrix from X to Y, where X is a dense matrix and Y is either a dense matrix or a sparse matrix.\n\nObligatory Arguments\n\nX::Matrix: the X matrix, where X is a dense matrix\nY::Union{SparseMatrixCSC, Matrix}: the Y matrix, where Y is either a sparse or a dense matrix\n\nOptional Arguments\n\nmethod::Symbol = :additive: whether :additive or :multiplicative decomposition is required\nshift::Float64 = 0.02: shift value for :additive decomposition\nmultiplier::Float64 = 1.01: multiplier value for :multiplicative decomposition\noutput_format::Symbol = :auto: to force output format to dense(:dense) or sparse(:sparse), make it auto(:auto) to determined by the program\nsparse_ratio::Float64 = 0.05: the ratio to decide whether a matrix is sparse\nverbose::Bool = false: if true, more information will be printed out\n\nExamples\n\n# additive mode\nJudiLing.make_transform_matrix(\n    C,\n    S,\n    method = :additive,\n    shift = 0.02,\n    verbose = false)\n\n# multiplicative mode\nJudiLing.make_transform_matrix(\n    C,\n    S,\n    method=:multiplicative,\n    multiplier = 1.01,\n    verbose = false)\n\n# further control of sparsity ratio\nJudiLing.make_transform_matrix(\n    ...\n    output_format = :auto,\n    sparse_ratio = 0.05,\n    ...)\n\n\n\n\n\n","category":"method"},{"location":"man/cholesky/#JudiLing.make_transform_matrix-Tuple{SparseArrays.SparseMatrixCSC, SparseArrays.SparseMatrixCSC}","page":"Cholesky","title":"JudiLing.make_transform_matrix","text":"make_transform_matrix(X::SparseMatrixCSC, Y::SparseMatrixCSC)\n\nUse the Cholesky decomposition to calculate the transformation matrix from X to Y, where X is a sparse matrix and Y is a sparse matrix.\n\nObligatory Arguments\n\nX::SparseMatrixCSC: the X matrix, where X is a sparse matrix\nY::SparseMatrixCSC: the Y matrix, where Y is a sparse matrix\n\nOptional Arguments\n\nmethod::Symbol = :additive: whether :additive or :multiplicative decomposition is required\nshift::Float64 = 0.02: shift value for :additive decomposition\nmultiplier::Float64 = 1.01: multiplier value for :multiplicative decomposition\noutput_format::Symbol = :auto: to force output format to dense(:dense) or sparse(:sparse), make it auto(:auto) to determined by the program\nsparse_ratio::Float64 = 0.05: the ratio to decide whether a matrix is sparse\nverbose::Bool = false: if true, more information will be printed out\n\nExamples\n\n# additive mode\nJudiLing.make_transform_matrix(\n    C,\n    S,\n    method = :additive,\n    shift = 0.02,\n    verbose = false)\n\n# multiplicative mode\nJudiLing.make_transform_matrix(\n    C,\n    S,\n    method = :multiplicative,\n    multiplier = 1.01,\n    verbose = false)\n\n# further control of sparsity ratio\nJudiLing.make_transform_matrix(\n    ...\n    output_format = :auto,\n    sparse_ratio = 0.05,\n    ...)\n\n\n\n\n\n","category":"method"},{"location":"man/cholesky/#JudiLing.format_matrix","page":"Cholesky","title":"JudiLing.format_matrix","text":"format_matrix(M::Union{SparseMatrixCSC, Matrix}, output_format=:auto)\n\nConvert output matrix format to either a dense matrix or a sparse matrix.\n\n\n\n\n\n","category":"function"},{"location":"man/make_semantic_matrix/","page":"Make Semantic Matrix","title":"Make Semantic Matrix","text":"CurrentModule = JudiLing","category":"page"},{"location":"man/make_semantic_matrix/#Make-Semantic-Matrix","page":"Make Semantic Matrix","title":"Make Semantic Matrix","text":"","category":"section"},{"location":"man/make_semantic_matrix/#Make-binary-semantic-vectors","page":"Make Semantic Matrix","title":"Make binary semantic vectors","text":"","category":"section"},{"location":"man/make_semantic_matrix/","page":"Make Semantic Matrix","title":"Make Semantic Matrix","text":"    PS_Matrix_Struct\n    make_pS_matrix\n    make_pS_matrix(data)\n    make_pS_matrix(data_val, pS_obj)\n    make_combined_pS_matrix(\n        data_train,\n        data_val;\n        features_col = :CommunicativeIntention,\n        sep_token = \"_\",\n    )","category":"page"},{"location":"man/make_semantic_matrix/#JudiLing.PS_Matrix_Struct","page":"Make Semantic Matrix","title":"JudiLing.PS_Matrix_Struct","text":"A structure that stores the discrete semantic vectors: pS is the discrete semantic matrix; f2i is a dictionary returning the indices for features; i2f is a dictionary returning the features for indices.\n\n\n\n\n\n","category":"type"},{"location":"man/make_semantic_matrix/#JudiLing.make_pS_matrix","page":"Make Semantic Matrix","title":"JudiLing.make_pS_matrix","text":"Make discrete semantic matrix.\n\n\n\n\n\n","category":"function"},{"location":"man/make_semantic_matrix/#JudiLing.make_pS_matrix-Tuple{Any}","page":"Make Semantic Matrix","title":"JudiLing.make_pS_matrix","text":"make_pS_matrix(data)\n\nCreate a discrete semantic matrix given a dataframe.\n\nObligatory Arguments\n\ndata::DataFrame: the dataset\n\nOptional Arguments\n\nfeatures_col::Symbol=:CommunicativeIntention: the column name for target\nsep_token::String=\"_\": separator\n\nExamples\n\ns_obj_train = JudiLing.make_pS_matrix(\n    utterance,\n    features_col=:CommunicativeIntention,\n    sep_token=\"_\")\n\n\n\n\n\n","category":"method"},{"location":"man/make_semantic_matrix/#JudiLing.make_pS_matrix-Tuple{Any, Any}","page":"Make Semantic Matrix","title":"JudiLing.make_pS_matrix","text":"make_pS_matrix(data_val, pS_obj)\n\nConstruct discrete semantic matrix for the validation datasets given by the exemplar in the dataframe, and given the S matrix for the training datasets.\n\nObligatory Arguments\n\ndata_val::DataFrame: the dataset\npS_obj::PS_Matrix_Struct: training PS object\n\nOptional Arguments\n\nfeatures_col::Symbol=:CommunicativeIntention: the column name for target\nsep_token::String=\"_\": separator\n\nExamples\n\ns_obj_val = JudiLing.make_pS_matrix(\n    data_val,\n    s_obj_train,\n    features_col=:CommunicativeIntention,\n    sep_token=\"_\")\n\n\n\n\n\n","category":"method"},{"location":"man/make_semantic_matrix/#JudiLing.make_combined_pS_matrix-Tuple{Any, Any}","page":"Make Semantic Matrix","title":"JudiLing.make_combined_pS_matrix","text":"make_combined_pS_matrix(\n    data_train,\n    data_val;\n    features_col = :CommunicativeIntention,\n    sep_token = \"_\",\n)\n\nCreate discrete semantic matrices for a train and validation dataframe.\n\nObligatory Arguments\n\ndata_train::DataFrame: the training dataset\ndata_val::DataFrame: the validation dataset\n\nOptional Arguments\n\nfeatures_col::Symbol=:CommunicativeIntention: the column name for target\nsep_token::String=\"_\": separator\n\nExamples\n\ns_obj_train, s_obj_val = JudiLing.make_combined_pS_matrix(\n    data_train,\n    data_val,\n    features_col=:CommunicativeIntention,\n    sep_token=\"_\")\n\n\n\n\n\n","category":"method"},{"location":"man/make_semantic_matrix/#Simulate-semantic-vectors","page":"Make Semantic Matrix","title":"Simulate semantic vectors","text":"","category":"section"},{"location":"man/make_semantic_matrix/","page":"Make Semantic Matrix","title":"Make Semantic Matrix","text":"    L_Matrix_Struct\n    make_S_matrix\n    make_L_matrix\n    make_combined_S_matrix\n    make_combined_L_matrix\n    make_S_matrix(data::DataFrame, base::Vector, inflections::Vector)\n    make_S_matrix(data_train::DataFrame, data_val::DataFrame, base::Vector, inflections::Vector)\n    make_S_matrix(data::DataFrame, base::Vector)\n    make_S_matrix(data_train::DataFrame, data_val::DataFrame, base::Vector)\n    make_S_matrix(data_train::DataFrame, base::Vector, inflections::Vector, L::L_Matrix_Struct)\n    make_S_matrix(data_train::DataFrame, data_val::Union{DataFrame, Nothing}, base::Vector, L::L_Matrix_Struct)\n    make_S_matrix(data::DataFrame, base::Vector, L::L_Matrix_Struct)\n    make_S_matrix(data_train::DataFrame, data_val::DataFrame, base::Vector, inflections::Vector, L::L_Matrix_Struct)\n    make_L_matrix(data::DataFrame, base::Vector)\n    make_combined_S_matrix(data_train::DataFrame, data_val::DataFrame, base::Vector, inflections::Vector, L::L_Matrix_Struct)\n    make_combined_S_matrix(data_train::DataFrame, data_val::Union{DataFrame, Nothing}, base::Vector, L::L_Matrix_Struct)\n    make_combined_S_matrix(  data_train::DataFrame, data_val::DataFrame, base::Vector, inflections::Vector)\n    make_combined_S_matrix(data_train::DataFrame, data_val::DataFrame, base::Vector)\n    make_combined_L_matrix(data_train::DataFrame, data_val::DataFrame, base::Vector, inflections::Vector)\n    make_combined_L_matrix(data_train::DataFrame, data_val::DataFrame, base::Vector)\n    L_Matrix_Struct(L, sd_base, sd_base_mean, sd_inflection, sd_inflection_mean, base_f, infl_f, base_f2i, infl_f2i, n_base_f, n_infl_f, ncol)\n    L_Matrix_Struct(L, sd_base, sd_inflection, base_f, infl_f, base_f2i, infl_f2i, n_base_f, n_infl_f, ncol)","category":"page"},{"location":"man/make_semantic_matrix/#JudiLing.L_Matrix_Struct","page":"Make Semantic Matrix","title":"JudiLing.L_Matrix_Struct","text":"A structure that stores Lexome semantic vectors: L is Lexome semantic matrix; f2i is a dictionary returning the indices for features; i2f is a dictionary returning the features for indices.\n\n\n\n\n\n","category":"type"},{"location":"man/make_semantic_matrix/#JudiLing.make_S_matrix","page":"Make Semantic Matrix","title":"JudiLing.make_S_matrix","text":"Make simulated semantic matrix.\n\n\n\n\n\n","category":"function"},{"location":"man/make_semantic_matrix/#JudiLing.make_L_matrix","page":"Make Semantic Matrix","title":"JudiLing.make_L_matrix","text":"Make simulated lexome matrix.\n\n\n\n\n\n","category":"function"},{"location":"man/make_semantic_matrix/#JudiLing.make_combined_S_matrix","page":"Make Semantic Matrix","title":"JudiLing.make_combined_S_matrix","text":"Make combined simulated S matrices, where combined features from both training datasets and validation datasets\n\n\n\n\n\n","category":"function"},{"location":"man/make_semantic_matrix/#JudiLing.make_combined_L_matrix","page":"Make Semantic Matrix","title":"JudiLing.make_combined_L_matrix","text":"Make combined simulated Lexome matrix, where combined features from both training datasets and validation datasets\n\n\n\n\n\n","category":"function"},{"location":"man/make_semantic_matrix/#JudiLing.make_S_matrix-Tuple{DataFrames.DataFrame, Vector, Vector}","page":"Make Semantic Matrix","title":"JudiLing.make_S_matrix","text":"make_S_matrix(data::DataFrame, base::Vector, inflections::Vector)\n\nCreate simulated semantic matrix for the training datasets, given the input data of a vector specified contex lexemes and a vector specified gramatic lexemes. The semantic vector of a word form is constructed summing semantic vectors of content and gramatic lexemes.\n\nObligatory Arguments\n\ndata::DataFrame: the dataset\nbase::Vector: context lexemes\ninflections::Vector: grammatic lexemes\n\nOptional Arguments\n\nncol::Int64=200: dimension of semantic vectors, usually the same as that of cue vectors\nsd_base_mean::Int64=1: the sd mean of base features\nsd_inflection_mean::Int64=1: the sd mean of inflectional features\nsd_base::Int64=4: the sd of base features\nsd_inflection::Int64=4: the sd of inflectional features\nseed::Int64=314: the random seed\nisdeep::Bool=true: if true, mean of each feature is also randomized\nadd_noise::Bool=true: if true, add additional Gaussian noise\nsd_noise::Int64=1: the sd of the Gaussian noise\nnormalized::Bool=false: if true, most of the values range between 1 and -1, it may slightly exceed between 1 or -1 depending on the sd\n\nExamples\n\n# basic usage\nS_train = JudiLing.make_S_matrix(\n    french,\n    [\"Lexeme\"],\n    [\"Tense\",\"Aspect\",\"Person\",\"Number\",\"Gender\",\"Class\",\"Mood\"],\n    ncol=200)\n\n# deep mode\nS_train = JudiLing.make_S_matrix(\n    ...\n    sd_base_mean=1,\n    sd_inflection_mean=1,\n    isdeep=true,\n    ...)\n\n# non-deep mode\nS_train = JudiLing.make_S_matrix(\n    ...\n    isdeep=false,\n    ...)\n\n# add additional Gaussian noise\nS_train = JudiLing.make_S_matrix(\n    ...\n    add_noise=true,\n    sd_noise=1,\n    ...)\n\n# further control of means and standard deviations\nS_train = JudiLing.make_S_matrix(\n    ...\n    sd_base_mean=1,\n    sd_inflection_mean=1,\n    sd_base=4,\n    sd_inflection=4,\n    sd_noise=1,\n    ...)\n\n\n\n\n\n","category":"method"},{"location":"man/make_semantic_matrix/#JudiLing.make_S_matrix-Tuple{DataFrames.DataFrame, DataFrames.DataFrame, Vector, Vector}","page":"Make Semantic Matrix","title":"JudiLing.make_S_matrix","text":"make_S_matrix(data_train::DataFrame, data_val::DataFrame, base::Vector, inflections::Vector)\n\nCreate simulated semantic matrix for the validation datasets, given the input data of a vector specified contex lexemes and a vector specified gramatic lexemes. The semantic vector of a word form is constructed summing semantic vectors of content and gramatic lexemes.\n\nObligatory Arguments\n\ndata_train::DataFrame: the training dataset\ndata_val::DataFrame: the validation dataset\nbase::Vector: context lexemes\ninflections::Vector: grammatic lexemes\n\nOptional Arguments\n\nncol::Int64=200: dimension of semantic vectors, usually the same as that of cue vectors\nsd_base_mean::Int64=1: the sd mean of base features\nsd_inflection_mean::Int64=1: the sd mean of inflectional features\nsd_base::Int64=4: the sd of base features\nsd_inflection::Int64=4: the sd of inflectional features\nseed::Int64=314: the random seed\nisdeep::Bool=true: if true, mean of each feature is also randomized\nadd_noise::Bool=true: if true, add additional Gaussian noise\nsd_noise::Int64=1: the sd of the Gaussian noise\nnormalized::Bool=false: if true, most of the values range between 1 and -1, it may slightly exceed between 1 or -1 depending on the sd\n\nExamples\n\n# basic usage\nS_train, S_val = JudiLing.make_S_matrix(\n    french,\n    french_val,\n    [\"Lexeme\"],\n    [\"Tense\",\"Aspect\",\"Person\",\"Number\",\"Gender\",\"Class\",\"Mood\"],\n    ncol=200)\n\n# deep mode\nS_train, S_val = JudiLing.make_S_matrix(\n    ...\n    sd_base_mean=1,\n    sd_inflection_mean=1,\n    isdeep=true,\n  ...)\n\n# non-deep mode\nS_train, S_val = JudiLing.make_S_matrix(\n    ...\n    isdeep=false,\n    ...)\n\n# add additional Gaussian noise\nS_train, S_val = JudiLing.make_S_matrix(\n    ...\n    add_noise=true,\n    sd_noise=1,\n    ...)\n\n# further control of means and standard deviations\nS_train, S_val = JudiLing.make_S_matrix(\n    ...\n    sd_base_mean=1,\n    sd_inflection_mean=1,\n    sd_base=4,\n    sd_inflection=4,\n    sd_noise=1,\n    ...)\n\n\n\n\n\n","category":"method"},{"location":"man/make_semantic_matrix/#JudiLing.make_S_matrix-Tuple{DataFrames.DataFrame, Vector}","page":"Make Semantic Matrix","title":"JudiLing.make_S_matrix","text":"make_S_matrix(data::DataFrame, base::Vector)\n\nCreate simulated semantic matrix for the training datasets with only base features, given the input data of a vector specified contex lexemes and a vector specified gramatic lexemes. The semantic vector of a word form is constructed summing semantic vectors of content and gramatic lexemes.\n\nObligatory Arguments\n\ndata::DataFrame: the dataset\nbase::Vector: context lexemes\n\nOptional Arguments\n\nncol::Int64=200: dimension of semantic vectors, usually the same as that of cue vectors\nsd_base_mean::Int64=1: the sd mean of base features\nsd_base::Int64=4: the sd of base features\nseed::Int64=314: the random seed\nisdeep::Bool=true: if true, mean of each feature is also randomized\nadd_noise::Bool=true: if true, add additional Gaussian noise\nsd_noise::Int64=1: the sd of the Gaussian noise\nnormalized::Bool=false: if true, most of the values range between 1 and -1, it may slightly exceed between 1 or -1 depending on the sd\n\nExamples\n\n# basic usage\nS_train = JudiLing.make_S_matrix(\n    french,\n    [\"Lexeme\"],\n    ncol=200)\n\n# deep mode\nS_train = JudiLing.make_S_matrix(\n    ...\n    sd_base_mean=1,\n    sd_inflection_mean=1,\n    isdeep=true,\n    ...)\n\n# non-deep mode\nS_train = JudiLing.make_S_matrix(\n    ...\n    isdeep=false,\n    ...)\n\n# add additional Gaussian noise\nS_train = JudiLing.make_S_matrix(\n    ...\n    add_noise=true,\n    sd_noise=1,\n    ...)\n\n# further control of means and standard deviations\nS_train = JudiLing.make_S_matrix(\n    ...\n    sd_base_mean=1,\n    sd_inflection_mean=1,\n    sd_base=4,\n    sd_inflection=4,\n    sd_noise=1,\n    ...)\n\n\n\n\n\n","category":"method"},{"location":"man/make_semantic_matrix/#JudiLing.make_S_matrix-Tuple{DataFrames.DataFrame, DataFrames.DataFrame, Vector}","page":"Make Semantic Matrix","title":"JudiLing.make_S_matrix","text":"make_S_matrix(data_train::DataFrame, data_val::DataFrame, base::Vector)\n\nCreate simulated semantic matrix for the validation datasets with only base features, given the input data of a vector specified contex lexemes and a vector specified gramatic lexemes. The semantic vector of a word form is constructed summing semantic vectors of content and gramatic lexemes.\n\nObligatory Arguments\n\ndata_train::DataFrame: the training dataset\ndata_val::DataFrame: the validation dataset\nbase::Vector: context lexemes\n\nOptional Arguments\n\nncol::Int64=200: dimension of semantic vectors, usually the same as that of cue vectors\nsd_base_mean::Int64=1: the sd mean of base features\nsd_base::Int64=4: the sd of base features\nseed::Int64=314: the random seed\nisdeep::Bool=true: if true, mean of each feature is also randomized\nadd_noise::Bool=true: if true, add additional Gaussian noise\nsd_noise::Int64=1: the sd of the Gaussian noise\nnormalized::Bool=false: if true, most of the values range between 1 and -1, it may slightly exceed between 1 or -1 depending on the sd\n\nExamples\n\n# basic usage\nS_train, S_val = JudiLing.make_S_matrix(\n    french,\n    french_val,\n    [\"Lexeme\"],\n    ncol=200)\n\n# deep mode\nS_train, S_val = JudiLing.make_S_matrix(\n    ...\n    sd_base_mean=1,\n    sd_inflection_mean=1,\n    isdeep=true,\n    ...)\n\n# non-deep mode\nS_train, S_val = JudiLing.make_S_matrix(\n    ...\n    isdeep=false,\n    ...)\n\n# add additional Gaussian noise\nS_train, S_val = JudiLing.make_S_matrix(\n    ...\n    add_noise=true,\n    sd_noise=1,\n    ...)\n\n# further control of means and standard deviations\nS_train, S_val = JudiLing.make_S_matrix(\n    ...\n    sd_base_mean=1,\n    sd_inflection_mean=1,\n    sd_base=4,\n    sd_inflection=4,\n    sd_noise=1,\n    ...)\n\n\n\n\n\n","category":"method"},{"location":"man/make_semantic_matrix/#JudiLing.make_S_matrix-Tuple{DataFrames.DataFrame, Vector, Vector, JudiLing.L_Matrix_Struct}","page":"Make Semantic Matrix","title":"JudiLing.make_S_matrix","text":"make_S_matrix(data_train::DataFrame, base::Vector, inflections::Vector, L::L_Matrix_Struct)\n\nCreate simulated semantic matrix where lexome matrix is available.\n\nObligatory Arguments\n\ndata::DataFrame: the dataset\nbase::Vector: context lexemes\ninflections::Vector: grammatic lexemes\nL::L_Matrix_Struct: the lexome matrix\n\nOptional Arguments\n\nadd_noise::Bool=true: if true, add additional Gaussian noise\nsd_noise::Int64=1: the sd of the Gaussian noise\nnormalized::Bool=false: if true, most of the values range between 1 and -1, it may slightly exceed between 1 or -1 depending on the sd\n\nExamples\n\n# basic usage\nS1 = JudiLing.make_S_matrix(\n    latin,\n    [\"Lexeme\"],\n    [\"Person\",\"Number\",\"Tense\",\"Voice\",\"Mood\"],\n     L1,\n     add_noise=true,\n    sd_noise=1,\n    normalized=false\n    )\n\n\n\n\n\n","category":"method"},{"location":"man/make_semantic_matrix/#JudiLing.make_S_matrix-Tuple{DataFrames.DataFrame, Union{Nothing, DataFrames.DataFrame}, Vector, JudiLing.L_Matrix_Struct}","page":"Make Semantic Matrix","title":"JudiLing.make_S_matrix","text":"make_S_matrix(data_train::DataFrame, data_val::Union{DataFrame, Nothing}, base::Vector, L::L_Matrix_Struct)\n\nCreate simulated semantic matrix where lexome matrix is available.\n\nObligatory Arguments\n\ndata_train::DataFrame: the training dataset\ndata_val::DataFrame: the validation dataset\nbase::Vector: context lexemes\nL::L_Matrix_Struct: the lexome matrix\n\nOptional Arguments\n\nadd_noise::Bool=true: if true, add additional Gaussian noise\nsd_noise::Int64=1: the sd of the Gaussian noise\nnormalized::Bool=false: if true, most of the values range between 1 and -1, it may slightly exceed between 1 or -1 depending on the sd\n\nExamples\n\n# basic usage\nS1, S2 = JudiLing.make_S_matrix(\n     latin,\n    latin_val,\n    [\"Lexeme\"],\n    L1,\n    add_noise=true,\n    sd_noise=1,\n    normalized=false\n    )\n\n\n\n\n\n","category":"method"},{"location":"man/make_semantic_matrix/#JudiLing.make_S_matrix-Tuple{DataFrames.DataFrame, Vector, JudiLing.L_Matrix_Struct}","page":"Make Semantic Matrix","title":"JudiLing.make_S_matrix","text":"make_S_matrix(data::DataFrame, base::Vector, L::L_Matrix_Struct)\n\nCreate simulated semantic matrix where lexome matrix is available.\n\nObligatory Arguments\n\ndata::DataFrame: the dataset\nbase::Vector: context lexemes\nL::L_Matrix_Struct: the lexome matrix\n\nOptional Arguments\n\nadd_noise::Bool=true: if true, add additional Gaussian noise\nsd_noise::Int64=1: the sd of the Gaussian noise\nnormalized::Bool=false: if true, most of the values range between 1 and -1, it may slightly exceed between 1 or -1 depending on the sd\n\nExamples\n\n# basic usage\nS1 = JudiLing.make_S_matrix(\n    latin,\n    [\"Lexeme\"],\n    L1,\n    add_noise=true,\n    sd_noise=1,\n    normalized=false\n    )\n\n\n\n\n\n","category":"method"},{"location":"man/make_semantic_matrix/#JudiLing.make_S_matrix-Tuple{DataFrames.DataFrame, DataFrames.DataFrame, Vector, Vector, JudiLing.L_Matrix_Struct}","page":"Make Semantic Matrix","title":"JudiLing.make_S_matrix","text":"make_S_matrix(data_train::DataFrame, data_val::DataFrame, base::Vector, inflections::Vector, L::L_Matrix_Struct)\n\nCreate simulated semantic matrix where lexome matrix is available.\n\nObligatory Arguments\n\ndata_train::DataFrame: the training dataset\ndata_val::DataFrame: the validation dataset\nbase::Vector: context lexemes\ninflections::Vector: grammatic lexemes\nL::L_Matrix_Struct: the lexome matrix\n\nOptional Arguments\n\nadd_noise::Bool=true: if true, add additional Gaussian noise\nsd_noise::Int64=1: the sd of the Gaussian noise\nnormalized::Bool=false: if true, most of the values range between 1 and -1, it may slightly exceed between 1 or -1 depending on the sd\n\nExamples\n\n# basic usage\nS1, S2 = JudiLing.make_S_matrix(\n    latin,\n    latin_val,\n    [\"Lexeme\"],\n    [\"Person\",\"Number\",\"Tense\",\"Voice\",\"Mood\"],\n    L1,\n    add_noise=true,\n    sd_noise=1,\n    normalized=false\n    )\n\n\n\n\n\n","category":"method"},{"location":"man/make_semantic_matrix/#JudiLing.make_L_matrix-Tuple{DataFrames.DataFrame, Vector}","page":"Make Semantic Matrix","title":"JudiLing.make_L_matrix","text":"make_L_matrix(data::DataFrame, base::Vector)\n\nCreate Lexome Matrix with simulated semantic vectors where there are only base features.\n\nObligatory Arguments\n\ndata::DataFrame: the dataset\nbase::Vector: context lexemes\n\nOptional Arguments\n\nncol::Int64=200: dimension of semantic vectors, usually the same as that of cue vectors\nsd_base_mean::Int64=1: the sd mean of base features\nsd_base::Int64=4: the sd of base features\nseed::Int64=314: the random seed\nisdeep::Bool=true: if true, mean of each feature is also randomized\n\nExamples\n\n# basic usage\nL = JudiLing.make_L_matrix(\n    latin,\n    [\"Lexeme\"],\n    ncol=200)\n\n\n\n\n\n","category":"method"},{"location":"man/make_semantic_matrix/#JudiLing.make_combined_S_matrix-Tuple{DataFrames.DataFrame, DataFrames.DataFrame, Vector, Vector, JudiLing.L_Matrix_Struct}","page":"Make Semantic Matrix","title":"JudiLing.make_combined_S_matrix","text":"make_combined_S_matrix(data_train::DataFrame, data_val::DataFrame, base::Vector, inflections::Vector, L::L_Matrix_Struct)\n\nCreate simulated semantic matrix for the training datasets and validation datasets with existing Lexome matrix, where features are combined from both training datasets and validation datasets.\n\nObligatory Arguments\n\ndata_train::DataFrame: the training dataset\ndata_val::DataFrame: the validation dataset\nbase::Vector: context lexemes\ninflections::Vector: grammatic lexemes\nL::L_Matrix_Struct: the Lexome Matrix\n\nOptional Arguments\n\nadd_noise::Bool=true: if true, add additional Gaussian noise\nsd_noise::Int64=1: the sd of the Gaussian noise\nnormalized::Bool=false: if true, most of the values range between 1 and -1, it may slightly exceed between 1 or -1 depending on the sd\n\nExamples\n\n# basic usage\nS_train, S_val = JudiLing.make_combined_S_matrix(\n    latin_train,\n    latin_val,\n    [\"Lexeme\"],\n    [\"Person\",\"Number\",\"Tense\",\"Voice\",\"Mood\"],\n    L)\n\n\n\n\n\n","category":"method"},{"location":"man/make_semantic_matrix/#JudiLing.make_combined_S_matrix-Tuple{DataFrames.DataFrame, Union{Nothing, DataFrames.DataFrame}, Vector, JudiLing.L_Matrix_Struct}","page":"Make Semantic Matrix","title":"JudiLing.make_combined_S_matrix","text":"make_combined_S_matrix(data_train::DataFrame, data_val::Union{DataFrame, Nothing}, base::Vector, L::L_Matrix_Struct)\n\nCreate simulated semantic matrix for the training datasets and validation datasets with existing Lexome matrix, where features are combined from both training datasets and validation datasets.\n\nObligatory Arguments\n\ndata_train::DataFrame: the training dataset\ndata_val::DataFrame: the validation dataset\nbase::Vector: context lexemes\nL::L_Matrix_Struct: the Lexome Matrix\n\nOptional Arguments\n\nadd_noise::Bool=true: if true, add additional Gaussian noise\nsd_noise::Int64=1: the sd of the Gaussian noise\nnormalized::Bool=false: if true, most of the values range between 1 and -1, it may slightly exceed between 1 or -1 depending on the sd\n\nExamples\n\n# basic usage\nS_train, S_val = JudiLing.make_combined_S_matrix(\n    latin_train,\n    latin_val,\n    [\"Lexeme\"],\n    [\"Person\",\"Number\",\"Tense\",\"Voice\",\"Mood\"],\n    L)\n\n\n\n\n\n","category":"method"},{"location":"man/make_semantic_matrix/#JudiLing.make_combined_S_matrix-Tuple{DataFrames.DataFrame, DataFrames.DataFrame, Vector, Vector}","page":"Make Semantic Matrix","title":"JudiLing.make_combined_S_matrix","text":"make_combined_S_matrix(  data_train::DataFrame, data_val::DataFrame, base::Vector, inflections::Vector)\n\nCreate simulated semantic matrix for the training datasets and validation datasets, where features are combined from both training datasets and validation datasets.\n\nObligatory Arguments\n\ndata_train::DataFrame: the training dataset\ndata_val::DataFrame: the validation dataset\nbase::Vector: context lexemes\ninflections::Vector: grammatic lexemes\n\nOptional Arguments\n\nncol::Int64=200: dimension of semantic vectors, usually the same as that of cue vectors\nsd_base_mean::Int64=1: the sd mean of base features\nsd_inflection_mean::Int64=1: the sd mean of inflectional features\nsd_base::Int64=4: the sd of base features\nsd_inflection::Int64=4: the sd of inflectional features\nseed::Int64=314: the random seed\nisdeep::Bool=true: if true, mean of each feature is also randomized\nadd_noise::Bool=true: if true, add additional Gaussian noise\nsd_noise::Int64=1: the sd of the Gaussian noise\nnormalized::Bool=false: if true, most of the values range between 1 and -1, it may slightly exceed between 1 or -1 depending on the sd\n\nExamples\n\n# basic usage\nS_train, S_val = JudiLing.make_combined_S_matrix(\n    latin_train,\n    latin_val,\n    [\"Lexeme\"],\n    [\"Person\",\"Number\",\"Tense\",\"Voice\",\"Mood\"],\n    ncol=n_features)\n\n\n\n\n\n","category":"method"},{"location":"man/make_semantic_matrix/#JudiLing.make_combined_S_matrix-Tuple{DataFrames.DataFrame, DataFrames.DataFrame, Vector}","page":"Make Semantic Matrix","title":"JudiLing.make_combined_S_matrix","text":"make_combined_S_matrix(data_train::DataFrame, data_val::DataFrame, base::Vector)\n\nCreate simulated semantic matrix for the training datasets and validation datasets, where features are combined from both training datasets and validation datasets.\n\nObligatory Arguments\n\ndata_train::DataFrame: the training dataset\ndata_val::DataFrame: the validation dataset\nbase::Vector: context lexemes\n\nOptional Arguments\n\nncol::Int64=200: dimension of semantic vectors, usually the same as that of cue vectors\nsd_base_mean::Int64=1: the sd mean of base features\nsd_inflection_mean::Int64=1: the sd mean of inflectional features\nsd_base::Int64=4: the sd of base features\nsd_inflection::Int64=4: the sd of inflectional features\nseed::Int64=314: the random seed\nisdeep::Bool=true: if true, mean of each feature is also randomized\nadd_noise::Bool=true: if true, add additional Gaussian noise\nsd_noise::Int64=1: the sd of the Gaussian noise\nnormalized::Bool=false: if true, most of the values range between 1 and -1, it may slightly exceed between 1 or -1 depending on the sd\n\nExamples\n\n# basic usage\nS_train, S_val = JudiLing.make_combined_S_matrix(\n    latin_train,\n    latin_val,\n    [\"Lexeme\"],\n    [\"Person\",\"Number\",\"Tense\",\"Voice\",\"Mood\"],\n    ncol=n_features)\n\n\n\n\n\n","category":"method"},{"location":"man/make_semantic_matrix/#JudiLing.make_combined_L_matrix-Tuple{DataFrames.DataFrame, DataFrames.DataFrame, Vector, Vector}","page":"Make Semantic Matrix","title":"JudiLing.make_combined_L_matrix","text":"make_combined_L_matrix(data_train::DataFrame, data_val::DataFrame, base::Vector, inflections::Vector)\n\nCreate Lexome Matrix with simulated semantic vectors, where features are combined from both training datasets and validation datasets.\n\nObligatory Arguments\n\ndata_train::DataFrame: the training dataset\ndata_val::DataFrame: the validation dataset\nbase::Vector: context lexemes\ninflections::Vector: grammatic lexemes\n\nOptional Arguments\n\nncol::Int64=200: dimension of semantic vectors, usually the same as that of cue vectors\nsd_base_mean::Int64=1: the sd mean of base features\nsd_inflection_mean::Int64=1: the sd mean of inflectional features\nsd_base::Int64=4: the sd of base features\nsd_inflection::Int64=4: the sd of inflectional features\nseed::Int64=314: the random seed\nisdeep::Bool=true: if true, mean of each feature is also randomized\n\nExamples\n\n# basic usage\nL = JudiLing.make_combined_L_matrix(\n    latin_train,\n    latin_val,\n    [\"Lexeme\"],\n    [\"Person\",\"Number\",\"Tense\",\"Voice\",\"Mood\"],\n    ncol=n_features)\n\n\n\n\n\n","category":"method"},{"location":"man/make_semantic_matrix/#JudiLing.make_combined_L_matrix-Tuple{DataFrames.DataFrame, DataFrames.DataFrame, Vector}","page":"Make Semantic Matrix","title":"JudiLing.make_combined_L_matrix","text":"make_combined_L_matrix(data_train::DataFrame, data_val::DataFrame, base::Vector)\n\nCreate Lexome Matrix with simulated semantic vectors, where features are combined from both training datasets and validation datasets.\n\nObligatory Arguments\n\ndata_train::DataFrame: the training dataset\ndata_val::DataFrame: the validation dataset\nbase::Vector: context lexemes\n\nOptional Arguments\n\nncol::Int64=200: dimension of semantic vectors, usually the same as that of cue vectors\nsd_base_mean::Int64=1: the sd mean of base features\nsd_inflection_mean::Int64=1: the sd mean of inflectional features\nsd_base::Int64=4: the sd of base features\nsd_inflection::Int64=4: the sd of inflectional features\nseed::Int64=314: the random seed\nisdeep::Bool=true: if true, mean of each feature is also randomized\n\nExamples\n\n# basic usage\nL = JudiLing.make_combined_L_matrix(\n    latin_train,\n    latin_val,\n    [\"Lexeme\"],\n    ncol=n_features)\n\n\n\n\n\n","category":"method"},{"location":"man/make_semantic_matrix/#JudiLing.L_Matrix_Struct-NTuple{12, Any}","page":"Make Semantic Matrix","title":"JudiLing.L_Matrix_Struct","text":"L_Matrix_Struct(L, sd_base, sd_base_mean, sd_inflection, sd_inflection_mean, base_f, infl_f, base_f2i, infl_f2i, n_base_f, n_infl_f, ncol)\n\nConstruct LMatrixStruct with deep mode.\n\n\n\n\n\n","category":"method"},{"location":"man/make_semantic_matrix/#JudiLing.L_Matrix_Struct-NTuple{10, Any}","page":"Make Semantic Matrix","title":"JudiLing.L_Matrix_Struct","text":"L_Matrix_Struct(L, sd_base, sd_inflection, base_f, infl_f, base_f2i, infl_f2i, n_base_f, n_infl_f, ncol)\n\nConstruct LMatrixStruct without deep mode.\n\n\n\n\n\n","category":"method"},{"location":"man/make_semantic_matrix/#Load-from-word2vec,-fasttext-or-similar","page":"Make Semantic Matrix","title":"Load from word2vec, fasttext or similar","text":"","category":"section"},{"location":"man/make_semantic_matrix/","page":"Make Semantic Matrix","title":"Make Semantic Matrix","text":"load_S_matrix_from_fasttext(data::DataFrame,\n                                     language::Symbol;\n                                     target_col=:Word,\n                                     default_file::Int=1)\n load_S_matrix_from_fasttext(data_train::DataFrame,\n                                  data_val::DataFrame,\n                                  language::Symbol;\n                                  target_col=:Word,\n                                  default_file::Int=1)\n  load_S_matrix_from_word2vec_file(data::DataFrame,\n                              filepath::String;\n                              target_col=:Word)\n  load_S_matrix_from_word2vec_file(data_train::DataFrame,\n                              data_val::DataFrame,\n                              filepath::String;\n                              target_col=:Word)\n  load_S_matrix_from_fasttext_file(data::DataFrame,\n                              filepath::String;\n                              target_col=:Word)\n  load_S_matrix_from_fasttext_file(data_train::DataFrame,\n                              data_val::DataFrame,\n                              filepath::String;\n                              target_col=:Word)","category":"page"},{"location":"man/make_semantic_matrix/#JudiLing.load_S_matrix_from_fasttext-Tuple{DataFrames.DataFrame, Symbol}","page":"Make Semantic Matrix","title":"JudiLing.load_S_matrix_from_fasttext","text":"load_S_matrix_from_fasttext(data::DataFrame,\n                                 language::Symbol;\n                                 target_col=:Word,\n                                 default_file::Int=1)\n\nLoad semantic matrix from fasttext, loaded using the Embeddings.jl package. Subset fasttext vectors to include only words in target_col of data, and subset data to only include words in target_col for which semantic vector is available.\n\nThe last parameter, default_file, specifies which vectors are loaded. To learn about all available vectors, use the following commands:\n\nusing Embeddings\nlanguage_files(FastText_Text{:nl})\n\nreplacing the language code (here :nl) with the language you are interested in. In general, for all languages other than English, these files are available:\n\ndefault_file=1 loads from https://fasttext.cc/docs/en/crawl-vectors.html, paper: E. Grave, P. Bojanowski, P. Gupta, A. Joulin, T. Mikolov,        Learning Word Vectors for 157 Languages License: CC BY-SA 3.0 https://creativecommons.org/licenses/by-sa/3.0/\ndefault_file=2 loads from https://fasttext.cc/docs/en/pretrained-vectors.html paper: P. Bojanowski, E. Grave, A. Joulin, T. Mikolov,        Enriching Word Vectors with Subword Information License: CC BY-SA 3.0 https://creativecommons.org/licenses/by-sa/3.0/\n\nObligatory Arguments\n\ndata::DataFrame: the dataset\nlanguage::Symbol: the language of the words in the dataset,   offically ISO 639-2 (see https://github.com/JuliaText/Embeddings.jl/issues/34#issuecomment-782604523)   but practically it seems more like ISO 639-1 to me with ISO 639-2 only being used   if ISO 639-1 isn't available (see https://en.wikipedia.org/wiki/ListofISO639-2codes)\n\nOptional Arguments\n\ntarget_col=:Word: column with orthographic representation of words in data\ndefault_file::Int=1: source of vectors, for more information see above and here: https://github.com/JuliaText/Embeddings.jl#loading-different-embeddings\n\nExamples\n\n# basic usage\nlatin_small, S = JudiLing.load_S_matrix_from_fasttext(latin, :la, target_col=:Word)\n\n\n\n\n\n","category":"method"},{"location":"man/make_semantic_matrix/#JudiLing.load_S_matrix_from_fasttext-Tuple{DataFrames.DataFrame, DataFrames.DataFrame, Symbol}","page":"Make Semantic Matrix","title":"JudiLing.load_S_matrix_from_fasttext","text":"load_S_matrix_from_fasttext(data_train::DataFrame,\n                                 data_val::DataFrame,\n                                 language::Symbol;\n                                 target_col=:Word,\n                                 default_file::Int=1)\n\nLoad semantic matrix from fasttext, loaded using the Embeddings.jl package. Subset fasttext vectors to include only words in target_col of data_train and data_val, and subset data to only include words in target_col for which semantic vector is available. Returns subsetted train and val data and train and val semantic matrices.\n\nThe last parameter, default_file, specifies which vectors are loaded. To learn about all available vectors, use the following commands:\n\nusing Embeddings\nlanguage_files(FastText_Text{:nl})\n\nreplacing the language code (here :nl) with the language you are interested in. In general, for all languages other than English, these files are available:\n\ndefault_file=1 loads from https://fasttext.cc/docs/en/crawl-vectors.html, paper: E. Grave, P. Bojanowski, P. Gupta, A. Joulin, T. Mikolov,        Learning Word Vectors for 157 Languages License: CC BY-SA 3.0 https://creativecommons.org/licenses/by-sa/3.0/\ndefault_file=2 loads from https://fasttext.cc/docs/en/pretrained-vectors.html paper: P. Bojanowski, E. Grave, A. Joulin, T. Mikolov,        Enriching Word Vectors with Subword Information License: CC BY-SA 3.0 https://creativecommons.org/licenses/by-sa/3.0/\n\nObligatory Arguments\n\ndata_train::DataFrame: the training dataset\ndata_val::DataFrame: the validation dataset\nlanguage::Symbol: the language of the words in the dataset,   offically ISO 639-2 (see https://github.com/JuliaText/Embeddings.jl/issues/34#issuecomment-782604523)   but practically it seems more like ISO 639-1 to me with ISO 639-2 only being used   if ISO 639-1 isn't available (see https://en.wikipedia.org/wiki/ListofISO639-2codes)\n\nOptional Arguments\n\ntarget_col=:Word: column with orthographic representation of words in data\ndefault_file::Int=1: source of vectors, for more information see above and here: https://github.com/JuliaText/Embeddings.jl#loading-different-embeddings\n\nExamples\n\n# basic usage\nlatin_small_train, latin_small_val, S_train, S_val = JudiLing.load_S_matrix_from_fasttext(latin_train,\n                                                      latin_val,\n                                                      :la,\n                                                      target_col=:Word)\n\n\n\n\n\n","category":"method"},{"location":"man/make_semantic_matrix/#JudiLing.load_S_matrix_from_word2vec_file-Tuple{DataFrames.DataFrame, String}","page":"Make Semantic Matrix","title":"JudiLing.load_S_matrix_from_word2vec_file","text":"load_S_matrix_from_word2vec_file(data::DataFrame,\n                            filepath::String;\n                            target_col=:Word)\n\nLoad semantic matrix from word2vec filepath. Subset word2vec vectors to include only words in target_col of data, and subset data to only include words in target_col for which semantic vector is available. Returns subsetted data and semantic matrix.\n\nObligatory Arguments\n\ndata::DataFrame: the training dataset\nfilepath::String: path to file with word2vec vectors in .txt (not compressed in any way)\n\nOptional Arguments\n\ntarget_col=:Word: column with orthographic representation of words in data\n\n\n\n\n\n","category":"method"},{"location":"man/make_semantic_matrix/#JudiLing.load_S_matrix_from_word2vec_file-Tuple{DataFrames.DataFrame, DataFrames.DataFrame, String}","page":"Make Semantic Matrix","title":"JudiLing.load_S_matrix_from_word2vec_file","text":"load_S_matrix_from_word2vec_file(data_train::DataFrame,\n                            data_val::DataFrame,\n                            filepath::String;\n                            target_col=:Word)\n\nLoad semantic matrix from word2vec filepath. Subset word2vec vectors to include only words in target_col of data_train and data_val, and subset data to only include words in target_col for which semantic vector is available. Returns subsetted train and val data and train and val semantic matrices.\n\nObligatory Arguments\n\ndata_train::DataFrame: the training dataset\ndata_val::DataFrame: the validation dataset\nfilepath::String: path to file with word2vec vectors in .txt (not compressed in any way)\n\nOptional Arguments\n\ntarget_col=:Word: column with orthographic representation of words in data\n\n\n\n\n\n","category":"method"},{"location":"man/make_semantic_matrix/#JudiLing.load_S_matrix_from_fasttext_file-Tuple{DataFrames.DataFrame, String}","page":"Make Semantic Matrix","title":"JudiLing.load_S_matrix_from_fasttext_file","text":"load_S_matrix_from_fasttext_file(data::DataFrame,\n                            filepath::String;\n                            target_col=:Word)\n\nLoad semantic matrix from fasttext filepath. Subset fasttext vectors to include only words in target_col of data, and subset data to only include words in target_col for which semantic vector is available. Returns subsetted data and semantic matrix.\n\nObligatory Arguments\n\ndata::DataFrame: the training dataset\nfilepath::String: path to file with fasttext vectors in .txt or .vec (not compressed in any way)\n\nOptional Arguments\n\ntarget_col=:Word: column with orthographic representation of words in data\n\n\n\n\n\n","category":"method"},{"location":"man/make_semantic_matrix/#JudiLing.load_S_matrix_from_fasttext_file-Tuple{DataFrames.DataFrame, DataFrames.DataFrame, String}","page":"Make Semantic Matrix","title":"JudiLing.load_S_matrix_from_fasttext_file","text":"load_S_matrix_from_fasttext_file(data_train::DataFrame,\n                            data_val::DataFrame,\n                            filepath::String;\n                            target_col=:Word)\n\nLoad semantic matrix from fasttext filepath. Subset fasttext vectors to include only words in target_col of data_train and data_val, and subset data to only include words in target_col for which semantic vector is available. Returns subsetted train and val data and train and val semantic matrices.\n\nObligatory Arguments\n\ndata_train::DataFrame: the training dataset\ndata_val::DataFrame: the validation dataset\nfilepath::String: path to file with fasttext vectors in .txt (not compressed in any way)\n\nOptional Arguments\n\ntarget_col=:Word: column with orthographic representation of words in data\n\n\n\n\n\n","category":"method"},{"location":"man/make_semantic_matrix/#Utility-functions","page":"Make Semantic Matrix","title":"Utility functions","text":"","category":"section"},{"location":"man/make_semantic_matrix/","page":"Make Semantic Matrix","title":"Make Semantic Matrix","text":"    process_features(data, feature_cols)\n    comp_f_M!(L, sd, sd_mean, n_f, ncol, n_b)\n    comp_f_M!(L, sd, n_f, ncol, n_b)\n    merge_f2i(base_f2i, infl_f2i, n_base_f, n_infl_f)\n    lexome_sum(L, features)\n    make_St(L, n, data, base, inflections)\n    make_St(L, n, data, base)\n    add_St_noise!(St, sd_noise)\n    normalize_St!(St, n_base, n_infl)\n    normalize_St!(St, n_base)","category":"page"},{"location":"man/make_semantic_matrix/#JudiLing.process_features-Tuple{Any, Any}","page":"Make Semantic Matrix","title":"JudiLing.process_features","text":"process_features(data, feature_cols)\n\nCollect all features given datasets and feature column names.\n\n\n\n\n\n","category":"method"},{"location":"man/make_semantic_matrix/#JudiLing.comp_f_M!-NTuple{6, Any}","page":"Make Semantic Matrix","title":"JudiLing.comp_f_M!","text":"comp_f_M!(L, sd, sd_mean, n_f, ncol, n_b)\n\nCompose feature Matrix with deep mode.\n\n\n\n\n\n","category":"method"},{"location":"man/make_semantic_matrix/#JudiLing.comp_f_M!-NTuple{5, Any}","page":"Make Semantic Matrix","title":"JudiLing.comp_f_M!","text":"comp_f_M!(L, sd, n_f, ncol, n_b)\n\nCompose feature Matrix without deep mode.\n\n\n\n\n\n","category":"method"},{"location":"man/make_semantic_matrix/#JudiLing.merge_f2i-NTuple{4, Any}","page":"Make Semantic Matrix","title":"JudiLing.merge_f2i","text":"merge_f2i(base_f2i, infl_f2i, n_base_f, n_infl_f)\n\nMerge base f2i dictionary and inflectional f2i dictionary.\n\n\n\n\n\n","category":"method"},{"location":"man/make_semantic_matrix/#JudiLing.lexome_sum-Tuple{Any, Any}","page":"Make Semantic Matrix","title":"JudiLing.lexome_sum","text":"lexome_sum(L, features)\n\nSum up semantic vector, given lexome vector.\n\n\n\n\n\n","category":"method"},{"location":"man/make_semantic_matrix/#JudiLing.make_St-NTuple{5, Any}","page":"Make Semantic Matrix","title":"JudiLing.make_St","text":"make_St(L, n, data, base, inflections)\n\nMake S transpose matrix with inflections.\n\n\n\n\n\n","category":"method"},{"location":"man/make_semantic_matrix/#JudiLing.make_St-NTuple{4, Any}","page":"Make Semantic Matrix","title":"JudiLing.make_St","text":"make_St(L, n, data, base)\n\nMake S transpose matrix without inflections.\n\n\n\n\n\n","category":"method"},{"location":"man/make_semantic_matrix/#JudiLing.add_St_noise!-Tuple{Any, Any}","page":"Make Semantic Matrix","title":"JudiLing.add_St_noise!","text":"add_St_noise!(St, sd_noise)\n\nAdd noise.\n\n\n\n\n\n","category":"method"},{"location":"man/make_semantic_matrix/#JudiLing.normalize_St!-Tuple{Any, Any, Any}","page":"Make Semantic Matrix","title":"JudiLing.normalize_St!","text":"normalize_St!(St, n_base, n_infl)\n\nNormalize S transpose with inflections.\n\n\n\n\n\n","category":"method"},{"location":"man/make_semantic_matrix/#JudiLing.normalize_St!-Tuple{Any, Any}","page":"Make Semantic Matrix","title":"JudiLing.normalize_St!","text":"normalize_St!(St, n_base)\n\nNormalize S transpose without inflections.\n\n\n\n\n\n","category":"method"},{"location":"man/eval/","page":"Evaluation","title":"Evaluation","text":"CurrentModule = JudiLing","category":"page"},{"location":"man/eval/#Evaluation","page":"Evaluation","title":"Evaluation","text":"","category":"section"},{"location":"man/eval/","page":"Evaluation","title":"Evaluation","text":"    Comp_Acc_Struct\n    eval_SC\n    eval_SC_loose\n    accuracy_comprehension(S, Shat, data)\n    accuracy_comprehension(\n        S_val,\n        S_train,\n        Shat_val,\n        data_val,\n        data_train;\n        target_col = :Words,\n        base = nothing,\n        inflections = nothing,\n    )\n    eval_SC(SChat::AbstractArray, SC::AbstractArray)\n    eval_SC(SChat::AbstractArray, SC::AbstractArray, SC_rest::AbstractArray)\n    eval_SC(SChat::AbstractArray, SC::AbstractArray, data::DataFrame, target_col::Union{String, Symbol})\n    eval_SC(SChat::AbstractArray, SC::AbstractArray, SC_rest::AbstractArray, data::DataFrame, data_rest::DataFrame, target_col::Union{String, Symbol})\n    eval_SC(SChat::AbstractArray, SC::AbstractArray, batch_size::Int64)\n    eval_SC(SChat::AbstractArray, SC::AbstractArray, data::DataFrame, target_col::Union{String, Symbol}, batch_size::Int64)\n    eval_SC_loose(SChat, SC, k)\n    eval_SC_loose(SChat, SC, k, data, target_col)\n    eval_manual(res, data, i2f)\n    eval_acc(res, gold_inds::Array)\n    eval_acc(res, cue_obj::Cue_Matrix_Struct)\n    eval_acc_loose(res, gold_inds)\n    extract_gpi(gpi, threshold=0.1, tolerance=(-1000.0))","category":"page"},{"location":"man/eval/#JudiLing.Comp_Acc_Struct","page":"Evaluation","title":"JudiLing.Comp_Acc_Struct","text":"A structure that stores information about comprehension accuracy.\n\n\n\n\n\n","category":"type"},{"location":"man/eval/#JudiLing.eval_SC","page":"Evaluation","title":"JudiLing.eval_SC","text":"Assess model accuracy on the basis of the correlations of row vectors of Chat and C or Shat and S. Ideally the target words have highest correlations on the diagonal of the pertinent correlation matrices. Homophones support option is implemented.\n\n\n\n\n\n","category":"function"},{"location":"man/eval/#JudiLing.eval_SC_loose","page":"Evaluation","title":"JudiLing.eval_SC_loose","text":"Assess model accuracy on the basis of the correlations of row vectors of Chat and C or Shat and S. Count it as correct if one of the top k candidates is correct. Homophones support option is implemented.\n\n\n\n\n\n","category":"function"},{"location":"man/eval/#JudiLing.accuracy_comprehension-Tuple{Any, Any, Any}","page":"Evaluation","title":"JudiLing.accuracy_comprehension","text":"accuracy_comprehension(S, Shat, data)\n\nEvaluate comprehension accuracy for training data.\n\nnote: Note\nIn case of homophones/homographs in the dataset, the correct/incorrect values for base and inflections may be misleading! See below for more information.\n\nObligatory Arguments\n\nS::Matrix: the (gold standard) S matrix\nShat::Matrix: the (predicted) Shat matrix\ndata::DataFrame: the dataset\n\nOptional Arguments\n\ntarget_col::Union{String, Symbol}=:Words: the column name for target strings\nbase::Vector=nothing: base features (typically a lexeme)\ninflections::Union{Nothing, Vector}=nothing: other features (typically in inflectional features)\n\nExamples\n\naccuracy_comprehension(\n    S_train,\n    Shat_train,\n    latin_val,\n    target_col=:Words,\n    base=[:Lexeme],\n    inflections=[:Person, :Number, :Tense, :Voice, :Mood]\n    )\n\nNote\n\nIn case of homophones/homographs in the dataset, the correct/incorrect values for base and inflections may be misleading! Consider the following example: The wordform \"Äpfel\" in German can be nominative plural, genitive plural and accusative plural. Let's assume we have a dataset in which \"Äpfel\" occurs in all three case/number combinations (i.e. there are homographs). If all these wordforms have the same semantic vectors (e.g. because they are derived from word2vec or fasttext which typically have a single vector per unique wordform), the predicted semantic vector of the wordform \"Äpfel\" will be equally correlated with all three case/number combinations in the dataset. In such cases, while the algorithm in this function can unambiguously conclude that the correct surface form \"Äpfel\" was comprehended, which of the three possible rows is the correct one will be picked somewhat non-deterministically (see https://docs.julialang.org/en/v1/base/collections/#Base.argmax). It is thus possible that the algorithm will then use the genitive plural instead of the intended nominative plural as the ground plural, and will report that \"case\" was comprehended incorrectly.\n\n\n\n\n\n","category":"method"},{"location":"man/eval/#JudiLing.accuracy_comprehension-NTuple{5, Any}","page":"Evaluation","title":"JudiLing.accuracy_comprehension","text":"accuracy_comprehension(\n    S_val,\n    S_train,\n    Shat_val,\n    data_val,\n    data_train;\n    target_col = :Words,\n    base = nothing,\n    inflections = nothing,\n)\n\nEvaluate comprehension accuracy for validation data.\n\nnote: Note\nIn case of homophones/homographs in the dataset, the correct/incorrect values for base and inflections may be misleading! See below for more information.\n\nObligatory Arguments\n\nS_val::Matrix: the (gold standard) S matrix of the validation data\nS_train::Matrix: the (gold standard) S matrix of the training data\nShat_val::Matrix: the (predicted) Shat matrix of the validation data\ndata_val::DataFrame: the validation dataset\ndata_train::DataFrame: the training dataset\n\nOptional Arguments\n\ntarget_col::Union{String, Symbol}=:Words: the column name for target strings\nbase::Vector=nothing: base features (typically a lexeme)\ninflections::Union{Nothing, Vector}=nothing: other features (typically in inflectional features)\n\nExamples\n\naccuracy_comprehension(\n    S_val,\n    S_train,\n    Shat_val,\n    latin_val,\n    latin_train,\n    target_col=:Words,\n    base=[:Lexeme],\n    inflections=[:Person, :Number, :Tense, :Voice, :Mood]\n    )\n\nNote\n\nIn case of homophones/homographs in the dataset, the correct/incorrect values for base and inflections may be misleading! Consider the following example: The wordform \"Äpfel\" in German can be nominative plural, genitive plural and accusative plural. Let's assume we have a dataset in which \"Äpfel\" occurs in all three case/number combinations (i.e. there are homographs). If all these wordforms have the same semantic vectors (e.g. because they are derived from word2vec or fasttext which typically have a single vector per unique wordform), the predicted semantic vector of the wordform \"Äpfel\" will be equally correlated with all three case/number combinations in the dataset. In such cases, while the algorithm in this function can unambiguously conclude that the correct surface form \"Äpfel\" was comprehended, which of the three possible rows is the correct one will be picked somewhat non-deterministically (see https://docs.julialang.org/en/v1/base/collections/#Base.argmax). It is thus possible that the algorithm will then use the genitive plural instead of the intended nominative plural as the ground plural, and will report that \"case\" was comprehended incorrectly.\n\n\n\n\n\n","category":"method"},{"location":"man/eval/#JudiLing.eval_SC-Tuple{AbstractArray, AbstractArray}","page":"Evaluation","title":"JudiLing.eval_SC","text":"eval_SC(SChat::AbstractArray, SC::AbstractArray)\n\nAssess model accuracy on the basis of the correlations (or Euclidean distances or Cosine Similarities) of row vectors of Chat and C or Shat and S. Ideally the target words have highest correlations (lowest distance/highest similarity) on the diagonal of the pertinent correlation (distance/similarity) matrices.\n\nIf freq is added, token-based accuracy is computed. Token-based accuracy weighs accuracy values according to words' frequency, i.e. if a word has a frequency of 30 and overall there are 3000 tokens (the frequencies of all types sum to 3000), this token's accuracy will contribute 30/3000.\n\nnote: Note\nIf there are homophones/homographs in the dataset, this evaluation method may be misleading: the predicted vector will be equally correlated with the target vector of both words and the one on the diagonal will not necessarily be selected as the most correlated. In such cases, supplying the dataset and target_col is recommended which enables taking into account homophones/homographs.\n\nObligatory Arguments\n\nSChat::Union{SparseMatrixCSC, Matrix}: the Chat or Shat matrix\nSC::Union{SparseMatrixCSC, Matrix}: the C or S matrix\n\nOptional Arguments\n\ndigits: the specified number of digits after the decimal place (or before if negative)\nR::Bool=false: if true, pairwise correlation/distance/similarity matrix R is return\nfreq::Union{Missing, Array{Int64, 1}, Array{Float64,1}}=missing: list of frequencies of the wordforms in X and Y\nmethod::Union{Symbol, String}=:correlation: Method for computing similarities, one of {:correlation, :euclidean, :cosine}.\n\neval_SC(Chat_train, cue_obj_train.C)\neval_SC(Chat_val, cue_obj_val.C)\neval_SC(Shat_train, S_train)\neval_SC(Shat_val, S_val)\n\n\n\n\n\n","category":"method"},{"location":"man/eval/#JudiLing.eval_SC-Tuple{AbstractArray, AbstractArray, AbstractArray}","page":"Evaluation","title":"JudiLing.eval_SC","text":"eval_SC(SChat::AbstractArray, SC::AbstractArray, SC_rest::AbstractArray)\n\nAssess model accuracy on the basis of the correlations (or Euclidean distances or Cosine Similarities) of row vectors of Chat and C or Shat and S. Ideally the target words have highest correlations (lowest distance/highest similarity) on the diagonal of the pertinent correlation (distance/similarity) matrices.\n\nIf freq is added, token-based accuracy is computed. Token-based accuracy weighs accuracy values according to words' frequency, i.e. if a word has a frequency of 30 and overall there are 3000 tokens (the frequencies of all types sum to 3000), this token's accuracy will contribute 30/3000.\n\nnote: Note\nThe order is important. The fist gold standard matrix has to be corresponing to the SChat matrix, such as eval_SC(Shat_train, S_train, S_val) or eval_SC(Shat_val, S_val, S_train)\n\nnote: Note\nIf there are homophones/homographs in the dataset, this evaluation method may be misleading: the predicted vector will be equally correlated with the target vector of both words and the one on the diagonal will not necessarily be selected as the most correlated. In such cases, supplying the dataset and target_col is recommended which enables taking into account homophones/homographs.\n\nObligatory Arguments\n\nSChat::Union{SparseMatrixCSC, Matrix}: the Chat or Shat matrix\nSC::Union{SparseMatrixCSC, Matrix}: the training/validation C or S matrix\nSC_rest::Union{SparseMatrixCSC, Matrix}: the validation/training C or S matrix\n\nOptional Arguments\n\ndigits: the specified number of digits after the decimal place (or before if negative)\nR::Bool=false: if true, pairwise correlation/distance/similarity matrix R is return\nfreq::Union{Missing, Array{Int64, 1}, Array{Float64,1}}=missing: list of frequencies of the wordforms in X and Y\nmethod::Union{Symbol, String}=:correlation: Method for computing similarities, one of {:correlation, :euclidean, :cosine}.\n\neval_SC(Chat_train, cue_obj_train.C, cue_obj_val.C)\neval_SC(Chat_val, cue_obj_val.C, cue_obj_train.C)\neval_SC(Shat_train, S_train, S_val)\neval_SC(Shat_val, S_val, S_train)\n\n\n\n\n\n","category":"method"},{"location":"man/eval/#JudiLing.eval_SC-Tuple{AbstractArray, AbstractArray, DataFrames.DataFrame, Union{String, Symbol}}","page":"Evaluation","title":"JudiLing.eval_SC","text":"eval_SC(SChat::AbstractArray, SC::AbstractArray, data::DataFrame, target_col::Union{String, Symbol})\n\nAssess model accuracy on the basis of the correlations (or Euclidean distances or Cosine Similarities) of row vectors of Chat and C or Shat and S. Ideally the target words have highest correlations (lowest distance/highest similarity) on the diagonal of the pertinent correlation (distance/similarity) matrices. Support for homophones.\n\nIf freq is added, token-based accuracy is computed. Token-based accuracy weighs accuracy values according to words' frequency, i.e. if a word has a frequency of 30 and overall there are 3000 tokens (the frequencies of all types sum to 3000), this token's accuracy will contribute 30/3000.\n\nObligatory Arguments\n\nSChat::Union{SparseMatrixCSC, Matrix}: the Chat or Shat matrix\nSC::Union{SparseMatrixCSC, Matrix}: the C or S matrix\ndata::DataFrame: datasets\ntarget_col::Union{String, Symbol}: target column name\n\nOptional Arguments\n\ndigits: the specified number of digits after the decimal place (or before if negative)\nR::Bool=false: if true, pairwise correlation/distance/similarity matrix R is return\nfreq::Union{Missing, Array{Int64, 1}, Array{Float64,1}}=missing: list of frequencies of the wordforms in X and Y\nmethod::Union{Symbol, String}=:correlation: Method for computing similarities, one of {:correlation, :euclidean, :cosine}.\n\neval_SC(Chat_train, cue_obj_train.C, latin, :Word)\neval_SC(Chat_val, cue_obj_val.C, latin, :Word)\neval_SC(Shat_train, S_train, latin, :Word)\neval_SC(Shat_val, S_val, latin, :Word)\n\n\n\n\n\n","category":"method"},{"location":"man/eval/#JudiLing.eval_SC-Tuple{AbstractArray, AbstractArray, AbstractArray, DataFrames.DataFrame, DataFrames.DataFrame, Union{String, Symbol}}","page":"Evaluation","title":"JudiLing.eval_SC","text":"eval_SC(SChat::AbstractArray, SC::AbstractArray, SC_rest::AbstractArray, data::DataFrame, data_rest::DataFrame, target_col::Union{String, Symbol})\n\nAssess model accuracy on the basis of the correlations (or Euclidean distances or Cosine Similarities) of row vectors of Chat and C or Shat and S. Ideally the target words have highest correlations (lowest distance/highest similarity) on the diagonal of the pertinent correlation (distance/similarity) matrices.\n\nIf freq is added, token-based accuracy is computed. Token-based accuracy weighs accuracy values according to words' frequency, i.e. if a word has a frequency of 30 and overall there are 3000 tokens (the frequencies of all types sum to 3000), this token's accuracy will contribute 30/3000.\n\nnote: Note\nThe order is important. The first gold standard matrix has to be corresponing to the SChat matrix, such as eval_SC(Shat_train, S_train, S_val, latin, :Word) or eval_SC(Shat_val, S_val, S_train, latin, :Word)\n\nObligatory Arguments\n\nSChat::Union{SparseMatrixCSC, Matrix}: the Chat or Shat matrix\nSC::Union{SparseMatrixCSC, Matrix}: the training/validation C or S matrix\nSC_rest::Union{SparseMatrixCSC, Matrix}: the validation/training C or S matrix\ndata::DataFrame: the training/validation datasets\ndata_rest::DataFrame: the validation/training datasets\ntarget_col::Union{String, Symbol}: target column name\n\nOptional Arguments\n\ndigits: the specified number of digits after the decimal place (or before if negative)\nR::Bool=false: if true, pairwise correlation/distance/similarity matrix R is return\nfreq::Union{Missing, Array{Int64, 1}, Array{Float64,1}}=missing: list of frequencies of the wordforms in X and Y\nmethod::Union{Symbol, String}=:correlation: Method for computing similarities, one of {:correlation, :euclidean, :cosine}.\n\neval_SC(Chat_train, cue_obj_train.C, cue_obj_val.C, latin, :Word)\neval_SC(Chat_val, cue_obj_val.C, cue_obj_train.C, latin, :Word)\neval_SC(Shat_train, S_train, S_val, latin, :Word)\neval_SC(Shat_val, S_val, S_train, latin, :Word)\n\n\n\n\n\n","category":"method"},{"location":"man/eval/#JudiLing.eval_SC-Tuple{AbstractArray, AbstractArray, Int64}","page":"Evaluation","title":"JudiLing.eval_SC","text":"eval_SC(SChat::AbstractArray, SC::AbstractArray, batch_size::Int64)\n\nAssess model accuracy on the basis of the correlations of row vectors of Chat and C or Shat and S. Ideally the target words have highest correlations on the diagonal of the pertinent correlation matrices. For large datasets, pass batch_size to process evaluation in chunks.\n\nnote: Note\nIf there are homophones/homographs in the dataset, this evaluation method may be misleading: the predicted vector will be equally correlated with the target vector of both words and the one on the diagonal will not necessarily be selected as the most correlated. In such cases, supplying the dataset and target_col is recommended which enables taking into account homophones/homographs.\n\nnote: Note\nCurrently only available for correlation.\n\nObligatory Arguments\n\nSChat: the Chat or Shat matrix\nSC: the C or S matrix\ndata: datasets\ntarget_col: target column name\nbatch_size: batch size\n\nOptional Arguments\n\ndigits: the specified number of digits after the decimal place (or before if negative)\nverbose::Bool=false: if true, more information is printed\n\neval_SC(Chat_train, cue_obj_train.C, latin, :Word)\neval_SC(Chat_val, cue_obj_val.C, latin, :Word)\neval_SC(Shat_train, S_train, latin, :Word)\neval_SC(Shat_val, S_val, latin, :Word)\n\n\n\n\n\n","category":"method"},{"location":"man/eval/#JudiLing.eval_SC-Tuple{AbstractArray, AbstractArray, DataFrames.DataFrame, Union{String, Symbol}, Int64}","page":"Evaluation","title":"JudiLing.eval_SC","text":"eval_SC(SChat::AbstractArray, SC::AbstractArray, data::DataFrame, target_col::Union{String, Symbol}, batch_size::Int64)\n\nAssess model accuracy on the basis of the correlations of row vectors of Chat and C or Shat and S. Ideally the target words have highest correlations on the diagonal of the pertinent correlation matrices. For large datasets, pass batch_size to process evaluation in chunks. Support homophones.\n\nnote: Note\nCurrently only available for correlation.\n\nObligatory Arguments\n\nSChat::AbstractArray: the Chat or Shat matrix\nSC::AbstractArray: the C or S matrix\ndata::DataFrame: datasets\ntarget_col::Union{String, Symbol}: target column name\nbatch_size::Int64: batch size\n\nOptional Arguments\n\ndigits: the specified number of digits after the decimal place (or before if negative)\nverbose::Bool=false: if true, more information is printed\n\neval_SC(Chat_train, cue_obj_train.C, latin, :Word, 5000)\neval_SC(Chat_val, cue_obj_val.C, latin, :Word, 5000)\neval_SC(Shat_train, S_train, latin, :Word, 5000)\neval_SC(Shat_val, S_val, latin, :Word, 5000)\n\n\n\n\n\n","category":"method"},{"location":"man/eval/#JudiLing.eval_SC_loose-Tuple{Any, Any, Any}","page":"Evaluation","title":"JudiLing.eval_SC_loose","text":"eval_SC_loose(SChat, SC, k)\n\nAssess model accuracy on the basis of the correlations (or Euclidean distances or Cosine Similarities) of row vectors of Chat and C or Shat and S. Ideally the target words have highest correlations (lowest distance/highest similarity) on the diagonal of the pertinent correlation (distance/similarity) matrices. Count it as correct if one of the top k candidates is correct.\n\nnote: Note\nIf there are homophones/homographs in the dataset, this evaluation method may be misleading: the predicted vector will be equally correlated with the target vector of both words and it is not guaranteed that the target on the diagonal will be among the k neighbours. In particular, eval_SC and eval_SC_loose with k=1 are not guaranteed to give the same result. In such cases, supplying the dataset and target_col is recommended which enables taking into account homophones/homographs.\n\nObligatory Arguments\n\nSChat::Union{SparseMatrixCSC, Matrix}: the Chat or Shat matrix\nSC::Union{SparseMatrixCSC, Matrix}: the C or S matrix\nk: top k candidates\n\nOptional Arguments\n\ndigits: the specified number of digits after the decimal place (or before if negative)\nmethod::Union{Symbol, String}=:correlation: Method for computing similarities, one of {:correlation, :euclidean, :cosine}.\n\neval_SC_loose(Chat, cue_obj.C, k)\neval_SC_loose(Shat, S, k)\n\n\n\n\n\n","category":"method"},{"location":"man/eval/#JudiLing.eval_SC_loose-NTuple{5, Any}","page":"Evaluation","title":"JudiLing.eval_SC_loose","text":"eval_SC_loose(SChat, SC, k, data, target_col)\n\nAssess model accuracy on the basis of the correlations (or Euclidean distances or Cosine Similarities) of row vectors of Chat and C or Shat and S. Ideally the target words have highest correlations (lowest distance/highest similarity) on the diagonal of the pertinent correlation (distance/similarity) matrices. Count it as correct if one of the top k candidates is correct. Support for homophones.\n\nObligatory Arguments\n\nSChat::Union{SparseMatrixCSC, Matrix}: the Chat or Shat matrix\nSC::Union{SparseMatrixCSC, Matrix}: the C or S matrix\nk: top k candidates\ndata: datasets\ntarget_col: target column name\n\nOptional Arguments\n\ndigits: the specified number of digits after the decimal place (or before if negative)\nmethod::Union{Symbol, String}=:correlation: Method for computing similarities, one of {:correlation, :euclidean, :cosine}.\n\neval_SC_loose(Chat, cue_obj.C, k, latin, :Word)\neval_SC_loose(Shat, S, k, latin, :Word)\n\n\n\n\n\n","category":"method"},{"location":"man/eval/#JudiLing.eval_manual-Tuple{Any, Any, Any}","page":"Evaluation","title":"JudiLing.eval_manual","text":"eval_manual(res, data, i2f)\n\nCreate extensive reports for the outputs from build_paths and learn_paths.\n\n\n\n\n\n","category":"method"},{"location":"man/eval/#JudiLing.eval_acc-Tuple{Any, Array}","page":"Evaluation","title":"JudiLing.eval_acc","text":"eval_acc(res, gold_inds::Array)\n\nEvaluate the accuracy of the results from learn_paths or build_paths.\n\nObligatory Arguments\n\nres::Array: the results from learn_paths or build_paths\ngold_inds::Array: the gold paths' indices\n\nOptional Arguments\n\ndigits: the specified number of digits after the decimal place (or before if negative)\nverbose::Bool=false: if true, more information is printed\n\nExamples\n\n# evaluation on training data\nacc_train = JudiLing.eval_acc(\n    res_train,\n    cue_obj_train.gold_ind,\n    verbose=false\n)\n\n# evaluation on validation data\nacc_val = JudiLing.eval_acc(\n    res_val,\n    cue_obj_val.gold_ind,\n    verbose=false\n)\n\n\n\n\n\n","category":"method"},{"location":"man/eval/#JudiLing.eval_acc-Tuple{Any, JudiLing.Cue_Matrix_Struct}","page":"Evaluation","title":"JudiLing.eval_acc","text":"eval_acc(res, cue_obj::Cue_Matrix_Struct)\n\nEvaluate the accuracy of the results from learn_paths or build_paths.\n\nObligatory Arguments\n\nres::Array: the results from learn_paths or build_paths\ncue_obj::Cue_Matrix_Struct: the C matrix object\n\nOptional Arguments\n\ndigits: the specified number of digits after the decimal place (or before if negative)\nverbose::Bool=false: if true, more information is printed\n\nExamples\n\nacc = JudiLing.eval_acc(res, cue_obj)\n\n\n\n\n\n","category":"method"},{"location":"man/eval/#JudiLing.eval_acc_loose-Tuple{Any, Any}","page":"Evaluation","title":"JudiLing.eval_acc_loose","text":"eval_acc_loose(res, gold_inds)\n\nLenient evaluation of the accuracy of the results from learn_paths or build_paths, counting a prediction as correct when the correlation of the predicted and gold standard semantic vectors is among the n top correlations, where n is equal to max_can in the 'learnpaths' or `buildpaths` function.\n\nObligatory Arguments\n\nres::Array: the results from learn_paths or build_paths\ngold_inds::Array: the gold paths' indices\n\nOptional Arguments\n\ndigits: the specified number of digits after the decimal place (or before if negative)\nverbose::Bool=false: if true, more information is printed\n\nExamples\n\n# evaluation on training data\nacc_train_loose = JudiLing.eval_acc_loose(\n    res_train,\n    cue_obj_train.gold_ind,\n    verbose=false\n)\n\n# evaluation on validation data\nacc_val_loose = JudiLing.eval_acc_loose(\n    res_val,\n    cue_obj_val.gold_ind,\n    verbose=false\n)\n\n\n\n\n\n","category":"method"},{"location":"man/eval/#JudiLing.extract_gpi","page":"Evaluation","title":"JudiLing.extract_gpi","text":"extract_gpi(gpi, threshold=0.1, tolerance=(-1000.0))\n\nExtract, using gold paths' information, how many n-grams for a gold path are below the threshold but above the tolerance.\n\n\n\n\n\n","category":"function"},{"location":"man/find_path/","page":"Find Paths","title":"Find Paths","text":"CurrentModule = JudiLing","category":"page"},{"location":"man/find_path/#Find-Paths","page":"Find Paths","title":"Find Paths","text":"","category":"section"},{"location":"man/find_path/#Structures","page":"Find Paths","title":"Structures","text":"","category":"section"},{"location":"man/find_path/","page":"Find Paths","title":"Find Paths","text":"    Result_Path_Info_Struct\n    Gold_Path_Info_Struct\n    Threshold_Stat_Struct","category":"page"},{"location":"man/find_path/#JudiLing.Result_Path_Info_Struct","page":"Find Paths","title":"JudiLing.Result_Path_Info_Struct","text":"Store paths' information built by learn_paths or build_paths\n\n\n\n\n\n","category":"type"},{"location":"man/find_path/#JudiLing.Gold_Path_Info_Struct","page":"Find Paths","title":"JudiLing.Gold_Path_Info_Struct","text":"Store gold paths' information including indices and indices' support and total support. It can be used to evaluate how low the threshold needs to be set in order to find most of the correct paths or if set very low, all of the correct paths.\n\n\n\n\n\n","category":"type"},{"location":"man/find_path/#JudiLing.Threshold_Stat_Struct","page":"Find Paths","title":"JudiLing.Threshold_Stat_Struct","text":"Store threshold and tolerance proportional for each timestep.\n\n\n\n\n\n","category":"type"},{"location":"man/find_path/#Build-paths","page":"Find Paths","title":"Build paths","text":"","category":"section"},{"location":"man/find_path/","page":"Find Paths","title":"Find Paths","text":"    build_paths\n    build_paths(\n        data_val,\n        C_train,\n        S_val,\n        F_train,\n        Chat_val,\n        A,\n        i2f,\n        C_train_ind;\n        rC = nothing,\n        max_t = 15,\n        max_can = 10,\n        n_neighbors = 10,\n        grams = 3,\n        tokenized = false,\n        sep_token = nothing,\n        target_col = :Words,\n        start_end_token = \"#\",\n        if_pca = false,\n        pca_eval_M = nothing,\n        ignore_nan = true,\n        verbose = false,\n    )","category":"page"},{"location":"man/find_path/#JudiLing.build_paths","page":"Find Paths","title":"JudiLing.build_paths","text":"The build_paths function constructs paths by only considering those n-grams that are close to the target. It first takes the predicted c-hat vector and finds the closest n neighbors in the C matrix. Then it selects all n-grams of these neighbors, and constructs all valid paths with those n-grams. The path producing the best correlation with the target semantic vector (through synthesis by analysis) is selected.\n\n\n\n\n\n","category":"function"},{"location":"man/find_path/#JudiLing.build_paths-NTuple{8, Any}","page":"Find Paths","title":"JudiLing.build_paths","text":"build_paths(\n    data_val,\n    C_train,\n    S_val,\n    F_train,\n    Chat_val,\n    A,\n    i2f,\n    C_train_ind;\n    rC = nothing,\n    max_t = 15,\n    max_can = 10,\n    n_neighbors = 10,\n    grams = 3,\n    tokenized = false,\n    sep_token = nothing,\n    target_col = :Words,\n    start_end_token = \"#\",\n    if_pca = false,\n    pca_eval_M = nothing,\n    ignore_nan = true,\n    verbose = false,\n)\n\nThe build_paths function constructs paths by only considering those n-grams that are close to the target. It first takes the predicted c-hat vector and finds the closest n neighbors in the C matrix. Then it selects all n-grams of these neighbors, and constructs all valid paths with those n-grams. The path producing the best correlation with the target semantic vector (through synthesis by analysis) is selected.\n\nObligatory Arguments\n\ndata::DataFrame: the training dataset\ndata_val::DataFrame: the validation dataset\nC_train::SparseMatrixCSC: the C matrix for the training dataset\nS_val::Union{SparseMatrixCSC, Matrix}: the S matrix for the validation dataset\nF_train::Union{SparseMatrixCSC, Matrix}: the F matrix for the training dataset\nChat_val::Matrix: the Chat matrix for the validation dataset\nA::SparseMatrixCSC: the adjacency matrix\ni2f::Dict: the dictionary returning features given indices\nC_train_ind::Array: the gold paths' indices for the training dataset\n\nOptional Arguments\n\nrC::Union{Nothing, Matrix}=nothing: correlation Matrix of C and Chat, specify to save computing time\nmax_t::Int64=15: maximum number of timesteps\nmax_can::Int64=10: maximum number of candidates to consider\nn_neighbors::Int64=10: the top n form neighbors to be considered\ngrams::Int64=3: the number n of grams that make up n-grams\ntokenized::Bool=false: if true, the dataset target is tokenized\nsep_token::Union{Nothing, String, Char}=nothing: separator\ntarget_col::Union{String, :Symbol}=:Words: the column name for target strings\nif_pca::Bool=false: turn on to enable pca mode\npca_eval_M::Matrix=nothing: pass original F for pca mode\nverbose::Bool=false: if true, more information will be printed\n\nExamples\n\n# training dataset\nJudiLing.build_paths(\n    latin_train,\n    cue_obj_train.C,\n    S_train,\n    F_train,\n    Chat_train,\n    A,\n    cue_obj_train.i2f,\n    cue_obj_train.gold_ind,\n    max_t=max_t,\n    n_neighbors=10,\n    verbose=false\n    )\n\n# validation dataset\nJudiLing.build_paths(\n    latin_val,\n    cue_obj_train.C,\n    S_val,\n    F_train,\n    Chat_val,\n    A,\n    cue_obj_train.i2f,\n    cue_obj_train.gold_ind,\n    max_t=max_t,\n    n_neighbors=10,\n    verbose=false\n    )\n\n# pca mode\nres_build = JudiLing.build_paths(\n    korean,\n    Array(Cpcat),\n    S,\n    F,\n    ChatPCA,\n    A,\n    cue_obj.i2f,\n    cue_obj.gold_ind,\n    max_t=max_t,\n    if_pca=true,\n    pca_eval_M=Fo,\n    n_neighbors=3,\n    verbose=true\n    )\n\n\n\n\n\n","category":"method"},{"location":"man/find_path/#Learn-paths","page":"Find Paths","title":"Learn paths","text":"","category":"section"},{"location":"man/find_path/","page":"Find Paths","title":"Find Paths","text":"    learn_paths\n    learn_paths(\n        data::DataFrame,\n        cue_obj::Cue_Matrix_Struct,\n        S_val::Union{SparseMatrixCSC, Matrix},\n        F_train,\n        Chat_val::Union{SparseMatrixCSC, Matrix};\n        Shat_val::Union{Nothing, Matrix} = nothing,\n        check_gold_path::Bool = false,\n        threshold::Float64 = 0.1,\n        is_tolerant::Bool = false,\n        tolerance::Float64 = (-1000.0),\n        max_tolerance::Int = 3,\n        activation::Union{Nothing, Function} = nothing,\n        ignore_nan::Bool = true,\n        verbose::Bool = true)\n    learn_paths(\n        data_train::DataFrame,\n        data_val::DataFrame,\n        C_train::Union{Matrix, SparseMatrixCSC},\n        S_val::Union{Matrix, SparseMatrixCSC},\n        F_train,\n        Chat_val::Union{Matrix, SparseMatrixCSC},\n        A::SparseMatrixCSC,\n        i2f::Dict,\n        f2i::Dict;\n        gold_ind::Union{Nothing, Vector} = nothing,\n        Shat_val::Union{Nothing, Matrix} = nothing,\n        check_gold_path::Bool = false,\n        max_t::Int = 15,\n        max_can::Int = 10,\n        threshold::Float64 = 0.1,\n        is_tolerant::Bool = false,\n        tolerance::Float64 = (-1000.0),\n        max_tolerance::Int = 3,\n        grams::Int = 3,\n        tokenized::Bool = false,\n        sep_token::Union{Nothing, String} = nothing,\n        keep_sep::Bool = false,\n        target_col::Union{Symbol, String} = \"Words\",\n        start_end_token::String = \"#\",\n        issparse::Union{Symbol, Bool} = :auto,\n        sparse_ratio::Float64 = 0.05,\n        if_pca::Bool = false,\n        pca_eval_M::Union{Nothing, Matrix} = nothing,\n        activation::Union{Nothing, Function} = nothing,\n        ignore_nan::Bool = true,\n        check_threshold_stat::Bool = false,\n        verbose::Bool = false\n    )\n    learn_paths_rpi(\n        data_train::DataFrame,\n        data_val::DataFrame,\n        C_train::Union{Matrix, SparseMatrixCSC},\n        S_val::Union{Matrix, SparseMatrixCSC},\n        F_train,\n        Chat_val::Union{Matrix, SparseMatrixCSC},\n        A::SparseMatrixCSC,\n        i2f::Dict,\n        f2i::Dict;\n        gold_ind::Union{Nothing, Vector} = nothing,\n        Shat_val::Union{Nothing, Matrix} = nothing,\n        check_gold_path::Bool = false,\n        max_t::Int = 15,\n        max_can::Int = 10,\n        threshold::Float64 = 0.1,\n        is_tolerant::Bool = false,\n        tolerance::Float64 = (-1000.0),\n        max_tolerance::Int = 3,\n        grams::Int = 3,\n        tokenized::Bool = false,\n        sep_token::Union{Nothing, String} = nothing,\n        keep_sep::Bool = false,\n        target_col::Union{Symbol, String} = \"Words\",\n        start_end_token::String = \"#\",\n        issparse::Union{Symbol, Bool} = :auto,\n        sparse_ratio::Float64 = 0.05,\n        if_pca::Bool = false,\n        pca_eval_M::Union{Nothing, Matrix} = nothing,\n        activation::Union{Nothing, Function} = nothing,\n        ignore_nan::Bool = true,\n        check_threshold_stat::Bool = false,\n        verbose::Bool = false\n    )","category":"page"},{"location":"man/find_path/#JudiLing.learn_paths","page":"Find Paths","title":"JudiLing.learn_paths","text":"A sequence finding algorithm using discrimination learning to predict, for a given word, which n-grams are best supported for a given position in the sequence of n-grams.\n\n\n\n\n\n","category":"function"},{"location":"man/find_path/#JudiLing.learn_paths-Tuple{DataFrames.DataFrame, JudiLing.Cue_Matrix_Struct, Union{SparseArrays.SparseMatrixCSC, Matrix}, Any, Union{SparseArrays.SparseMatrixCSC, Matrix}}","page":"Find Paths","title":"JudiLing.learn_paths","text":"learn_paths(\n    data::DataFrame,\n    cue_obj::Cue_Matrix_Struct,\n    S_val::Union{SparseMatrixCSC, Matrix},\n    F_train,\n    Chat_val::Union{SparseMatrixCSC, Matrix};\n    Shat_val::Union{Nothing, Matrix} = nothing,\n    check_gold_path::Bool = false,\n    threshold::Float64 = 0.1,\n    is_tolerant::Bool = false,\n    tolerance::Float64 = (-1000.0),\n    max_tolerance::Int = 3,\n    activation::Union{Nothing, Function} = nothing,\n    ignore_nan::Bool = true,\n    verbose::Bool = true)\n\nA high-level wrapper function for learn_paths with much less control. It aims for users who is very new to JudiLing and learn_paths function.\n\nObligatory Arguments\n\ndata::DataFrame: the training dataset\ncue_obj::Cue_Matrix_Struct: the C matrix object containing all information with C\nS_val::Union{SparseMatrixCSC, Matrix}: the S matrix for validation dataset\nF_train::Union{SparseMatrixCSC, Matrix, Chain}: either the F matrix for training dataset, or a deep learning comprehension model trained on the training set\nChat_val::Union{SparseMatrixCSC, Matrix}: the Chat matrix for validation dataset\n\nOptional Arguments\n\nShat_val::Union{Nothing, Matrix}=nothing: the Shat matrix for the validation dataset\ncheck_gold_path::Bool=false: if true, return a list of support values for the gold path; this information is returned as second output value\nthreshold::Float64=0.1:the value set for the support such that if the support of an n-gram is higher than this value, the n-gram will be taking into consideration\nis_tolerant::Bool=false: if true, select a specified number (given by max_tolerance) of n-grams whose supports are below threshold but above a second tolerance threshold to be added to the path\ntolerance::Float64=(-1000.0): the value set for the second threshold (in tolerant mode) such that if the support for an n-gram is in between this value and the threshold and the max_tolerance number has not been reached, then allow this n-gram to be added to the path\nmax_tolerance::Int64=4: maximum number of n-grams allowed in a path\nactivation::Function=nothing: the activation function you want to pass\nignore_nan::Bool=true: whether to ignore NaN when compare correlations, otherwise NaN will be selected as the max correlation value\nverbose::Bool=false: if true, more information is printed\n\nExamples\n\nres = learn_paths(latin, cue_obj, S, F, Chat)\n\n\n\n\n\n","category":"method"},{"location":"man/find_path/#JudiLing.learn_paths-Tuple{DataFrames.DataFrame, DataFrames.DataFrame, Union{SparseArrays.SparseMatrixCSC, Matrix}, Union{SparseArrays.SparseMatrixCSC, Matrix}, Any, Union{SparseArrays.SparseMatrixCSC, Matrix}, SparseArrays.SparseMatrixCSC, Dict, Dict}","page":"Find Paths","title":"JudiLing.learn_paths","text":"learn_paths(\n    data_train::DataFrame,\n    data_val::DataFrame,\n    C_train::Union{Matrix, SparseMatrixCSC},\n    S_val::Union{Matrix, SparseMatrixCSC},\n    F_train,\n    Chat_val::Union{Matrix, SparseMatrixCSC},\n    A::SparseMatrixCSC,\n    i2f::Dict,\n    f2i::Dict;\n    gold_ind::Union{Nothing, Vector} = nothing,\n    Shat_val::Union{Nothing, Matrix} = nothing,\n    check_gold_path::Bool = false,\n    max_t::Int = 15,\n    max_can::Int = 10,\n    threshold::Float64 = 0.1,\n    is_tolerant::Bool = false,\n    tolerance::Float64 = (-1000.0),\n    max_tolerance::Int = 3,\n    grams::Int = 3,\n    tokenized::Bool = false,\n    sep_token::Union{Nothing, String} = nothing,\n    keep_sep::Bool = false,\n    target_col::Union{Symbol, String} = \"Words\",\n    start_end_token::String = \"#\",\n    issparse::Union{Symbol, Bool} = :auto,\n    sparse_ratio::Float64 = 0.05,\n    if_pca::Bool = false,\n    pca_eval_M::Union{Nothing, Matrix} = nothing,\n    activation::Union{Nothing, Function} = nothing,\n    ignore_nan::Bool = true,\n    check_threshold_stat::Bool = false,\n    verbose::Bool = false\n)\n\nA sequence finding algorithm using discrimination learning to predict, for a given word, which n-grams are best supported for a given position in the sequence of n-grams.\n\nObligatory Arguments\n\ndata::DataFrame: the training dataset\ndata_val::DataFrame: the validation dataset\nC_train::Union{SparseMatrixCSC, Matrix}: the C matrix for training dataset\nS_val::Union{SparseMatrixCSC, Matrix}: the S matrix for validation dataset\nF_train::Union{SparseMatrixCSC, Matrix, Chain}: the F matrix for training dataset, or a deep learning comprehension model trained on the training data\nChat_val::Union{SparseMatrixCSC, Matrix}: the Chat matrix for validation dataset\nA::SparseMatrixCSC: the adjacency matrix\ni2f::Dict: the dictionary returning features given indices\nf2i::Dict: the dictionary returning indices given features\n\nOptional Arguments\n\ngold_ind::Union{Nothing, Vector}=nothing: gold paths' indices\nShat_val::Union{Nothing, Matrix}=nothing: the Shat matrix for the validation dataset\ncheck_gold_path::Bool=false: if true, return a list of support values for the gold path; this information is returned as second output value\nmax_t::Int64=15: maximum timestep\nmax_can::Int64=10: maximum number of candidates to consider\nthreshold::Float64=0.1:the value set for the support such that if the support of an n-gram is higher than this value, the n-gram will be taking into consideration\nis_tolerant::Bool=false: if true, select a specified number (given by max_tolerance) of n-grams whose supports are below threshold but above a second tolerance threshold to be added to the path\ntolerance::Float64=(-1000.0): the value set for the second threshold (in tolerant mode) such that if the support for an n-gram is in between this value and the threshold and the max_tolerance number has not been reached, then allow this n-gram to be added to the path\nmax_tolerance::Int64=4: maximum number of n-grams allowed in a path\ngrams::Int64=3: the number n of grams that make up an n-gram\ntokenized::Bool=false: if true, the dataset target is tokenized\nsep_token::Union{Nothing, String, Char}=nothing: separator token\nkeep_sep::Bool=false:if true, keep separators in cues\ntarget_col::Union{String, :Symbol}=:Words: the column name for target strings\nstart_end_token::Union{String, Char}=\"#\": start and end token in boundary cues\nissparse::Union{Symbol, Bool}=:auto: control of whether output of Mt matrix is a dense matrix or a sparse matrix\nsparse_ratio::Float64=0.05: the ratio to decide whether a matrix is sparse\nif_pca::Bool=false: turn on to enable pca mode\npca_eval_M::Matrix=nothing: pass original F for pca mode\nactivation::Function=nothing: the activation function you want to pass\nignore_nan::Bool=true: whether to ignore NaN when compare correlations, otherwise NaN will be selected as the max correlation value\ncheck_threshold_stat::Bool=false: if true, return a threshold and torlerance proportion for each timestep\nverbose::Bool=false: if true, more information is printed\n\nExamples\n\n# basic usage without tokenization\nres = JudiLing.learn_paths(\nlatin,\nlatin,\ncue_obj.C,\nS,\nF,\nChat,\nA,\ncue_obj.i2f,\nmax_t=max_t,\nmax_can=10,\ngrams=3,\nthreshold=0.1,\ntokenized=false,\nkeep_sep=false,\ntarget_col=:Word,\nverbose=true)\n\n# basic usage with tokenization\nres = JudiLing.learn_paths(\nfrench,\nfrench,\ncue_obj.C,\nS,\nF,\nChat,\nA,\ncue_obj.i2f,\nmax_t=max_t,\nmax_can=10,\ngrams=3,\nthreshold=0.1,\ntokenized=true,\nsep_token=\"-\",\nkeep_sep=true,\ntarget_col=:Syllables,\nverbose=true)\n\n# basic usage for validation data\nres_val = JudiLing.learn_paths(\nlatin_train,\nlatin_val,\ncue_obj_train.C,\nS_val,\nF_train,\nChat_val,\nA,\ncue_obj_train.i2f,\nmax_t=max_t,\nmax_can=10,\ngrams=3,\nthreshold=0.1,\ntokenized=false,\nkeep_sep=false,\ntarget_col=:Word,\nverbose=true)\n\n# turn on tolerance mode\nres_val = JudiLing.learn_paths(\n...\nthreshold=0.1,\nis_tolerant=true,\ntolerance=-0.1,\nmax_tolerance=4,\n...)\n\n# turn on check gold paths mode\nres_train, gpi_train = JudiLing.learn_paths(\n...\ngold_ind=cue_obj_train.gold_ind,\nShat_val=Shat_train,\ncheck_gold_path=true,\n...)\n\nres_val, gpi_val = JudiLing.learn_paths(\n...\ngold_ind=cue_obj_val.gold_ind,\nShat_val=Shat_val,\ncheck_gold_path=true,\n...)\n\n# control over sparsity\nres_val = JudiLing.learn_paths(\n...\nissparse=:auto,\nsparse_ratio=0.05,\n...)\n\n# pca mode\nres_learn = JudiLing.learn_paths(\nkorean,\nkorean,\nArray(Cpcat),\nS,\nF,\nChatPCA,\nA,\ncue_obj.i2f,\ncue_obj.f2i,\ncheck_gold_path=false,\ngold_ind=cue_obj.gold_ind,\nShat_val=Shat,\nmax_t=max_t,\nmax_can=10,\ngrams=3,\nthreshold=0.1,\ntokenized=true,\nsep_token=\"_\",\nkeep_sep=true,\ntarget_col=:Verb_syll,\nif_pca=true,\npca_eval_M=Fo,\nverbose=true);\n\n\n\n\n\n\n","category":"method"},{"location":"man/find_path/#JudiLing.learn_paths_rpi-Tuple{DataFrames.DataFrame, DataFrames.DataFrame, Union{SparseArrays.SparseMatrixCSC, Matrix}, Union{SparseArrays.SparseMatrixCSC, Matrix}, Any, Union{SparseArrays.SparseMatrixCSC, Matrix}, SparseArrays.SparseMatrixCSC, Dict, Dict}","page":"Find Paths","title":"JudiLing.learn_paths_rpi","text":"learn_paths_rpi(\n    data_train::DataFrame,\n    data_val::DataFrame,\n    C_train::Union{Matrix, SparseMatrixCSC},\n    S_val::Union{Matrix, SparseMatrixCSC},\n    F_train,\n    Chat_val::Union{Matrix, SparseMatrixCSC},\n    A::SparseMatrixCSC,\n    i2f::Dict,\n    f2i::Dict;\n    gold_ind::Union{Nothing, Vector} = nothing,\n    Shat_val::Union{Nothing, Matrix} = nothing,\n    check_gold_path::Bool = false,\n    max_t::Int = 15,\n    max_can::Int = 10,\n    threshold::Float64 = 0.1,\n    is_tolerant::Bool = false,\n    tolerance::Float64 = (-1000.0),\n    max_tolerance::Int = 3,\n    grams::Int = 3,\n    tokenized::Bool = false,\n    sep_token::Union{Nothing, String} = nothing,\n    keep_sep::Bool = false,\n    target_col::Union{Symbol, String} = \"Words\",\n    start_end_token::String = \"#\",\n    issparse::Union{Symbol, Bool} = :auto,\n    sparse_ratio::Float64 = 0.05,\n    if_pca::Bool = false,\n    pca_eval_M::Union{Nothing, Matrix} = nothing,\n    activation::Union{Nothing, Function} = nothing,\n    ignore_nan::Bool = true,\n    check_threshold_stat::Bool = false,\n    verbose::Bool = false\n)\n\nCalculate learn_paths with results indices supports as well.\n\nObligatory Arguments\n\ndata::DataFrame: the training dataset\ndata_val::DataFrame: the validation dataset\nC_train::Union{SparseMatrixCSC, Matrix}: the C matrix for training dataset\nS_val::Union{SparseMatrixCSC, Matrix}: the S matrix for validation dataset\nF_train::Union{SparseMatrixCSC, Matrix, Chain}: the F matrix for training dataset, or a deep learning comprehension model trained on the training data\nChat_val::Union{SparseMatrixCSC, Matrix}: the Chat matrix for validation dataset\nA::SparseMatrixCSC: the adjacency matrix\ni2f::Dict: the dictionary returning features given indices\nf2i::Dict: the dictionary returning indices given features\n\nOptional Arguments\n\ngold_ind::Union{Nothing, Vector}=nothing: gold paths' indices\nShat_val::Union{Nothing, Matrix}=nothing: the Shat matrix for the validation dataset\ncheck_gold_path::Bool=false: if true, return a list of support values for the gold path; this information is returned as second output value\nmax_t::Int64=15: maximum timestep\nmax_can::Int64=10: maximum number of candidates to consider\nthreshold::Float64=0.1:the value set for the support such that if the support of an n-gram is higher than this value, the n-gram will be taking into consideration\nis_tolerant::Bool=false: if true, select a specified number (given by max_tolerance) of n-grams whose supports are below threshold but above a second tolerance threshold to be added to the path\ntolerance::Float64=(-1000.0): the value set for the second threshold (in tolerant mode) such that if the support for an n-gram is in between this value and the threshold and the max_tolerance number has not been reached, then allow this n-gram to be added to the path\nmax_tolerance::Int64=4: maximum number of n-grams allowed in a path\ngrams::Int64=3: the number n of grams that make up an n-gram\ntokenized::Bool=false: if true, the dataset target is tokenized\nsep_token::Union{Nothing, String, Char}=nothing: separator token\nkeep_sep::Bool=false:if true, keep separators in cues\ntarget_col::Union{String, :Symbol}=:Words: the column name for target strings\nstart_end_token::Union{String, Char}=\"#\": start and end token in boundary cues\nissparse::Union{Symbol, Bool}=:auto: control of whether output of Mt matrix is a dense matrix or a sparse matrix\nsparse_ratio::Float64=0.05: the ratio to decide whether a matrix is sparse\nif_pca::Bool=false: turn on to enable pca mode\npca_eval_M::Matrix=nothing: pass original F for pca mode\nactivation::Function=nothing: the activation function you want to pass\nignore_nan::Bool=true: whether to ignore NaN when compare correlations, otherwise NaN will be selected as the max correlation value\ncheck_threshold_stat::Bool=false: if true, return a threshold and torlerance proportion for each timestep\nverbose::Bool=false: if true, more information is printed\n\n\n\n\n\n","category":"method"},{"location":"man/find_path/#Utility-functions","page":"Find Paths","title":"Utility functions","text":"","category":"section"},{"location":"man/find_path/","page":"Find Paths","title":"Find Paths","text":"    eval_can(candidates, S, F, i2f, max_can, if_pca, pca_eval_M)\n    find_top_feature_indices(rC, C_train_ind)\n    make_ngrams_ind(res, n)\n    predict_shat(F::Union{Matrix, SparseMatrixCSC},\n                          ci::Vector{Int})","category":"page"},{"location":"man/find_path/#JudiLing.eval_can-NTuple{7, Any}","page":"Find Paths","title":"JudiLing.eval_can","text":"eval_can(candidates, S, F::Union{Matrix,SparseMatrixCSC, Chain}, i2f, max_can, if_pca, pca_eval_M)\n\nCalculate for each candidate path the correlation between predicted semantic vector and the gold standard semantic vector, and select as target for production the path with the highest correlation.\n\n\n\n\n\n","category":"method"},{"location":"man/find_path/#JudiLing.find_top_feature_indices-Tuple{Any, Any}","page":"Find Paths","title":"JudiLing.find_top_feature_indices","text":"find_top_feature_indices(rC, C_train_ind)\n\nFind all indices for the n-grams of the top n closest neighbors of a given target.\n\n\n\n\n\n","category":"method"},{"location":"man/find_path/#JudiLing.make_ngrams_ind-Tuple{Any, Any}","page":"Find Paths","title":"JudiLing.make_ngrams_ind","text":"make_ngrams_ind(res, n)\n\nConstruct ngrams indices.\n\n\n\n\n\n","category":"method"},{"location":"man/find_path/#JudiLing.predict_shat-Tuple{Union{SparseArrays.SparseMatrixCSC, Matrix}, Vector{Int64}}","page":"Find Paths","title":"JudiLing.predict_shat","text":"predict_shat(F::Union{Matrix, SparseMatrixCSC},\n             ci::Vector{Int})\n\nPredicts semantic vector shat given a comprehension matrix F and a list of indices of ngrams ci.\n\nObligatory arguments\n\nF::Union{Matrix, SparseMatrixCSC}: Comprehension matrix F.\nci::Vector{Int}: Vector of indices of ngrams in c vector. Essentially, this is a vector indicating which ngrams in a c vector are absent and which are present.\n\n\n\n\n\n","category":"method"},{"location":"man/display/","page":"Display","title":"Display","text":"CurrentModule = JudiLing","category":"page"},{"location":"man/display/#Cholesky","page":"Display","title":"Cholesky","text":"","category":"section"},{"location":"man/display/","page":"Display","title":"Display","text":"    display_matrix(M, rownames, colnames)\n    display_matrix(data, target_col, cue_obj, M, M_type)","category":"page"},{"location":"man/display/#JudiLing.display_matrix-Tuple{Any, Any, Any}","page":"Display","title":"JudiLing.display_matrix","text":"display_matrix(M, rownames, colnames)\n\nDisplay matrix with rownames and colnames.\n\n\n\n\n\n","category":"method"},{"location":"man/display/#JudiLing.display_matrix-NTuple{5, Any}","page":"Display","title":"JudiLing.display_matrix","text":"display_matrix(data, target_col, cue_pS_obj, M, M_type)\n\nDisplay matrix with rownames and colnames.\n\nObligatory Arguments\n\ndata::DataFrame: the dataset\ntarget_col::Union{String, Symbol}: the target column name\ncue_pS_obj::Union{Cue_Matrix_Struct,PS_Matrix_Struct}: the cue matrix or pS matrix structure\nM::Union{SparseMatrixCSC, Matrix}: the matrix\nM_type::Union{String, Symbol}: the type of the matrix, currently support :C, :S, :F, :G, :Chat, :Shat, :A, :R and :pS\n\nOptional Arguments\n\nnrow::Int64 = 6: the number of rows to display\nncol::Int64 = 6: the number of columns to display\nreturn_matrix::Bool = false: whether the created dataframe should be returned (and not only displayed)\n\nExamples\n\nJudiLing.display_matrix(latin, :Word, cue_obj, cue_obj.C, :C)\nJudiLing.display_matrix(latin, :Word, cue_obj, S, :S)\nJudiLing.display_matrix(latin, :Word, cue_obj, G, :G)\nJudiLing.display_matrix(latin, :Word, cue_obj, Chat, :Chat)\nJudiLing.display_matrix(latin, :Word, cue_obj, F, :F)\nJudiLing.display_matrix(latin, :Word, cue_obj, Shat, :Shat)\nJudiLing.display_matrix(latin, :Word, cue_obj, A, :A)\nJudiLing.display_matrix(latin, :Word, cue_obj, R, :R)\nJudiLing.display_matrix(latin, :Word, pS_obj, pS_obj.pS, :pS)\n\n\n\n\n\n","category":"method"},{"location":"man/input/","page":"Loading data","title":"Loading data","text":"CurrentModule = JudiLing","category":"page"},{"location":"man/input/#Loading-data","page":"Loading data","title":"Loading data","text":"","category":"section"},{"location":"man/input/","page":"Loading data","title":"Loading data","text":"load_dataset(filepath::String;\n            delim::String=\",\",\n            kargs...)\nloading_data_randomly_split(\n      data_path::String,\n      output_dir_path::String,\n      data_prefix::String;\n      val_sample_size::Int = 0,\n      val_ratio::Float = 0.0,\n      random_seed::Int = 314)\nloading_data_careful_split(\n      data_path::String,\n      data_prefix::String,\n      output_dir_path::String,\n      n_features_columns::Union{Vector{Symbol},Vector{String}};\n      train_sample_size::Int = 0,\n      val_sample_size::Int = 0,\n      val_ratio::Float64 = 0.0,\n      n_grams_target_col::Union{Symbol, String} = :Word,\n      n_grams_tokenized::Bool = false,\n      n_grams_sep_token::Union{Nothing, String} = nothing,\n      grams::Int = 3,\n      n_grams_keep_sep::Bool = false,\n      start_end_token::String = \"#\",\n      random_seed::Int = 314,\n      verbose::Bool = false)","category":"page"},{"location":"man/input/#JudiLing.load_dataset-Tuple{String}","page":"Loading data","title":"JudiLing.load_dataset","text":"load_dataset(filepath::String;\n            delim::String=\",\",\n            kargs...)\n\nLoad a dataset from file, usually comma- or tab-separated. Returns a DataFrame.\n\nObligatory arguments\n\nfilepath::String: Path to file to be loaded.\n\nOptional arguments\n\ndelim::String=\",\": Delimiter in the file (usually either \",\" or \"\\t\").\nkargs...: Further keyword arguments are passed to CSV.File().\n\nExample\n\nlatin = JudiLing.load_dataset(\"latin.csv\")\nfirst(latin, 10)\n\n\n\n\n\n","category":"method"},{"location":"man/input/#JudiLing.loading_data_randomly_split-Tuple{String, String, String}","page":"Loading data","title":"JudiLing.loading_data_randomly_split","text":"loading_data_randomly_split(\n    data_path::String,\n    output_dir_path::String,\n    data_prefix::String;\n    val_sample_size::Int = 0,\n    val_ratio::Float64 = 0.0,\n    random_seed::Int = 314)\n\nRead in a dataframe, splitting the dataframe into a training and validation dataset. The two are also written to output_dir_path at the same time.\n\nnote: Note\nThe order of data_prefix and output_dir_path is exactly reversed compared to loading_data_careful_split.\n\nObligatory arguments\n\ndata_path::String: Path to where the dataset is stored.\noutput_dir_path::String: Path to where the new dataframes should be stored.\ndata_prefix::String: Prefix of the two new files, will be called data_prefix_train.csv and data_prefix_val.csv.\n\nOptional arguments\n\nval_sample_size::Int = 0: Size of the validation dataset (only val_sample_size or val_ratio may be used).\nval_ratio::Float64 = 0.0: Fraction of the data that should be in the validation dataset (only val_sample_size or val_ratio may be used).\nrandom_seed::Int = 314: Random seed for controlling random split.\n\nExample\n\ndata_train, data_val = JudiLing.loading_data_randomly_split(\n    \"latin.csv\",\n    \"careful\",\n    \"latin\",\n    [\"Lexeme\",\"Person\",\"Number\",\"Tense\",\"Voice\",\"Mood\"]\n)\n\n\n\n\n\n","category":"method"},{"location":"man/input/#JudiLing.loading_data_careful_split-Tuple{String, String, String, Union{Vector{String}, Vector{Symbol}}}","page":"Loading data","title":"JudiLing.loading_data_careful_split","text":"loading_data_careful_split(\n    data_path::String,\n    data_prefix::String,\n    output_dir_path::String,\n    n_features_columns::Union{Vector{Symbol},Vector{String}};\n    train_sample_size::Int = 0,\n    val_sample_size::Int = 0,\n    val_ratio::Float64 = 0.0,\n    n_grams_target_col::Union{Symbol, String} = :Word,\n    n_grams_tokenized::Bool = false,\n    n_grams_sep_token::Union{Nothing, String} = nothing,\n    grams::Int = 3,\n    n_grams_keep_sep::Bool = false,\n    start_end_token::String = \"#\",\n    random_seed::Int = 314,\n    verbose::Bool = false)\n\nRead in a dataframe, splitting the dataframe into a training and validation dataset. The split is done such that all features in the columns specified in n_features_columns occur both in the training and validation data. It is also ensured that the unique grams resulting from splitting the strings in column n_grams_target_col into grams-grams occur in both datasets. The two are also written to output_dir_path at the same time.\n\nnote: Note\nThe order of data_prefix and output_dir_path is exactly reversed compared to loading_data_randomly_split.\n\nObligatory arguments\n\ndata_path::String: Path to where the dataset is stored.\noutput_dir_path::String: Path to where the new dataframes should be stored.\ndata_prefix::String: Prefix of the two new files, will be called data_prefix_train.csv and data_prefix_val.csv.\nn_features_columns::Vector{Union{Symbol, String}}: Vector with columns whose features have to occur in both the training and validation data.\n\nOptional arguments\n\nval_sample_size::Int = 0: Size of the validation dataset (only val_sample_size or val_ratio may be used).\nval_ratio::Float64 = 0.0: Fraction of the data that should be in the validation dataset (only val_sample_size or val_ratio may be used).\nn_grams_target_col::Union{Symbol, String} = :Word: Column with target words.\nn_grams_tokenized::Bool = false: Whether the words in n_grams_target_col are already tokenized.\nn_grams_sep_token::Union{Nothing, String} = nothing: String with which tokens in n_grams_target_col are separated (only used if n_grams_tokenized=true).\ngrams::Int = 3: Granularity of the n-grams.\nn_grams_keep_sep::Bool = false: Whether the token separators should be kept in the ngrams (this is useful e.g. when working with syllables).\nstart_end_token::String = \"#\": Token with which the start and end of words should be marked.\nrandom_seed::Int = 314: Random seed for controlling random split.\n\nExample\n\ndata_train, data_val = JudiLing.loading_data_careful_split(\n    \"latin.csv\",\n    \"latin\",\n    \"careful\",\n    [\"Lexeme\",\"Person\",\"Number\",\"Tense\",\"Voice\",\"Mood\"]\n)\n\n\n\n\n\n","category":"method"},{"location":"man/all_manual/","page":"All Manual index","title":"All Manual index","text":"CurrentModule = JudiLing","category":"page"},{"location":"man/all_manual/","page":"All Manual index","title":"All Manual index","text":"","category":"page"},{"location":"man/output/","page":"Output","title":"Output","text":"CurrentModule = JudiLing","category":"page"},{"location":"man/output/#Output","page":"Output","title":"Output","text":"","category":"section"},{"location":"man/output/","page":"Output","title":"Output","text":"    write2csv\n    write2df\n    write_comprehension_eval\n    write2csv(res, data, cue_obj_train, cue_obj_val, filename)\n    write2csv(gpi::Vector{Gold_Path_Info_Struct}, filename)\n    write2csv(ts::Threshold_Stat_Struct, filename)\n    write2df(res, data, cue_obj_train, cue_obj_val)\n    write2df(gpi::Vector{Gold_Path_Info_Struct})\n    write2df(ts::Threshold_Stat_Struct)\n    write_comprehension_eval(SChat, SC, data, target_col, filename)\n    write_comprehension_eval(SChat, SC, SC_rest, data, data_rest, target_col, filename)\n    save_L_matrix(L, filename)\n    load_L_matrix(filename)\n    save_S_matrix(S, filename, data, target_col)\n    load_S_matrix(filename)","category":"page"},{"location":"man/output/#JudiLing.write2csv","page":"Output","title":"JudiLing.write2csv","text":"Write results into a csv file. This function takes as input the results from the learn_paths and build_paths functions, including the information on gold paths that is optionally returned as second output result.\n\n\n\n\n\n","category":"function"},{"location":"man/output/#JudiLing.write2df","page":"Output","title":"JudiLing.write2df","text":"Reformat results into a dataframe. This function takes as input the results from the learn_paths and build_paths functions, including the information on gold paths that is optionally returned as second output result.\n\n\n\n\n\n","category":"function"},{"location":"man/output/#JudiLing.write_comprehension_eval","page":"Output","title":"JudiLing.write_comprehension_eval","text":"Write comprehension evaluation into a CSV file, include target and predicted ids and indentifiers and their correlations.\n\n\n\n\n\n","category":"function"},{"location":"man/output/#JudiLing.write2csv-NTuple{5, Any}","page":"Output","title":"JudiLing.write2csv","text":"write2csv(res, data, cue_obj_train, cue_obj_val, filename)\n\nWrite results into csv file for the results from learn_paths and build_paths.\n\nObligatory Arguments\n\nres::Array{Array{Result_Path_Info_Struct,1},1}: the results from learn_paths or build_paths\ndata::DataFrame: the dataset\ncue_obj_train::Cue_Matrix_Struct: the cue object for training dataset\ncue_obj_val::Cue_Matrix_Struct: the cue object for validation dataset\nfilename::String: the filename\n\nOptional Arguments\n\ngrams::Int64=3: the number n in n-gram cues\ntokenized::Bool=false: if true, the dataset target is tokenized\nsep_token::Union{Nothing, String, Char}=nothing: separator\nstart_end_token::Union{String, Char}=\"#\": start and end token in boundary cues\noutput_sep_token::Union{String, Char}=\"\": output separator\npath_sep_token::Union{String, Char}=\":\": path separator\ntarget_col::Union{String, Symbol}=:Words: the column name for target strings\nroot_dir::String=\".\": dir path for project root dir\noutput_dir::String=\".\": output dir inside root dir\n\nExamples\n\n# writing results for training data\nJudiLing.write2csv(\n    res_train,\n    latin_train,\n     cue_obj_train,\n    cue_obj_train,\n    \"res_latin_train.csv\",\n    grams=3,\n    tokenized=false,\n    sep_token=nothing,\n    start_end_token=\"#\",\n    output_sep_token=\"\",\n    path_sep_token=\":\",\n    target_col=:Word,\n    root_dir=\".\",\n    output_dir=\"test_out\")\n\n# writing results for validation data\nJudiLing.write2csv(\n    res_val,\n    latin_val,\n    cue_obj_train,\n    cue_obj_val,\n    \"res_latin_val.csv\",\n    grams=3,\n    tokenized=false,\n    sep_token=nothing,\n    start_end_token=\"#\",\n    output_sep_token=\"\",\n    path_sep_token=\":\",\n    target_col=:Word,\n    root_dir=\".\",\n    output_dir=\"test_out\")\n\n\n\n\n\n","category":"method"},{"location":"man/output/#JudiLing.write2csv-Tuple{Vector{JudiLing.Gold_Path_Info_Struct}, Any}","page":"Output","title":"JudiLing.write2csv","text":"write2csv(gpi::Vector{Gold_Path_Info_Struct}, filename)\n\nWrite results into csv file for the gold paths' information optionally returned by learn_paths and build_paths.\n\nObligatory Arguments\n\ngpi::Vector{Gold_Path_Info_Struct}: the gold paths' information\nfilename::String: the filename\n\nOptional Arguments\n\nroot_dir::String=\".\": dir path for project root dir\noutput_dir::String=\".\": output dir inside root dir\n\nExamples\n\n# write gold standard paths to csv for training data\nJudiLing.write2csv(\n    gpi_train,\n    \"gpi_latin_train.csv\",\n    root_dir=\".\",\n    output_dir=\"test_out\"\n    )\n\n# write gold standard paths to csv for validation data\nJudiLing.write2csv(\n    gpi_val,\n    \"gpi_latin_val.csv\",\n    root_dir=\".\",\n    output_dir=\"test_out\"\n    )\n\n\n\n\n\n","category":"method"},{"location":"man/output/#JudiLing.write2csv-Tuple{JudiLing.Threshold_Stat_Struct, Any}","page":"Output","title":"JudiLing.write2csv","text":"write2csv(ts::Threshold_Stat_Struct, filename)\n\nWrite results into csv file for threshold and tolerance proportion for each timestep.\n\nObligatory Arguments\n\ngpi::Vector{Gold_Path_Info_Struct}: the gold paths' information\nfilename::String: the filename\n\nOptional Arguments\n\nroot_dir::String=\".\": dir path for project root dir\noutput_dir::String=\".\": output dir inside root dir\n\nExamples\n\nJudiLing.write2csv(ts, \"ts.csv\", root_dir = @__DIR__, output_dir=\"out\")\n\n\n\n\n\n","category":"method"},{"location":"man/output/#JudiLing.write2df-NTuple{4, Any}","page":"Output","title":"JudiLing.write2df","text":"write2df(res, data, cue_obj_train, cue_obj_val)\n\nReformat results into a dataframe for the results form learn_paths and build_paths functions.\n\nObligatory Arguments\n\nres: output of learn_paths or build_paths\ndata::DataFrame: the dataset\ncue_obj_train: cue object of the training data set\ncue_obj_val: cue object of the validation data set\n\nOptional Arguments\n\ngrams::Int64=3: the number n in n-gram cues\ntokenized::Bool=false: if true, the dataset target is tokenized\nsep_token::Union{Nothing, String, Char}=nothing: separator\nstart_end_token::Union{String, Char}=\"#\": start and end token in boundary cues\noutput_sep_token::Union{String, Char}=\"\": output separator\npath_sep_token::Union{String, Char}=\":\": path separator\ntarget_col::Union{String, Symbol}=:Words: the column name for target strings\n\nExamples\n\n# writing results for training data\nJudiLing.write2df(\n    res_train,\n    latin_train,\n    cue_obj_train,\n    cue_obj_train,\n    grams=3,\n    tokenized=false,\n    sep_token=nothing,\n    start_end_token=\"#\",\n    output_sep_token=\"\",\n    path_sep_token=\":\",\n    target_col=:Word)\n\n# writing results for validation data\nJudiLing.write2df(\n    res_val,\n    latin_val,\n    cue_obj_train,\n    cue_obj_val,\n    grams=3,\n    tokenized=false,\n    sep_token=nothing,\n    start_end_token=\"#\",\n    output_sep_token=\"\",\n    path_sep_token=\":\",\n    target_col=:Word)\n\n\n\n\n\n","category":"method"},{"location":"man/output/#JudiLing.write2df-Tuple{Vector{JudiLing.Gold_Path_Info_Struct}}","page":"Output","title":"JudiLing.write2df","text":"write2df(gpi::Vector{Gold_Path_Info_Struct})\n\nWrite results into a dataframe for the gold paths' information optionally returned by learn_paths and build_paths.\n\nObligatory Arguments\n\ngpi::Vector{Gold_Path_Info_Struct}: the gold paths' information\n\nExamples\n\n# write gold standard paths to df for training data\nJudiLing.write2csv(gpi_train)\n\n# write gold standard paths to df for validation data\nJudiLing.write2csv(gpi_val)\n\n\n\n\n\n","category":"method"},{"location":"man/output/#JudiLing.write2df-Tuple{JudiLing.Threshold_Stat_Struct}","page":"Output","title":"JudiLing.write2df","text":"write2df(ts::Threshold_Stat_Struct)\n\nWrite results into a dataframe for threshold and tolerance proportion for each timestep.\n\nObligatory Arguments\n\nts::Threshold_Stat_Struct: the threshold and tolerance proportion\n\nExamples\n\nJudiLing.write2df(ts)\n\n\n\n\n\n","category":"method"},{"location":"man/output/#JudiLing.write_comprehension_eval-NTuple{5, Any}","page":"Output","title":"JudiLing.write_comprehension_eval","text":"write_comprehension_eval(SChat, SC, data, target_col, filename)\n\nWrite comprehension evaluation into a CSV file, include target and predicted ids and indentifiers and their correlations.\n\nObligatory Arguments\n\nSChat::Matrix: the Shat/Chat matrix\nSC::Matrix: the S/C matrix\ndata::DataFrame: the data\ntarget_col::Symbol: the name of target column\nfilename::String: the filename/filepath\n\nOptional Arguments\n\nk: top k candidates\nroot_dir::String=\".\": dir path for project root dir\noutput_dir::String=\".\": output dir inside root dir\n\nExamples\n\nJudiLing.write_comprehension_eval(Chat, cue_obj.C, latin, :Word, \"output.csv\",\n    k=10, root_dir=@__DIR__, output_dir=\"out\")\n\n\n\n\n\n","category":"method"},{"location":"man/output/#JudiLing.write_comprehension_eval-NTuple{7, Any}","page":"Output","title":"JudiLing.write_comprehension_eval","text":"write_comprehension_eval(SChat, SC, SC_rest, data, data_rest, target_col, filename)\n\nWrite comprehension evaluation into a CSV file for both training and validation datasets, include target and predicted ids and indentifiers and their correlations.\n\nObligatory Arguments\n\nSChat::Matrix: the Shat/Chat matrix\nSC::Matrix: the S/C matrix\nSC_rest::Matrix: the rest S/C matrix\ndata::DataFrame: the data\ndata_rest::DataFrame: the rest data\ntarget_col::Symbol: the name of target column\nfilename::String: the filename/filepath\n\nOptional Arguments\n\nk: top k candidates\nroot_dir::String=\".\": dir path for project root dir\noutput_dir::String=\".\": output dir inside root dir\n\nExamples\n\nJudiLing.write_comprehension_eval(Shat_val, S_val, S_train, latin_val, latin_train,\n    :Word, \"all_output.csv\", k=10, root_dir=@__DIR__, output_dir=\"out\")\n\n\n\n\n\n","category":"method"},{"location":"man/output/#JudiLing.save_L_matrix-Tuple{Any, Any}","page":"Output","title":"JudiLing.save_L_matrix","text":"save_L_matrix(L, filename)\n\nSave lexome matrix into csv file.\n\nObligatory Arguments\n\nL::L_Matrix_Struct: the lexome matrix struct\nfilename::String: the filename/filepath\n\nExamples\n\nJudiLing.save_L_matrix(L, joinpath(@__DIR__, \"L.csv\"))\n\n\n\n\n\n","category":"method"},{"location":"man/output/#JudiLing.load_L_matrix-Tuple{Any}","page":"Output","title":"JudiLing.load_L_matrix","text":"load_L_matrix(filename)\n\nLoad lexome matrix from csv file.\n\nObligatory Arguments\n\nfilename::String: the filename/filepath\n\nOptional Arguments\n\nheader::Bool=false: header in csv\n\nExamples\n\nL_load = JudiLing.load_L_matrix(joinpath(@__DIR__, \"L.csv\"))\n\n\n\n\n\n","category":"method"},{"location":"man/output/#JudiLing.save_S_matrix-NTuple{4, Any}","page":"Output","title":"JudiLing.save_S_matrix","text":"save_S_matrix(S, filename, data, target_col)\n\nSave S matrix into a csv file.\n\nObligatory Arguments\n\nS::Matrix: the S matrix\nfilename::String: the filename/filepath\ndata::DataFrame: the data\ntarget_col::Symbol: the name of target column\n\nOptional Arguments\n\nsep::Bool=\" \": separator in CSV file\n\nExamples\n\nJudiLing.save_S_matrix(S, joinpath(@__DIR__, \"S.csv\"), latin, :Word)\n\n\n\n\n\n","category":"method"},{"location":"man/output/#JudiLing.load_S_matrix-Tuple{Any}","page":"Output","title":"JudiLing.load_S_matrix","text":"load_S_matrix(filename)\n\nLoad S matrix from a csv file.\n\nObligatory Arguments\n\nfilename::String: the filename/filepath\n\nOptional Arguments\n\nheader::Bool=false: header in csv\nsep::Bool=\" \": separator in CSV file\n\nExamples\n\nJudiLing.load_S_matrix(joinpath(@__DIR__, \"S.csv\"))\n\n\n\n\n\n","category":"method"},{"location":"man/make_yt_matrix/","page":"Make Yt Matrix","title":"Make Yt Matrix","text":"CurrentModule = JudiLing","category":"page"},{"location":"man/make_yt_matrix/#Make-Yt-Matrix","page":"Make Yt Matrix","title":"Make Yt Matrix","text":"","category":"section"},{"location":"man/make_yt_matrix/","page":"Make Yt Matrix","title":"Make Yt Matrix","text":"    make_Yt_matrix\n    make_Yt_matrix(t, data, f2i)","category":"page"},{"location":"man/make_yt_matrix/#JudiLing.make_Yt_matrix","page":"Make Yt Matrix","title":"JudiLing.make_Yt_matrix","text":"Make Yt matrix for timestep t.\n\n\n\n\n\n","category":"function"},{"location":"man/make_yt_matrix/#JudiLing.make_Yt_matrix-Tuple{Any, Any, Any}","page":"Make Yt Matrix","title":"JudiLing.make_Yt_matrix","text":"make_Yt_matrix(t, data, f2i)\n\nMake Yt matrix for timestep t. A given column of the Yt matrix specifies the support for the corresponding n-gram predicted for timestep t for each of the observations (rows of Yt).\n\nObligatory Arguments\n\nt::Int64: the timestep t\ndata::DataFrame: the dataset\nf2i::Dict: the dictionary returning indices given features\n\nOptional Arguments\n\ntokenized::Bool=false: if true, the dataset target is assumed to be tokenized\nsep_token::Union{Nothing, String, Char}=nothing: separator token\nverbose::Bool=false: if verbose, more information will be printed\n\nExamples\n\nlatin = DataFrame(CSV.File(joinpath(\"data\", \"latin_mini.csv\")))\nJudiLing.make_Yt_matrix(2, latin)\n\n\n\n\n\n","category":"method"},{"location":"man/preprocess/","page":"Preprocess","title":"Preprocess","text":"CurrentModule = JudiLing","category":"page"},{"location":"man/preprocess/#Preprocess","page":"Preprocess","title":"Preprocess","text":"","category":"section"},{"location":"man/preprocess/","page":"Preprocess","title":"Preprocess","text":"    SplitDataException\n    lpo_cv_split(p, data_path)\n    loo_cv_split(data_path)\n    train_val_random_split(data_path, output_dir_path, data_prefix)\n    train_val_careful_split(data_path, output_dir_path, data_prefix, n_features_columns)","category":"page"},{"location":"man/preprocess/#JudiLing.SplitDataException","page":"Preprocess","title":"JudiLing.SplitDataException","text":"Split Data Exception\n\n\n\n\n\n","category":"type"},{"location":"man/preprocess/#JudiLing.lpo_cv_split-Tuple{Any, Any}","page":"Preprocess","title":"JudiLing.lpo_cv_split","text":"lpo_cv_split(p, data_path)\n\nLeave p out cross-validation.\n\n\n\n\n\n","category":"method"},{"location":"man/preprocess/#JudiLing.loo_cv_split-Tuple{Any}","page":"Preprocess","title":"JudiLing.loo_cv_split","text":"loo_cv_split(data_path)\n\nLeave one out cross-validation.\n\n\n\n\n\n","category":"method"},{"location":"man/preprocess/#JudiLing.train_val_random_split-Tuple{Any, Any, Any}","page":"Preprocess","title":"JudiLing.train_val_random_split","text":"train_val_random_split(data_path, output_dir_path, data_prefix)\n\nRandomly split dataset.\n\n\n\n\n\n","category":"method"},{"location":"man/preprocess/#JudiLing.train_val_careful_split-NTuple{4, Any}","page":"Preprocess","title":"JudiLing.train_val_careful_split","text":"train_val_careful_split(data_path, output_dir_path, data_prefix, n_features_columns)\n\nCarefully split dataset.\n\n\n\n\n\n","category":"method"},{"location":"man/test_combo/","page":"Test Combo","title":"Test Combo","text":"CurrentModule = JudiLing","category":"page"},{"location":"man/test_combo/#Test-Combo","page":"Test Combo","title":"Test Combo","text":"","category":"section"},{"location":"man/test_combo/","page":"Test Combo","title":"Test Combo","text":"    test_combo(test_mode;kwargs...)","category":"page"},{"location":"man/test_combo/#JudiLing.test_combo-Tuple{Any}","page":"Test Combo","title":"JudiLing.test_combo","text":"test_combo(test_mode;kwargs...)\n\nA wrapper function for a full model for a specific combination of parameters. A detailed introduction is in Test Combo Introduction\n\nObligatory Arguments\n\ntest_mode::Symbol: which test mode, currently supports :trainonly, :presplit, :carefulsplit and :randomsplit.\n\nOptional Arguments\n\ntrain_sample_size::Int64=0: the desired number of training data\nval_sample_size::Int64=0: the desired number of validation data\nval_ratio::Float64=0.0: the desired portion of validation data, if works only if :valsamplesize is 0.0.\nextension::String=\".csv\": the extension for data nfeaturesinflections\nn_grams_target_col::Union{String, Symbol}=:Word: the column name for target strings\nn_grams_tokenized::Boolean=false: if true, the dataset target is assumed to be tokenized\nn_grams_sep_token::String=nothing: separator\ngrams::Int64=3: the number of grams for cues\nn_grams_keep_sep::Boolean=false: if true, keep separators in cues\nstart_end_token::String=\":\": start and end token in boundary cues\npath_sep_token::String=\":\": path separator in the assembled path\nrandom_seed::Int64=314: the random seed\nsd_base_mean::Int64=1: the sd mean of base features\nsd_inflection_mean::Int64=1: the sd mean of inflectional features\nsd_base::Int64=4: the sd of base features\nsd_inflection::Int64=4: the sd of inflectional features\nisdeep::Boolean=true: if true, mean of each feature is also randomized\nadd_noise::Boolean=true: if true, add additional Gaussian noise\nsd_noise::Int64=1: the sd of the Gaussian noise\nnormalized::Boolean=false: if true, most of the values range between 1 and -1, it may slightly exceed between 1 or -1 depending on the sd\nif_combined::Boolean=false: if true, then features are combined with both training and validation data\nlearn_mode::Int64=:cholesky: which learning mode, currently supports :cholesky and :wh\nmethod::Int64=:additive: whether :additive or :multiplicative decomposition is required\nshift::Int64=0.02: shift value for :additive decomposition\nmultiplier::Int64=1.01: multiplier value for :multiplicative decomposition\noutput_format::Int64=:auto: to force output format to dense(:dense) or sparse(:sparse), make it auto(:auto) to determined by the program\nsparse_ratio::Int64=0.05: the ratio to decide whether a matrix is sparse\nwh_freq::Vector=nothing: the learning sequence\ninit_weights::Matrix=nothing: the initial weights\neta::Float64=0.1: the learning rate\nn_epochs::Int64=1: the number of epochs to be trained\nmax_t::Int64=0: the number of epochs to be trained\nA::Matrix=nothing: the number of epochs to be trained\nA_mode::Symbol=:combined: the adjacency matrix mode, currently supports :combined or :train_only\nmax_can::Int64=10: the max number of candidate path to keep in the output\nthreshold_train::Float64=0.1:the value set for the support such that if the support of an n-gram is higher than this value, the n-gram will be taking into consideration for training data\nis_tolerant_train::Bool=false: if true, select a specified number (given by max_tolerance) of n-grams whose supports are below threshold but above a second tolerance threshold to be added to the path  for training data\ntolerance_train::Float64=-0.1: the value set for the second threshold (in tolerant mode) such that if the support for an n-gram is in between this value and the threshold and the max_tolerance number has not been reached, then allow this n-gram to be added to the path  for training data\nmax_tolerance_train::Int64=2: maximum number of n-grams allowed in a path for training data\nthreshold_val::Float64=0.1:the value set for the support such that if the support of an n-gram is higher than this value, the n-gram will be taking into consideration for validation data\nis_tolerant_val::Bool=false: if true, select a specified number (given by max_tolerance) of n-grams whose supports are below threshold but above a second tolerance threshold to be added to the path for validation data\ntolerance_val::Float64=-0.1: the value set for the second threshold (in tolerant mode) such that if the support for an n-gram is in between this value and the threshold and the max_tolerance number has not been reached, then allow this n-gram to be added to the path for validation data\nmax_tolerance_val::Int64=2: maximum number of n-grams allowed in a path for validation data\nn_neighbors_train::Int64=10: the top n form neighbors to be considered for training data\nn_neighbors_val::Int64=20: the top n form neighbors to be considered for validation data\nissparse::Bool=false: if true, keep sparse matrix format when learning paths\noutput_dir::String=\"out\": the output directory\nverbose::Bool=false: if true, more information will be printed\n\n\n\n\n\n","category":"method"},{"location":"#JudiLing","page":"Home","title":"JudiLing","text":"","category":"section"},{"location":"","page":"Home","title":"Home","text":"JudiLing: An implementation for Linear Discriminative Learning in Julia","category":"page"},{"location":"","page":"Home","title":"Home","text":"Maintainer: Maria Heitmeier @MariaHei\nOriginal codebase: Xuefeng Luo @MegamindHenry","category":"page"},{"location":"#Installation","page":"Home","title":"Installation","text":"","category":"section"},{"location":"","page":"Home","title":"Home","text":"You can install JudiLing by the follow commands:","category":"page"},{"location":"","page":"Home","title":"Home","text":"using Pkg\nPkg.add(\"JudiLing\")","category":"page"},{"location":"","page":"Home","title":"Home","text":"For brave adventurers, install test version of JudiLing by:","category":"page"},{"location":"","page":"Home","title":"Home","text":"julia> Pkg.add(url=\"https://github.com/quantling/JudiLing.jl.git\")","category":"page"},{"location":"","page":"Home","title":"Home","text":"Or from the Julia REPL, type ] to enter the Pkg REPL mode and run","category":"page"},{"location":"","page":"Home","title":"Home","text":"pkg> add https://github.com/quantling/JudiLing.jl.git","category":"page"},{"location":"#Running-Julia-with-multiple-threads","page":"Home","title":"Running Julia with multiple threads","text":"","category":"section"},{"location":"","page":"Home","title":"Home","text":"JudiLing supports the use of multiple threads. Simply start up Julia in your terminal as follows:","category":"page"},{"location":"","page":"Home","title":"Home","text":"$ julia -t your_num_of_threads","category":"page"},{"location":"","page":"Home","title":"Home","text":"For detailed information on using Julia with threads, see this link.","category":"page"},{"location":"#Include-packages","page":"Home","title":"Include packages","text":"","category":"section"},{"location":"","page":"Home","title":"Home","text":"Before we start, we first need to load the JudiLing package:","category":"page"},{"location":"","page":"Home","title":"Home","text":"using JudiLing","category":"page"},{"location":"","page":"Home","title":"Home","text":"Note: As of JudiLing 0.8.0, PyCall and Flux have become optional dependencies. This means that all code in JudiLing which requires calls to python is only available if PyCall is loaded first, like this:","category":"page"},{"location":"","page":"Home","title":"Home","text":"using PyCall\nusing JudiLing","category":"page"},{"location":"","page":"Home","title":"Home","text":"Likewise, the code involving deep learning is only available if Julia's deep learning library Flux is loaded first, like this:","category":"page"},{"location":"","page":"Home","title":"Home","text":"using Flux\nusing JudiLing","category":"page"},{"location":"","page":"Home","title":"Home","text":"Note that Flux and PyCall have to be installed separately, and the newest version of Flux requires at least Julia 1.9. If you want to run deep learning in a GPU, make sure to also install and import CUDA.","category":"page"},{"location":"#Running-Julia-with-multiple-threads-2","page":"Home","title":"Running Julia with multiple threads","text":"","category":"section"},{"location":"","page":"Home","title":"Home","text":"JudiLing supports the use of multiple threads. Simply start up Julia in your terminal as follows:","category":"page"},{"location":"","page":"Home","title":"Home","text":"$ julia -t your_num_of_threads","category":"page"},{"location":"","page":"Home","title":"Home","text":"For detailed information on using Julia with threads, see this link.","category":"page"},{"location":"#Quick-start-example","page":"Home","title":"Quick start example","text":"","category":"section"},{"location":"","page":"Home","title":"Home","text":"The Latin dataset latin.csv contains lexemes and inflectional features for 672 inflected Latin verb forms for 8 lexemes from 4 conjugation classes. Word forms are inflected for person, number, tense, voice and mood.","category":"page"},{"location":"","page":"Home","title":"Home","text":"\"\",\"Word\",\"Lexeme\",\"Person\",\"Number\",\"Tense\",\"Voice\",\"Mood\"\n\"1\",\"vocoo\",\"vocare\",\"p1\",\"sg\",\"present\",\"active\",\"ind\"\n\"2\",\"vocaas\",\"vocare\",\"p2\",\"sg\",\"present\",\"active\",\"ind\"\n\"3\",\"vocat\",\"vocare\",\"p3\",\"sg\",\"present\",\"active\",\"ind\"\n\"4\",\"vocaamus\",\"vocare\",\"p1\",\"pl\",\"present\",\"active\",\"ind\"\n\"5\",\"vocaatis\",\"vocare\",\"p2\",\"pl\",\"present\",\"active\",\"ind\"\n\"6\",\"vocant\",\"vocare\",\"p3\",\"pl\",\"present\",\"active\",\"ind\"","category":"page"},{"location":"","page":"Home","title":"Home","text":"We first download and read the csv file into Julia:","category":"page"},{"location":"","page":"Home","title":"Home","text":"download(\"https://osf.io/2ejfu/download\", \"latin.csv\")\n\nlatin = JudiLing.load_dataset(\"latin.csv\");","category":"page"},{"location":"","page":"Home","title":"Home","text":"and we can inspect the latin dataframe:","category":"page"},{"location":"","page":"Home","title":"Home","text":"display(latin)","category":"page"},{"location":"","page":"Home","title":"Home","text":"672×8 DataFrame. Omitted printing of 2 columns\n│ Row │ Column1 │ Word           │ Lexeme  │ Person │ Number │ Tense      │\n│     │ Int64   │ String         │ String  │ String │ String │ String     │\n├─────┼─────────┼────────────────┼─────────┼────────┼────────┼────────────┤\n│ 1   │ 1       │ vocoo          │ vocare  │ p1     │ sg     │ present    │\n│ 2   │ 2       │ vocaas         │ vocare  │ p2     │ sg     │ present    │\n│ 3   │ 3       │ vocat          │ vocare  │ p3     │ sg     │ present    │\n│ 4   │ 4       │ vocaamus       │ vocare  │ p1     │ pl     │ present    │\n│ 5   │ 5       │ vocaatis       │ vocare  │ p2     │ pl     │ present    │\n│ 6   │ 6       │ vocant         │ vocare  │ p3     │ pl     │ present    │\n│ 7   │ 7       │ clamoo         │ clamare │ p1     │ sg     │ present    │\n│ 8   │ 8       │ clamaas        │ clamare │ p2     │ sg     │ present    │\n⋮\n│ 664 │ 664     │ carpsisseemus  │ carpere │ p1     │ pl     │ pluperfect │\n│ 665 │ 665     │ carpsisseetis  │ carpere │ p2     │ pl     │ pluperfect │\n│ 666 │ 666     │ carpsissent    │ carpere │ p3     │ pl     │ pluperfect │\n│ 667 │ 667     │ cuccurissem    │ currere │ p1     │ sg     │ pluperfect │\n│ 668 │ 668     │ cuccurissees   │ currere │ p2     │ sg     │ pluperfect │\n│ 669 │ 669     │ cuccurisset    │ currere │ p3     │ sg     │ pluperfect │\n│ 670 │ 670     │ cuccurisseemus │ currere │ p1     │ pl     │ pluperfect │\n│ 671 │ 671     │ cuccurisseetis │ currere │ p2     │ pl     │ pluperfect │\n│ 672 │ 672     │ cuccurissent   │ currere │ p3     │ pl     │ pluperfect │","category":"page"},{"location":"","page":"Home","title":"Home","text":"For the production model, we want to predict correct forms given their lexemes and inflectional features. For example, giving the lexeme vocare and its inflectional features p1, sg, present, active and ind, the model should produce the form vocoo. On the other hand, the comprehension model takes forms as input and tries to predict their lexemes and inflectional features.","category":"page"},{"location":"","page":"Home","title":"Home","text":"We use letter trigrams to encode our forms. For word vocoo, for example, we use trigrams #vo, voc, oco, coo and oo#. Here, # is used as start/end token to encode the initial trigram and finial trigram of a word. The row vectors of the C matrix specify for each word which of the trigrams are realized in that word.","category":"page"},{"location":"","page":"Home","title":"Home","text":"To make the C matrix, we use the make_cue_matrix function:","category":"page"},{"location":"","page":"Home","title":"Home","text":"cue_obj = JudiLing.make_cue_matrix(\n    latin,\n    grams=3,\n    target_col=:Word,\n    tokenized=false,\n    keep_sep=false\n    )","category":"page"},{"location":"","page":"Home","title":"Home","text":"Next, we simulate the semantic matrix S using the make_S_matrix function:","category":"page"},{"location":"","page":"Home","title":"Home","text":"n_features = size(cue_obj.C, 2)\nS = JudiLing.make_S_matrix(\n    latin,\n    [\"Lexeme\"],\n    [\"Person\",\"Number\",\"Tense\",\"Voice\",\"Mood\"],\n    ncol=n_features)","category":"page"},{"location":"","page":"Home","title":"Home","text":"For this simulation, first random vectors are assigned to every lexeme and inflectional feature, and next the vectors of those features are summed up to obtain the semantic vector of the inflected form. Similar dimensions for C and S work best. Therefore, we retrieve the number of columns from the C matrix and pass it to make_S_matrix when constructing S.","category":"page"},{"location":"","page":"Home","title":"Home","text":"Then, the next step is to calculate a mapping from S to C by solving equation C = SG. We use Cholesky decomposition to solve this equation:","category":"page"},{"location":"","page":"Home","title":"Home","text":"G = JudiLing.make_transform_matrix(S, cue_obj.C)","category":"page"},{"location":"","page":"Home","title":"Home","text":"Then, we can make our predicted C matrix Chat:","category":"page"},{"location":"","page":"Home","title":"Home","text":"Chat = S * G","category":"page"},{"location":"","page":"Home","title":"Home","text":"and evaluate the model's prediction accuracy:","category":"page"},{"location":"","page":"Home","title":"Home","text":"@show JudiLing.eval_SC(Chat, cue_obj.C)","category":"page"},{"location":"","page":"Home","title":"Home","text":"Output:","category":"page"},{"location":"","page":"Home","title":"Home","text":"JudiLing.eval_SC(Chat, cue_obj.C) = 0.9926","category":"page"},{"location":"","page":"Home","title":"Home","text":"NOTE: Accuracy may be different depending on the simulated semantic matrix.","category":"page"},{"location":"","page":"Home","title":"Home","text":"Similar to G and Chat, we can solve S = CF:","category":"page"},{"location":"","page":"Home","title":"Home","text":"F = JudiLing.make_transform_matrix(cue_obj.C, S)","category":"page"},{"location":"","page":"Home","title":"Home","text":"and we then calculate the Shat matrix and evaluate comprehension accuracy:","category":"page"},{"location":"","page":"Home","title":"Home","text":"Shat = cue_obj.C * F\n@show JudiLing.eval_SC(Shat, S)","category":"page"},{"location":"","page":"Home","title":"Home","text":"Output:","category":"page"},{"location":"","page":"Home","title":"Home","text":"JudiLing.eval_SC(Shat, S) = 0.9911","category":"page"},{"location":"","page":"Home","title":"Home","text":"NOTE: Accuracy may be different depending on the simulated semantic matrix.","category":"page"},{"location":"","page":"Home","title":"Home","text":"To model speech production, the proper triphones have to be selected and put into the right order. We have two algorithms that accomplish this. Both algorithms construct paths in a triphone space that start with word-initial triphones and end with word-final triphones.","category":"page"},{"location":"","page":"Home","title":"Home","text":"The first step is to construct an adjacency matrix that specify which triphone can follow each other. In this example, we use the adjacency matrix constructed by make_cue_matrix, but we can also make use of a independently constructed adjacency matrix if required.","category":"page"},{"location":"","page":"Home","title":"Home","text":"A = cue_obj.A","category":"page"},{"location":"","page":"Home","title":"Home","text":"For our sequencing algorithms, we calculate the number of timesteps we need for our algorithms. For the Latin dataset, the max timestep is equal to the length of the longest word. The argument :Word specifies the column in the Latin dataset that lists the words' forms.","category":"page"},{"location":"","page":"Home","title":"Home","text":"max_t = JudiLing.cal_max_timestep(latin, :Word)","category":"page"},{"location":"","page":"Home","title":"Home","text":"One sequence finding algorithm used discrimination learning for the position of triphones. This function returns two lists, one with candidate triphone paths and their positional learning support (res) and one with the semantic supports for the gold paths (gpi).","category":"page"},{"location":"","page":"Home","title":"Home","text":"res_learn, gpi_learn = JudiLing.learn_paths(\n    latin,\n    latin,\n    cue_obj.C,\n    S,\n    F,\n    Chat,\n    A,\n    cue_obj.i2f,\n    cue_obj.f2i, # api changed in 0.3.1\n    check_gold_path = true,\n    gold_ind = cue_obj.gold_ind,\n    Shat_val = Shat,\n    max_t = max_t,\n    max_can = 10,\n    grams = 3,\n    threshold = 0.05,\n    tokenized = false,\n    keep_sep = false,\n    target_col = :Word,\n    verbose = true\n)","category":"page"},{"location":"","page":"Home","title":"Home","text":"We evaluate the accuracy on the training data as follows:","category":"page"},{"location":"","page":"Home","title":"Home","text":"acc_learn = JudiLing.eval_acc(res_learn, cue_obj.gold_ind, verbose = false)\n\nprintln(\"Acc for learn: $acc_learn\")","category":"page"},{"location":"","page":"Home","title":"Home","text":"Acc for learn: 0.9985","category":"page"},{"location":"","page":"Home","title":"Home","text":"The second sequence finding algorithm is usually faster than the first, but does not provide positional learnability estimates.","category":"page"},{"location":"","page":"Home","title":"Home","text":"res_build = JudiLing.build_paths(\n    latin,\n    cue_obj.C,\n    S,\n    F,\n    Chat,\n    A,\n    cue_obj.i2f,\n    cue_obj.gold_ind,\n    max_t=max_t,\n    n_neighbors=3,\n    verbose=true\n    )\n\nacc_build = JudiLing.eval_acc(\n    res_build,\n    cue_obj.gold_ind,\n    verbose=false\n)","category":"page"},{"location":"","page":"Home","title":"Home","text":"Acc for build: 0.9955","category":"page"},{"location":"","page":"Home","title":"Home","text":"After having obtained the results from the sequence functions: learn_paths or build_paths, we can save the results either into a csv or into a dataframe, the dataframe can be loaded into R with the rput command of the RCall package.","category":"page"},{"location":"","page":"Home","title":"Home","text":"JudiLing.write2csv(\n    res_learn,\n    latin,\n    cue_obj,\n    cue_obj,\n    \"latin_learn_res.csv\",\n    grams = 3,\n    tokenized = false,\n    sep_token = nothing,\n    start_end_token = \"#\",\n    output_sep_token = \"\",\n    path_sep_token = \":\",\n    target_col = :Word,\n    root_dir = @__DIR__,\n    output_dir = \"latin_out\"\n)\n\ndf_learn = JudiLing.write2df(\n    res_learn,\n    latin,\n    cue_obj,\n    cue_obj,\n    grams = 3,\n    tokenized = false,\n    sep_token = nothing,\n    start_end_token = \"#\",\n    output_sep_token = \"\",\n    path_sep_token = \":\",\n    target_col = :Word\n)\n\nJudiLing.write2csv(\n    res_build,\n    latin,\n    cue_obj,\n    cue_obj,\n    \"latin_build_res.csv\",\n    grams = 3,\n    tokenized = false,\n    sep_token = nothing,\n    start_end_token = \"#\",\n    output_sep_token = \"\",\n    path_sep_token = \":\",\n    target_col = :Word,\n    root_dir = @__DIR__,\n    output_dir = \"latin_out\"\n)\n\ndf_build = JudiLing.write2df(\n    res_build,\n    latin,\n    cue_obj,\n    cue_obj,\n    grams = 3,\n    tokenized = false,\n    sep_token = nothing,\n    start_end_token = \"#\",\n    output_sep_token = \"\",\n    path_sep_token = \":\",\n    target_col = :Word\n)\n\ndisplay(df_learn)\ndisplay(df_build)","category":"page"},{"location":"","page":"Home","title":"Home","text":"3805×9 DataFrame. Omitted printing of 5 columns\n│ Row  │ utterance │ identifier     │ path                                                    │ pred           │\n│      │ Int64?    │ String?        │ Union{Missing, String}                                  │ String?        │\n├──────┼───────────┼────────────────┼─────────────────────────────────────────────────────────┼────────────────┤\n│ 1    │ 1         │ vocoo          │ #vo:voc:oco:coo:oo#                                     │ vocoo          │\n│ 2    │ 2         │ vocaas         │ #vo:voc:oca:caa:aas:as#                                 │ vocaas         │\n│ 3    │ 2         │ vocaas         │ #vo:voc:oca:caa:aab:aba:baa:aas:as#                     │ vocaabaas      │\n│ 4    │ 2         │ vocaas         │ #vo:voc:oca:caa:aat:ati:tis:is#                         │ vocaatis       │\n│ 5    │ 2         │ vocaas         │ #vo:voc:oca:caa:aav:avi:vis:ist:sti:tis:is#             │ vocaavistis    │\n│ 6    │ 2         │ vocaas         │ #vo:voc:oca:caa:aam:amu:mus:us#                         │ vocaamus       │\n│ 7    │ 2         │ vocaas         │ #vo:voc:oca:caa:aab:abi:bit:it#                         │ vocaabit       │\n│ 8    │ 2         │ vocaas         │ #vo:voc:oca:caa:aam:amu:mur:ur#                         │ vocaamur       │\n│ 9    │ 2         │ vocaas         │ #vo:voc:oca:caa:aar:are:ret:et#                         │ vocaaret       │\n⋮\n│ 3796 │ 671       │ cuccurisseetis │ #cu:cuc:ucc:ccu:cur:ure:ree:eet:eti:tis:is#             │ cuccureetis    │\n│ 3797 │ 671       │ cuccurisseetis │ #cu:cuc:ucc:ccu:cur:uri:ris:ist:sti:tis:is#             │ cuccuristis    │\n│ 3798 │ 671       │ cuccurisseetis │ #cu:cuc:ucc:ccu:cur:uri:ris:iss:sse:set:et#             │ cuccurisset    │\n│ 3799 │ 671       │ cuccurisseetis │ #cu:cur:urr:rri:rim:imi:min:ini:nii:ii#                 │ curriminii     │\n│ 3800 │ 672       │ cuccurissent   │ #cu:cuc:ucc:ccu:cur:uri:ris:iss:sse:sen:ent:nt#         │ cuccurissent   │\n│ 3801 │ 672       │ cuccurissent   │ #cu:cur:urr:rre:rer:ere:ren:ent:nt#                     │ currerent      │\n│ 3802 │ 672       │ cuccurissent   │ #cu:cuc:ucc:ccu:cur:uri:ris:iss:sse:see:eem:emu:mus:us# │ cuccurisseemus │\n│ 3803 │ 672       │ cuccurissent   │ #cu:cuc:ucc:ccu:cur:uri:ris:iss:sse:see:eet:eti:tis:is# │ cuccurisseetis │\n│ 3804 │ 672       │ cuccurissent   │ #cu:cur:urr:rre:rer:ere:ren:ent:ntu:tur:ur#             │ currerentur    │\n│ 3805 │ 672       │ cuccurissent   │ #cu:cuc:ucc:ccu:cur:uri:ris:iss:sse:see:ees:es#         │ cuccurissees   │\n2519×9 DataFrame. Omitted printing of 4 columns\n│ Row  │ utterance │ identifier     │ path                                            │ pred         │ num_tolerance │\n│      │ Int64?    │ String?        │ Union{Missing, String}                          │ String?      │ Int64?        │\n├──────┼───────────┼────────────────┼─────────────────────────────────────────────────┼──────────────┼───────────────┤\n│ 1    │ 1         │ vocoo          │ #vo:voc:oco:coo:oo#                             │ vocoo        │ 0             │\n│ 2    │ 1         │ vocoo          │ #vo:voc:oca:caa:aab:abo:boo:oo#                 │ vocaaboo     │ 0             │\n│ 3    │ 1         │ vocoo          │ #vo:voc:oca:caa:aab:aba:bam:am#                 │ vocaabam     │ 0             │\n│ 4    │ 2         │ vocaas         │ #vo:voc:oca:caa:aas:as#                         │ vocaas       │ 0             │\n│ 5    │ 2         │ vocaas         │ #vo:voc:oca:caa:aab:abi:bis:is#                 │ vocaabis     │ 0             │\n│ 6    │ 2         │ vocaas         │ #vo:voc:oca:caa:aat:ati:tis:is#                 │ vocaatis     │ 0             │\n│ 7    │ 3         │ vocat          │ #vo:voc:oca:cat:at#                             │ vocat        │ 0             │\n│ 8    │ 3         │ vocat          │ #vo:voc:oca:caa:aab:aba:bat:at#                 │ vocaabat     │ 0             │\n│ 9    │ 3         │ vocat          │ #vo:voc:oca:caa:aas:as#                         │ vocaas       │ 0             │\n⋮\n│ 2510 │ 671       │ cuccurisseetis │ #cu:cur:uri:ris:iss:sse:see:ees:es#             │ curissees    │ 0             │\n│ 2511 │ 671       │ cuccurisseetis │ #cu:cur:uri:ris:iss:sse:see:eem:emu:mus:us#     │ curisseemus  │ 0             │\n│ 2512 │ 671       │ cuccurisseetis │ #cu:cur:uri:ris:is#                             │ curis        │ 0             │\n│ 2513 │ 671       │ cuccurisseetis │ #cu:cuc:ucc:ccu:cur:uri:ris:is#                 │ cuccuris     │ 0             │\n│ 2514 │ 672       │ cuccurissent   │ #cu:cuc:ucc:ccu:cur:uri:ris:iss:sse:sen:ent:nt# │ cuccurissent │ 0             │\n│ 2515 │ 672       │ cuccurissent   │ #cu:cur:uri:ris:iss:sse:sen:ent:nt#             │ curissent    │ 0             │\n│ 2516 │ 672       │ cuccurissent   │ #cu:cuc:ucc:ccu:cur:uri:ris:iss:sse:set:et#     │ cuccurisset  │ 0             │\n│ 2517 │ 672       │ cuccurissent   │ #cu:cur:uri:ris:iss:sse:set:et#                 │ curisset     │ 0             │\n│ 2518 │ 672       │ cuccurissent   │ #cu:cuc:ucc:ccu:cur:uri:ris:iss:sse:sem:em#     │ cuccurissem  │ 0             │\n│ 2519 │ 672       │ cuccurissent   │ #cu:cur:uri:ris:iss:sse:sem:em#                 │ curissem     │ 0             │","category":"page"},{"location":"#Cross-validation","page":"Home","title":"Cross-validation","text":"","category":"section"},{"location":"","page":"Home","title":"Home","text":"The model also provides functionality for cross-validation. Here, we first split the dataset randomly into 90% training and 10% validation data:","category":"page"},{"location":"","page":"Home","title":"Home","text":"latin_train, latin_val = JudiLing.loading_data_randomly_split(\"latin.csv\",\n                                                                \"data\",\n                                                                \"latin\",\n                                                                val_ratio=0.1,\n                                                                random_seed=42)","category":"page"},{"location":"","page":"Home","title":"Home","text":"Then, we make the C matrix by passing both training and validation datasets to the make_combined_cue_matrix function which ensures that the C matrix contains columns for both training and validation data.","category":"page"},{"location":"","page":"Home","title":"Home","text":"cue_obj_train, cue_obj_val = JudiLing.make_combined_cue_matrix(\n    latin_train,\n    latin_val,\n    grams = 3,\n    target_col = :Word,\n    tokenized = false,\n    keep_sep = false\n)","category":"page"},{"location":"","page":"Home","title":"Home","text":"Next, we simulate semantic vectors, again for both the training and validation data, using make_combined_S_matrix:","category":"page"},{"location":"","page":"Home","title":"Home","text":"n_features = size(cue_obj_train.C, 2)\nS_train, S_val = JudiLing.make_combined_S_matrix(\n    latin_train,\n    latin_val,\n    [\"Lexeme\"],\n    [\"Person\", \"Number\", \"Tense\", \"Voice\", \"Mood\"],\n    ncol = n_features\n)","category":"page"},{"location":"","page":"Home","title":"Home","text":"After that, we make the transformation matrices, but this time we only use the training dataset. We use these transformation matrices to predict the validation dataset.","category":"page"},{"location":"","page":"Home","title":"Home","text":"G_train = JudiLing.make_transform_matrix(S_train, cue_obj_train.C)\nF_train = JudiLing.make_transform_matrix(cue_obj_train.C, S_train)\n\nChat_train = S_train * G_train\nChat_val = S_val * G_train\nShat_train = cue_obj_train.C * F_train\nShat_val = cue_obj_val.C * F_train\n\n@show JudiLing.eval_SC(Chat_train, cue_obj_train.C)\n@show JudiLing.eval_SC(Chat_val, cue_obj_val.C)\n@show JudiLing.eval_SC(Shat_train, S_train)\n@show JudiLing.eval_SC(Shat_val, S_val)","category":"page"},{"location":"","page":"Home","title":"Home","text":"Output:","category":"page"},{"location":"","page":"Home","title":"Home","text":"JudiLing.eval_SC(Chat_train, cue_obj_train.C) = 0.995\nJudiLing.eval_SC(Chat_val, cue_obj_val.C) = 0.403\nJudiLing.eval_SC(Shat_train, S_train) = 0.9917\nJudiLing.eval_SC(Shat_val, S_val) = 1.0","category":"page"},{"location":"","page":"Home","title":"Home","text":"Finally, we can find possible paths through build_paths or learn_paths. Since validation datasets are harder to predict, we turn on tolerant mode which allow the algorithms to find more paths but at the cost of investing more time.","category":"page"},{"location":"","page":"Home","title":"Home","text":"A = cue_obj_train.A\nmax_t = JudiLing.cal_max_timestep(latin_train, latin_val, :Word)\n\nres_learn_train, gpi_learn_train = JudiLing.learn_paths(\n    latin_train,\n    latin_train,\n    cue_obj_train.C,\n    S_train,\n    F_train,\n    Chat_train,\n    A,\n    cue_obj_train.i2f,\n    cue_obj_train.f2i, # api changed in 0.3.1\n    gold_ind = cue_obj_train.gold_ind,\n    Shat_val = Shat_train,\n    check_gold_path = true,\n    max_t = max_t,\n    max_can = 10,\n    grams = 3,\n    threshold = 0.05,\n    tokenized = false,\n    sep_token = \"_\",\n    keep_sep = false,\n    target_col = :Word,\n    issparse = :dense,\n    verbose = true,\n)\n\nres_learn_val, gpi_learn_val = JudiLing.learn_paths(\n    latin_train,\n    latin_val,\n    cue_obj_train.C,\n    S_val,\n    F_train,\n    Chat_val,\n    A,\n    cue_obj_train.i2f,\n    cue_obj_train.f2i, # api changed in 0.3.1\n    gold_ind = cue_obj_val.gold_ind,\n    Shat_val = Shat_val,\n    check_gold_path = true,\n    max_t = max_t,\n    max_can = 10,\n    grams = 3,\n    threshold = 0.05,\n    is_tolerant = true,\n    tolerance = -0.1,\n    max_tolerance = 2,\n    tokenized = false,\n    sep_token = \"-\",\n    keep_sep = false,\n    target_col = :Word,\n    issparse = :dense,\n    verbose = true,\n)\n\nacc_learn_train =\n    JudiLing.eval_acc(res_learn_train, cue_obj_train.gold_ind, verbose = false)\nacc_learn_val = JudiLing.eval_acc(res_learn_val, cue_obj_val.gold_ind, verbose = false)\n\nres_build_train = JudiLing.build_paths(\n    latin_train,\n    cue_obj_train.C,\n    S_train,\n    F_train,\n    Chat_train,\n    A,\n    cue_obj_train.i2f,\n    cue_obj_train.gold_ind,\n    max_t = max_t,\n    n_neighbors = 3,\n    verbose = true,\n)\n\nres_build_val = JudiLing.build_paths(\n    latin_val,\n    cue_obj_train.C,\n    S_val,\n    F_train,\n    Chat_val,\n    A,\n    cue_obj_train.i2f,\n    cue_obj_train.gold_ind,\n    max_t = max_t,\n    n_neighbors = 20,\n    verbose = true,\n)\n\nacc_build_train =\n    JudiLing.eval_acc(res_build_train, cue_obj_train.gold_ind, verbose = false)\nacc_build_val = JudiLing.eval_acc(res_build_val, cue_obj_val.gold_ind, verbose = false)\n\n@show acc_learn_train\n@show acc_learn_val\n@show acc_build_train\n@show acc_build_val","category":"page"},{"location":"","page":"Home","title":"Home","text":"Output:","category":"page"},{"location":"","page":"Home","title":"Home","text":"acc_learn_train = 0.9983\nacc_learn_val = 0.6866\nacc_build_train = 1.0\nacc_build_val = 0.3284","category":"page"},{"location":"","page":"Home","title":"Home","text":"Alternatively, we  have a wrapper function incorporating all above functionalities. With this function, you can quickly explore datasets with different parameter settings. Please find more in the Test Combo Introduction.","category":"page"},{"location":"#Supports","page":"Home","title":"Supports","text":"","category":"section"},{"location":"","page":"Home","title":"Home","text":"There are two types of supports in outputs. An utterance level and a set of supports for each cue. The former support is also called \"synthesis-by-analysis\" support. This support is calculated by predicted S vector and original S vector and it is used to select the best paths. Cue level supports are slices of Yt matrices from each timestep. Those supports are used to determine whether a cue is eligible for constructing paths.","category":"page"},{"location":"#Acknowledgments","page":"Home","title":"Acknowledgments","text":"","category":"section"},{"location":"","page":"Home","title":"Home","text":"This project was supported by the ERC advanced grant WIDE-742545 and by the Deutsche Forschungsgemeinschaft (DFG, German Research Foundation) under Germany’s Excellence Strategy - EXC number 2064/1 - Project number 390727645.","category":"page"},{"location":"#Acknowledgments-2","page":"Home","title":"Acknowledgments","text":"","category":"section"},{"location":"","page":"Home","title":"Home","text":"This project was supported by the ERC advanced grant WIDE-742545 and by the Deutsche Forschungsgemeinschaft (DFG, German Research Foundation) under Germany’s Excellence Strategy - EXC number 2064/1 - Project number 390727645.","category":"page"},{"location":"#Citation","page":"Home","title":"Citation","text":"","category":"section"},{"location":"","page":"Home","title":"Home","text":"If you find this package helpful, please cite it as follows:","category":"page"},{"location":"","page":"Home","title":"Home","text":"Luo, X., Heitmeier, M., Chuang, Y. Y., Baayen, R. H. JudiLing: an implementation of the Discriminative Lexicon Model in Julia. Eberhard Karls Universität Tübingen, Seminar für Sprachwissenschaft.","category":"page"},{"location":"","page":"Home","title":"Home","text":"The following studies have made use of several algorithms now implemented in JudiLing instead of WpmWithLdl:","category":"page"},{"location":"","page":"Home","title":"Home","text":"Baayen, R. H., Chuang, Y. Y., Shafaei-Bajestan, E., and Blevins, J. P. (2019). The discriminative lexicon: A unified computational model for the lexicon and lexical processing in comprehension and production grounded not in (de)composition but in linear discriminative learning. Complexity, 2019, 1-39.\nBaayen, R. H., Chuang, Y. Y., and Blevins, J. P. (2018). Inflectional morphology with linear mappings. The Mental Lexicon, 13 (2), 232-270.\nChuang, Y.-Y., Lõo, K., Blevins, J. P., and Baayen, R. H. (2020). Estonian case inflection made simple. A case study in Word and Paradigm morphology with Linear Discriminative Learning. In Körtvélyessy, L., and Štekauer, P. (Eds.) Complex Words: Advances in Morphology, 1-19.\nChuang, Y-Y., Bell, M. J., Banke, I., and Baayen, R. H. (2020). Bilingual and multilingual mental lexicon: a modeling study with Linear Discriminative Learning. Language Learning, 1-55.\nHeitmeier, M., Chuang, Y-Y., Baayen, R. H. (2021). Modeling morphology with Linear Discriminative Learning: considerations and design choices. Frontiers in Psychology, 12, 4929.\nDenistia, K., and Baayen, R. H. (2022). The morphology of Indonesian: Data and quantitative modeling. In Shei, C., and Li, S. (Eds.) The Routledge Handbook of Asian Linguistics, (pp. 605-634). Routledge, London.\nHeitmeier, M., Chuang, Y.-Y., and Baayen, R. H. (2023). How trial-to-trial learning shapes mappings in the mental lexicon: Modelling lexical decision with linear discriminative learning. Cognitive Psychology, 1-30.\nChuang, Y. Y., Kang, M., Luo, X. F. and Baayen, R. H. (2023). Vector Space Morphology with Linear Discriminative Learning. In Crepaldi, D. (Ed.) Linguistic morphology in the mind and brain.\nHeitmeier, M., Chuang, Y. Y., Axen, S. D., & Baayen, R. H. (2024). Frequency effects in linear discriminative learning. Frontiers in Human Neuroscience, 17, 1242720.\nPlag, I., Heitmeier, M. & Domahs, F. (to appear). German nominal number interpretation in an impaired mental lexicon: A naive discriminative learning perspective. The Mental Lexicon.","category":"page"},{"location":"man/make_cue_matrix/","page":"Make Cue Matrix","title":"Make Cue Matrix","text":"CurrentModule = JudiLing","category":"page"},{"location":"man/make_cue_matrix/#Make-Cue-Matrix","page":"Make Cue Matrix","title":"Make Cue Matrix","text":"","category":"section"},{"location":"man/make_cue_matrix/","page":"Make Cue Matrix","title":"Make Cue Matrix","text":"    Cue_Matrix_Struct\r\n    make_cue_matrix\r\n    make_combined_cue_matrix\r\n    make_ngrams\r\n    make_cue_matrix(data::DataFrame)\r\n    make_cue_matrix(data::DataFrame, cue_obj::Cue_Matrix_Struct)\r\n    make_cue_matrix(data_train::DataFrame, data_val::DataFrame)\r\n    make_combined_cue_matrix(data_train, data_val)\r\n    make_cue_matrix_from_CFBS(features::Vector{Vector{T}};\r\n                                        pad_val::T = 0.,\r\n                                        ncol::Union{Missing,Int}=missing) where {T}\r\n    make_combined_cue_matrix_from_CFBS(features_train::Vector{Vector{T}},\r\n                                                features_test::Vector{Vector{T}};\r\n                                                pad_val::T = 0.,\r\n                                                ncol::Union{Missing,Int}=missing) where {T}\r\n    make_ngrams(tokens, grams, keep_sep, sep_token, start_end_token)","category":"page"},{"location":"man/make_cue_matrix/#JudiLing.Cue_Matrix_Struct","page":"Make Cue Matrix","title":"JudiLing.Cue_Matrix_Struct","text":"A structure that stores information created by makecuematrix: C is the cue matrix; f2i is a dictionary returning the indices for features; i2f is a dictionary returning the features for indices; goldind is a list of indices of gold paths; A is the adjacency matrix; grams is the number of grams for cues; targetcol is the column name for target strings; tokenized is whether the dataset target is tokenized; septoken is the separator; keepsep is whether to keep separators in cues; startendtoken is the start and end token in boundary cues.\n\n\n\n\n\n","category":"type"},{"location":"man/make_cue_matrix/#JudiLing.make_cue_matrix","page":"Make Cue Matrix","title":"JudiLing.make_cue_matrix","text":"Construct cue matrix.\n\n\n\n\n\n","category":"function"},{"location":"man/make_cue_matrix/#JudiLing.make_combined_cue_matrix","page":"Make Cue Matrix","title":"JudiLing.make_combined_cue_matrix","text":"Construct cue matrix where combined features and adjacencies for both training datasets and validation datasets.\n\n\n\n\n\n","category":"function"},{"location":"man/make_cue_matrix/#JudiLing.make_ngrams","page":"Make Cue Matrix","title":"JudiLing.make_ngrams","text":"Given a list of string tokens, extract their n-grams.\n\n\n\n\n\n","category":"function"},{"location":"man/make_cue_matrix/#JudiLing.make_cue_matrix-Tuple{DataFrames.DataFrame}","page":"Make Cue Matrix","title":"JudiLing.make_cue_matrix","text":"make_cue_matrix(data::DataFrame)\n\nMake the cue matrix for training datasets and corresponding indices as well as the adjacency matrix and gold paths given a dataset in a form of dataframe.\n\nObligatory Arguments\n\ndata::DataFrame: the dataset\n\nOptional Arguments\n\ngrams::Int64=3: the number of grams for cues\ntarget_col::Union{String, Symbol}=:Words: the column name for target strings\ntokenized::Bool=false:if true, the dataset target is assumed to be tokenized\nsep_token::Union{Nothing, String, Char}=nothing: separator\nkeep_sep::Bool=false: if true, keep separators in cues\nstart_end_token::Union{String, Char}=\"#\": start and end token in boundary cues\nverbose::Bool=false: if true, more information is printed\n\nExamples\n\n# make cue matrix without tokenization\ncue_obj_train = JudiLing.make_cue_matrix(\n     latin_train,\n    grams=3,\n    target_col=:Word,\n    tokenized=false,\n    sep_token=\"-\",\n    start_end_token=\"#\",\n    keep_sep=false,\n    verbose=false\n    )\n\n# make cue matrix with tokenization\ncue_obj_train = JudiLing.make_cue_matrix(\n    french_train,\n    grams=3,\n    target_col=:Syllables,\n    tokenized=true,\n    sep_token=\"-\",\n    start_end_token=\"#\",\n    keep_sep=true,\n    verbose=false\n    )\n\n\n\n\n\n","category":"method"},{"location":"man/make_cue_matrix/#JudiLing.make_cue_matrix-Tuple{DataFrames.DataFrame, JudiLing.Cue_Matrix_Struct}","page":"Make Cue Matrix","title":"JudiLing.make_cue_matrix","text":"make_cue_matrix(data::DataFrame, cue_obj::Cue_Matrix_Struct)\n\nMake the cue matrix for validation datasets and corresponding indices as well as the adjacency matrix and gold paths given a dataset in a form of dataframe.\n\nObligatory Arguments\n\ndata::DataFrame: the dataset\ncue_obj::Cue_Matrix_Struct: training cue object\n\nOptional Arguments\n\ngrams::Int64=3: the number of grams for cues\ntarget_col::Union{String, Symbol}=:Words: the column name for target strings\ntokenized::Bool=false:if true, the dataset target is assumed to be tokenized\nsep_token::Union{Nothing, String, Char}=nothing: separator\nkeep_sep::Bool=false: if true, keep separators in cues\nstart_end_token::Union{String, Char}=\"#\": start and end token in boundary cues\nverbose::Bool=false: if true, more information is printed\n\nExamples\n\n# make cue matrix without tokenization\ncue_obj_val = JudiLing.make_cue_matrix(\n  latin_val,\n  cue_obj_train,\n  grams=3,\n  target_col=:Word,\n  tokenized=false,\n  sep_token=\"-\",\n  keep_sep=false,\n  start_end_token=\"#\",\n  verbose=false\n  )\n\n# make cue matrix with tokenization\ncue_obj_val = JudiLing.make_cue_matrix(\n    french_val,\n    cue_obj_train,\n    grams=3,\n    target_col=:Syllables,\n    tokenized=true,\n    sep_token=\"-\",\n    keep_sep=true,\n    start_end_token=\"#\",\n    verbose=false\n    )\n\n\n\n\n\n","category":"method"},{"location":"man/make_cue_matrix/#JudiLing.make_cue_matrix-Tuple{DataFrames.DataFrame, DataFrames.DataFrame}","page":"Make Cue Matrix","title":"JudiLing.make_cue_matrix","text":"make_cue_matrix(data_train::DataFrame, data_val::DataFrame)\n\nMake the cue matrix for traiing and validation datasets at the same time.\n\nObligatory Arguments\n\ndata_train::DataFrame: the training dataset\ndata_val::DataFrame: the validation dataset\n\nOptional Arguments\n\ngrams::Int64=3: the number of grams for cues\ntarget_col::Union{String, Symbol}=:Words: the column name for target strings\ntokenized::Bool=false:if true, the dataset target is assumed to be tokenized\nsep_token::Union{Nothing, String, Char}=nothing: separator\nkeep_sep::Bool=false: if true, keep separators in cues\nstart_end_token::Union{String, Char}=\"#\": start and end token in boundary cues\nverbose::Bool=false: if true, more information is printed\n\nExamples\n\n# make cue matrix without tokenization\ncue_obj_train, cue_obj_val = JudiLing.make_cue_matrix(\n    latin_train,\n    latin_val,\n    grams=3,\n    target_col=:Word,\n    tokenized=false,\n    keep_sep=false\n    )\n\n# make cue matrix with tokenization\ncue_obj_train, cue_obj_val = JudiLing.make_cue_matrix(\n    french_train,\n    french_val,\n    grams=3,\n    target_col=:Syllables,\n    tokenized=true,\n    sep_token=\"-\",\n    keep_sep=true,\n    start_end_token=\"#\",\n    verbose=false\n    )\n\n\n\n\n\n","category":"method"},{"location":"man/make_cue_matrix/#JudiLing.make_combined_cue_matrix-Tuple{Any, Any}","page":"Make Cue Matrix","title":"JudiLing.make_combined_cue_matrix","text":"make_combined_cue_matrix(data_train, data_val)\n\nMake the cue matrix for training and validation datasets at the same time, where the features and adjacencies are combined.\n\nObligatory Arguments\n\ndata_train::DataFrame: the training dataset\ndata_val::DataFrame: the validation dataset\n\nOptional Arguments\n\ngrams::Int64=3: the number of grams for cues\ntarget_col::Union{String, Symbol}=:Words: the column name for target strings\ntokenized::Bool=false:if true, the dataset target is assumed to be tokenized\nsep_token::Union{Nothing, String, Char}=nothing: separator\nkeep_sep::Bool=false: if true, keep separators in cues\nstart_end_token::Union{String, Char}=\"#\": start and end token in boundary cues\nverbose::Bool=false: if true, more information is printed\n\nExamples\n\n# make cue matrix without tokenization\ncue_obj_train, cue_obj_val = JudiLing.make_combined_cue_matrix(\n    latin_train,\n    latin_val,\n    grams=3,\n    target_col=:Word,\n    tokenized=false,\n    keep_sep=false\n    )\n\n# make cue matrix with tokenization\ncue_obj_train, cue_obj_val = JudiLing.make_combined_cue_matrix(\n    french_train,\n    french_val,\n    grams=3,\n    target_col=:Syllables,\n    tokenized=true,\n    sep_token=\"-\",\n    keep_sep=true,\n    start_end_token=\"#\",\n    verbose=false\n    )\n\n\n\n\n\n","category":"method"},{"location":"man/make_cue_matrix/#JudiLing.make_cue_matrix_from_CFBS-Union{Tuple{Array{Vector{T}, 1}}, Tuple{T}} where T","page":"Make Cue Matrix","title":"JudiLing.make_cue_matrix_from_CFBS","text":"make_cue_matrix_from_CFBS(features::Vector{Vector{T}};\n                          pad_val::T = 0.,\n                          ncol::Union{Missing,Int}=missing) where {T}\n\nCreate a cue matrix from a vector of feature vectors (usually CFBS vectors). It is expected (though of course not necessary) that the vectors have varying lengths. They are consequently padded on the right with the provided pad_val.\n\nObligatory arguments\n\nfeatures::Vector{Vector{T}}: vector of vectors containing C-FBS features\n\nOptional arguments\n\npad_val::T = 0.: Value with which the feature vectors will be padded\nncol::Union{Missing,Int}=missing: Number of columns of the C matrix. If not set, will be set to the maximum number of features\n\nExamples\n\nC = JudiLing.make_cue_matrix_from_CFBS(features)\n\n\n\n\n\n","category":"method"},{"location":"man/make_cue_matrix/#JudiLing.make_combined_cue_matrix_from_CFBS-Union{Tuple{T}, Tuple{Array{Vector{T}, 1}, Array{Vector{T}, 1}}} where T","page":"Make Cue Matrix","title":"JudiLing.make_combined_cue_matrix_from_CFBS","text":"make_combined_cue_matrix_from_CFBS(features_train::Vector{Vector{T}},\n                                   features_test::Vector{Vector{T}};\n                                   pad_val::T = 0.,\n                                   ncol::Union{Missing,Int}=missing) where {T}\n\nCreate cue matrices from two vectors of feature vectors (usually CFBS vectors). It is expected (though of course not necessary) that the vectors have varying lengths. They are consequently padded on the right with the provided pad_val. The cue matrices are set to have to the size of the maximum number of feature values in features_train and features_test.\n\nObligatory arguments\n\nfeatures_train::Vector{Vector{T}}: vector of vectors containing C-FBS features\nfeatures_test::Vector{Vector{T}}: vector of vectors containing C-FBS features\n\nOptional arguments\n\npad_val::T = 0.: Value with which the feature vectors will be padded\nncol::Union{Missing,Int}=missing: Number of columns of the C matrices. If not set, will be set to the maximum number of features in features_train and features_test\n\nExamples\n\nC_train, C_test = JudiLing.make_combined_cue_matrix_from_CFBS(features_train, features_test)\n\n\n\n\n\n","category":"method"},{"location":"man/make_cue_matrix/#JudiLing.make_ngrams-NTuple{5, Any}","page":"Make Cue Matrix","title":"JudiLing.make_ngrams","text":"make_ngrams(tokens, grams, keep_sep, sep_token, start_end_token)\n\nGiven a list of string tokens return a list of all n-grams for these tokens.\n\n\n\n\n\n","category":"method"}]
+[{"location":"man/deep_learning/","page":"Deep learning","title":"Deep learning","text":"CurrentModule = JudiLing","category":"page"},{"location":"man/deep_learning/#Deep-learning-in-JudiLing","page":"Deep learning","title":"Deep learning in JudiLing","text":"","category":"section"},{"location":"man/deep_learning/","page":"Deep learning","title":"Deep learning","text":"predict_from_deep_model(model::Flux.Chain,\n                                 X::Union{SparseMatrixCSC,Matrix})\npredict_shat(model::Flux.Chain,\n                  ci::Vector{Int})\nget_and_train_model(X_train::Union{SparseMatrixCSC,Matrix},\n                            Y_train::Union{SparseMatrixCSC,Matrix},\n                            X_val::Union{SparseMatrixCSC,Matrix,Missing},\n                            Y_val::Union{SparseMatrixCSC,Matrix,Missing},\n                            data_train::Union{DataFrame,Missing},\n                            data_val::Union{DataFrame,Missing},\n                            target_col::Union{Symbol, String,Missing},\n                            model_outpath::String;\n                            hidden_dim::Int=1000,\n                            n_epochs::Int=100,\n                            batchsize::Int=64,\n                            loss_func::Function=Flux.mse,\n                            optimizer=Flux.Adam(0.001),\n                            model::Union{Missing, Flux.Chain} = missing,\n                            early_stopping::Union{Missing, Int}=missing,\n                            optimise_for_acc::Bool=false,\n                            return_losses::Bool=false,\n                            verbose::Bool=true,\n                            measures_func::Union{Missing, Function}=missing,\n                            return_train_acc::Bool=false,\n                            kargs...)\nget_and_train_model(X_train::Union{SparseMatrixCSC,Matrix},\n                            Y_train::Union{SparseMatrixCSC,Matrix},\n                            model_outpath::String;\n                            data_train::Union{Missing, DataFrame}=missing,\n                            target_col::Union{Missing, Symbol, String}=missing,\n                            hidden_dim::Int=1000,\n                            n_epochs::Int=100,\n                            batchsize::Int=64,\n                            loss_func::Function=Flux.mse,\n                            optimizer=Flux.Adam(0.001),\n                            model::Union{Missing, Flux.Chain} = missing,\n                            return_losses::Bool=false,\n                            verbose::Bool=true,\n                            measures_func::Union{Missing, Function}=missing,\n                            return_train_acc::Bool=false,\n                            kargs...)\nfiddl(X_train::Union{SparseMatrixCSC,Matrix},\n              Y_train::Union{SparseMatrixCSC,Matrix},\n              learn_seq::Vector,\n              data::DataFrame,\n              target_col::Union{Symbol, String},\n              model_outpath::String;\n              hidden_dim::Int=1000,\n              batchsize::Int=64,\n              loss_func::Function=Flux.mse,\n              optimizer=Flux.Adam(0.001),\n              model::Union{Missing, Chain} = missing,\n              return_losses::Bool=false,\n              verbose::Bool=true,\n              n_batch_eval::Int=100,\n              measures_func::Union{Function, Missing}=missing,\n              kargs...)\n","category":"page"},{"location":"man/deep_learning/#JudiLing.predict_from_deep_model-Tuple{Chain, Union{SparseArrays.SparseMatrixCSC, Matrix}}","page":"Deep learning","title":"JudiLing.predict_from_deep_model","text":"predict_from_deep_model(model::Chain,\n                        X::Union{SparseMatrixCSC,Matrix})\n\nGenerates output of a model given input X.\n\nObligatory arguments\n\nmodel::Chain: Model of type Flux.Chain, as generated by get_and_train_model\nX::Union{SparseMatrixCSC,Matrix}: Input matrix of size (numberofsamples, inpdim) where inpdim is the input dimension of model\n\n\n\n\n\n","category":"method"},{"location":"man/deep_learning/#JudiLing.predict_shat-Tuple{Chain, Vector{Int64}}","page":"Deep learning","title":"JudiLing.predict_shat","text":"predict_shat(model::Chain,\n             ci::Vector{Int})\n\nPredicts semantic vector shat given a deep learning comprehension model model and a list of indices of ngrams ci.\n\nObligatory arguments\n\nmodel::Chain: Deep learning comprehension model as generated by get_and_train_model\nci::Vector{Int}: Vector of indices of ngrams in c vector. Essentially, this is a vector indicating which ngrams in a c vector are absent and which are present.\n\n\n\n\n\n","category":"method"},{"location":"man/deep_learning/#JudiLing.get_and_train_model-Tuple{Union{SparseArrays.SparseMatrixCSC, Matrix}, Union{SparseArrays.SparseMatrixCSC, Matrix}, Union{Missing, SparseArrays.SparseMatrixCSC, Matrix}, Union{Missing, SparseArrays.SparseMatrixCSC, Matrix}, Union{Missing, DataFrames.DataFrame}, Union{Missing, DataFrames.DataFrame}, Union{Missing, String, Symbol}, String}","page":"Deep learning","title":"JudiLing.get_and_train_model","text":"get_and_train_model(X_train::Union{SparseMatrixCSC,Matrix},\n                    Y_train::Union{SparseMatrixCSC,Matrix},\n                    X_val::Union{SparseMatrixCSC,Matrix,Missing},\n                    Y_val::Union{SparseMatrixCSC,Matrix,Missing},\n                    data_train::Union{DataFrame,Missing},\n                    data_val::Union{DataFrame,Missing},\n                    target_col::Union{Symbol,String,Missing},\n                    model_outpath::String;\n                    hidden_dim::Int=1000,\n                    n_epochs::Int=100,\n                    batchsize::Int=64,\n                    loss_func::Function=Flux.mse,\n                    optimizer=Flux.Adam(0.001)\n                    model::Union{Missing, Chain}=missing,\n                    early_stopping::Union{Missing, Int}=missing,\n                    optimise_for_acc::Bool=false\n                    return_losses::Bool=false,\n                    verbose::Bool=true,\n                    measures_func::Union{Missing, Function}=missing,\n                    return_train_acc::Bool=false,\n                    ...kargs\n                    )\n\nTrains a deep learning model from X_train to Y_train, saving the model with either the highest validation accuracy or lowest validation loss (depending on optimise_for_acc) to outpath.\n\nThe default model looks like this:\n\ninp_dim = size(X_train, 2)\nout_dim = size(Y_train, 2)\nChain(Dense(inp_dim => hidden_dim, relu), Dense(hidden_dim => out_dim))\n\nAny other model with the same input and output dimensions can be provided to the function with the model argument. The default loss function is mean squared error, but any other loss function can be provded, as long as it fits with the model architecture.\n\nBy default the adam optimizer (Kingma and Ba, 2015) with learning rate 0.001 is used. You can provide any other optimizer. If you want to use a different learning rate, e.g. 0.01, provide optimizer=Flux.Adam(0.01). If you do not want to use an optimizer at all, and simply use normal gradient descent, provide optimizer=Descent(0.001), again replacing the learning rate with the learning rate of your preference.\n\nReturns a named tuple with the following values:\n\nmodel: the trained model\ndata_train: the training data, including any measures if computed by measures_func\ndata_val: the validation data, including any measures if computed by measures_func\nlosses_train: The losses of the training data for each epoch.\nlosses_val: The losses of the validation data after each epoch.\naccs_train: The accuracies of the training data after each epoch, if return_train_acc=true.\naccs_val: The accuracies of the validation data after each epoch.\n\nObligatory arguments\n\nX_train::Union{SparseMatrixCSC,Matrix}: training input matrix of dimension m x n\nY_train::Union{SparseMatrixCSC,Matrix}: training output/target matrix of dimension m x k\nX_train::Union{SparseMatrixCSC,Matrix}: validation input matrix of dimension l x n\nY_train::Union{SparseMatrixCSC,Matrix}: validation output/target matrix of dimension l x k\ndata_train::DataFrame: training data\ndata_val::DataFrame: validation data\ntarget_col::Union{Symbol, String}: column with target wordforms in datatrain and dataval\nmodel_outpath::String: filepath to where final model should be stored (in .bson format)\n\nOptional arguments\n\nhidden_dim::Int=1000: hidden dimension of the model\nn_epochs::Int=100: number of epochs for which the model should be trained\nbatchsize::Int=64: batchsize during training\nloss_func::Function=Flux.mse: Loss function. Per default this is the mse loss, but other options might be a crossentropy loss (Flux.crossentropy). Make sure the model makes sense with the loss function!\noptimizer=Flux.Adam(0.001): optimizer to use for training\nmodel::Union{Missing, Chain} = missing: A custom model can be provided for training. Its requirements are that it has to correspond to the input and output size of the training and validation data\nearly_stopping::Union{Missing, Int}=missing: If missing, no early stopping is used. Otherwise early_stopping indicates how many epochs have to pass without improvement in validation accuracy before the training is stopped.\noptimise_for_acc::Bool=false: if true, keep model with highest validation accuracy. If false, keep model with lowest validation loss.\nreturn_losses::Bool=false: whether additional to the model per-epoch losses for the training and test data as well as per-epoch accuracy on the validation data should be returned\nverbose::Bool=true: Turn on verbose mode\nmeasures_func::Union{Missing, Function}=missing: A measures function which is run at the end of every epoch. For more information see The measures_func argument. If a measure is tagged for each epoch, the one tagged with \"final\" will be the one for the finally returned model.\nreturn_train_acc::Bool=false: If true, a vector with training accuracies is returned at the end of the training.\n...kargs: any additional keyword arguments are passed to the measures_func\n\n\n\n\n\n","category":"method"},{"location":"man/deep_learning/#JudiLing.get_and_train_model-Tuple{Union{SparseArrays.SparseMatrixCSC, Matrix}, Union{SparseArrays.SparseMatrixCSC, Matrix}, String}","page":"Deep learning","title":"JudiLing.get_and_train_model","text":"get_and_train_model(X_train::Union{SparseMatrixCSC,Matrix},\n                    Y_train::Union{SparseMatrixCSC,Matrix},\n                    model_outpath::String;\n                    data_train::Union{Missing, DataFrame}=missing,\n                    target_col::Union{Missing, Symbol, String}=missing,\n                    hidden_dim::Int=1000,\n                    n_epochs::Int=100,\n                    batchsize::Int=64,\n                    loss_func::Function=Flux.mse,\n                    optimizer=Flux.Adam(0.001),\n                    model::Union{Missing, Chain} = missing,\n                    return_losses::Bool=false,\n                    verbose::Bool=true,\n                    measures_func::Union{Missing, Function}=missing,\n                    return_train_acc::Bool=false,\n                    ...kargs)\n\nTrains a deep learning model from X_train to Y_train, saving the model after n_epochs epochs. The default model looks like this:\n\ninp_dim = size(X_train, 2)\nout_dim = size(Y_train, 2)\nChain(Dense(inp_dim => hidden_dim, relu), Dense(hidden_dim => out_dim))\n\nAny other model with the same input and output dimensions can be provided to the function with the model argument. The default loss function is mean squared error, but any other loss function can be provded, as long as it fits with the model architecture.\n\nBy default the adam optimizer (Kingma and Ba, 2015) with learning rate 0.001 is used. You can provide any other optimizer. If you want to use a different learning rate, e.g. 0.01, provide optimizer=Flux.Adam(0.01). If you do not want to use an optimizer at all, and simply use normal gradient descent, provide optimizer=Descent(0.001), again replacing the learning rate with the learning rate of your preference.\n\nReturns a named tuple with the following values:\n\nmodel: the trained model\ndata_train: the data, including any measures if computed by measures_func\ndata_val: missing for this function\nlosses_train: The losses of the training data for each epoch.\nlosses_val: missing for this function\naccs_train: The accuracies of the training data after each epoch, if return_train_acc=true.\naccs_val: missing for this function\n\nObligatory arguments\n\nX_train::Union{SparseMatrixCSC,Matrix}: training input matrix of dimension m x n\nY_train::Union{SparseMatrixCSC,Matrix}: training output/target matrix of dimension m x k\nmodel_outpath::String: filepath to where final model should be stored (in .bson format)\n\nOptional arguments\n\ndata_train::Union{Missing, DataFrame}=missing: The training data. Only necessary if a measuresfunc is included or returntrain_acc=true.\ntarget_col::Union{Missing, Symbol, String}=missing: The column with target word forms in the training data. Only necessary if a measuresfunc is included or returntrain_acc=true.\nhidden_dim::Int=1000: hidden dimension of the model\nn_epochs::Int=100: number of epochs for which the model should be trained\nbatchsize::Int=64: batchsize during training\nloss_func::Function=Flux.mse: Loss function. Per default this is the mse loss, but other options might be a crossentropy loss (Flux.crossentropy). Make sure the model makes sense with the loss function!\noptimizer=Flux.Adam(0.001): optimizer to use for training\nmodel::Union{Missing, Chain} = missing: A custom model can be provided for training. Its requirements are that it has to correspond to the input and output size of the training and validation data\nreturn_losses::Bool=false: whether additional to the model per-epoch losses for the training and test data as well as per-epoch accuracy on the validation data should be returned\nverbose::Bool=true: Turn on verbose mode\nmeasures_func::Union{Missing, Function}=missing: A measures function which is run at the end of every epoch. For more information see The measures_func argument.\nreturn_train_acc::Bool=false: If true, a vector with training accuracies is returned at the end of the training.\n...kargs: any additional keyword arguments are passed to the measures_func\n\n\n\n\n\n","category":"method"},{"location":"man/deep_learning/#JudiLing.fiddl-Tuple{Union{SparseArrays.SparseMatrixCSC, Matrix}, Union{SparseArrays.SparseMatrixCSC, Matrix}, Vector, DataFrames.DataFrame, Union{String, Symbol}, String}","page":"Deep learning","title":"JudiLing.fiddl","text":"fiddl(X_train::Union{SparseMatrixCSC,Matrix},\n        Y_train::Union{SparseMatrixCSC,Matrix},\n        learn_seq::Vector,\n        data::DataFrame,\n        target_col::Union{Symbol, String},\n        model_outpath::String;\n        hidden_dim::Int=1000,\n        batchsize::Int=64,\n        loss_func::Function=Flux.mse,\n        optimizer=Flux.Adam(0.001),\n        model::Union{Missing, Chain} = missing,\n        return_losses::Bool=false,\n        verbose::Bool=true,\n        n_batch_eval::Int=100,\n        compute_accuracy::Bool=true,\n        measures_func::Union{Function, Missing}=missing,\n        kargs...)\n\nTrains a deep learning model using the FIDDL method (frequency-informed deep discriminative learning). Optionally, after each n_batch_eval batches measures_func can be run to compute any measures which are then added to the data.\n\nnote: Note\nIf you get an OutOfMemory error, chances are that this is due to the eval_SC function being evaluated after each n_batch_eval batches. Setting compute_accuracy=false disables computing the mapping accuracy.\n\nReturns a named tuple with the following values:\n\nmodel: the trained model\ndata: the data, including any measures if computed by measures_func\nlosses_train: The losses of the data the model is trained on within each n_batch_eval batches.\nlosses: The losses of the full dataset after each n_batch_eval batches.\naccs: The accuracies of the full dataset after each n_batch_eval batches.\n\nObligatory arguments\n\nX_train::Union{SparseMatrixCSC,Matrix}: training input matrix of dimension m x n\nY_train::Union{SparseMatrixCSC,Matrix}: training output/target matrix of dimension m x k\nlearn_seq::Vector: List of indices in the order that the vectors in Xtrain and Ytrain should be presented to the model for training.\ndata::DataFrame: The full data.\ntarget_col::Union{Symbol, String}: The column with target word forms in the data.\nmodel_outpath::String: filepath to where final model should be stored (in .bson format)\n\nOptional arguments\n\nhidden_dim::Int=1000: hidden dimension of the model\nn_epochs::Int=100: number of epochs for which the model should be trained\nbatchsize::Int=64: batchsize during training\nloss_func::Function=Flux.mse: Loss function. Per default this is the mse loss, but other options might be a crossentropy loss (Flux.crossentropy). Make sure the model makes sense with the loss function!\noptimizer=Flux.Adam(0.001): optimizer to use for training\nmodel::Union{Missing, Chain} = missing: A custom model can be provided for training. Its requirements are that it has to correspond to the input and output size of the training and validation data\nreturn_losses::Bool=false: whether additional to the model per-epoch losses for the training and test data as well as per-epoch accuracy on the validation data should be returned\nverbose::Bool=true: Turn on verbose mode\nn_batch_eval::Int=100: Loss, accuracy and measures_func are evaluated every n_batch_eval batches.\ncompute_accuracy::Bool=true: Whether accuracy should be computed every n_batch_eval batches.\nmeasures_func::Union{Missing, Function}=missing: A measures function which is run each n_batch_eval batches. For more information see The measures_func argument.\n\n\n\n\n\n","category":"method"},{"location":"man/pickle/","page":"Pickle","title":"Pickle","text":"CurrentModule = JudiLing","category":"page"},{"location":"man/pickle/#Utils","page":"Pickle","title":"Utils","text":"","category":"section"},{"location":"man/pickle/","page":"Pickle","title":"Pickle","text":"    save_pickle\n    load_pickle","category":"page"},{"location":"man/pickle/#JudiLing.save_pickle","page":"Pickle","title":"JudiLing.save_pickle","text":"Save pickle from python pickle file.\n\n\n\n\n\n","category":"function"},{"location":"man/pickle/#JudiLing.load_pickle","page":"Pickle","title":"JudiLing.load_pickle","text":"Load pickle from python pickle file.\n\n\n\n\n\n","category":"function"},{"location":"man/measures_func/#The-measures_func-argument","page":"Measures function","title":"The measures_func argument","text":"","category":"section"},{"location":"man/measures_func/","page":"Measures function","title":"Measures function","text":"The deep learning functions get_and_train_model and fiddl take a measures_func as one of their arguments. This helps computing measures during the training. For this to work, the measures_func has to conform to the following format.","category":"page"},{"location":"man/measures_func/#For-get_and_train_model","page":"Measures function","title":"For get_and_train_model","text":"","category":"section"},{"location":"man/measures_func/","page":"Measures function","title":"Measures function","text":"data_train, data_val = measures_func(X_train,\n                                    Y_train,\n                                    X_val,\n                                    Y_val,\n                                    Yhat_train,\n                                    Yhat_val,\n                                    data_train,\n                                    data_val,\n                                    target_col,\n                                    model,\n                                    epoch;\n                                    kargs...)\n\n## Input\n\n- `X_train`: The input training matrix.\n- `Y_train`: The target training matrix\n- `X_val`: The input validation matrix.\n- `Y_val`: The target validation matrix.\n- `Yhat_train`: The predicted training matrix.\n- `Yhat_val`: The predicted validation matrix.\n- `data_train`: The training dataset.\n- `data_val`: The validation dataset.\n- `target_col`: The name of the column with the target wordforms in the datasets.\n- `model`: The trained model.\n- `epoch`: The epoch the training is currently in.\n- `kargs...`: Any other keyword arguments that should be passed to the function.\n\nNote: the `kargs` are just keyword arguments that are passed on from the parameters of `get_and_train_model` to the `measures_func`. For example, this could be a suffix that should be added to each added column in `measures_func`.\n\n## Output\nThe function has to return the training and validation dataframes.","category":"page"},{"location":"man/measures_func/#Example","page":"Measures function","title":"Example","text":"","category":"section"},{"location":"man/measures_func/","page":"Measures function","title":"Measures function","text":"Define a measures_func. This one computes target correlations for both training and validation datasets.","category":"page"},{"location":"man/measures_func/","page":"Measures function","title":"Measures function","text":"function compute_target_corr(X_train, Y_train, X_val, Y_val,\n                                    Yhat_train, Yhat_val, data_train,\n                                    data_val, target_col, model, epoch)\n        _, corr = JudiLing.eval_SC(Yhat_train, Y_train, R=true)\n        data_train[!, string(\"target_corr_\", epoch)] = diag(corr)\n        _, corr = JudiLing.eval_SC(Yhat_val, Y_val, R=true)\n        data_val[!, string(\"target_corr_\", epoch)] = diag(corr)\n        return(data_train, data_val)\nend","category":"page"},{"location":"man/measures_func/","page":"Measures function","title":"Measures function","text":"Train a model for 100 epochs, call compute_target_corr after each epoch.","category":"page"},{"location":"man/measures_func/","page":"Measures function","title":"Measures function","text":"res = JudiLing.get_and_train_model(cue_obj_train.C,\n                            S_train,\n                            cue_obj_val.C,\n                            S_val,\n                            train, val,\n                            :Word,\n                            \"test.bson\",\n                            return_losses=true,\n                            batchsize=3,\n                            measures_func=compute_target_corr)\n","category":"page"},{"location":"man/measures_func/#For-fiddl","page":"Measures function","title":"For fiddl","text":"","category":"section"},{"location":"man/measures_func/","page":"Measures function","title":"Measures function","text":"data = measures_func(X_train,\n                      Y_train,\n                      Yhat_train,\n                      data,\n                      target_col,\n                      model,\n                      step;\n                      kargs...)\n\n## Input\n\n- `X_train`: The input matrix of the full dataset.\n- `Y_train`: The target matrix of the full dataset.\n- `Yhat_train`: The predicted matrix of the full dataset at current step.\n- `data_train`: The full dataset.\n- `target_col`: The name of the column with the target wordforms in the dataset.\n- `model`: The trained model.\n- `step`: The step the training is currently in.\n- `kargs...`: Any other keyword arguments that should be passed to the function.\n\nNote: the `kargs` are just keyword arguments that are passed on from the parameters of `get_and_train_model` to the `measures_func`. For example, this could be a suffix that should be added to each added column in `measures_func`.\n\n## Output\nThe function has to return the dataset.","category":"page"},{"location":"man/pyndl/","page":"Pyndl","title":"Pyndl","text":"CurrentModule = JudiLing","category":"page"},{"location":"man/pyndl/","page":"Pyndl","title":"Pyndl","text":"JudiLing is able to call the python package pyndl internally to compute NDL models. pyndl uses event files to compute the mapping matrices, which have to be generated manually or by using pyndl in Python, see documentation here. The advantage of calling pyndl from JudiLing is that the resulting weights, cue and semantic matrices can be directly translated into JudiLing format and further processing can be done in JudiLing.","category":"page"},{"location":"man/pyndl/","page":"Pyndl","title":"Pyndl","text":"note: Note\nFor pyndl to be available in JudiLing, PyCall has to be imported before JudiLing:using PyCall\nusing JudiLing","category":"page"},{"location":"man/pyndl/#Calling-pyndl-from-JudiLing","page":"Pyndl","title":"Calling pyndl from JudiLing","text":"","category":"section"},{"location":"man/pyndl/","page":"Pyndl","title":"Pyndl","text":"    Pyndl_Weight_Struct\n    pyndl(\n        data_path::String;\n        alpha::Float64 = 0.1,\n        betas::Tuple{Float64,Float64} = (0.1, 0.1),\n        method::String = \"openmp\"\n    )","category":"page"},{"location":"man/pyndl/#JudiLing.Pyndl_Weight_Struct","page":"Pyndl","title":"JudiLing.Pyndl_Weight_Struct","text":"Pyndl_Weight_Struct\n    cues::Vector{String}\n    outcomes::Vector{String}\n    weight::Matrix{Float64}\n\ncues::Vector{String}: Vector of cues, in the order that they appear in the weight matrix.\noutcomes::Vector{String}: Vector of outcomes, in the order that they appear in the weight matrix.\nweight::Matrix{Float64}: Weight matrix.\n\n\n\n\n\n","category":"type"},{"location":"man/pyndl/#JudiLing.pyndl-Tuple{String}","page":"Pyndl","title":"JudiLing.pyndl","text":"pyndl(\n    data_path::String;\n    alpha::Float64 = 0.1,\n    betas::Tuple{Float64,Float64} = (0.1, 0.1),\n    method::String = \"openmp\"\n)\n\nCompute weights using pyndl. See the documentation of pyndl for more information: https://pyndl.readthedocs.io/en/latest/\n\nObligatory arguments\n\ndata_path::String: Path to an events file as generated by pyndl's preprocess.createeventfile\n\nOptional arguments\n\nalpha::Float64 = 0.1: α learning rate.\nbetas::Tuple{Float64,Float64} = (0.1, 0.1): β1 and β2 learning rates\nmethod::String = \"openmp\": One of {\"openmp\", \"threading\"}. \"openmp\" only works on Linux.\n\nExample\n\nweights = JudiLing.pyndl(\"data/latin_train_events.tab.gz\")\n\n\n\n\n\n","category":"method"},{"location":"man/pyndl/#Translating-output-of-pyndl-to-cue-and-semantic-matrices-in-JudiLing","page":"Pyndl","title":"Translating output of pyndl to cue and semantic matrices in JudiLing","text":"","category":"section"},{"location":"man/pyndl/","page":"Pyndl","title":"Pyndl","text":"With the weights in hand, the cue and semantic matrices can be computed:","category":"page"},{"location":"man/pyndl/","page":"Pyndl","title":"Pyndl","text":"    make_cue_matrix(\n        data::DataFrame,\n        pyndl_weights::Pyndl_Weight_Struct;\n        grams = 3,\n        target_col = \"Words\",\n        tokenized = false,\n        sep_token = nothing,\n        keep_sep = false,\n        start_end_token = \"#\",\n        verbose = false,\n    )\n    make_S_matrix(\n        data::DataFrame,\n        pyndl_weights::Pyndl_Weight_Struct,\n        n_features_columns::Vector;\n        tokenized::Bool=false,\n        sep_token::String=\"_\"\n    )\n    make_S_matrix(\n        data_train::DataFrame,\n        data_val::DataFrame,\n        pyndl_weights::Pyndl_Weight_Struct,\n        n_features_columns::Vector;\n        tokenized::Bool=false,\n        sep_token::String=\"_\"\n    )","category":"page"},{"location":"man/pyndl/#JudiLing.make_cue_matrix-Tuple{DataFrames.DataFrame, JudiLing.Pyndl_Weight_Struct}","page":"Pyndl","title":"JudiLing.make_cue_matrix","text":"make_cue_matrix(\n    data::DataFrame,\n    pyndl_weights::Pyndl_Weight_Struct;\n    grams = 3,\n    target_col = \"Words\",\n    tokenized = false,\n    sep_token = nothing,\n    keep_sep = false,\n    start_end_token = \"#\",\n    verbose = false,\n)\n\nMake the cue matrix based on a dataframe and weights computed with pyndl. Practically this means that the cues are extracted from the weights object and translated to the JudiLing format.\n\nObligatory arguments\n\ndata::DataFrame: Dataset with all the word types on which the weights were trained.\npyndl_weights::Pyndl_Weight_Struct: Weights trained with JudiLing.pyndl\n\nOptional argyments\n\ngrams = 3: N-gram size (has to match the n-gram granularity of the cues on which the weights were trained).\ntarget_col = \"Words\": Column with target words.\ntokenized = false: Whether the target words are already tokenized\nsep_token = nothing: The string separating the tokens (only used if tokenized=true).\nkeep_sep = false: Whether the sep_token should be retained in the cues.\nstart_end_token = \"#\": The string with which to mark word boundaries.\nverbose = false: Verbose mode.\n\nExample\n\nweights = JudiLing.pyndl(\"data/latin_train_events.tab.gz\")\ncue_obj = JudiLing.make_cue_matrix(\"latin_train.csv\", weights,\n                                    grams = 3,\n                                    target_col = \"Word\")\n\n\n\n\n\n","category":"method"},{"location":"man/pyndl/#JudiLing.make_S_matrix-Tuple{DataFrames.DataFrame, JudiLing.Pyndl_Weight_Struct, Vector}","page":"Pyndl","title":"JudiLing.make_S_matrix","text":"make_S_matrix(\n    data::DataFrame,\n    pyndl_weights::Pyndl_Weight_Struct,\n    n_features_columns::Vector;\n    tokenized::Bool=false,\n    sep_token::String=\"_\"\n)\n\nCreate semantic matrix based on a dataframe and weights computed with pyndl. Practically this means that the semantic features are extracted from the weights object and translated to the JudiLing format.\n\nObligatory arguments\n\ndata::DataFrame: The dataset with word types.\npyndl_weights::Pyndl_Weight_Struct: Weights trained with JudiLing.pyndl.\nn_features_columns::Vector: Vector of columns with the features in the dataset.\n\nOptional arguments\n\ntokenized=false: Whether the features in n_features_columns columns are already tokenized (e.g. \"feature1_feature2_feature3\")\nsep_token=\"_\": The string with which the features are separated (only used if tokenized=false).\n\nExample\n\nweights = JudiLing.pyndl(\"data/latin_train_events.tab.gz\")\nS = JudiLing.make_S_matrix(data,\n                            weights_latin,\n                            [\"Lexeme\", \"Person\", \"Number\", \"Tense\", \"Voice\", \"Mood\"],\n                            tokenized=false)\n\n\n\n\n\n","category":"method"},{"location":"man/pyndl/#JudiLing.make_S_matrix-Tuple{DataFrames.DataFrame, DataFrames.DataFrame, JudiLing.Pyndl_Weight_Struct, Vector}","page":"Pyndl","title":"JudiLing.make_S_matrix","text":"make_S_matrix(\n    data_train::DataFrame,\n    data_val::DataFrame,\n    pyndl_weights::Pyndl_Weight_Struct,\n    n_features_columns::Vector;\n    tokenized::Bool=false,\n    sep_token::String=\"_\"\n)\n\nCreate semantic matrix based on a training and validation dataframe and weights computed with pyndl. Practically this means that the semantic features are extracted from the weights object and translated to the JudiLing format.\n\nObligatory arguments\n\ndata_train::DataFrame: The training dataset.\ndata_val::DataFrame: The validation dataset.\npyndl_weights::Pyndl_Weight_Struct: Weights trained with JudiLing.pyndl.\nn_features_columns::Vector: Vector of columns with the features in the training and validation datasets.\n\nOptional arguments\n\ntokenized=false: Whether the features in n_features_columns columns are already tokenized (e.g. \"feature1_feature2_feature3\")\nsep_token=\"_\": The string with which the features are separated (only used if tokenized=false).\n\nExample\n\nweights = JudiLing.pyndl(\"data/latin_train_events.tab.gz\")\nS_train, S_val = JudiLing.make_S_matrix(train,\n                            val,\n                            weights_latin,\n                            [\"Lexeme\", \"Person\", \"Number\", \"Tense\", \"Voice\", \"Mood\"],\n                            tokenized=false)\n\n\n\n\n\n","category":"method"},{"location":"man/wh/","page":"Widrow-Hoff Learning","title":"Widrow-Hoff Learning","text":"CurrentModule = JudiLing","category":"page"},{"location":"man/wh/#Utils","page":"Widrow-Hoff Learning","title":"Utils","text":"","category":"section"},{"location":"man/wh/","page":"Widrow-Hoff Learning","title":"Widrow-Hoff Learning","text":"    wh_learn(\n        X,\n        Y;\n        eta = 0.01,\n        n_epochs = 1,\n        weights = nothing,\n        learn_seq = nothing,\n        save_history = false,\n        history_cols = nothing,\n        history_rows = nothing,\n        verbose = false,\n        )\n    make_learn_seq(freq; random_seed = 314)","category":"page"},{"location":"man/wh/#JudiLing.wh_learn-Tuple{Any, Any}","page":"Widrow-Hoff Learning","title":"JudiLing.wh_learn","text":"wh_learn(\n    X,\n    Y;\n    eta = 0.01,\n    n_epochs = 1,\n    weights = nothing,\n    learn_seq = nothing,\n    save_history = false,\n    history_cols = nothing,\n    history_rows = nothing,\n    verbose = false,\n    )\n\nWidrow-Hoff Learning.\n\nObligatory Arguments\n\ntest_mode::Symbol: which test mode, currently supports :trainonly, :presplit, :carefulsplit and :randomsplit.\n\nOptional Arguments\n\neta::Float64=0.1: the learning rate\nn_epochs::Int64=1: the number of epochs to be trained\nweights::Matrix=nothing: the initial weights\nlearn_seq::Vector=nothing: the learning sequence\nsave_history::Bool=false: if true, a partical training history will be saved\nhistory_cols::Vector=nothing: the list of column indices you want to saved in history, e.g. [1,32,42] or [2]\nhistory_rows::Vector=nothing: the list of row indices you want to saved in history, e.g. [1,32,42] or [2]\nverbose::Bool = false: if true, more information will be printed out\n\n\n\n\n\n","category":"method"},{"location":"man/wh/#JudiLing.make_learn_seq-Tuple{Any}","page":"Widrow-Hoff Learning","title":"JudiLing.make_learn_seq","text":"make_learn_seq(freq; random_seed = 314)\n\nMake Widrow-Hoff learning sequence from frequencies. Creates a randomly ordered sequences of indices where each index appears according to its frequncy.\n\nObligatory arguments\n\nfreq: Vector with frequencies.\n\nOptional arguments\n\nrandom_seed = 314: Random seed to control randomness.\n\nExample\n\nlearn_seq = JudiLing.make_learn_seq(data.frequency)\n\n\n\n\n\n","category":"method"},{"location":"man/utils/","page":"Utils","title":"Utils","text":"CurrentModule = JudiLing","category":"page"},{"location":"man/utils/#Utils","page":"Utils","title":"Utils","text":"","category":"section"},{"location":"man/utils/","page":"Utils","title":"Utils","text":"    iscorrect\n    display_pred\n    translate\n    translate_path\n    is_truly_sparse\n    isattachable\n    iscomplete\n    isstart\n    isnovel\n    check_used_token\n    cal_max_timestep","category":"page"},{"location":"man/utils/#JudiLing.iscorrect","page":"Utils","title":"JudiLing.iscorrect","text":"Check whether the predictions are correct.\n\n\n\n\n\n","category":"function"},{"location":"man/utils/#JudiLing.display_pred","page":"Utils","title":"JudiLing.display_pred","text":"Display prediction nicely.\n\n\n\n\n\n","category":"function"},{"location":"man/utils/#JudiLing.translate","page":"Utils","title":"JudiLing.translate","text":"Translate indices into words or utterances\n\n\n\n\n\n","category":"function"},{"location":"man/utils/#JudiLing.translate_path","page":"Utils","title":"JudiLing.translate_path","text":"Append indices together to form a path\n\n\n\n\n\n","category":"function"},{"location":"man/utils/#JudiLing.is_truly_sparse","page":"Utils","title":"JudiLing.is_truly_sparse","text":"Check whether a matrix is truly sparse regardless its format, where M is originally a sparse matrix format.\n\n\n\n\n\nCheck whether a matrix is truly sparse regardless its format, where M is originally a dense matrix format.\n\n\n\n\n\n","category":"function"},{"location":"man/utils/#JudiLing.isattachable","page":"Utils","title":"JudiLing.isattachable","text":"Check whether a gram can attach to another gram.\n\n\n\n\n\nCheck whether a gram can attach to another gram.\n\n\n\n\n\n","category":"function"},{"location":"man/utils/#JudiLing.iscomplete","page":"Utils","title":"JudiLing.iscomplete","text":"Check whether a path is complete.\n\n\n\n\n\n","category":"function"},{"location":"man/utils/#JudiLing.isstart","page":"Utils","title":"JudiLing.isstart","text":"Check whether a gram can start a path.\n\n\n\n\n\n","category":"function"},{"location":"man/utils/#JudiLing.isnovel","page":"Utils","title":"JudiLing.isnovel","text":"Check whether a predicted path is in training data.\n\n\n\n\n\n","category":"function"},{"location":"man/utils/#JudiLing.check_used_token","page":"Utils","title":"JudiLing.check_used_token","text":"Check whether there are tokens already used in dataset as n-gram components.\n\n\n\n\n\n","category":"function"},{"location":"man/utils/#JudiLing.cal_max_timestep","page":"Utils","title":"JudiLing.cal_max_timestep","text":"function cal_max_timestep(\n    data_train::DataFrame,\n    data_val::DataFrame,\n    target_col::Union{String, Symbol};\n    tokenized::Bool = false,\n    sep_token::Union{Nothing, String, Char} = \"\",\n)\n\nCalculate the max timestep given training and validation datasets.\n\nObligatory Arguments\n\ndata_train::DataFrame: the training dataset\ndata_val::DataFrame: the validation dataset\ntarget_col::Union{String, Symbol}: the column with the target word forms\n\nOptional Arguments\n\ntokenized::Bool = false: Whether the word forms in the target_col are already tokenized\nsep_token::Union{Nothing, String, Char} = \"\": The token with which the word forms are tokenized\n\nExamples\n\nJudiLing.cal_max_timestep(latin_train, latin_val, target_col=:Word)\n\n\n\n\n\nfunction cal_max_timestep(\n    data::DataFrame,\n    target_col::Union{String, Symbol};\n    tokenized::Bool = false,\n    sep_token::Union{Nothing, String, Char} = \"\",\n)\n\nCalculate the max timestep given training dataset.\n\nObligatory Arguments\n\ndata::DataFrame: the dataset\ntarget_col::Union{String, Symbol}: the column with the target word forms\n\nOptional Arguments\n\ntokenized::Bool = false: Whether the word forms in the target_col are already tokenized\nsep_token::Union{Nothing, String, Char} = \"\": The token with which the word forms are tokenized\n\nExamples\n\nJudiLing.cal_max_timestep(latin, target_col=:Word)\n\n\n\n\n\n","category":"function"},{"location":"man/make_adjacency_matrix/","page":"Make Adjacency Matrix","title":"Make Adjacency Matrix","text":"CurrentModule = JudiLing","category":"page"},{"location":"man/make_adjacency_matrix/#Make-Adjacency-Matrix","page":"Make Adjacency Matrix","title":"Make Adjacency Matrix","text":"","category":"section"},{"location":"man/make_adjacency_matrix/","page":"Make Adjacency Matrix","title":"Make Adjacency Matrix","text":"    make_full_adjacency_matrix\n    make_full_adjacency_matrix(i2f)\n    make_combined_adjacency_matrix(data_train, data_val)","category":"page"},{"location":"man/make_adjacency_matrix/#JudiLing.make_full_adjacency_matrix","page":"Make Adjacency Matrix","title":"JudiLing.make_full_adjacency_matrix","text":"make_adjacency_matrix(i2f)\n\nMake full adjacency matrix based only on the form of n-grams regardless of whether they are seen in the training data. This usually takes hours for large datasets, as all possible combinations are considered.\n\nObligatory Arguments\n\ni2f::Dict: the dictionary returning features given indices\n\nOptional Arguments\n\ntokenized::Bool=false:if true, the dataset target is assumed to be tokenized\nsep_token::Union{Nothing, String, Char}=nothing: separator token\nverbose::Bool=false: if true, more information will be printed\n\nExamples\n\n# without tokenization\ni2f = Dict([(1, \"#ab\"), (2, \"abc\"), (3, \"bc#\"), (4, \"#bc\"), (5, \"ab#\")])\nJudiLing.make_adjacency_matrix(i2f)\n\n# with tokenization\ni2f = Dict([(1, \"#-a-b\"), (2, \"a-b-c\"), (3, \"b-c-#\"), (4, \"#-b-c\"), (5, \"a-b-#\")])\nJudiLing.make_adjacency_matrix(\n    i2f,\n    tokenized=true,\n    sep_token=\"-\")\n\n\n\n\n\n","category":"function"},{"location":"man/make_adjacency_matrix/#JudiLing.make_full_adjacency_matrix-Tuple{Any}","page":"Make Adjacency Matrix","title":"JudiLing.make_full_adjacency_matrix","text":"make_adjacency_matrix(i2f)\n\nMake full adjacency matrix based only on the form of n-grams regardless of whether they are seen in the training data. This usually takes hours for large datasets, as all possible combinations are considered.\n\nObligatory Arguments\n\ni2f::Dict: the dictionary returning features given indices\n\nOptional Arguments\n\ntokenized::Bool=false:if true, the dataset target is assumed to be tokenized\nsep_token::Union{Nothing, String, Char}=nothing: separator token\nverbose::Bool=false: if true, more information will be printed\n\nExamples\n\n# without tokenization\ni2f = Dict([(1, \"#ab\"), (2, \"abc\"), (3, \"bc#\"), (4, \"#bc\"), (5, \"ab#\")])\nJudiLing.make_adjacency_matrix(i2f)\n\n# with tokenization\ni2f = Dict([(1, \"#-a-b\"), (2, \"a-b-c\"), (3, \"b-c-#\"), (4, \"#-b-c\"), (5, \"a-b-#\")])\nJudiLing.make_adjacency_matrix(\n    i2f,\n    tokenized=true,\n    sep_token=\"-\")\n\n\n\n\n\n","category":"method"},{"location":"man/make_adjacency_matrix/#JudiLing.make_combined_adjacency_matrix-Tuple{Any, Any}","page":"Make Adjacency Matrix","title":"JudiLing.make_combined_adjacency_matrix","text":"make_combined_adjacency_matrix(data_train, data_val)\n\nMake combined adjacency matrix.\n\nObligatory Arguments\n\ndata_train::DataFrame: training dataset\ndata_val::DataFrame: validation dataset\n\nOptional Arguments\n\ngrams=3: the number of grams for cues\ntarget_col=:Words: the column name for target strings\ntokenized=false:if true, the dataset target is assumed to be tokenized\nsep_token=nothing: separator\nkeep_sep=false: if true, keep separators in cues\nstart_end_token=\"#\": start and end token in boundary cues\nverbose=false: if true, more information is printed\n\nExamples\n\nJudiLing.make_combined_adjacency_matrix(\n    latin_train,\n    latin_val,\n    grams=3,\n    target_col=:Word,\n    tokenized=false,\n    keep_sep=false\n    )\n\n\n\n\n\n","category":"method"},{"location":"man/cholesky/","page":"Cholesky","title":"Cholesky","text":"CurrentModule = JudiLing","category":"page"},{"location":"man/cholesky/#Cholesky","page":"Cholesky","title":"Cholesky","text":"","category":"section"},{"location":"man/cholesky/","page":"Cholesky","title":"Cholesky","text":"    make_transform_fac\n    make_transform_matrix\n    make_transform_fac(X::SparseMatrixCSC)\n    make_transform_fac(X::Matrix)\n    make_transform_matrix(fac::Union{LinearAlgebra.Cholesky, SuiteSparse.CHOLMOD.Factor}, X::Union{SparseMatrixCSC, Matrix}, Y::Union{SparseMatrixCSC, Matrix})\n    make_transform_matrix(X::SparseMatrixCSC, Y::Matrix)\n    make_transform_matrix(X::Matrix, Y::Union{SparseMatrixCSC, Matrix})\n    make_transform_matrix(X::SparseMatrixCSC, Y::SparseMatrixCSC)\n    format_matrix(M::Union{SparseMatrixCSC, Matrix}, output_format=:auto)","category":"page"},{"location":"man/cholesky/#JudiLing.make_transform_fac","page":"Cholesky","title":"JudiLing.make_transform_fac","text":"The first part of make transform matrix, usually used by the learn_paths function to save time and computing resources.\n\n\n\n\n\n","category":"function"},{"location":"man/cholesky/#JudiLing.make_transform_matrix","page":"Cholesky","title":"JudiLing.make_transform_matrix","text":"Using Cholesky decomposition to calculate the transformation matrix from S to C or from C to S.\n\n\n\n\n\n","category":"function"},{"location":"man/cholesky/#JudiLing.make_transform_fac-Tuple{SparseArrays.SparseMatrixCSC}","page":"Cholesky","title":"JudiLing.make_transform_fac","text":"make_transform_fac(X::SparseMatrixCSC)\n\nCalculate the first step of Cholesky decomposition for sparse matrices.\n\n\n\n\n\n","category":"method"},{"location":"man/cholesky/#JudiLing.make_transform_fac-Tuple{Matrix}","page":"Cholesky","title":"JudiLing.make_transform_fac","text":"make_transform_fac(X::Matrix)\n\nCalculate the first step of Cholesky decomposition for dense matrices.\n\n\n\n\n\n","category":"method"},{"location":"man/cholesky/#JudiLing.make_transform_matrix-Tuple{Union{SparseArrays.CHOLMOD.Factor, LinearAlgebra.Cholesky}, Union{SparseArrays.SparseMatrixCSC, Matrix}, Union{SparseArrays.SparseMatrixCSC, Matrix}}","page":"Cholesky","title":"JudiLing.make_transform_matrix","text":"make_transform_matrix(fac::Union{LinearAlgebra.Cholesky, SuiteSparse.CHOLMOD.Factor}, X::Union{SparseMatrixCSC, Matrix}, Y::Union{SparseMatrixCSC, Matrix})\n\nSecond step in calculating the Cholesky decomposition for the transformation matrix.\n\n\n\n\n\n","category":"method"},{"location":"man/cholesky/#JudiLing.make_transform_matrix-Tuple{SparseArrays.SparseMatrixCSC, Matrix}","page":"Cholesky","title":"JudiLing.make_transform_matrix","text":"make_transform_matrix(X::SparseMatrixCSC, Y::Matrix)\n\nUse Cholesky decomposition to calculate the transformation matrix from X to Y, where X is a sparse matrix and Y is a dense matrix.\n\nObligatory Arguments\n\nX::SparseMatrixCSC: the X matrix, where X is a sparse matrix\nY::Matrix: the Y matrix, where Y is a dense matrix\n\nOptional Arguments\n\nmethod::Symbol = :additive: whether :additive or :multiplicative decomposition is required\nshift::Float64 = 0.02: shift value for :additive decomposition\nmultiplier::Float64 = 1.01: multiplier value for :multiplicative decomposition\noutput_format::Symbol = :auto: to force output format to dense(:dense) or sparse(:sparse), make it auto(:auto) to determined by the program\nsparse_ratio::Float64 = 0.05: the ratio to decide whether a matrix is sparse\nverbose::Bool = false: if true, more information will be printed out\n\nExamples\n\n# additive mode\nJudiLing.make_transform_matrix(\n    C,\n    S,\n    method = :additive,\n    shift = 0.02,\n    verbose = false)\n\n# multiplicative mode\nJudiLing.make_transform_matrix(\n    C,\n    S,\n    method = :multiplicative,\n    multiplier = 1.01,\n    verbose = false)\n\n# further control of sparsity ratio\nJudiLing.make_transform_matrix(\n  ...\n    output_format = :auto,\n    sparse_ratio = 0.05,\n  ...)\n\n\n\n\n\n","category":"method"},{"location":"man/cholesky/#JudiLing.make_transform_matrix-Tuple{Matrix, Union{SparseArrays.SparseMatrixCSC, Matrix}}","page":"Cholesky","title":"JudiLing.make_transform_matrix","text":"make_transform_matrix(X::Matrix, Y::Union{SparseMatrixCSC, Matrix})\n\nUse the Cholesky decomposition to calculate the transformation matrix from X to Y, where X is a dense matrix and Y is either a dense matrix or a sparse matrix.\n\nObligatory Arguments\n\nX::Matrix: the X matrix, where X is a dense matrix\nY::Union{SparseMatrixCSC, Matrix}: the Y matrix, where Y is either a sparse or a dense matrix\n\nOptional Arguments\n\nmethod::Symbol = :additive: whether :additive or :multiplicative decomposition is required\nshift::Float64 = 0.02: shift value for :additive decomposition\nmultiplier::Float64 = 1.01: multiplier value for :multiplicative decomposition\noutput_format::Symbol = :auto: to force output format to dense(:dense) or sparse(:sparse), make it auto(:auto) to determined by the program\nsparse_ratio::Float64 = 0.05: the ratio to decide whether a matrix is sparse\nverbose::Bool = false: if true, more information will be printed out\n\nExamples\n\n# additive mode\nJudiLing.make_transform_matrix(\n    C,\n    S,\n    method = :additive,\n    shift = 0.02,\n    verbose = false)\n\n# multiplicative mode\nJudiLing.make_transform_matrix(\n    C,\n    S,\n    method=:multiplicative,\n    multiplier = 1.01,\n    verbose = false)\n\n# further control of sparsity ratio\nJudiLing.make_transform_matrix(\n    ...\n    output_format = :auto,\n    sparse_ratio = 0.05,\n    ...)\n\n\n\n\n\n","category":"method"},{"location":"man/cholesky/#JudiLing.make_transform_matrix-Tuple{SparseArrays.SparseMatrixCSC, SparseArrays.SparseMatrixCSC}","page":"Cholesky","title":"JudiLing.make_transform_matrix","text":"make_transform_matrix(X::SparseMatrixCSC, Y::SparseMatrixCSC)\n\nUse the Cholesky decomposition to calculate the transformation matrix from X to Y, where X is a sparse matrix and Y is a sparse matrix.\n\nObligatory Arguments\n\nX::SparseMatrixCSC: the X matrix, where X is a sparse matrix\nY::SparseMatrixCSC: the Y matrix, where Y is a sparse matrix\n\nOptional Arguments\n\nmethod::Symbol = :additive: whether :additive or :multiplicative decomposition is required\nshift::Float64 = 0.02: shift value for :additive decomposition\nmultiplier::Float64 = 1.01: multiplier value for :multiplicative decomposition\noutput_format::Symbol = :auto: to force output format to dense(:dense) or sparse(:sparse), make it auto(:auto) to determined by the program\nsparse_ratio::Float64 = 0.05: the ratio to decide whether a matrix is sparse\nverbose::Bool = false: if true, more information will be printed out\n\nExamples\n\n# additive mode\nJudiLing.make_transform_matrix(\n    C,\n    S,\n    method = :additive,\n    shift = 0.02,\n    verbose = false)\n\n# multiplicative mode\nJudiLing.make_transform_matrix(\n    C,\n    S,\n    method = :multiplicative,\n    multiplier = 1.01,\n    verbose = false)\n\n# further control of sparsity ratio\nJudiLing.make_transform_matrix(\n    ...\n    output_format = :auto,\n    sparse_ratio = 0.05,\n    ...)\n\n\n\n\n\n","category":"method"},{"location":"man/cholesky/#JudiLing.format_matrix","page":"Cholesky","title":"JudiLing.format_matrix","text":"format_matrix(M::Union{SparseMatrixCSC, Matrix}, output_format=:auto)\n\nConvert output matrix format to either a dense matrix or a sparse matrix.\n\n\n\n\n\n","category":"function"},{"location":"man/make_semantic_matrix/","page":"Make Semantic Matrix","title":"Make Semantic Matrix","text":"CurrentModule = JudiLing","category":"page"},{"location":"man/make_semantic_matrix/#Make-Semantic-Matrix","page":"Make Semantic Matrix","title":"Make Semantic Matrix","text":"","category":"section"},{"location":"man/make_semantic_matrix/#Make-binary-semantic-vectors","page":"Make Semantic Matrix","title":"Make binary semantic vectors","text":"","category":"section"},{"location":"man/make_semantic_matrix/","page":"Make Semantic Matrix","title":"Make Semantic Matrix","text":"    PS_Matrix_Struct\n    make_pS_matrix\n    make_pS_matrix(data)\n    make_pS_matrix(data_val, pS_obj)\n    make_combined_pS_matrix(\n        data_train,\n        data_val;\n        features_col = :CommunicativeIntention,\n        sep_token = \"_\",\n    )","category":"page"},{"location":"man/make_semantic_matrix/#JudiLing.PS_Matrix_Struct","page":"Make Semantic Matrix","title":"JudiLing.PS_Matrix_Struct","text":"A structure that stores the discrete semantic vectors: pS is the discrete semantic matrix; f2i is a dictionary returning the indices for features; i2f is a dictionary returning the features for indices.\n\n\n\n\n\n","category":"type"},{"location":"man/make_semantic_matrix/#JudiLing.make_pS_matrix","page":"Make Semantic Matrix","title":"JudiLing.make_pS_matrix","text":"Make discrete semantic matrix.\n\n\n\n\n\n","category":"function"},{"location":"man/make_semantic_matrix/#JudiLing.make_pS_matrix-Tuple{Any}","page":"Make Semantic Matrix","title":"JudiLing.make_pS_matrix","text":"make_pS_matrix(data)\n\nCreate a discrete semantic matrix given a dataframe.\n\nObligatory Arguments\n\ndata::DataFrame: the dataset\n\nOptional Arguments\n\nfeatures_col::Symbol=:CommunicativeIntention: the column name for target\nsep_token::String=\"_\": separator\n\nExamples\n\ns_obj_train = JudiLing.make_pS_matrix(\n    utterance,\n    features_col=:CommunicativeIntention,\n    sep_token=\"_\")\n\n\n\n\n\n","category":"method"},{"location":"man/make_semantic_matrix/#JudiLing.make_pS_matrix-Tuple{Any, Any}","page":"Make Semantic Matrix","title":"JudiLing.make_pS_matrix","text":"make_pS_matrix(data_val, pS_obj)\n\nConstruct discrete semantic matrix for the validation datasets given by the exemplar in the dataframe, and given the S matrix for the training datasets.\n\nObligatory Arguments\n\ndata_val::DataFrame: the dataset\npS_obj::PS_Matrix_Struct: training PS object\n\nOptional Arguments\n\nfeatures_col::Symbol=:CommunicativeIntention: the column name for target\nsep_token::String=\"_\": separator\n\nExamples\n\ns_obj_val = JudiLing.make_pS_matrix(\n    data_val,\n    s_obj_train,\n    features_col=:CommunicativeIntention,\n    sep_token=\"_\")\n\n\n\n\n\n","category":"method"},{"location":"man/make_semantic_matrix/#JudiLing.make_combined_pS_matrix-Tuple{Any, Any}","page":"Make Semantic Matrix","title":"JudiLing.make_combined_pS_matrix","text":"make_combined_pS_matrix(\n    data_train,\n    data_val;\n    features_col = :CommunicativeIntention,\n    sep_token = \"_\",\n)\n\nCreate discrete semantic matrices for a train and validation dataframe.\n\nObligatory Arguments\n\ndata_train::DataFrame: the training dataset\ndata_val::DataFrame: the validation dataset\n\nOptional Arguments\n\nfeatures_col::Symbol=:CommunicativeIntention: the column name for target\nsep_token::String=\"_\": separator\n\nExamples\n\ns_obj_train, s_obj_val = JudiLing.make_combined_pS_matrix(\n    data_train,\n    data_val,\n    features_col=:CommunicativeIntention,\n    sep_token=\"_\")\n\n\n\n\n\n","category":"method"},{"location":"man/make_semantic_matrix/#Simulate-semantic-vectors","page":"Make Semantic Matrix","title":"Simulate semantic vectors","text":"","category":"section"},{"location":"man/make_semantic_matrix/","page":"Make Semantic Matrix","title":"Make Semantic Matrix","text":"    L_Matrix_Struct\n    make_S_matrix\n    make_L_matrix\n    make_combined_S_matrix\n    make_combined_L_matrix\n    make_S_matrix(data::DataFrame, base::Vector, inflections::Vector)\n    make_S_matrix(data_train::DataFrame, data_val::DataFrame, base::Vector, inflections::Vector)\n    make_S_matrix(data::DataFrame, base::Vector)\n    make_S_matrix(data_train::DataFrame, data_val::DataFrame, base::Vector)\n    make_S_matrix(data_train::DataFrame, base::Vector, inflections::Vector, L::L_Matrix_Struct)\n    make_S_matrix(data_train::DataFrame, data_val::Union{DataFrame, Nothing}, base::Vector, L::L_Matrix_Struct)\n    make_S_matrix(data::DataFrame, base::Vector, L::L_Matrix_Struct)\n    make_S_matrix(data_train::DataFrame, data_val::DataFrame, base::Vector, inflections::Vector, L::L_Matrix_Struct)\n    make_L_matrix(data::DataFrame, base::Vector)\n    make_combined_S_matrix(data_train::DataFrame, data_val::DataFrame, base::Vector, inflections::Vector, L::L_Matrix_Struct)\n    make_combined_S_matrix(data_train::DataFrame, data_val::Union{DataFrame, Nothing}, base::Vector, L::L_Matrix_Struct)\n    make_combined_S_matrix(  data_train::DataFrame, data_val::DataFrame, base::Vector, inflections::Vector)\n    make_combined_S_matrix(data_train::DataFrame, data_val::DataFrame, base::Vector)\n    make_combined_L_matrix(data_train::DataFrame, data_val::DataFrame, base::Vector, inflections::Vector)\n    make_combined_L_matrix(data_train::DataFrame, data_val::DataFrame, base::Vector)\n    L_Matrix_Struct(L, sd_base, sd_base_mean, sd_inflection, sd_inflection_mean, base_f, infl_f, base_f2i, infl_f2i, n_base_f, n_infl_f, ncol)\n    L_Matrix_Struct(L, sd_base, sd_inflection, base_f, infl_f, base_f2i, infl_f2i, n_base_f, n_infl_f, ncol)","category":"page"},{"location":"man/make_semantic_matrix/#JudiLing.L_Matrix_Struct","page":"Make Semantic Matrix","title":"JudiLing.L_Matrix_Struct","text":"A structure that stores Lexome semantic vectors: L is Lexome semantic matrix; f2i is a dictionary returning the indices for features; i2f is a dictionary returning the features for indices.\n\n\n\n\n\n","category":"type"},{"location":"man/make_semantic_matrix/#JudiLing.make_S_matrix","page":"Make Semantic Matrix","title":"JudiLing.make_S_matrix","text":"Make simulated semantic matrix.\n\n\n\n\n\n","category":"function"},{"location":"man/make_semantic_matrix/#JudiLing.make_L_matrix","page":"Make Semantic Matrix","title":"JudiLing.make_L_matrix","text":"Make simulated lexome matrix.\n\n\n\n\n\n","category":"function"},{"location":"man/make_semantic_matrix/#JudiLing.make_combined_S_matrix","page":"Make Semantic Matrix","title":"JudiLing.make_combined_S_matrix","text":"Make combined simulated S matrices, where combined features from both training datasets and validation datasets\n\n\n\n\n\n","category":"function"},{"location":"man/make_semantic_matrix/#JudiLing.make_combined_L_matrix","page":"Make Semantic Matrix","title":"JudiLing.make_combined_L_matrix","text":"Make combined simulated Lexome matrix, where combined features from both training datasets and validation datasets\n\n\n\n\n\n","category":"function"},{"location":"man/make_semantic_matrix/#JudiLing.make_S_matrix-Tuple{DataFrames.DataFrame, Vector, Vector}","page":"Make Semantic Matrix","title":"JudiLing.make_S_matrix","text":"make_S_matrix(data::DataFrame, base::Vector, inflections::Vector)\n\nCreate simulated semantic matrix for the training datasets, given the input data of a vector specified contex lexemes and a vector specified gramatic lexemes. The semantic vector of a word form is constructed summing semantic vectors of content and gramatic lexemes.\n\nObligatory Arguments\n\ndata::DataFrame: the dataset\nbase::Vector: context lexemes\ninflections::Vector: grammatic lexemes\n\nOptional Arguments\n\nncol::Int64=200: dimension of semantic vectors, usually the same as that of cue vectors\nsd_base_mean::Int64=1: the sd mean of base features\nsd_inflection_mean::Int64=1: the sd mean of inflectional features\nsd_base::Int64=4: the sd of base features\nsd_inflection::Int64=4: the sd of inflectional features\nseed::Int64=314: the random seed\nisdeep::Bool=true: if true, mean of each feature is also randomized\nadd_noise::Bool=true: if true, add additional Gaussian noise\nsd_noise::Int64=1: the sd of the Gaussian noise\nnormalized::Bool=false: if true, most of the values range between 1 and -1, it may slightly exceed between 1 or -1 depending on the sd\n\nExamples\n\n# basic usage\nS_train = JudiLing.make_S_matrix(\n    french,\n    [\"Lexeme\"],\n    [\"Tense\",\"Aspect\",\"Person\",\"Number\",\"Gender\",\"Class\",\"Mood\"],\n    ncol=200)\n\n# deep mode\nS_train = JudiLing.make_S_matrix(\n    ...\n    sd_base_mean=1,\n    sd_inflection_mean=1,\n    isdeep=true,\n    ...)\n\n# non-deep mode\nS_train = JudiLing.make_S_matrix(\n    ...\n    isdeep=false,\n    ...)\n\n# add additional Gaussian noise\nS_train = JudiLing.make_S_matrix(\n    ...\n    add_noise=true,\n    sd_noise=1,\n    ...)\n\n# further control of means and standard deviations\nS_train = JudiLing.make_S_matrix(\n    ...\n    sd_base_mean=1,\n    sd_inflection_mean=1,\n    sd_base=4,\n    sd_inflection=4,\n    sd_noise=1,\n    ...)\n\n\n\n\n\n","category":"method"},{"location":"man/make_semantic_matrix/#JudiLing.make_S_matrix-Tuple{DataFrames.DataFrame, DataFrames.DataFrame, Vector, Vector}","page":"Make Semantic Matrix","title":"JudiLing.make_S_matrix","text":"make_S_matrix(data_train::DataFrame, data_val::DataFrame, base::Vector, inflections::Vector)\n\nCreate simulated semantic matrix for the validation datasets, given the input data of a vector specified contex lexemes and a vector specified gramatic lexemes. The semantic vector of a word form is constructed summing semantic vectors of content and gramatic lexemes.\n\nObligatory Arguments\n\ndata_train::DataFrame: the training dataset\ndata_val::DataFrame: the validation dataset\nbase::Vector: context lexemes\ninflections::Vector: grammatic lexemes\n\nOptional Arguments\n\nncol::Int64=200: dimension of semantic vectors, usually the same as that of cue vectors\nsd_base_mean::Int64=1: the sd mean of base features\nsd_inflection_mean::Int64=1: the sd mean of inflectional features\nsd_base::Int64=4: the sd of base features\nsd_inflection::Int64=4: the sd of inflectional features\nseed::Int64=314: the random seed\nisdeep::Bool=true: if true, mean of each feature is also randomized\nadd_noise::Bool=true: if true, add additional Gaussian noise\nsd_noise::Int64=1: the sd of the Gaussian noise\nnormalized::Bool=false: if true, most of the values range between 1 and -1, it may slightly exceed between 1 or -1 depending on the sd\n\nExamples\n\n# basic usage\nS_train, S_val = JudiLing.make_S_matrix(\n    french,\n    french_val,\n    [\"Lexeme\"],\n    [\"Tense\",\"Aspect\",\"Person\",\"Number\",\"Gender\",\"Class\",\"Mood\"],\n    ncol=200)\n\n# deep mode\nS_train, S_val = JudiLing.make_S_matrix(\n    ...\n    sd_base_mean=1,\n    sd_inflection_mean=1,\n    isdeep=true,\n  ...)\n\n# non-deep mode\nS_train, S_val = JudiLing.make_S_matrix(\n    ...\n    isdeep=false,\n    ...)\n\n# add additional Gaussian noise\nS_train, S_val = JudiLing.make_S_matrix(\n    ...\n    add_noise=true,\n    sd_noise=1,\n    ...)\n\n# further control of means and standard deviations\nS_train, S_val = JudiLing.make_S_matrix(\n    ...\n    sd_base_mean=1,\n    sd_inflection_mean=1,\n    sd_base=4,\n    sd_inflection=4,\n    sd_noise=1,\n    ...)\n\n\n\n\n\n","category":"method"},{"location":"man/make_semantic_matrix/#JudiLing.make_S_matrix-Tuple{DataFrames.DataFrame, Vector}","page":"Make Semantic Matrix","title":"JudiLing.make_S_matrix","text":"make_S_matrix(data::DataFrame, base::Vector)\n\nCreate simulated semantic matrix for the training datasets with only base features, given the input data of a vector specified contex lexemes and a vector specified gramatic lexemes. The semantic vector of a word form is constructed summing semantic vectors of content and gramatic lexemes.\n\nObligatory Arguments\n\ndata::DataFrame: the dataset\nbase::Vector: context lexemes\n\nOptional Arguments\n\nncol::Int64=200: dimension of semantic vectors, usually the same as that of cue vectors\nsd_base_mean::Int64=1: the sd mean of base features\nsd_base::Int64=4: the sd of base features\nseed::Int64=314: the random seed\nisdeep::Bool=true: if true, mean of each feature is also randomized\nadd_noise::Bool=true: if true, add additional Gaussian noise\nsd_noise::Int64=1: the sd of the Gaussian noise\nnormalized::Bool=false: if true, most of the values range between 1 and -1, it may slightly exceed between 1 or -1 depending on the sd\n\nExamples\n\n# basic usage\nS_train = JudiLing.make_S_matrix(\n    french,\n    [\"Lexeme\"],\n    ncol=200)\n\n# deep mode\nS_train = JudiLing.make_S_matrix(\n    ...\n    sd_base_mean=1,\n    sd_inflection_mean=1,\n    isdeep=true,\n    ...)\n\n# non-deep mode\nS_train = JudiLing.make_S_matrix(\n    ...\n    isdeep=false,\n    ...)\n\n# add additional Gaussian noise\nS_train = JudiLing.make_S_matrix(\n    ...\n    add_noise=true,\n    sd_noise=1,\n    ...)\n\n# further control of means and standard deviations\nS_train = JudiLing.make_S_matrix(\n    ...\n    sd_base_mean=1,\n    sd_inflection_mean=1,\n    sd_base=4,\n    sd_inflection=4,\n    sd_noise=1,\n    ...)\n\n\n\n\n\n","category":"method"},{"location":"man/make_semantic_matrix/#JudiLing.make_S_matrix-Tuple{DataFrames.DataFrame, DataFrames.DataFrame, Vector}","page":"Make Semantic Matrix","title":"JudiLing.make_S_matrix","text":"make_S_matrix(data_train::DataFrame, data_val::DataFrame, base::Vector)\n\nCreate simulated semantic matrix for the validation datasets with only base features, given the input data of a vector specified contex lexemes and a vector specified gramatic lexemes. The semantic vector of a word form is constructed summing semantic vectors of content and gramatic lexemes.\n\nObligatory Arguments\n\ndata_train::DataFrame: the training dataset\ndata_val::DataFrame: the validation dataset\nbase::Vector: context lexemes\n\nOptional Arguments\n\nncol::Int64=200: dimension of semantic vectors, usually the same as that of cue vectors\nsd_base_mean::Int64=1: the sd mean of base features\nsd_base::Int64=4: the sd of base features\nseed::Int64=314: the random seed\nisdeep::Bool=true: if true, mean of each feature is also randomized\nadd_noise::Bool=true: if true, add additional Gaussian noise\nsd_noise::Int64=1: the sd of the Gaussian noise\nnormalized::Bool=false: if true, most of the values range between 1 and -1, it may slightly exceed between 1 or -1 depending on the sd\n\nExamples\n\n# basic usage\nS_train, S_val = JudiLing.make_S_matrix(\n    french,\n    french_val,\n    [\"Lexeme\"],\n    ncol=200)\n\n# deep mode\nS_train, S_val = JudiLing.make_S_matrix(\n    ...\n    sd_base_mean=1,\n    sd_inflection_mean=1,\n    isdeep=true,\n    ...)\n\n# non-deep mode\nS_train, S_val = JudiLing.make_S_matrix(\n    ...\n    isdeep=false,\n    ...)\n\n# add additional Gaussian noise\nS_train, S_val = JudiLing.make_S_matrix(\n    ...\n    add_noise=true,\n    sd_noise=1,\n    ...)\n\n# further control of means and standard deviations\nS_train, S_val = JudiLing.make_S_matrix(\n    ...\n    sd_base_mean=1,\n    sd_inflection_mean=1,\n    sd_base=4,\n    sd_inflection=4,\n    sd_noise=1,\n    ...)\n\n\n\n\n\n","category":"method"},{"location":"man/make_semantic_matrix/#JudiLing.make_S_matrix-Tuple{DataFrames.DataFrame, Vector, Vector, JudiLing.L_Matrix_Struct}","page":"Make Semantic Matrix","title":"JudiLing.make_S_matrix","text":"make_S_matrix(data_train::DataFrame, base::Vector, inflections::Vector, L::L_Matrix_Struct)\n\nCreate simulated semantic matrix where lexome matrix is available.\n\nObligatory Arguments\n\ndata::DataFrame: the dataset\nbase::Vector: context lexemes\ninflections::Vector: grammatic lexemes\nL::L_Matrix_Struct: the lexome matrix\n\nOptional Arguments\n\nadd_noise::Bool=true: if true, add additional Gaussian noise\nsd_noise::Int64=1: the sd of the Gaussian noise\nnormalized::Bool=false: if true, most of the values range between 1 and -1, it may slightly exceed between 1 or -1 depending on the sd\n\nExamples\n\n# basic usage\nS1 = JudiLing.make_S_matrix(\n    latin,\n    [\"Lexeme\"],\n    [\"Person\",\"Number\",\"Tense\",\"Voice\",\"Mood\"],\n     L1,\n     add_noise=true,\n    sd_noise=1,\n    normalized=false\n    )\n\n\n\n\n\n","category":"method"},{"location":"man/make_semantic_matrix/#JudiLing.make_S_matrix-Tuple{DataFrames.DataFrame, Union{Nothing, DataFrames.DataFrame}, Vector, JudiLing.L_Matrix_Struct}","page":"Make Semantic Matrix","title":"JudiLing.make_S_matrix","text":"make_S_matrix(data_train::DataFrame, data_val::Union{DataFrame, Nothing}, base::Vector, L::L_Matrix_Struct)\n\nCreate simulated semantic matrix where lexome matrix is available.\n\nObligatory Arguments\n\ndata_train::DataFrame: the training dataset\ndata_val::DataFrame: the validation dataset\nbase::Vector: context lexemes\nL::L_Matrix_Struct: the lexome matrix\n\nOptional Arguments\n\nadd_noise::Bool=true: if true, add additional Gaussian noise\nsd_noise::Int64=1: the sd of the Gaussian noise\nnormalized::Bool=false: if true, most of the values range between 1 and -1, it may slightly exceed between 1 or -1 depending on the sd\n\nExamples\n\n# basic usage\nS1, S2 = JudiLing.make_S_matrix(\n     latin,\n    latin_val,\n    [\"Lexeme\"],\n    L1,\n    add_noise=true,\n    sd_noise=1,\n    normalized=false\n    )\n\n\n\n\n\n","category":"method"},{"location":"man/make_semantic_matrix/#JudiLing.make_S_matrix-Tuple{DataFrames.DataFrame, Vector, JudiLing.L_Matrix_Struct}","page":"Make Semantic Matrix","title":"JudiLing.make_S_matrix","text":"make_S_matrix(data::DataFrame, base::Vector, L::L_Matrix_Struct)\n\nCreate simulated semantic matrix where lexome matrix is available.\n\nObligatory Arguments\n\ndata::DataFrame: the dataset\nbase::Vector: context lexemes\nL::L_Matrix_Struct: the lexome matrix\n\nOptional Arguments\n\nadd_noise::Bool=true: if true, add additional Gaussian noise\nsd_noise::Int64=1: the sd of the Gaussian noise\nnormalized::Bool=false: if true, most of the values range between 1 and -1, it may slightly exceed between 1 or -1 depending on the sd\n\nExamples\n\n# basic usage\nS1 = JudiLing.make_S_matrix(\n    latin,\n    [\"Lexeme\"],\n    L1,\n    add_noise=true,\n    sd_noise=1,\n    normalized=false\n    )\n\n\n\n\n\n","category":"method"},{"location":"man/make_semantic_matrix/#JudiLing.make_S_matrix-Tuple{DataFrames.DataFrame, DataFrames.DataFrame, Vector, Vector, JudiLing.L_Matrix_Struct}","page":"Make Semantic Matrix","title":"JudiLing.make_S_matrix","text":"make_S_matrix(data_train::DataFrame, data_val::DataFrame, base::Vector, inflections::Vector, L::L_Matrix_Struct)\n\nCreate simulated semantic matrix where lexome matrix is available.\n\nObligatory Arguments\n\ndata_train::DataFrame: the training dataset\ndata_val::DataFrame: the validation dataset\nbase::Vector: context lexemes\ninflections::Vector: grammatic lexemes\nL::L_Matrix_Struct: the lexome matrix\n\nOptional Arguments\n\nadd_noise::Bool=true: if true, add additional Gaussian noise\nsd_noise::Int64=1: the sd of the Gaussian noise\nnormalized::Bool=false: if true, most of the values range between 1 and -1, it may slightly exceed between 1 or -1 depending on the sd\n\nExamples\n\n# basic usage\nS1, S2 = JudiLing.make_S_matrix(\n    latin,\n    latin_val,\n    [\"Lexeme\"],\n    [\"Person\",\"Number\",\"Tense\",\"Voice\",\"Mood\"],\n    L1,\n    add_noise=true,\n    sd_noise=1,\n    normalized=false\n    )\n\n\n\n\n\n","category":"method"},{"location":"man/make_semantic_matrix/#JudiLing.make_L_matrix-Tuple{DataFrames.DataFrame, Vector}","page":"Make Semantic Matrix","title":"JudiLing.make_L_matrix","text":"make_L_matrix(data::DataFrame, base::Vector)\n\nCreate Lexome Matrix with simulated semantic vectors where there are only base features.\n\nObligatory Arguments\n\ndata::DataFrame: the dataset\nbase::Vector: context lexemes\n\nOptional Arguments\n\nncol::Int64=200: dimension of semantic vectors, usually the same as that of cue vectors\nsd_base_mean::Int64=1: the sd mean of base features\nsd_base::Int64=4: the sd of base features\nseed::Int64=314: the random seed\nisdeep::Bool=true: if true, mean of each feature is also randomized\n\nExamples\n\n# basic usage\nL = JudiLing.make_L_matrix(\n    latin,\n    [\"Lexeme\"],\n    ncol=200)\n\n\n\n\n\n","category":"method"},{"location":"man/make_semantic_matrix/#JudiLing.make_combined_S_matrix-Tuple{DataFrames.DataFrame, DataFrames.DataFrame, Vector, Vector, JudiLing.L_Matrix_Struct}","page":"Make Semantic Matrix","title":"JudiLing.make_combined_S_matrix","text":"make_combined_S_matrix(data_train::DataFrame, data_val::DataFrame, base::Vector, inflections::Vector, L::L_Matrix_Struct)\n\nCreate simulated semantic matrix for the training datasets and validation datasets with existing Lexome matrix, where features are combined from both training datasets and validation datasets.\n\nObligatory Arguments\n\ndata_train::DataFrame: the training dataset\ndata_val::DataFrame: the validation dataset\nbase::Vector: context lexemes\ninflections::Vector: grammatic lexemes\nL::L_Matrix_Struct: the Lexome Matrix\n\nOptional Arguments\n\nadd_noise::Bool=true: if true, add additional Gaussian noise\nsd_noise::Int64=1: the sd of the Gaussian noise\nnormalized::Bool=false: if true, most of the values range between 1 and -1, it may slightly exceed between 1 or -1 depending on the sd\n\nExamples\n\n# basic usage\nS_train, S_val = JudiLing.make_combined_S_matrix(\n    latin_train,\n    latin_val,\n    [\"Lexeme\"],\n    [\"Person\",\"Number\",\"Tense\",\"Voice\",\"Mood\"],\n    L)\n\n\n\n\n\n","category":"method"},{"location":"man/make_semantic_matrix/#JudiLing.make_combined_S_matrix-Tuple{DataFrames.DataFrame, Union{Nothing, DataFrames.DataFrame}, Vector, JudiLing.L_Matrix_Struct}","page":"Make Semantic Matrix","title":"JudiLing.make_combined_S_matrix","text":"make_combined_S_matrix(data_train::DataFrame, data_val::Union{DataFrame, Nothing}, base::Vector, L::L_Matrix_Struct)\n\nCreate simulated semantic matrix for the training datasets and validation datasets with existing Lexome matrix, where features are combined from both training datasets and validation datasets.\n\nObligatory Arguments\n\ndata_train::DataFrame: the training dataset\ndata_val::DataFrame: the validation dataset\nbase::Vector: context lexemes\nL::L_Matrix_Struct: the Lexome Matrix\n\nOptional Arguments\n\nadd_noise::Bool=true: if true, add additional Gaussian noise\nsd_noise::Int64=1: the sd of the Gaussian noise\nnormalized::Bool=false: if true, most of the values range between 1 and -1, it may slightly exceed between 1 or -1 depending on the sd\n\nExamples\n\n# basic usage\nS_train, S_val = JudiLing.make_combined_S_matrix(\n    latin_train,\n    latin_val,\n    [\"Lexeme\"],\n    [\"Person\",\"Number\",\"Tense\",\"Voice\",\"Mood\"],\n    L)\n\n\n\n\n\n","category":"method"},{"location":"man/make_semantic_matrix/#JudiLing.make_combined_S_matrix-Tuple{DataFrames.DataFrame, DataFrames.DataFrame, Vector, Vector}","page":"Make Semantic Matrix","title":"JudiLing.make_combined_S_matrix","text":"make_combined_S_matrix(  data_train::DataFrame, data_val::DataFrame, base::Vector, inflections::Vector)\n\nCreate simulated semantic matrix for the training datasets and validation datasets, where features are combined from both training datasets and validation datasets.\n\nObligatory Arguments\n\ndata_train::DataFrame: the training dataset\ndata_val::DataFrame: the validation dataset\nbase::Vector: context lexemes\ninflections::Vector: grammatic lexemes\n\nOptional Arguments\n\nncol::Int64=200: dimension of semantic vectors, usually the same as that of cue vectors\nsd_base_mean::Int64=1: the sd mean of base features\nsd_inflection_mean::Int64=1: the sd mean of inflectional features\nsd_base::Int64=4: the sd of base features\nsd_inflection::Int64=4: the sd of inflectional features\nseed::Int64=314: the random seed\nisdeep::Bool=true: if true, mean of each feature is also randomized\nadd_noise::Bool=true: if true, add additional Gaussian noise\nsd_noise::Int64=1: the sd of the Gaussian noise\nnormalized::Bool=false: if true, most of the values range between 1 and -1, it may slightly exceed between 1 or -1 depending on the sd\n\nExamples\n\n# basic usage\nS_train, S_val = JudiLing.make_combined_S_matrix(\n    latin_train,\n    latin_val,\n    [\"Lexeme\"],\n    [\"Person\",\"Number\",\"Tense\",\"Voice\",\"Mood\"],\n    ncol=n_features)\n\n\n\n\n\n","category":"method"},{"location":"man/make_semantic_matrix/#JudiLing.make_combined_S_matrix-Tuple{DataFrames.DataFrame, DataFrames.DataFrame, Vector}","page":"Make Semantic Matrix","title":"JudiLing.make_combined_S_matrix","text":"make_combined_S_matrix(data_train::DataFrame, data_val::DataFrame, base::Vector)\n\nCreate simulated semantic matrix for the training datasets and validation datasets, where features are combined from both training datasets and validation datasets.\n\nObligatory Arguments\n\ndata_train::DataFrame: the training dataset\ndata_val::DataFrame: the validation dataset\nbase::Vector: context lexemes\n\nOptional Arguments\n\nncol::Int64=200: dimension of semantic vectors, usually the same as that of cue vectors\nsd_base_mean::Int64=1: the sd mean of base features\nsd_inflection_mean::Int64=1: the sd mean of inflectional features\nsd_base::Int64=4: the sd of base features\nsd_inflection::Int64=4: the sd of inflectional features\nseed::Int64=314: the random seed\nisdeep::Bool=true: if true, mean of each feature is also randomized\nadd_noise::Bool=true: if true, add additional Gaussian noise\nsd_noise::Int64=1: the sd of the Gaussian noise\nnormalized::Bool=false: if true, most of the values range between 1 and -1, it may slightly exceed between 1 or -1 depending on the sd\n\nExamples\n\n# basic usage\nS_train, S_val = JudiLing.make_combined_S_matrix(\n    latin_train,\n    latin_val,\n    [\"Lexeme\"],\n    [\"Person\",\"Number\",\"Tense\",\"Voice\",\"Mood\"],\n    ncol=n_features)\n\n\n\n\n\n","category":"method"},{"location":"man/make_semantic_matrix/#JudiLing.make_combined_L_matrix-Tuple{DataFrames.DataFrame, DataFrames.DataFrame, Vector, Vector}","page":"Make Semantic Matrix","title":"JudiLing.make_combined_L_matrix","text":"make_combined_L_matrix(data_train::DataFrame, data_val::DataFrame, base::Vector, inflections::Vector)\n\nCreate Lexome Matrix with simulated semantic vectors, where features are combined from both training datasets and validation datasets.\n\nObligatory Arguments\n\ndata_train::DataFrame: the training dataset\ndata_val::DataFrame: the validation dataset\nbase::Vector: context lexemes\ninflections::Vector: grammatic lexemes\n\nOptional Arguments\n\nncol::Int64=200: dimension of semantic vectors, usually the same as that of cue vectors\nsd_base_mean::Int64=1: the sd mean of base features\nsd_inflection_mean::Int64=1: the sd mean of inflectional features\nsd_base::Int64=4: the sd of base features\nsd_inflection::Int64=4: the sd of inflectional features\nseed::Int64=314: the random seed\nisdeep::Bool=true: if true, mean of each feature is also randomized\n\nExamples\n\n# basic usage\nL = JudiLing.make_combined_L_matrix(\n    latin_train,\n    latin_val,\n    [\"Lexeme\"],\n    [\"Person\",\"Number\",\"Tense\",\"Voice\",\"Mood\"],\n    ncol=n_features)\n\n\n\n\n\n","category":"method"},{"location":"man/make_semantic_matrix/#JudiLing.make_combined_L_matrix-Tuple{DataFrames.DataFrame, DataFrames.DataFrame, Vector}","page":"Make Semantic Matrix","title":"JudiLing.make_combined_L_matrix","text":"make_combined_L_matrix(data_train::DataFrame, data_val::DataFrame, base::Vector)\n\nCreate Lexome Matrix with simulated semantic vectors, where features are combined from both training datasets and validation datasets.\n\nObligatory Arguments\n\ndata_train::DataFrame: the training dataset\ndata_val::DataFrame: the validation dataset\nbase::Vector: context lexemes\n\nOptional Arguments\n\nncol::Int64=200: dimension of semantic vectors, usually the same as that of cue vectors\nsd_base_mean::Int64=1: the sd mean of base features\nsd_inflection_mean::Int64=1: the sd mean of inflectional features\nsd_base::Int64=4: the sd of base features\nsd_inflection::Int64=4: the sd of inflectional features\nseed::Int64=314: the random seed\nisdeep::Bool=true: if true, mean of each feature is also randomized\n\nExamples\n\n# basic usage\nL = JudiLing.make_combined_L_matrix(\n    latin_train,\n    latin_val,\n    [\"Lexeme\"],\n    ncol=n_features)\n\n\n\n\n\n","category":"method"},{"location":"man/make_semantic_matrix/#JudiLing.L_Matrix_Struct-NTuple{12, Any}","page":"Make Semantic Matrix","title":"JudiLing.L_Matrix_Struct","text":"L_Matrix_Struct(L, sd_base, sd_base_mean, sd_inflection, sd_inflection_mean, base_f, infl_f, base_f2i, infl_f2i, n_base_f, n_infl_f, ncol)\n\nConstruct LMatrixStruct with deep mode.\n\n\n\n\n\n","category":"method"},{"location":"man/make_semantic_matrix/#JudiLing.L_Matrix_Struct-NTuple{10, Any}","page":"Make Semantic Matrix","title":"JudiLing.L_Matrix_Struct","text":"L_Matrix_Struct(L, sd_base, sd_inflection, base_f, infl_f, base_f2i, infl_f2i, n_base_f, n_infl_f, ncol)\n\nConstruct LMatrixStruct without deep mode.\n\n\n\n\n\n","category":"method"},{"location":"man/make_semantic_matrix/#Load-from-word2vec,-fasttext-or-similar","page":"Make Semantic Matrix","title":"Load from word2vec, fasttext or similar","text":"","category":"section"},{"location":"man/make_semantic_matrix/","page":"Make Semantic Matrix","title":"Make Semantic Matrix","text":"load_S_matrix_from_fasttext(data::DataFrame,\n                                     language::Symbol;\n                                     target_col=:Word,\n                                     default_file::Int=1)\n load_S_matrix_from_fasttext(data_train::DataFrame,\n                                  data_val::DataFrame,\n                                  language::Symbol;\n                                  target_col=:Word,\n                                  default_file::Int=1)\n  load_S_matrix_from_word2vec_file(data::DataFrame,\n                              filepath::String;\n                              target_col=:Word)\n  load_S_matrix_from_word2vec_file(data_train::DataFrame,\n                              data_val::DataFrame,\n                              filepath::String;\n                              target_col=:Word)\n  load_S_matrix_from_fasttext_file(data::DataFrame,\n                              filepath::String;\n                              target_col=:Word)\n  load_S_matrix_from_fasttext_file(data_train::DataFrame,\n                              data_val::DataFrame,\n                              filepath::String;\n                              target_col=:Word)","category":"page"},{"location":"man/make_semantic_matrix/#JudiLing.load_S_matrix_from_fasttext-Tuple{DataFrames.DataFrame, Symbol}","page":"Make Semantic Matrix","title":"JudiLing.load_S_matrix_from_fasttext","text":"load_S_matrix_from_fasttext(data::DataFrame,\n                                 language::Symbol;\n                                 target_col=:Word,\n                                 default_file::Int=1)\n\nLoad semantic matrix from fasttext, loaded using the Embeddings.jl package. Subset fasttext vectors to include only words in target_col of data, and subset data to only include words in target_col for which semantic vector is available.\n\nThe last parameter, default_file, specifies which vectors are loaded. To learn about all available vectors, use the following commands:\n\nusing Embeddings\nlanguage_files(FastText_Text{:nl})\n\nreplacing the language code (here :nl) with the language you are interested in. In general, for all languages other than English, these files are available:\n\ndefault_file=1 loads from https://fasttext.cc/docs/en/crawl-vectors.html, paper: E. Grave, P. Bojanowski, P. Gupta, A. Joulin, T. Mikolov,        Learning Word Vectors for 157 Languages License: CC BY-SA 3.0 https://creativecommons.org/licenses/by-sa/3.0/\ndefault_file=2 loads from https://fasttext.cc/docs/en/pretrained-vectors.html paper: P. Bojanowski, E. Grave, A. Joulin, T. Mikolov,        Enriching Word Vectors with Subword Information License: CC BY-SA 3.0 https://creativecommons.org/licenses/by-sa/3.0/\n\nObligatory Arguments\n\ndata::DataFrame: the dataset\nlanguage::Symbol: the language of the words in the dataset,   offically ISO 639-2 (see https://github.com/JuliaText/Embeddings.jl/issues/34#issuecomment-782604523)   but practically it seems more like ISO 639-1 to me with ISO 639-2 only being used   if ISO 639-1 isn't available (see https://en.wikipedia.org/wiki/ListofISO639-2codes)\n\nOptional Arguments\n\ntarget_col=:Word: column with orthographic representation of words in data\ndefault_file::Int=1: source of vectors, for more information see above and here: https://github.com/JuliaText/Embeddings.jl#loading-different-embeddings\n\nExamples\n\n# basic usage\nlatin_small, S = JudiLing.load_S_matrix_from_fasttext(latin, :la, target_col=:Word)\n\n\n\n\n\n","category":"method"},{"location":"man/make_semantic_matrix/#JudiLing.load_S_matrix_from_fasttext-Tuple{DataFrames.DataFrame, DataFrames.DataFrame, Symbol}","page":"Make Semantic Matrix","title":"JudiLing.load_S_matrix_from_fasttext","text":"load_S_matrix_from_fasttext(data_train::DataFrame,\n                                 data_val::DataFrame,\n                                 language::Symbol;\n                                 target_col=:Word,\n                                 default_file::Int=1)\n\nLoad semantic matrix from fasttext, loaded using the Embeddings.jl package. Subset fasttext vectors to include only words in target_col of data_train and data_val, and subset data to only include words in target_col for which semantic vector is available. Returns subsetted train and val data and train and val semantic matrices.\n\nThe last parameter, default_file, specifies which vectors are loaded. To learn about all available vectors, use the following commands:\n\nusing Embeddings\nlanguage_files(FastText_Text{:nl})\n\nreplacing the language code (here :nl) with the language you are interested in. In general, for all languages other than English, these files are available:\n\ndefault_file=1 loads from https://fasttext.cc/docs/en/crawl-vectors.html, paper: E. Grave, P. Bojanowski, P. Gupta, A. Joulin, T. Mikolov,        Learning Word Vectors for 157 Languages License: CC BY-SA 3.0 https://creativecommons.org/licenses/by-sa/3.0/\ndefault_file=2 loads from https://fasttext.cc/docs/en/pretrained-vectors.html paper: P. Bojanowski, E. Grave, A. Joulin, T. Mikolov,        Enriching Word Vectors with Subword Information License: CC BY-SA 3.0 https://creativecommons.org/licenses/by-sa/3.0/\n\nObligatory Arguments\n\ndata_train::DataFrame: the training dataset\ndata_val::DataFrame: the validation dataset\nlanguage::Symbol: the language of the words in the dataset,   offically ISO 639-2 (see https://github.com/JuliaText/Embeddings.jl/issues/34#issuecomment-782604523)   but practically it seems more like ISO 639-1 to me with ISO 639-2 only being used   if ISO 639-1 isn't available (see https://en.wikipedia.org/wiki/ListofISO639-2codes)\n\nOptional Arguments\n\ntarget_col=:Word: column with orthographic representation of words in data\ndefault_file::Int=1: source of vectors, for more information see above and here: https://github.com/JuliaText/Embeddings.jl#loading-different-embeddings\n\nExamples\n\n# basic usage\nlatin_small_train, latin_small_val, S_train, S_val = JudiLing.load_S_matrix_from_fasttext(latin_train,\n                                                      latin_val,\n                                                      :la,\n                                                      target_col=:Word)\n\n\n\n\n\n","category":"method"},{"location":"man/make_semantic_matrix/#JudiLing.load_S_matrix_from_word2vec_file-Tuple{DataFrames.DataFrame, String}","page":"Make Semantic Matrix","title":"JudiLing.load_S_matrix_from_word2vec_file","text":"load_S_matrix_from_word2vec_file(data::DataFrame,\n                            filepath::String;\n                            target_col=:Word)\n\nLoad semantic matrix from word2vec filepath. Subset word2vec vectors to include only words in target_col of data, and subset data to only include words in target_col for which semantic vector is available. Returns subsetted data and semantic matrix.\n\nObligatory Arguments\n\ndata::DataFrame: the training dataset\nfilepath::String: path to file with word2vec vectors in .txt (not compressed in any way)\n\nOptional Arguments\n\ntarget_col=:Word: column with orthographic representation of words in data\n\n\n\n\n\n","category":"method"},{"location":"man/make_semantic_matrix/#JudiLing.load_S_matrix_from_word2vec_file-Tuple{DataFrames.DataFrame, DataFrames.DataFrame, String}","page":"Make Semantic Matrix","title":"JudiLing.load_S_matrix_from_word2vec_file","text":"load_S_matrix_from_word2vec_file(data_train::DataFrame,\n                            data_val::DataFrame,\n                            filepath::String;\n                            target_col=:Word)\n\nLoad semantic matrix from word2vec filepath. Subset word2vec vectors to include only words in target_col of data_train and data_val, and subset data to only include words in target_col for which semantic vector is available. Returns subsetted train and val data and train and val semantic matrices.\n\nObligatory Arguments\n\ndata_train::DataFrame: the training dataset\ndata_val::DataFrame: the validation dataset\nfilepath::String: path to file with word2vec vectors in .txt (not compressed in any way)\n\nOptional Arguments\n\ntarget_col=:Word: column with orthographic representation of words in data\n\n\n\n\n\n","category":"method"},{"location":"man/make_semantic_matrix/#JudiLing.load_S_matrix_from_fasttext_file-Tuple{DataFrames.DataFrame, String}","page":"Make Semantic Matrix","title":"JudiLing.load_S_matrix_from_fasttext_file","text":"load_S_matrix_from_fasttext_file(data::DataFrame,\n                            filepath::String;\n                            target_col=:Word)\n\nLoad semantic matrix from fasttext filepath. Subset fasttext vectors to include only words in target_col of data, and subset data to only include words in target_col for which semantic vector is available. Returns subsetted data and semantic matrix.\n\nObligatory Arguments\n\ndata::DataFrame: the training dataset\nfilepath::String: path to file with fasttext vectors in .txt or .vec (not compressed in any way)\n\nOptional Arguments\n\ntarget_col=:Word: column with orthographic representation of words in data\n\n\n\n\n\n","category":"method"},{"location":"man/make_semantic_matrix/#JudiLing.load_S_matrix_from_fasttext_file-Tuple{DataFrames.DataFrame, DataFrames.DataFrame, String}","page":"Make Semantic Matrix","title":"JudiLing.load_S_matrix_from_fasttext_file","text":"load_S_matrix_from_fasttext_file(data_train::DataFrame,\n                            data_val::DataFrame,\n                            filepath::String;\n                            target_col=:Word)\n\nLoad semantic matrix from fasttext filepath. Subset fasttext vectors to include only words in target_col of data_train and data_val, and subset data to only include words in target_col for which semantic vector is available. Returns subsetted train and val data and train and val semantic matrices.\n\nObligatory Arguments\n\ndata_train::DataFrame: the training dataset\ndata_val::DataFrame: the validation dataset\nfilepath::String: path to file with fasttext vectors in .txt (not compressed in any way)\n\nOptional Arguments\n\ntarget_col=:Word: column with orthographic representation of words in data\n\n\n\n\n\n","category":"method"},{"location":"man/make_semantic_matrix/#Utility-functions","page":"Make Semantic Matrix","title":"Utility functions","text":"","category":"section"},{"location":"man/make_semantic_matrix/","page":"Make Semantic Matrix","title":"Make Semantic Matrix","text":"    process_features(data, feature_cols)\n    comp_f_M!(L, sd, sd_mean, n_f, ncol, n_b)\n    comp_f_M!(L, sd, n_f, ncol, n_b)\n    merge_f2i(base_f2i, infl_f2i, n_base_f, n_infl_f)\n    lexome_sum(L, features)\n    make_St(L, n, data, base, inflections)\n    make_St(L, n, data, base)\n    add_St_noise!(St, sd_noise)\n    normalize_St!(St, n_base, n_infl)\n    normalize_St!(St, n_base)","category":"page"},{"location":"man/make_semantic_matrix/#JudiLing.process_features-Tuple{Any, Any}","page":"Make Semantic Matrix","title":"JudiLing.process_features","text":"process_features(data, feature_cols)\n\nCollect all features given datasets and feature column names.\n\n\n\n\n\n","category":"method"},{"location":"man/make_semantic_matrix/#JudiLing.comp_f_M!-NTuple{6, Any}","page":"Make Semantic Matrix","title":"JudiLing.comp_f_M!","text":"comp_f_M!(L, sd, sd_mean, n_f, ncol, n_b)\n\nCompose feature Matrix with deep mode.\n\n\n\n\n\n","category":"method"},{"location":"man/make_semantic_matrix/#JudiLing.comp_f_M!-NTuple{5, Any}","page":"Make Semantic Matrix","title":"JudiLing.comp_f_M!","text":"comp_f_M!(L, sd, n_f, ncol, n_b)\n\nCompose feature Matrix without deep mode.\n\n\n\n\n\n","category":"method"},{"location":"man/make_semantic_matrix/#JudiLing.merge_f2i-NTuple{4, Any}","page":"Make Semantic Matrix","title":"JudiLing.merge_f2i","text":"merge_f2i(base_f2i, infl_f2i, n_base_f, n_infl_f)\n\nMerge base f2i dictionary and inflectional f2i dictionary.\n\n\n\n\n\n","category":"method"},{"location":"man/make_semantic_matrix/#JudiLing.lexome_sum-Tuple{Any, Any}","page":"Make Semantic Matrix","title":"JudiLing.lexome_sum","text":"lexome_sum(L, features)\n\nSum up semantic vector, given lexome vector.\n\n\n\n\n\n","category":"method"},{"location":"man/make_semantic_matrix/#JudiLing.make_St-NTuple{5, Any}","page":"Make Semantic Matrix","title":"JudiLing.make_St","text":"make_St(L, n, data, base, inflections)\n\nMake S transpose matrix with inflections.\n\n\n\n\n\n","category":"method"},{"location":"man/make_semantic_matrix/#JudiLing.make_St-NTuple{4, Any}","page":"Make Semantic Matrix","title":"JudiLing.make_St","text":"make_St(L, n, data, base)\n\nMake S transpose matrix without inflections.\n\n\n\n\n\n","category":"method"},{"location":"man/make_semantic_matrix/#JudiLing.add_St_noise!-Tuple{Any, Any}","page":"Make Semantic Matrix","title":"JudiLing.add_St_noise!","text":"add_St_noise!(St, sd_noise)\n\nAdd noise.\n\n\n\n\n\n","category":"method"},{"location":"man/make_semantic_matrix/#JudiLing.normalize_St!-Tuple{Any, Any, Any}","page":"Make Semantic Matrix","title":"JudiLing.normalize_St!","text":"normalize_St!(St, n_base, n_infl)\n\nNormalize S transpose with inflections.\n\n\n\n\n\n","category":"method"},{"location":"man/make_semantic_matrix/#JudiLing.normalize_St!-Tuple{Any, Any}","page":"Make Semantic Matrix","title":"JudiLing.normalize_St!","text":"normalize_St!(St, n_base)\n\nNormalize S transpose without inflections.\n\n\n\n\n\n","category":"method"},{"location":"man/eval/","page":"Evaluation","title":"Evaluation","text":"CurrentModule = JudiLing","category":"page"},{"location":"man/eval/#Evaluation","page":"Evaluation","title":"Evaluation","text":"","category":"section"},{"location":"man/eval/","page":"Evaluation","title":"Evaluation","text":"    Comp_Acc_Struct\n    eval_SC\n    eval_SC_loose\n    accuracy_comprehension(S, Shat, data)\n    accuracy_comprehension(\n        S_val,\n        S_train,\n        Shat_val,\n        data_val,\n        data_train;\n        target_col = :Words,\n        base = nothing,\n        inflections = nothing,\n    )\n    eval_SC(SChat::AbstractArray, SC::AbstractArray)\n    eval_SC(SChat::AbstractArray, SC::AbstractArray, SC_rest::AbstractArray)\n    eval_SC(SChat::AbstractArray, SC::AbstractArray, data::DataFrame, target_col::Union{String, Symbol})\n    eval_SC(SChat::AbstractArray, SC::AbstractArray, SC_rest::AbstractArray, data::DataFrame, data_rest::DataFrame, target_col::Union{String, Symbol})\n    eval_SC(SChat::AbstractArray, SC::AbstractArray, batch_size::Int64)\n    eval_SC(SChat::AbstractArray, SC::AbstractArray, data::DataFrame, target_col::Union{String, Symbol}, batch_size::Int64)\n    eval_SC_loose(SChat, SC, k)\n    eval_SC_loose(SChat, SC, k, data, target_col)\n    eval_manual(res, data, i2f)\n    eval_acc(res, gold_inds::Array)\n    eval_acc(res, cue_obj::Cue_Matrix_Struct)\n    eval_acc_loose(res, gold_inds)\n    extract_gpi(gpi, threshold=0.1, tolerance=(-1000.0))","category":"page"},{"location":"man/eval/#JudiLing.Comp_Acc_Struct","page":"Evaluation","title":"JudiLing.Comp_Acc_Struct","text":"A structure that stores information about comprehension accuracy.\n\n\n\n\n\n","category":"type"},{"location":"man/eval/#JudiLing.eval_SC","page":"Evaluation","title":"JudiLing.eval_SC","text":"Assess model accuracy on the basis of the correlations of row vectors of Chat and C or Shat and S. Ideally the target words have highest correlations on the diagonal of the pertinent correlation matrices. Homophones support option is implemented.\n\n\n\n\n\n","category":"function"},{"location":"man/eval/#JudiLing.eval_SC_loose","page":"Evaluation","title":"JudiLing.eval_SC_loose","text":"Assess model accuracy on the basis of the correlations of row vectors of Chat and C or Shat and S. Count it as correct if one of the top k candidates is correct. Homophones support option is implemented.\n\n\n\n\n\n","category":"function"},{"location":"man/eval/#JudiLing.accuracy_comprehension-Tuple{Any, Any, Any}","page":"Evaluation","title":"JudiLing.accuracy_comprehension","text":"accuracy_comprehension(S, Shat, data)\n\nEvaluate comprehension accuracy for training data.\n\nnote: Note\nIn case of homophones/homographs in the dataset, the correct/incorrect values for base and inflections may be misleading! See below for more information.\n\nObligatory Arguments\n\nS::Matrix: the (gold standard) S matrix\nShat::Matrix: the (predicted) Shat matrix\ndata::DataFrame: the dataset\n\nOptional Arguments\n\ntarget_col::Union{String, Symbol}=:Words: the column name for target strings\nbase::Vector=nothing: base features (typically a lexeme)\ninflections::Union{Nothing, Vector}=nothing: other features (typically in inflectional features)\n\nExamples\n\naccuracy_comprehension(\n    S_train,\n    Shat_train,\n    latin_val,\n    target_col=:Words,\n    base=[:Lexeme],\n    inflections=[:Person, :Number, :Tense, :Voice, :Mood]\n    )\n\nNote\n\nIn case of homophones/homographs in the dataset, the correct/incorrect values for base and inflections may be misleading! Consider the following example: The wordform \"Äpfel\" in German can be nominative plural, genitive plural and accusative plural. Let's assume we have a dataset in which \"Äpfel\" occurs in all three case/number combinations (i.e. there are homographs). If all these wordforms have the same semantic vectors (e.g. because they are derived from word2vec or fasttext which typically have a single vector per unique wordform), the predicted semantic vector of the wordform \"Äpfel\" will be equally correlated with all three case/number combinations in the dataset. In such cases, while the algorithm in this function can unambiguously conclude that the correct surface form \"Äpfel\" was comprehended, which of the three possible rows is the correct one will be picked somewhat non-deterministically (see https://docs.julialang.org/en/v1/base/collections/#Base.argmax). It is thus possible that the algorithm will then use the genitive plural instead of the intended nominative plural as the ground plural, and will report that \"case\" was comprehended incorrectly.\n\n\n\n\n\n","category":"method"},{"location":"man/eval/#JudiLing.accuracy_comprehension-NTuple{5, Any}","page":"Evaluation","title":"JudiLing.accuracy_comprehension","text":"accuracy_comprehension(\n    S_val,\n    S_train,\n    Shat_val,\n    data_val,\n    data_train;\n    target_col = :Words,\n    base = nothing,\n    inflections = nothing,\n)\n\nEvaluate comprehension accuracy for validation data.\n\nnote: Note\nIn case of homophones/homographs in the dataset, the correct/incorrect values for base and inflections may be misleading! See below for more information.\n\nObligatory Arguments\n\nS_val::Matrix: the (gold standard) S matrix of the validation data\nS_train::Matrix: the (gold standard) S matrix of the training data\nShat_val::Matrix: the (predicted) Shat matrix of the validation data\ndata_val::DataFrame: the validation dataset\ndata_train::DataFrame: the training dataset\n\nOptional Arguments\n\ntarget_col::Union{String, Symbol}=:Words: the column name for target strings\nbase::Vector=nothing: base features (typically a lexeme)\ninflections::Union{Nothing, Vector}=nothing: other features (typically in inflectional features)\n\nExamples\n\naccuracy_comprehension(\n    S_val,\n    S_train,\n    Shat_val,\n    latin_val,\n    latin_train,\n    target_col=:Words,\n    base=[:Lexeme],\n    inflections=[:Person, :Number, :Tense, :Voice, :Mood]\n    )\n\nNote\n\nIn case of homophones/homographs in the dataset, the correct/incorrect values for base and inflections may be misleading! Consider the following example: The wordform \"Äpfel\" in German can be nominative plural, genitive plural and accusative plural. Let's assume we have a dataset in which \"Äpfel\" occurs in all three case/number combinations (i.e. there are homographs). If all these wordforms have the same semantic vectors (e.g. because they are derived from word2vec or fasttext which typically have a single vector per unique wordform), the predicted semantic vector of the wordform \"Äpfel\" will be equally correlated with all three case/number combinations in the dataset. In such cases, while the algorithm in this function can unambiguously conclude that the correct surface form \"Äpfel\" was comprehended, which of the three possible rows is the correct one will be picked somewhat non-deterministically (see https://docs.julialang.org/en/v1/base/collections/#Base.argmax). It is thus possible that the algorithm will then use the genitive plural instead of the intended nominative plural as the ground plural, and will report that \"case\" was comprehended incorrectly.\n\n\n\n\n\n","category":"method"},{"location":"man/eval/#JudiLing.eval_SC-Tuple{AbstractArray, AbstractArray}","page":"Evaluation","title":"JudiLing.eval_SC","text":"eval_SC(SChat::AbstractArray, SC::AbstractArray)\n\nAssess model accuracy on the basis of the correlations (or Euclidean distances or Cosine Similarities) of row vectors of Chat and C or Shat and S. Ideally the target words have highest correlations (lowest distance/highest similarity) on the diagonal of the pertinent correlation (distance/similarity) matrices.\n\nIf freq is added, token-based accuracy is computed. Token-based accuracy weighs accuracy values according to words' frequency, i.e. if a word has a frequency of 30 and overall there are 3000 tokens (the frequencies of all types sum to 3000), this token's accuracy will contribute 30/3000.\n\nnote: Note\nIf there are homophones/homographs in the dataset, this evaluation method may be misleading: the predicted vector will be equally correlated with the target vector of both words and the one on the diagonal will not necessarily be selected as the most correlated. In such cases, supplying the dataset and target_col is recommended which enables taking into account homophones/homographs.\n\nObligatory Arguments\n\nSChat::Union{SparseMatrixCSC, Matrix}: the Chat or Shat matrix\nSC::Union{SparseMatrixCSC, Matrix}: the C or S matrix\n\nOptional Arguments\n\ndigits: the specified number of digits after the decimal place (or before if negative)\nR::Bool=false: if true, pairwise correlation/distance/similarity matrix R is return\nfreq::Union{Missing, Array{Int64, 1}, Array{Float64,1}}=missing: list of frequencies of the wordforms in X and Y\nmethod::Union{Symbol, String}=:correlation: Method for computing similarities, one of {:correlation, :euclidean, :cosine}.\n\neval_SC(Chat_train, cue_obj_train.C)\neval_SC(Chat_val, cue_obj_val.C)\neval_SC(Shat_train, S_train)\neval_SC(Shat_val, S_val)\n\n\n\n\n\n","category":"method"},{"location":"man/eval/#JudiLing.eval_SC-Tuple{AbstractArray, AbstractArray, AbstractArray}","page":"Evaluation","title":"JudiLing.eval_SC","text":"eval_SC(SChat::AbstractArray, SC::AbstractArray, SC_rest::AbstractArray)\n\nAssess model accuracy on the basis of the correlations (or Euclidean distances or Cosine Similarities) of row vectors of Chat and C or Shat and S. Ideally the target words have highest correlations (lowest distance/highest similarity) on the diagonal of the pertinent correlation (distance/similarity) matrices.\n\nIf freq is added, token-based accuracy is computed. Token-based accuracy weighs accuracy values according to words' frequency, i.e. if a word has a frequency of 30 and overall there are 3000 tokens (the frequencies of all types sum to 3000), this token's accuracy will contribute 30/3000.\n\nnote: Note\nThe order is important. The fist gold standard matrix has to be corresponing to the SChat matrix, such as eval_SC(Shat_train, S_train, S_val) or eval_SC(Shat_val, S_val, S_train)\n\nnote: Note\nIf there are homophones/homographs in the dataset, this evaluation method may be misleading: the predicted vector will be equally correlated with the target vector of both words and the one on the diagonal will not necessarily be selected as the most correlated. In such cases, supplying the dataset and target_col is recommended which enables taking into account homophones/homographs.\n\nObligatory Arguments\n\nSChat::Union{SparseMatrixCSC, Matrix}: the Chat or Shat matrix\nSC::Union{SparseMatrixCSC, Matrix}: the training/validation C or S matrix\nSC_rest::Union{SparseMatrixCSC, Matrix}: the validation/training C or S matrix\n\nOptional Arguments\n\ndigits: the specified number of digits after the decimal place (or before if negative)\nR::Bool=false: if true, pairwise correlation/distance/similarity matrix R is return\nfreq::Union{Missing, Array{Int64, 1}, Array{Float64,1}}=missing: list of frequencies of the wordforms in X and Y\nmethod::Union{Symbol, String}=:correlation: Method for computing similarities, one of {:correlation, :euclidean, :cosine}.\n\neval_SC(Chat_train, cue_obj_train.C, cue_obj_val.C)\neval_SC(Chat_val, cue_obj_val.C, cue_obj_train.C)\neval_SC(Shat_train, S_train, S_val)\neval_SC(Shat_val, S_val, S_train)\n\n\n\n\n\n","category":"method"},{"location":"man/eval/#JudiLing.eval_SC-Tuple{AbstractArray, AbstractArray, DataFrames.DataFrame, Union{String, Symbol}}","page":"Evaluation","title":"JudiLing.eval_SC","text":"eval_SC(SChat::AbstractArray, SC::AbstractArray, data::DataFrame, target_col::Union{String, Symbol})\n\nAssess model accuracy on the basis of the correlations (or Euclidean distances or Cosine Similarities) of row vectors of Chat and C or Shat and S. Ideally the target words have highest correlations (lowest distance/highest similarity) on the diagonal of the pertinent correlation (distance/similarity) matrices. Support for homophones.\n\nIf freq is added, token-based accuracy is computed. Token-based accuracy weighs accuracy values according to words' frequency, i.e. if a word has a frequency of 30 and overall there are 3000 tokens (the frequencies of all types sum to 3000), this token's accuracy will contribute 30/3000.\n\nObligatory Arguments\n\nSChat::Union{SparseMatrixCSC, Matrix}: the Chat or Shat matrix\nSC::Union{SparseMatrixCSC, Matrix}: the C or S matrix\ndata::DataFrame: datasets\ntarget_col::Union{String, Symbol}: target column name\n\nOptional Arguments\n\ndigits: the specified number of digits after the decimal place (or before if negative)\nR::Bool=false: if true, pairwise correlation/distance/similarity matrix R is return\nfreq::Union{Missing, Array{Int64, 1}, Array{Float64,1}}=missing: list of frequencies of the wordforms in X and Y\nmethod::Union{Symbol, String}=:correlation: Method for computing similarities, one of {:correlation, :euclidean, :cosine}.\n\neval_SC(Chat_train, cue_obj_train.C, latin, :Word)\neval_SC(Chat_val, cue_obj_val.C, latin, :Word)\neval_SC(Shat_train, S_train, latin, :Word)\neval_SC(Shat_val, S_val, latin, :Word)\n\n\n\n\n\n","category":"method"},{"location":"man/eval/#JudiLing.eval_SC-Tuple{AbstractArray, AbstractArray, AbstractArray, DataFrames.DataFrame, DataFrames.DataFrame, Union{String, Symbol}}","page":"Evaluation","title":"JudiLing.eval_SC","text":"eval_SC(SChat::AbstractArray, SC::AbstractArray, SC_rest::AbstractArray, data::DataFrame, data_rest::DataFrame, target_col::Union{String, Symbol})\n\nAssess model accuracy on the basis of the correlations (or Euclidean distances or Cosine Similarities) of row vectors of Chat and C or Shat and S. Ideally the target words have highest correlations (lowest distance/highest similarity) on the diagonal of the pertinent correlation (distance/similarity) matrices.\n\nIf freq is added, token-based accuracy is computed. Token-based accuracy weighs accuracy values according to words' frequency, i.e. if a word has a frequency of 30 and overall there are 3000 tokens (the frequencies of all types sum to 3000), this token's accuracy will contribute 30/3000.\n\nnote: Note\nThe order is important. The first gold standard matrix has to be corresponing to the SChat matrix, such as eval_SC(Shat_train, S_train, S_val, latin, :Word) or eval_SC(Shat_val, S_val, S_train, latin, :Word)\n\nObligatory Arguments\n\nSChat::Union{SparseMatrixCSC, Matrix}: the Chat or Shat matrix\nSC::Union{SparseMatrixCSC, Matrix}: the training/validation C or S matrix\nSC_rest::Union{SparseMatrixCSC, Matrix}: the validation/training C or S matrix\ndata::DataFrame: the training/validation datasets\ndata_rest::DataFrame: the validation/training datasets\ntarget_col::Union{String, Symbol}: target column name\n\nOptional Arguments\n\ndigits: the specified number of digits after the decimal place (or before if negative)\nR::Bool=false: if true, pairwise correlation/distance/similarity matrix R is return\nfreq::Union{Missing, Array{Int64, 1}, Array{Float64,1}}=missing: list of frequencies of the wordforms in X and Y\nmethod::Union{Symbol, String}=:correlation: Method for computing similarities, one of {:correlation, :euclidean, :cosine}.\n\neval_SC(Chat_train, cue_obj_train.C, cue_obj_val.C, latin, :Word)\neval_SC(Chat_val, cue_obj_val.C, cue_obj_train.C, latin, :Word)\neval_SC(Shat_train, S_train, S_val, latin, :Word)\neval_SC(Shat_val, S_val, S_train, latin, :Word)\n\n\n\n\n\n","category":"method"},{"location":"man/eval/#JudiLing.eval_SC-Tuple{AbstractArray, AbstractArray, Int64}","page":"Evaluation","title":"JudiLing.eval_SC","text":"eval_SC(SChat::AbstractArray, SC::AbstractArray, batch_size::Int64)\n\nAssess model accuracy on the basis of the correlations of row vectors of Chat and C or Shat and S. Ideally the target words have highest correlations on the diagonal of the pertinent correlation matrices. For large datasets, pass batch_size to process evaluation in chunks.\n\nnote: Note\nIf there are homophones/homographs in the dataset, this evaluation method may be misleading: the predicted vector will be equally correlated with the target vector of both words and the one on the diagonal will not necessarily be selected as the most correlated. In such cases, supplying the dataset and target_col is recommended which enables taking into account homophones/homographs.\n\nnote: Note\nCurrently only available for correlation.\n\nObligatory Arguments\n\nSChat: the Chat or Shat matrix\nSC: the C or S matrix\ndata: datasets\ntarget_col: target column name\nbatch_size: batch size\n\nOptional Arguments\n\ndigits: the specified number of digits after the decimal place (or before if negative)\nverbose::Bool=false: if true, more information is printed\n\neval_SC(Chat_train, cue_obj_train.C, latin, :Word)\neval_SC(Chat_val, cue_obj_val.C, latin, :Word)\neval_SC(Shat_train, S_train, latin, :Word)\neval_SC(Shat_val, S_val, latin, :Word)\n\n\n\n\n\n","category":"method"},{"location":"man/eval/#JudiLing.eval_SC-Tuple{AbstractArray, AbstractArray, DataFrames.DataFrame, Union{String, Symbol}, Int64}","page":"Evaluation","title":"JudiLing.eval_SC","text":"eval_SC(SChat::AbstractArray, SC::AbstractArray, data::DataFrame, target_col::Union{String, Symbol}, batch_size::Int64)\n\nAssess model accuracy on the basis of the correlations of row vectors of Chat and C or Shat and S. Ideally the target words have highest correlations on the diagonal of the pertinent correlation matrices. For large datasets, pass batch_size to process evaluation in chunks. Support homophones.\n\nnote: Note\nCurrently only available for correlation.\n\nObligatory Arguments\n\nSChat::AbstractArray: the Chat or Shat matrix\nSC::AbstractArray: the C or S matrix\ndata::DataFrame: datasets\ntarget_col::Union{String, Symbol}: target column name\nbatch_size::Int64: batch size\n\nOptional Arguments\n\ndigits: the specified number of digits after the decimal place (or before if negative)\nverbose::Bool=false: if true, more information is printed\n\neval_SC(Chat_train, cue_obj_train.C, latin, :Word, 5000)\neval_SC(Chat_val, cue_obj_val.C, latin, :Word, 5000)\neval_SC(Shat_train, S_train, latin, :Word, 5000)\neval_SC(Shat_val, S_val, latin, :Word, 5000)\n\n\n\n\n\n","category":"method"},{"location":"man/eval/#JudiLing.eval_SC_loose-Tuple{Any, Any, Any}","page":"Evaluation","title":"JudiLing.eval_SC_loose","text":"eval_SC_loose(SChat, SC, k)\n\nAssess model accuracy on the basis of the correlations (or Euclidean distances or Cosine Similarities) of row vectors of Chat and C or Shat and S. Ideally the target words have highest correlations (lowest distance/highest similarity) on the diagonal of the pertinent correlation (distance/similarity) matrices. Count it as correct if one of the top k candidates is correct.\n\nnote: Note\nIf there are homophones/homographs in the dataset, this evaluation method may be misleading: the predicted vector will be equally correlated with the target vector of both words and it is not guaranteed that the target on the diagonal will be among the k neighbours. In particular, eval_SC and eval_SC_loose with k=1 are not guaranteed to give the same result. In such cases, supplying the dataset and target_col is recommended which enables taking into account homophones/homographs.\n\nObligatory Arguments\n\nSChat::Union{SparseMatrixCSC, Matrix}: the Chat or Shat matrix\nSC::Union{SparseMatrixCSC, Matrix}: the C or S matrix\nk: top k candidates\n\nOptional Arguments\n\ndigits: the specified number of digits after the decimal place (or before if negative)\nmethod::Union{Symbol, String}=:correlation: Method for computing similarities, one of {:correlation, :euclidean, :cosine}.\n\neval_SC_loose(Chat, cue_obj.C, k)\neval_SC_loose(Shat, S, k)\n\n\n\n\n\n","category":"method"},{"location":"man/eval/#JudiLing.eval_SC_loose-NTuple{5, Any}","page":"Evaluation","title":"JudiLing.eval_SC_loose","text":"eval_SC_loose(SChat, SC, k, data, target_col)\n\nAssess model accuracy on the basis of the correlations (or Euclidean distances or Cosine Similarities) of row vectors of Chat and C or Shat and S. Ideally the target words have highest correlations (lowest distance/highest similarity) on the diagonal of the pertinent correlation (distance/similarity) matrices. Count it as correct if one of the top k candidates is correct. Support for homophones.\n\nObligatory Arguments\n\nSChat::Union{SparseMatrixCSC, Matrix}: the Chat or Shat matrix\nSC::Union{SparseMatrixCSC, Matrix}: the C or S matrix\nk: top k candidates\ndata: datasets\ntarget_col: target column name\n\nOptional Arguments\n\ndigits: the specified number of digits after the decimal place (or before if negative)\nmethod::Union{Symbol, String}=:correlation: Method for computing similarities, one of {:correlation, :euclidean, :cosine}.\n\neval_SC_loose(Chat, cue_obj.C, k, latin, :Word)\neval_SC_loose(Shat, S, k, latin, :Word)\n\n\n\n\n\n","category":"method"},{"location":"man/eval/#JudiLing.eval_manual-Tuple{Any, Any, Any}","page":"Evaluation","title":"JudiLing.eval_manual","text":"eval_manual(res, data, i2f)\n\nCreate extensive reports for the outputs from build_paths and learn_paths.\n\n\n\n\n\n","category":"method"},{"location":"man/eval/#JudiLing.eval_acc-Tuple{Any, Array}","page":"Evaluation","title":"JudiLing.eval_acc","text":"eval_acc(res, gold_inds::Array)\n\nEvaluate the accuracy of the results from learn_paths or build_paths.\n\nObligatory Arguments\n\nres::Array: the results from learn_paths or build_paths\ngold_inds::Array: the gold paths' indices\n\nOptional Arguments\n\ndigits: the specified number of digits after the decimal place (or before if negative)\nverbose::Bool=false: if true, more information is printed\n\nExamples\n\n# evaluation on training data\nacc_train = JudiLing.eval_acc(\n    res_train,\n    cue_obj_train.gold_ind,\n    verbose=false\n)\n\n# evaluation on validation data\nacc_val = JudiLing.eval_acc(\n    res_val,\n    cue_obj_val.gold_ind,\n    verbose=false\n)\n\n\n\n\n\n","category":"method"},{"location":"man/eval/#JudiLing.eval_acc-Tuple{Any, JudiLing.Cue_Matrix_Struct}","page":"Evaluation","title":"JudiLing.eval_acc","text":"eval_acc(res, cue_obj::Cue_Matrix_Struct)\n\nEvaluate the accuracy of the results from learn_paths or build_paths.\n\nObligatory Arguments\n\nres::Array: the results from learn_paths or build_paths\ncue_obj::Cue_Matrix_Struct: the C matrix object\n\nOptional Arguments\n\ndigits: the specified number of digits after the decimal place (or before if negative)\nverbose::Bool=false: if true, more information is printed\n\nExamples\n\nacc = JudiLing.eval_acc(res, cue_obj)\n\n\n\n\n\n","category":"method"},{"location":"man/eval/#JudiLing.eval_acc_loose-Tuple{Any, Any}","page":"Evaluation","title":"JudiLing.eval_acc_loose","text":"eval_acc_loose(res, gold_inds)\n\nLenient evaluation of the accuracy of the results from learn_paths or build_paths, counting a prediction as correct when the correlation of the predicted and gold standard semantic vectors is among the n top correlations, where n is equal to max_can in the 'learnpaths' or `buildpaths` function.\n\nObligatory Arguments\n\nres::Array: the results from learn_paths or build_paths\ngold_inds::Array: the gold paths' indices\n\nOptional Arguments\n\ndigits: the specified number of digits after the decimal place (or before if negative)\nverbose::Bool=false: if true, more information is printed\n\nExamples\n\n# evaluation on training data\nacc_train_loose = JudiLing.eval_acc_loose(\n    res_train,\n    cue_obj_train.gold_ind,\n    verbose=false\n)\n\n# evaluation on validation data\nacc_val_loose = JudiLing.eval_acc_loose(\n    res_val,\n    cue_obj_val.gold_ind,\n    verbose=false\n)\n\n\n\n\n\n","category":"method"},{"location":"man/eval/#JudiLing.extract_gpi","page":"Evaluation","title":"JudiLing.extract_gpi","text":"extract_gpi(gpi, threshold=0.1, tolerance=(-1000.0))\n\nExtract, using gold paths' information, how many n-grams for a gold path are below the threshold but above the tolerance.\n\n\n\n\n\n","category":"function"},{"location":"man/find_path/","page":"Find Paths","title":"Find Paths","text":"CurrentModule = JudiLing","category":"page"},{"location":"man/find_path/#Find-Paths","page":"Find Paths","title":"Find Paths","text":"","category":"section"},{"location":"man/find_path/#Structures","page":"Find Paths","title":"Structures","text":"","category":"section"},{"location":"man/find_path/","page":"Find Paths","title":"Find Paths","text":"    Result_Path_Info_Struct\n    Gold_Path_Info_Struct\n    Threshold_Stat_Struct","category":"page"},{"location":"man/find_path/#JudiLing.Result_Path_Info_Struct","page":"Find Paths","title":"JudiLing.Result_Path_Info_Struct","text":"Store paths' information built by learn_paths or build_paths\n\n\n\n\n\n","category":"type"},{"location":"man/find_path/#JudiLing.Gold_Path_Info_Struct","page":"Find Paths","title":"JudiLing.Gold_Path_Info_Struct","text":"Store gold paths' information including indices and indices' support and total support. It can be used to evaluate how low the threshold needs to be set in order to find most of the correct paths or if set very low, all of the correct paths.\n\n\n\n\n\n","category":"type"},{"location":"man/find_path/#JudiLing.Threshold_Stat_Struct","page":"Find Paths","title":"JudiLing.Threshold_Stat_Struct","text":"Store threshold and tolerance proportional for each timestep.\n\n\n\n\n\n","category":"type"},{"location":"man/find_path/#Build-paths","page":"Find Paths","title":"Build paths","text":"","category":"section"},{"location":"man/find_path/","page":"Find Paths","title":"Find Paths","text":"    build_paths\n    build_paths(\n        data_val,\n        C_train,\n        S_val,\n        F_train,\n        Chat_val,\n        A,\n        i2f,\n        C_train_ind;\n        rC = nothing,\n        max_t = 15,\n        max_can = 10,\n        n_neighbors = 10,\n        grams = 3,\n        tokenized = false,\n        sep_token = nothing,\n        target_col = :Words,\n        start_end_token = \"#\",\n        if_pca = false,\n        pca_eval_M = nothing,\n        ignore_nan = true,\n        verbose = false,\n    )","category":"page"},{"location":"man/find_path/#JudiLing.build_paths","page":"Find Paths","title":"JudiLing.build_paths","text":"The build_paths function constructs paths by only considering those n-grams that are close to the target. It first takes the predicted c-hat vector and finds the closest n neighbors in the C matrix. Then it selects all n-grams of these neighbors, and constructs all valid paths with those n-grams. The path producing the best correlation with the target semantic vector (through synthesis by analysis) is selected.\n\n\n\n\n\n","category":"function"},{"location":"man/find_path/#JudiLing.build_paths-NTuple{8, Any}","page":"Find Paths","title":"JudiLing.build_paths","text":"build_paths(\n    data_val,\n    C_train,\n    S_val,\n    F_train,\n    Chat_val,\n    A,\n    i2f,\n    C_train_ind;\n    rC = nothing,\n    max_t = 15,\n    max_can = 10,\n    n_neighbors = 10,\n    grams = 3,\n    tokenized = false,\n    sep_token = nothing,\n    target_col = :Words,\n    start_end_token = \"#\",\n    if_pca = false,\n    pca_eval_M = nothing,\n    ignore_nan = true,\n    verbose = false,\n)\n\nThe build_paths function constructs paths by only considering those n-grams that are close to the target. It first takes the predicted c-hat vector and finds the closest n neighbors in the C matrix. Then it selects all n-grams of these neighbors, and constructs all valid paths with those n-grams. The path producing the best correlation with the target semantic vector (through synthesis by analysis) is selected.\n\nObligatory Arguments\n\ndata::DataFrame: the training dataset\ndata_val::DataFrame: the validation dataset\nC_train::SparseMatrixCSC: the C matrix for the training dataset\nS_val::Union{SparseMatrixCSC, Matrix}: the S matrix for the validation dataset\nF_train::Union{SparseMatrixCSC, Matrix}: the F matrix for the training dataset\nChat_val::Matrix: the Chat matrix for the validation dataset\nA::SparseMatrixCSC: the adjacency matrix\ni2f::Dict: the dictionary returning features given indices\nC_train_ind::Array: the gold paths' indices for the training dataset\n\nOptional Arguments\n\nrC::Union{Nothing, Matrix}=nothing: correlation Matrix of C and Chat, specify to save computing time\nmax_t::Int64=15: maximum number of timesteps\nmax_can::Int64=10: maximum number of candidates to consider\nn_neighbors::Int64=10: the top n form neighbors to be considered\ngrams::Int64=3: the number n of grams that make up n-grams\ntokenized::Bool=false: if true, the dataset target is tokenized\nsep_token::Union{Nothing, String, Char}=nothing: separator\ntarget_col::Union{String, :Symbol}=:Words: the column name for target strings\nif_pca::Bool=false: turn on to enable pca mode\npca_eval_M::Matrix=nothing: pass original F for pca mode\nverbose::Bool=false: if true, more information will be printed\n\nExamples\n\n# training dataset\nJudiLing.build_paths(\n    latin_train,\n    cue_obj_train.C,\n    S_train,\n    F_train,\n    Chat_train,\n    A,\n    cue_obj_train.i2f,\n    cue_obj_train.gold_ind,\n    max_t=max_t,\n    n_neighbors=10,\n    verbose=false\n    )\n\n# validation dataset\nJudiLing.build_paths(\n    latin_val,\n    cue_obj_train.C,\n    S_val,\n    F_train,\n    Chat_val,\n    A,\n    cue_obj_train.i2f,\n    cue_obj_train.gold_ind,\n    max_t=max_t,\n    n_neighbors=10,\n    verbose=false\n    )\n\n# pca mode\nres_build = JudiLing.build_paths(\n    korean,\n    Array(Cpcat),\n    S,\n    F,\n    ChatPCA,\n    A,\n    cue_obj.i2f,\n    cue_obj.gold_ind,\n    max_t=max_t,\n    if_pca=true,\n    pca_eval_M=Fo,\n    n_neighbors=3,\n    verbose=true\n    )\n\n\n\n\n\n","category":"method"},{"location":"man/find_path/#Learn-paths","page":"Find Paths","title":"Learn paths","text":"","category":"section"},{"location":"man/find_path/","page":"Find Paths","title":"Find Paths","text":"    learn_paths\n    learn_paths(\n        data::DataFrame,\n        cue_obj::Cue_Matrix_Struct,\n        S_val::Union{SparseMatrixCSC, Matrix},\n        F_train,\n        Chat_val::Union{SparseMatrixCSC, Matrix};\n        Shat_val::Union{Nothing, Matrix} = nothing,\n        check_gold_path::Bool = false,\n        threshold::Float64 = 0.1,\n        is_tolerant::Bool = false,\n        tolerance::Float64 = (-1000.0),\n        max_tolerance::Int = 3,\n        activation::Union{Nothing, Function} = nothing,\n        ignore_nan::Bool = true,\n        verbose::Bool = true)\n    learn_paths(\n        data_train::DataFrame,\n        data_val::DataFrame,\n        C_train::Union{Matrix, SparseMatrixCSC},\n        S_val::Union{Matrix, SparseMatrixCSC},\n        F_train,\n        Chat_val::Union{Matrix, SparseMatrixCSC},\n        A::SparseMatrixCSC,\n        i2f::Dict,\n        f2i::Dict;\n        gold_ind::Union{Nothing, Vector} = nothing,\n        Shat_val::Union{Nothing, Matrix} = nothing,\n        check_gold_path::Bool = false,\n        max_t::Int = 15,\n        max_can::Int = 10,\n        threshold::Float64 = 0.1,\n        is_tolerant::Bool = false,\n        tolerance::Float64 = (-1000.0),\n        max_tolerance::Int = 3,\n        grams::Int = 3,\n        tokenized::Bool = false,\n        sep_token::Union{Nothing, String} = nothing,\n        keep_sep::Bool = false,\n        target_col::Union{Symbol, String} = \"Words\",\n        start_end_token::String = \"#\",\n        issparse::Union{Symbol, Bool} = :auto,\n        sparse_ratio::Float64 = 0.05,\n        if_pca::Bool = false,\n        pca_eval_M::Union{Nothing, Matrix} = nothing,\n        activation::Union{Nothing, Function} = nothing,\n        ignore_nan::Bool = true,\n        check_threshold_stat::Bool = false,\n        verbose::Bool = false\n    )\n    learn_paths_rpi(\n        data_train::DataFrame,\n        data_val::DataFrame,\n        C_train::Union{Matrix, SparseMatrixCSC},\n        S_val::Union{Matrix, SparseMatrixCSC},\n        F_train,\n        Chat_val::Union{Matrix, SparseMatrixCSC},\n        A::SparseMatrixCSC,\n        i2f::Dict,\n        f2i::Dict;\n        gold_ind::Union{Nothing, Vector} = nothing,\n        Shat_val::Union{Nothing, Matrix} = nothing,\n        check_gold_path::Bool = false,\n        max_t::Int = 15,\n        max_can::Int = 10,\n        threshold::Float64 = 0.1,\n        is_tolerant::Bool = false,\n        tolerance::Float64 = (-1000.0),\n        max_tolerance::Int = 3,\n        grams::Int = 3,\n        tokenized::Bool = false,\n        sep_token::Union{Nothing, String} = nothing,\n        keep_sep::Bool = false,\n        target_col::Union{Symbol, String} = \"Words\",\n        start_end_token::String = \"#\",\n        issparse::Union{Symbol, Bool} = :auto,\n        sparse_ratio::Float64 = 0.05,\n        if_pca::Bool = false,\n        pca_eval_M::Union{Nothing, Matrix} = nothing,\n        activation::Union{Nothing, Function} = nothing,\n        ignore_nan::Bool = true,\n        check_threshold_stat::Bool = false,\n        verbose::Bool = false\n    )","category":"page"},{"location":"man/find_path/#JudiLing.learn_paths","page":"Find Paths","title":"JudiLing.learn_paths","text":"A sequence finding algorithm using discrimination learning to predict, for a given word, which n-grams are best supported for a given position in the sequence of n-grams.\n\n\n\n\n\n","category":"function"},{"location":"man/find_path/#JudiLing.learn_paths-Tuple{DataFrames.DataFrame, JudiLing.Cue_Matrix_Struct, Union{SparseArrays.SparseMatrixCSC, Matrix}, Any, Union{SparseArrays.SparseMatrixCSC, Matrix}}","page":"Find Paths","title":"JudiLing.learn_paths","text":"learn_paths(\n    data::DataFrame,\n    cue_obj::Cue_Matrix_Struct,\n    S_val::Union{SparseMatrixCSC, Matrix},\n    F_train,\n    Chat_val::Union{SparseMatrixCSC, Matrix};\n    Shat_val::Union{Nothing, Matrix} = nothing,\n    check_gold_path::Bool = false,\n    threshold::Float64 = 0.1,\n    is_tolerant::Bool = false,\n    tolerance::Float64 = (-1000.0),\n    max_tolerance::Int = 3,\n    activation::Union{Nothing, Function} = nothing,\n    ignore_nan::Bool = true,\n    verbose::Bool = true)\n\nA high-level wrapper function for learn_paths with much less control. It aims for users who is very new to JudiLing and learn_paths function.\n\nObligatory Arguments\n\ndata::DataFrame: the training dataset\ncue_obj::Cue_Matrix_Struct: the C matrix object containing all information with C\nS_val::Union{SparseMatrixCSC, Matrix}: the S matrix for validation dataset\nF_train::Union{SparseMatrixCSC, Matrix, Chain}: either the F matrix for training dataset, or a deep learning comprehension model trained on the training set\nChat_val::Union{SparseMatrixCSC, Matrix}: the Chat matrix for validation dataset\n\nOptional Arguments\n\nShat_val::Union{Nothing, Matrix}=nothing: the Shat matrix for the validation dataset\ncheck_gold_path::Bool=false: if true, return a list of support values for the gold path; this information is returned as second output value\nthreshold::Float64=0.1:the value set for the support such that if the support of an n-gram is higher than this value, the n-gram will be taking into consideration\nis_tolerant::Bool=false: if true, select a specified number (given by max_tolerance) of n-grams whose supports are below threshold but above a second tolerance threshold to be added to the path\ntolerance::Float64=(-1000.0): the value set for the second threshold (in tolerant mode) such that if the support for an n-gram is in between this value and the threshold and the max_tolerance number has not been reached, then allow this n-gram to be added to the path\nmax_tolerance::Int64=4: maximum number of n-grams allowed in a path\nactivation::Function=nothing: the activation function you want to pass\nignore_nan::Bool=true: whether to ignore NaN when compare correlations, otherwise NaN will be selected as the max correlation value\nverbose::Bool=false: if true, more information is printed\n\nExamples\n\nres = learn_paths(latin, cue_obj, S, F, Chat)\n\n\n\n\n\n","category":"method"},{"location":"man/find_path/#JudiLing.learn_paths-Tuple{DataFrames.DataFrame, DataFrames.DataFrame, Union{SparseArrays.SparseMatrixCSC, Matrix}, Union{SparseArrays.SparseMatrixCSC, Matrix}, Any, Union{SparseArrays.SparseMatrixCSC, Matrix}, SparseArrays.SparseMatrixCSC, Dict, Dict}","page":"Find Paths","title":"JudiLing.learn_paths","text":"learn_paths(\n    data_train::DataFrame,\n    data_val::DataFrame,\n    C_train::Union{Matrix, SparseMatrixCSC},\n    S_val::Union{Matrix, SparseMatrixCSC},\n    F_train,\n    Chat_val::Union{Matrix, SparseMatrixCSC},\n    A::SparseMatrixCSC,\n    i2f::Dict,\n    f2i::Dict;\n    gold_ind::Union{Nothing, Vector} = nothing,\n    Shat_val::Union{Nothing, Matrix} = nothing,\n    check_gold_path::Bool = false,\n    max_t::Int = 15,\n    max_can::Int = 10,\n    threshold::Float64 = 0.1,\n    is_tolerant::Bool = false,\n    tolerance::Float64 = (-1000.0),\n    max_tolerance::Int = 3,\n    grams::Int = 3,\n    tokenized::Bool = false,\n    sep_token::Union{Nothing, String} = nothing,\n    keep_sep::Bool = false,\n    target_col::Union{Symbol, String} = \"Words\",\n    start_end_token::String = \"#\",\n    issparse::Union{Symbol, Bool} = :auto,\n    sparse_ratio::Float64 = 0.05,\n    if_pca::Bool = false,\n    pca_eval_M::Union{Nothing, Matrix} = nothing,\n    activation::Union{Nothing, Function} = nothing,\n    ignore_nan::Bool = true,\n    check_threshold_stat::Bool = false,\n    verbose::Bool = false\n)\n\nA sequence finding algorithm using discrimination learning to predict, for a given word, which n-grams are best supported for a given position in the sequence of n-grams.\n\nObligatory Arguments\n\ndata::DataFrame: the training dataset\ndata_val::DataFrame: the validation dataset\nC_train::Union{SparseMatrixCSC, Matrix}: the C matrix for training dataset\nS_val::Union{SparseMatrixCSC, Matrix}: the S matrix for validation dataset\nF_train::Union{SparseMatrixCSC, Matrix, Chain}: the F matrix for training dataset, or a deep learning comprehension model trained on the training data\nChat_val::Union{SparseMatrixCSC, Matrix}: the Chat matrix for validation dataset\nA::SparseMatrixCSC: the adjacency matrix\ni2f::Dict: the dictionary returning features given indices\nf2i::Dict: the dictionary returning indices given features\n\nOptional Arguments\n\ngold_ind::Union{Nothing, Vector}=nothing: gold paths' indices\nShat_val::Union{Nothing, Matrix}=nothing: the Shat matrix for the validation dataset\ncheck_gold_path::Bool=false: if true, return a list of support values for the gold path; this information is returned as second output value\nmax_t::Int64=15: maximum timestep\nmax_can::Int64=10: maximum number of candidates to consider\nthreshold::Float64=0.1:the value set for the support such that if the support of an n-gram is higher than this value, the n-gram will be taking into consideration\nis_tolerant::Bool=false: if true, select a specified number (given by max_tolerance) of n-grams whose supports are below threshold but above a second tolerance threshold to be added to the path\ntolerance::Float64=(-1000.0): the value set for the second threshold (in tolerant mode) such that if the support for an n-gram is in between this value and the threshold and the max_tolerance number has not been reached, then allow this n-gram to be added to the path\nmax_tolerance::Int64=4: maximum number of n-grams allowed in a path\ngrams::Int64=3: the number n of grams that make up an n-gram\ntokenized::Bool=false: if true, the dataset target is tokenized\nsep_token::Union{Nothing, String, Char}=nothing: separator token\nkeep_sep::Bool=false:if true, keep separators in cues\ntarget_col::Union{String, :Symbol}=:Words: the column name for target strings\nstart_end_token::Union{String, Char}=\"#\": start and end token in boundary cues\nissparse::Union{Symbol, Bool}=:auto: control of whether output of Mt matrix is a dense matrix or a sparse matrix\nsparse_ratio::Float64=0.05: the ratio to decide whether a matrix is sparse\nif_pca::Bool=false: turn on to enable pca mode\npca_eval_M::Matrix=nothing: pass original F for pca mode\nactivation::Function=nothing: the activation function you want to pass\nignore_nan::Bool=true: whether to ignore NaN when compare correlations, otherwise NaN will be selected as the max correlation value\ncheck_threshold_stat::Bool=false: if true, return a threshold and torlerance proportion for each timestep\nverbose::Bool=false: if true, more information is printed\n\nExamples\n\n# basic usage without tokenization\nres = JudiLing.learn_paths(\nlatin,\nlatin,\ncue_obj.C,\nS,\nF,\nChat,\nA,\ncue_obj.i2f,\nmax_t=max_t,\nmax_can=10,\ngrams=3,\nthreshold=0.1,\ntokenized=false,\nkeep_sep=false,\ntarget_col=:Word,\nverbose=true)\n\n# basic usage with tokenization\nres = JudiLing.learn_paths(\nfrench,\nfrench,\ncue_obj.C,\nS,\nF,\nChat,\nA,\ncue_obj.i2f,\nmax_t=max_t,\nmax_can=10,\ngrams=3,\nthreshold=0.1,\ntokenized=true,\nsep_token=\"-\",\nkeep_sep=true,\ntarget_col=:Syllables,\nverbose=true)\n\n# basic usage for validation data\nres_val = JudiLing.learn_paths(\nlatin_train,\nlatin_val,\ncue_obj_train.C,\nS_val,\nF_train,\nChat_val,\nA,\ncue_obj_train.i2f,\nmax_t=max_t,\nmax_can=10,\ngrams=3,\nthreshold=0.1,\ntokenized=false,\nkeep_sep=false,\ntarget_col=:Word,\nverbose=true)\n\n# turn on tolerance mode\nres_val = JudiLing.learn_paths(\n...\nthreshold=0.1,\nis_tolerant=true,\ntolerance=-0.1,\nmax_tolerance=4,\n...)\n\n# turn on check gold paths mode\nres_train, gpi_train = JudiLing.learn_paths(\n...\ngold_ind=cue_obj_train.gold_ind,\nShat_val=Shat_train,\ncheck_gold_path=true,\n...)\n\nres_val, gpi_val = JudiLing.learn_paths(\n...\ngold_ind=cue_obj_val.gold_ind,\nShat_val=Shat_val,\ncheck_gold_path=true,\n...)\n\n# control over sparsity\nres_val = JudiLing.learn_paths(\n...\nissparse=:auto,\nsparse_ratio=0.05,\n...)\n\n# pca mode\nres_learn = JudiLing.learn_paths(\nkorean,\nkorean,\nArray(Cpcat),\nS,\nF,\nChatPCA,\nA,\ncue_obj.i2f,\ncue_obj.f2i,\ncheck_gold_path=false,\ngold_ind=cue_obj.gold_ind,\nShat_val=Shat,\nmax_t=max_t,\nmax_can=10,\ngrams=3,\nthreshold=0.1,\ntokenized=true,\nsep_token=\"_\",\nkeep_sep=true,\ntarget_col=:Verb_syll,\nif_pca=true,\npca_eval_M=Fo,\nverbose=true);\n\n\n\n\n\n\n","category":"method"},{"location":"man/find_path/#JudiLing.learn_paths_rpi-Tuple{DataFrames.DataFrame, DataFrames.DataFrame, Union{SparseArrays.SparseMatrixCSC, Matrix}, Union{SparseArrays.SparseMatrixCSC, Matrix}, Any, Union{SparseArrays.SparseMatrixCSC, Matrix}, SparseArrays.SparseMatrixCSC, Dict, Dict}","page":"Find Paths","title":"JudiLing.learn_paths_rpi","text":"learn_paths_rpi(\n    data_train::DataFrame,\n    data_val::DataFrame,\n    C_train::Union{Matrix, SparseMatrixCSC},\n    S_val::Union{Matrix, SparseMatrixCSC},\n    F_train,\n    Chat_val::Union{Matrix, SparseMatrixCSC},\n    A::SparseMatrixCSC,\n    i2f::Dict,\n    f2i::Dict;\n    gold_ind::Union{Nothing, Vector} = nothing,\n    Shat_val::Union{Nothing, Matrix} = nothing,\n    check_gold_path::Bool = false,\n    max_t::Int = 15,\n    max_can::Int = 10,\n    threshold::Float64 = 0.1,\n    is_tolerant::Bool = false,\n    tolerance::Float64 = (-1000.0),\n    max_tolerance::Int = 3,\n    grams::Int = 3,\n    tokenized::Bool = false,\n    sep_token::Union{Nothing, String} = nothing,\n    keep_sep::Bool = false,\n    target_col::Union{Symbol, String} = \"Words\",\n    start_end_token::String = \"#\",\n    issparse::Union{Symbol, Bool} = :auto,\n    sparse_ratio::Float64 = 0.05,\n    if_pca::Bool = false,\n    pca_eval_M::Union{Nothing, Matrix} = nothing,\n    activation::Union{Nothing, Function} = nothing,\n    ignore_nan::Bool = true,\n    check_threshold_stat::Bool = false,\n    verbose::Bool = false\n)\n\nCalculate learn_paths with results indices supports as well.\n\nObligatory Arguments\n\ndata::DataFrame: the training dataset\ndata_val::DataFrame: the validation dataset\nC_train::Union{SparseMatrixCSC, Matrix}: the C matrix for training dataset\nS_val::Union{SparseMatrixCSC, Matrix}: the S matrix for validation dataset\nF_train::Union{SparseMatrixCSC, Matrix, Chain}: the F matrix for training dataset, or a deep learning comprehension model trained on the training data\nChat_val::Union{SparseMatrixCSC, Matrix}: the Chat matrix for validation dataset\nA::SparseMatrixCSC: the adjacency matrix\ni2f::Dict: the dictionary returning features given indices\nf2i::Dict: the dictionary returning indices given features\n\nOptional Arguments\n\ngold_ind::Union{Nothing, Vector}=nothing: gold paths' indices\nShat_val::Union{Nothing, Matrix}=nothing: the Shat matrix for the validation dataset\ncheck_gold_path::Bool=false: if true, return a list of support values for the gold path; this information is returned as second output value\nmax_t::Int64=15: maximum timestep\nmax_can::Int64=10: maximum number of candidates to consider\nthreshold::Float64=0.1:the value set for the support such that if the support of an n-gram is higher than this value, the n-gram will be taking into consideration\nis_tolerant::Bool=false: if true, select a specified number (given by max_tolerance) of n-grams whose supports are below threshold but above a second tolerance threshold to be added to the path\ntolerance::Float64=(-1000.0): the value set for the second threshold (in tolerant mode) such that if the support for an n-gram is in between this value and the threshold and the max_tolerance number has not been reached, then allow this n-gram to be added to the path\nmax_tolerance::Int64=4: maximum number of n-grams allowed in a path\ngrams::Int64=3: the number n of grams that make up an n-gram\ntokenized::Bool=false: if true, the dataset target is tokenized\nsep_token::Union{Nothing, String, Char}=nothing: separator token\nkeep_sep::Bool=false:if true, keep separators in cues\ntarget_col::Union{String, :Symbol}=:Words: the column name for target strings\nstart_end_token::Union{String, Char}=\"#\": start and end token in boundary cues\nissparse::Union{Symbol, Bool}=:auto: control of whether output of Mt matrix is a dense matrix or a sparse matrix\nsparse_ratio::Float64=0.05: the ratio to decide whether a matrix is sparse\nif_pca::Bool=false: turn on to enable pca mode\npca_eval_M::Matrix=nothing: pass original F for pca mode\nactivation::Function=nothing: the activation function you want to pass\nignore_nan::Bool=true: whether to ignore NaN when compare correlations, otherwise NaN will be selected as the max correlation value\ncheck_threshold_stat::Bool=false: if true, return a threshold and torlerance proportion for each timestep\nverbose::Bool=false: if true, more information is printed\n\n\n\n\n\n","category":"method"},{"location":"man/find_path/#Utility-functions","page":"Find Paths","title":"Utility functions","text":"","category":"section"},{"location":"man/find_path/","page":"Find Paths","title":"Find Paths","text":"    eval_can(candidates, S, F, i2f, max_can, if_pca, pca_eval_M)\n    find_top_feature_indices(rC, C_train_ind)\n    make_ngrams_ind(res, n)\n    predict_shat(F::Union{Matrix, SparseMatrixCSC},\n                          ci::Vector{Int})","category":"page"},{"location":"man/find_path/#JudiLing.eval_can-NTuple{7, Any}","page":"Find Paths","title":"JudiLing.eval_can","text":"eval_can(candidates, S, F::Union{Matrix,SparseMatrixCSC, Chain}, i2f, max_can, if_pca, pca_eval_M)\n\nCalculate for each candidate path the correlation between predicted semantic vector and the gold standard semantic vector, and select as target for production the path with the highest correlation.\n\n\n\n\n\n","category":"method"},{"location":"man/find_path/#JudiLing.find_top_feature_indices-Tuple{Any, Any}","page":"Find Paths","title":"JudiLing.find_top_feature_indices","text":"find_top_feature_indices(rC, C_train_ind)\n\nFind all indices for the n-grams of the top n closest neighbors of a given target.\n\n\n\n\n\n","category":"method"},{"location":"man/find_path/#JudiLing.make_ngrams_ind-Tuple{Any, Any}","page":"Find Paths","title":"JudiLing.make_ngrams_ind","text":"make_ngrams_ind(res, n)\n\nConstruct ngrams indices.\n\n\n\n\n\n","category":"method"},{"location":"man/find_path/#JudiLing.predict_shat-Tuple{Union{SparseArrays.SparseMatrixCSC, Matrix}, Vector{Int64}}","page":"Find Paths","title":"JudiLing.predict_shat","text":"predict_shat(F::Union{Matrix, SparseMatrixCSC},\n             ci::Vector{Int})\n\nPredicts semantic vector shat given a comprehension matrix F and a list of indices of ngrams ci.\n\nObligatory arguments\n\nF::Union{Matrix, SparseMatrixCSC}: Comprehension matrix F.\nci::Vector{Int}: Vector of indices of ngrams in c vector. Essentially, this is a vector indicating which ngrams in a c vector are absent and which are present.\n\n\n\n\n\n","category":"method"},{"location":"man/display/","page":"Display","title":"Display","text":"CurrentModule = JudiLing","category":"page"},{"location":"man/display/#Cholesky","page":"Display","title":"Cholesky","text":"","category":"section"},{"location":"man/display/","page":"Display","title":"Display","text":"    display_matrix(M, rownames, colnames)\n    display_matrix(data, target_col, cue_obj, M, M_type)","category":"page"},{"location":"man/display/#JudiLing.display_matrix-Tuple{Any, Any, Any}","page":"Display","title":"JudiLing.display_matrix","text":"display_matrix(M, rownames, colnames)\n\nDisplay matrix with rownames and colnames.\n\n\n\n\n\n","category":"method"},{"location":"man/display/#JudiLing.display_matrix-NTuple{5, Any}","page":"Display","title":"JudiLing.display_matrix","text":"display_matrix(data, target_col, cue_pS_obj, M, M_type)\n\nDisplay matrix with rownames and colnames.\n\nObligatory Arguments\n\ndata::DataFrame: the dataset\ntarget_col::Union{String, Symbol}: the target column name\ncue_pS_obj::Union{Cue_Matrix_Struct,PS_Matrix_Struct}: the cue matrix or pS matrix structure\nM::Union{SparseMatrixCSC, Matrix}: the matrix\nM_type::Union{String, Symbol}: the type of the matrix, currently support :C, :S, :F, :G, :Chat, :Shat, :A, :R and :pS\n\nOptional Arguments\n\nnrow::Int64 = 6: the number of rows to display\nncol::Int64 = 6: the number of columns to display\nreturn_matrix::Bool = false: whether the created dataframe should be returned (and not only displayed)\n\nExamples\n\nJudiLing.display_matrix(latin, :Word, cue_obj, cue_obj.C, :C)\nJudiLing.display_matrix(latin, :Word, cue_obj, S, :S)\nJudiLing.display_matrix(latin, :Word, cue_obj, G, :G)\nJudiLing.display_matrix(latin, :Word, cue_obj, Chat, :Chat)\nJudiLing.display_matrix(latin, :Word, cue_obj, F, :F)\nJudiLing.display_matrix(latin, :Word, cue_obj, Shat, :Shat)\nJudiLing.display_matrix(latin, :Word, cue_obj, A, :A)\nJudiLing.display_matrix(latin, :Word, cue_obj, R, :R)\nJudiLing.display_matrix(latin, :Word, pS_obj, pS_obj.pS, :pS)\n\n\n\n\n\n","category":"method"},{"location":"man/input/","page":"Loading data","title":"Loading data","text":"CurrentModule = JudiLing","category":"page"},{"location":"man/input/#Loading-data","page":"Loading data","title":"Loading data","text":"","category":"section"},{"location":"man/input/","page":"Loading data","title":"Loading data","text":"load_dataset(filepath::String;\n            delim::String=\",\",\n            kargs...)\nloading_data_randomly_split(\n      data_path::String,\n      output_dir_path::String,\n      data_prefix::String;\n      val_sample_size::Int = 0,\n      val_ratio::Float = 0.0,\n      random_seed::Int = 314)\nloading_data_careful_split(\n      data_path::String,\n      data_prefix::String,\n      output_dir_path::String,\n      n_features_columns::Union{Vector{Symbol},Vector{String}};\n      train_sample_size::Int = 0,\n      val_sample_size::Int = 0,\n      val_ratio::Float64 = 0.0,\n      n_grams_target_col::Union{Symbol, String} = :Word,\n      n_grams_tokenized::Bool = false,\n      n_grams_sep_token::Union{Nothing, String} = nothing,\n      grams::Int = 3,\n      n_grams_keep_sep::Bool = false,\n      start_end_token::String = \"#\",\n      random_seed::Int = 314,\n      verbose::Bool = false)","category":"page"},{"location":"man/input/#JudiLing.load_dataset-Tuple{String}","page":"Loading data","title":"JudiLing.load_dataset","text":"load_dataset(filepath::String;\n            delim::String=\",\",\n            kargs...)\n\nLoad a dataset from file, usually comma- or tab-separated. Returns a DataFrame.\n\nObligatory arguments\n\nfilepath::String: Path to file to be loaded.\n\nOptional arguments\n\ndelim::String=\",\": Delimiter in the file (usually either \",\" or \"\\t\").\nkargs...: Further keyword arguments are passed to CSV.File().\n\nExample\n\nlatin = JudiLing.load_dataset(\"latin.csv\")\nfirst(latin, 10)\n\n\n\n\n\n","category":"method"},{"location":"man/input/#JudiLing.loading_data_randomly_split-Tuple{String, String, String}","page":"Loading data","title":"JudiLing.loading_data_randomly_split","text":"loading_data_randomly_split(\n    data_path::String,\n    output_dir_path::String,\n    data_prefix::String;\n    val_sample_size::Int = 0,\n    val_ratio::Float64 = 0.0,\n    random_seed::Int = 314)\n\nRead in a dataframe, splitting the dataframe into a training and validation dataset. The two are also written to output_dir_path at the same time.\n\nnote: Note\nThe order of data_prefix and output_dir_path is exactly reversed compared to loading_data_careful_split.\n\nObligatory arguments\n\ndata_path::String: Path to where the dataset is stored.\noutput_dir_path::String: Path to where the new dataframes should be stored.\ndata_prefix::String: Prefix of the two new files, will be called data_prefix_train.csv and data_prefix_val.csv.\n\nOptional arguments\n\nval_sample_size::Int = 0: Size of the validation dataset (only val_sample_size or val_ratio may be used).\nval_ratio::Float64 = 0.0: Fraction of the data that should be in the validation dataset (only val_sample_size or val_ratio may be used).\nrandom_seed::Int = 314: Random seed for controlling random split.\n\nExample\n\ndata_train, data_val = JudiLing.loading_data_randomly_split(\n    \"latin.csv\",\n    \"careful\",\n    \"latin\",\n    [\"Lexeme\",\"Person\",\"Number\",\"Tense\",\"Voice\",\"Mood\"]\n)\n\n\n\n\n\n","category":"method"},{"location":"man/input/#JudiLing.loading_data_careful_split-Tuple{String, String, String, Union{Vector{String}, Vector{Symbol}}}","page":"Loading data","title":"JudiLing.loading_data_careful_split","text":"loading_data_careful_split(\n    data_path::String,\n    data_prefix::String,\n    output_dir_path::String,\n    n_features_columns::Union{Vector{Symbol},Vector{String}};\n    train_sample_size::Int = 0,\n    val_sample_size::Int = 0,\n    val_ratio::Float64 = 0.0,\n    n_grams_target_col::Union{Symbol, String} = :Word,\n    n_grams_tokenized::Bool = false,\n    n_grams_sep_token::Union{Nothing, String} = nothing,\n    grams::Int = 3,\n    n_grams_keep_sep::Bool = false,\n    start_end_token::String = \"#\",\n    random_seed::Int = 314,\n    verbose::Bool = false)\n\nRead in a dataframe, splitting the dataframe into a training and validation dataset. The split is done such that all features in the columns specified in n_features_columns occur both in the training and validation data. It is also ensured that the unique grams resulting from splitting the strings in column n_grams_target_col into grams-grams occur in both datasets. The two are also written to output_dir_path at the same time.\n\nnote: Note\nThe order of data_prefix and output_dir_path is exactly reversed compared to loading_data_randomly_split.\n\nObligatory arguments\n\ndata_path::String: Path to where the dataset is stored.\noutput_dir_path::String: Path to where the new dataframes should be stored.\ndata_prefix::String: Prefix of the two new files, will be called data_prefix_train.csv and data_prefix_val.csv.\nn_features_columns::Vector{Union{Symbol, String}}: Vector with columns whose features have to occur in both the training and validation data.\n\nOptional arguments\n\nval_sample_size::Int = 0: Size of the validation dataset (only val_sample_size or val_ratio may be used).\nval_ratio::Float64 = 0.0: Fraction of the data that should be in the validation dataset (only val_sample_size or val_ratio may be used).\nn_grams_target_col::Union{Symbol, String} = :Word: Column with target words.\nn_grams_tokenized::Bool = false: Whether the words in n_grams_target_col are already tokenized.\nn_grams_sep_token::Union{Nothing, String} = nothing: String with which tokens in n_grams_target_col are separated (only used if n_grams_tokenized=true).\ngrams::Int = 3: Granularity of the n-grams.\nn_grams_keep_sep::Bool = false: Whether the token separators should be kept in the ngrams (this is useful e.g. when working with syllables).\nstart_end_token::String = \"#\": Token with which the start and end of words should be marked.\nrandom_seed::Int = 314: Random seed for controlling random split.\n\nExample\n\ndata_train, data_val = JudiLing.loading_data_careful_split(\n    \"latin.csv\",\n    \"latin\",\n    \"careful\",\n    [\"Lexeme\",\"Person\",\"Number\",\"Tense\",\"Voice\",\"Mood\"]\n)\n\n\n\n\n\n","category":"method"},{"location":"man/all_manual/","page":"All Manual index","title":"All Manual index","text":"CurrentModule = JudiLing","category":"page"},{"location":"man/all_manual/","page":"All Manual index","title":"All Manual index","text":"","category":"page"},{"location":"man/output/","page":"Output","title":"Output","text":"CurrentModule = JudiLing","category":"page"},{"location":"man/output/#Output","page":"Output","title":"Output","text":"","category":"section"},{"location":"man/output/","page":"Output","title":"Output","text":"    write2csv\n    write2df\n    write_comprehension_eval\n    write2csv(res, data, cue_obj_train, cue_obj_val, filename)\n    write2csv(gpi::Vector{Gold_Path_Info_Struct}, filename)\n    write2csv(ts::Threshold_Stat_Struct, filename)\n    write2df(res, data, cue_obj_train, cue_obj_val)\n    write2df(gpi::Vector{Gold_Path_Info_Struct})\n    write2df(ts::Threshold_Stat_Struct)\n    write_comprehension_eval(SChat, SC, data, target_col, filename)\n    write_comprehension_eval(SChat, SC, SC_rest, data, data_rest, target_col, filename)\n    save_L_matrix(L, filename)\n    load_L_matrix(filename)\n    save_S_matrix(S, filename, data, target_col)\n    load_S_matrix(filename)","category":"page"},{"location":"man/output/#JudiLing.write2csv","page":"Output","title":"JudiLing.write2csv","text":"Write results into a csv file. This function takes as input the results from the learn_paths and build_paths functions, including the information on gold paths that is optionally returned as second output result.\n\n\n\n\n\n","category":"function"},{"location":"man/output/#JudiLing.write2df","page":"Output","title":"JudiLing.write2df","text":"Reformat results into a dataframe. This function takes as input the results from the learn_paths and build_paths functions, including the information on gold paths that is optionally returned as second output result.\n\n\n\n\n\n","category":"function"},{"location":"man/output/#JudiLing.write_comprehension_eval","page":"Output","title":"JudiLing.write_comprehension_eval","text":"Write comprehension evaluation into a CSV file, include target and predicted ids and indentifiers and their correlations.\n\n\n\n\n\n","category":"function"},{"location":"man/output/#JudiLing.write2csv-NTuple{5, Any}","page":"Output","title":"JudiLing.write2csv","text":"write2csv(res, data, cue_obj_train, cue_obj_val, filename)\n\nWrite results into csv file for the results from learn_paths and build_paths.\n\nObligatory Arguments\n\nres::Array{Array{Result_Path_Info_Struct,1},1}: the results from learn_paths or build_paths\ndata::DataFrame: the dataset\ncue_obj_train::Cue_Matrix_Struct: the cue object for training dataset\ncue_obj_val::Cue_Matrix_Struct: the cue object for validation dataset\nfilename::String: the filename\n\nOptional Arguments\n\ngrams::Int64=3: the number n in n-gram cues\ntokenized::Bool=false: if true, the dataset target is tokenized\nsep_token::Union{Nothing, String, Char}=nothing: separator\nstart_end_token::Union{String, Char}=\"#\": start and end token in boundary cues\noutput_sep_token::Union{String, Char}=\"\": output separator\npath_sep_token::Union{String, Char}=\":\": path separator\ntarget_col::Union{String, Symbol}=:Words: the column name for target strings\nroot_dir::String=\".\": dir path for project root dir\noutput_dir::String=\".\": output dir inside root dir\n\nExamples\n\n# writing results for training data\nJudiLing.write2csv(\n    res_train,\n    latin_train,\n     cue_obj_train,\n    cue_obj_train,\n    \"res_latin_train.csv\",\n    grams=3,\n    tokenized=false,\n    sep_token=nothing,\n    start_end_token=\"#\",\n    output_sep_token=\"\",\n    path_sep_token=\":\",\n    target_col=:Word,\n    root_dir=\".\",\n    output_dir=\"test_out\")\n\n# writing results for validation data\nJudiLing.write2csv(\n    res_val,\n    latin_val,\n    cue_obj_train,\n    cue_obj_val,\n    \"res_latin_val.csv\",\n    grams=3,\n    tokenized=false,\n    sep_token=nothing,\n    start_end_token=\"#\",\n    output_sep_token=\"\",\n    path_sep_token=\":\",\n    target_col=:Word,\n    root_dir=\".\",\n    output_dir=\"test_out\")\n\n\n\n\n\n","category":"method"},{"location":"man/output/#JudiLing.write2csv-Tuple{Vector{JudiLing.Gold_Path_Info_Struct}, Any}","page":"Output","title":"JudiLing.write2csv","text":"write2csv(gpi::Vector{Gold_Path_Info_Struct}, filename)\n\nWrite results into csv file for the gold paths' information optionally returned by learn_paths and build_paths.\n\nObligatory Arguments\n\ngpi::Vector{Gold_Path_Info_Struct}: the gold paths' information\nfilename::String: the filename\n\nOptional Arguments\n\nroot_dir::String=\".\": dir path for project root dir\noutput_dir::String=\".\": output dir inside root dir\n\nExamples\n\n# write gold standard paths to csv for training data\nJudiLing.write2csv(\n    gpi_train,\n    \"gpi_latin_train.csv\",\n    root_dir=\".\",\n    output_dir=\"test_out\"\n    )\n\n# write gold standard paths to csv for validation data\nJudiLing.write2csv(\n    gpi_val,\n    \"gpi_latin_val.csv\",\n    root_dir=\".\",\n    output_dir=\"test_out\"\n    )\n\n\n\n\n\n","category":"method"},{"location":"man/output/#JudiLing.write2csv-Tuple{JudiLing.Threshold_Stat_Struct, Any}","page":"Output","title":"JudiLing.write2csv","text":"write2csv(ts::Threshold_Stat_Struct, filename)\n\nWrite results into csv file for threshold and tolerance proportion for each timestep.\n\nObligatory Arguments\n\ngpi::Vector{Gold_Path_Info_Struct}: the gold paths' information\nfilename::String: the filename\n\nOptional Arguments\n\nroot_dir::String=\".\": dir path for project root dir\noutput_dir::String=\".\": output dir inside root dir\n\nExamples\n\nJudiLing.write2csv(ts, \"ts.csv\", root_dir = @__DIR__, output_dir=\"out\")\n\n\n\n\n\n","category":"method"},{"location":"man/output/#JudiLing.write2df-NTuple{4, Any}","page":"Output","title":"JudiLing.write2df","text":"write2df(res, data, cue_obj_train, cue_obj_val)\n\nReformat results into a dataframe for the results form learn_paths and build_paths functions.\n\nObligatory Arguments\n\nres: output of learn_paths or build_paths\ndata::DataFrame: the dataset\ncue_obj_train: cue object of the training data set\ncue_obj_val: cue object of the validation data set\n\nOptional Arguments\n\ngrams::Int64=3: the number n in n-gram cues\ntokenized::Bool=false: if true, the dataset target is tokenized\nsep_token::Union{Nothing, String, Char}=nothing: separator\nstart_end_token::Union{String, Char}=\"#\": start and end token in boundary cues\noutput_sep_token::Union{String, Char}=\"\": output separator\npath_sep_token::Union{String, Char}=\":\": path separator\ntarget_col::Union{String, Symbol}=:Words: the column name for target strings\n\nExamples\n\n# writing results for training data\nJudiLing.write2df(\n    res_train,\n    latin_train,\n    cue_obj_train,\n    cue_obj_train,\n    grams=3,\n    tokenized=false,\n    sep_token=nothing,\n    start_end_token=\"#\",\n    output_sep_token=\"\",\n    path_sep_token=\":\",\n    target_col=:Word)\n\n# writing results for validation data\nJudiLing.write2df(\n    res_val,\n    latin_val,\n    cue_obj_train,\n    cue_obj_val,\n    grams=3,\n    tokenized=false,\n    sep_token=nothing,\n    start_end_token=\"#\",\n    output_sep_token=\"\",\n    path_sep_token=\":\",\n    target_col=:Word)\n\n\n\n\n\n","category":"method"},{"location":"man/output/#JudiLing.write2df-Tuple{Vector{JudiLing.Gold_Path_Info_Struct}}","page":"Output","title":"JudiLing.write2df","text":"write2df(gpi::Vector{Gold_Path_Info_Struct})\n\nWrite results into a dataframe for the gold paths' information optionally returned by learn_paths and build_paths.\n\nObligatory Arguments\n\ngpi::Vector{Gold_Path_Info_Struct}: the gold paths' information\n\nExamples\n\n# write gold standard paths to df for training data\nJudiLing.write2csv(gpi_train)\n\n# write gold standard paths to df for validation data\nJudiLing.write2csv(gpi_val)\n\n\n\n\n\n","category":"method"},{"location":"man/output/#JudiLing.write2df-Tuple{JudiLing.Threshold_Stat_Struct}","page":"Output","title":"JudiLing.write2df","text":"write2df(ts::Threshold_Stat_Struct)\n\nWrite results into a dataframe for threshold and tolerance proportion for each timestep.\n\nObligatory Arguments\n\nts::Threshold_Stat_Struct: the threshold and tolerance proportion\n\nExamples\n\nJudiLing.write2df(ts)\n\n\n\n\n\n","category":"method"},{"location":"man/output/#JudiLing.write_comprehension_eval-NTuple{5, Any}","page":"Output","title":"JudiLing.write_comprehension_eval","text":"write_comprehension_eval(SChat, SC, data, target_col, filename)\n\nWrite comprehension evaluation into a CSV file, include target and predicted ids and indentifiers and their correlations.\n\nObligatory Arguments\n\nSChat::Matrix: the Shat/Chat matrix\nSC::Matrix: the S/C matrix\ndata::DataFrame: the data\ntarget_col::Symbol: the name of target column\nfilename::String: the filename/filepath\n\nOptional Arguments\n\nk: top k candidates\nroot_dir::String=\".\": dir path for project root dir\noutput_dir::String=\".\": output dir inside root dir\n\nExamples\n\nJudiLing.write_comprehension_eval(Chat, cue_obj.C, latin, :Word, \"output.csv\",\n    k=10, root_dir=@__DIR__, output_dir=\"out\")\n\n\n\n\n\n","category":"method"},{"location":"man/output/#JudiLing.write_comprehension_eval-NTuple{7, Any}","page":"Output","title":"JudiLing.write_comprehension_eval","text":"write_comprehension_eval(SChat, SC, SC_rest, data, data_rest, target_col, filename)\n\nWrite comprehension evaluation into a CSV file for both training and validation datasets, include target and predicted ids and indentifiers and their correlations.\n\nObligatory Arguments\n\nSChat::Matrix: the Shat/Chat matrix\nSC::Matrix: the S/C matrix\nSC_rest::Matrix: the rest S/C matrix\ndata::DataFrame: the data\ndata_rest::DataFrame: the rest data\ntarget_col::Symbol: the name of target column\nfilename::String: the filename/filepath\n\nOptional Arguments\n\nk: top k candidates\nroot_dir::String=\".\": dir path for project root dir\noutput_dir::String=\".\": output dir inside root dir\n\nExamples\n\nJudiLing.write_comprehension_eval(Shat_val, S_val, S_train, latin_val, latin_train,\n    :Word, \"all_output.csv\", k=10, root_dir=@__DIR__, output_dir=\"out\")\n\n\n\n\n\n","category":"method"},{"location":"man/output/#JudiLing.save_L_matrix-Tuple{Any, Any}","page":"Output","title":"JudiLing.save_L_matrix","text":"save_L_matrix(L, filename)\n\nSave lexome matrix into csv file.\n\nObligatory Arguments\n\nL::L_Matrix_Struct: the lexome matrix struct\nfilename::String: the filename/filepath\n\nExamples\n\nJudiLing.save_L_matrix(L, joinpath(@__DIR__, \"L.csv\"))\n\n\n\n\n\n","category":"method"},{"location":"man/output/#JudiLing.load_L_matrix-Tuple{Any}","page":"Output","title":"JudiLing.load_L_matrix","text":"load_L_matrix(filename)\n\nLoad lexome matrix from csv file.\n\nObligatory Arguments\n\nfilename::String: the filename/filepath\n\nOptional Arguments\n\nheader::Bool=false: header in csv\n\nExamples\n\nL_load = JudiLing.load_L_matrix(joinpath(@__DIR__, \"L.csv\"))\n\n\n\n\n\n","category":"method"},{"location":"man/output/#JudiLing.save_S_matrix-NTuple{4, Any}","page":"Output","title":"JudiLing.save_S_matrix","text":"save_S_matrix(S, filename, data, target_col)\n\nSave S matrix into a csv file.\n\nObligatory Arguments\n\nS::Matrix: the S matrix\nfilename::String: the filename/filepath\ndata::DataFrame: the data\ntarget_col::Symbol: the name of target column\n\nOptional Arguments\n\nsep::Bool=\" \": separator in CSV file\n\nExamples\n\nJudiLing.save_S_matrix(S, joinpath(@__DIR__, \"S.csv\"), latin, :Word)\n\n\n\n\n\n","category":"method"},{"location":"man/output/#JudiLing.load_S_matrix-Tuple{Any}","page":"Output","title":"JudiLing.load_S_matrix","text":"load_S_matrix(filename)\n\nLoad S matrix from a csv file.\n\nObligatory Arguments\n\nfilename::String: the filename/filepath\n\nOptional Arguments\n\nheader::Bool=false: header in csv\nsep::Bool=\" \": separator in CSV file\n\nExamples\n\nJudiLing.load_S_matrix(joinpath(@__DIR__, \"S.csv\"))\n\n\n\n\n\n","category":"method"},{"location":"man/make_yt_matrix/","page":"Make Yt Matrix","title":"Make Yt Matrix","text":"CurrentModule = JudiLing","category":"page"},{"location":"man/make_yt_matrix/#Make-Yt-Matrix","page":"Make Yt Matrix","title":"Make Yt Matrix","text":"","category":"section"},{"location":"man/make_yt_matrix/","page":"Make Yt Matrix","title":"Make Yt Matrix","text":"    make_Yt_matrix\n    make_Yt_matrix(t, data, f2i)","category":"page"},{"location":"man/make_yt_matrix/#JudiLing.make_Yt_matrix","page":"Make Yt Matrix","title":"JudiLing.make_Yt_matrix","text":"Make Yt matrix for timestep t.\n\n\n\n\n\n","category":"function"},{"location":"man/make_yt_matrix/#JudiLing.make_Yt_matrix-Tuple{Any, Any, Any}","page":"Make Yt Matrix","title":"JudiLing.make_Yt_matrix","text":"make_Yt_matrix(t, data, f2i)\n\nMake Yt matrix for timestep t. A given column of the Yt matrix specifies the support for the corresponding n-gram predicted for timestep t for each of the observations (rows of Yt).\n\nObligatory Arguments\n\nt::Int64: the timestep t\ndata::DataFrame: the dataset\nf2i::Dict: the dictionary returning indices given features\n\nOptional Arguments\n\ntokenized::Bool=false: if true, the dataset target is assumed to be tokenized\nsep_token::Union{Nothing, String, Char}=nothing: separator token\nverbose::Bool=false: if verbose, more information will be printed\n\nExamples\n\nlatin = DataFrame(CSV.File(joinpath(\"data\", \"latin_mini.csv\")))\nJudiLing.make_Yt_matrix(2, latin)\n\n\n\n\n\n","category":"method"},{"location":"man/preprocess/","page":"Preprocess","title":"Preprocess","text":"CurrentModule = JudiLing","category":"page"},{"location":"man/preprocess/#Preprocess","page":"Preprocess","title":"Preprocess","text":"","category":"section"},{"location":"man/preprocess/","page":"Preprocess","title":"Preprocess","text":"    SplitDataException\n    lpo_cv_split(p, data_path)\n    loo_cv_split(data_path)\n    train_val_random_split(data_path, output_dir_path, data_prefix)\n    train_val_careful_split(data_path, output_dir_path, data_prefix, n_features_columns)","category":"page"},{"location":"man/preprocess/#JudiLing.SplitDataException","page":"Preprocess","title":"JudiLing.SplitDataException","text":"Split Data Exception\n\n\n\n\n\n","category":"type"},{"location":"man/preprocess/#JudiLing.lpo_cv_split-Tuple{Any, Any}","page":"Preprocess","title":"JudiLing.lpo_cv_split","text":"lpo_cv_split(p, data_path)\n\nLeave p out cross-validation.\n\n\n\n\n\n","category":"method"},{"location":"man/preprocess/#JudiLing.loo_cv_split-Tuple{Any}","page":"Preprocess","title":"JudiLing.loo_cv_split","text":"loo_cv_split(data_path)\n\nLeave one out cross-validation.\n\n\n\n\n\n","category":"method"},{"location":"man/preprocess/#JudiLing.train_val_random_split-Tuple{Any, Any, Any}","page":"Preprocess","title":"JudiLing.train_val_random_split","text":"train_val_random_split(data_path, output_dir_path, data_prefix)\n\nRandomly split dataset.\n\n\n\n\n\n","category":"method"},{"location":"man/preprocess/#JudiLing.train_val_careful_split-NTuple{4, Any}","page":"Preprocess","title":"JudiLing.train_val_careful_split","text":"train_val_careful_split(data_path, output_dir_path, data_prefix, n_features_columns)\n\nCarefully split dataset.\n\n\n\n\n\n","category":"method"},{"location":"man/test_combo/","page":"Test Combo","title":"Test Combo","text":"CurrentModule = JudiLing","category":"page"},{"location":"man/test_combo/#Test-Combo","page":"Test Combo","title":"Test Combo","text":"","category":"section"},{"location":"man/test_combo/","page":"Test Combo","title":"Test Combo","text":"    test_combo(test_mode;kwargs...)","category":"page"},{"location":"man/test_combo/#JudiLing.test_combo-Tuple{Any}","page":"Test Combo","title":"JudiLing.test_combo","text":"test_combo(test_mode;kwargs...)\n\nA wrapper function for a full model for a specific combination of parameters. A detailed introduction is in Test Combo Introduction\n\nnote: Note\ntestcombo: testcombo is deprecated. While it will remain in the package it is no longer actively maintained.\n\nObligatory Arguments\n\ntest_mode::Symbol: which test mode, currently supports :trainonly, :presplit, :carefulsplit and :randomsplit.\n\nOptional Arguments\n\ntrain_sample_size::Int64=0: the desired number of training data\nval_sample_size::Int64=0: the desired number of validation data\nval_ratio::Float64=0.0: the desired portion of validation data, if works only if :valsamplesize is 0.0.\nextension::String=\".csv\": the extension for data nfeaturesinflections\nn_grams_target_col::Union{String, Symbol}=:Word: the column name for target strings\nn_grams_tokenized::Boolean=false: if true, the dataset target is assumed to be tokenized\nn_grams_sep_token::String=nothing: separator\ngrams::Int64=3: the number of grams for cues\nn_grams_keep_sep::Boolean=false: if true, keep separators in cues\nstart_end_token::String=\":\": start and end token in boundary cues\npath_sep_token::String=\":\": path separator in the assembled path\nrandom_seed::Int64=314: the random seed\nsd_base_mean::Int64=1: the sd mean of base features\nsd_inflection_mean::Int64=1: the sd mean of inflectional features\nsd_base::Int64=4: the sd of base features\nsd_inflection::Int64=4: the sd of inflectional features\nisdeep::Boolean=true: if true, mean of each feature is also randomized\nadd_noise::Boolean=true: if true, add additional Gaussian noise\nsd_noise::Int64=1: the sd of the Gaussian noise\nnormalized::Boolean=false: if true, most of the values range between 1 and -1, it may slightly exceed between 1 or -1 depending on the sd\nif_combined::Boolean=false: if true, then features are combined with both training and validation data\nlearn_mode::Int64=:cholesky: which learning mode, currently supports :cholesky and :wh\nmethod::Int64=:additive: whether :additive or :multiplicative decomposition is required\nshift::Int64=0.02: shift value for :additive decomposition\nmultiplier::Int64=1.01: multiplier value for :multiplicative decomposition\noutput_format::Int64=:auto: to force output format to dense(:dense) or sparse(:sparse), make it auto(:auto) to determined by the program\nsparse_ratio::Int64=0.05: the ratio to decide whether a matrix is sparse\nwh_freq::Vector=nothing: the learning sequence\ninit_weights::Matrix=nothing: the initial weights\neta::Float64=0.1: the learning rate\nn_epochs::Int64=1: the number of epochs to be trained\nmax_t::Int64=0: the number of epochs to be trained\nA::Matrix=nothing: the number of epochs to be trained\nA_mode::Symbol=:combined: the adjacency matrix mode, currently supports :combined or :train_only\nmax_can::Int64=10: the max number of candidate path to keep in the output\nthreshold_train::Float64=0.1:the value set for the support such that if the support of an n-gram is higher than this value, the n-gram will be taking into consideration for training data\nis_tolerant_train::Bool=false: if true, select a specified number (given by max_tolerance) of n-grams whose supports are below threshold but above a second tolerance threshold to be added to the path  for training data\ntolerance_train::Float64=-0.1: the value set for the second threshold (in tolerant mode) such that if the support for an n-gram is in between this value and the threshold and the max_tolerance number has not been reached, then allow this n-gram to be added to the path  for training data\nmax_tolerance_train::Int64=2: maximum number of n-grams allowed in a path for training data\nthreshold_val::Float64=0.1:the value set for the support such that if the support of an n-gram is higher than this value, the n-gram will be taking into consideration for validation data\nis_tolerant_val::Bool=false: if true, select a specified number (given by max_tolerance) of n-grams whose supports are below threshold but above a second tolerance threshold to be added to the path for validation data\ntolerance_val::Float64=-0.1: the value set for the second threshold (in tolerant mode) such that if the support for an n-gram is in between this value and the threshold and the max_tolerance number has not been reached, then allow this n-gram to be added to the path for validation data\nmax_tolerance_val::Int64=2: maximum number of n-grams allowed in a path for validation data\nn_neighbors_train::Int64=10: the top n form neighbors to be considered for training data\nn_neighbors_val::Int64=20: the top n form neighbors to be considered for validation data\nissparse::Bool=false: if true, keep sparse matrix format when learning paths\noutput_dir::String=\"out\": the output directory\nverbose::Bool=false: if true, more information will be printed\n\n\n\n\n\n","category":"method"},{"location":"#JudiLing","page":"Home","title":"JudiLing","text":"","category":"section"},{"location":"","page":"Home","title":"Home","text":"JudiLing: An implementation for Linear Discriminative Learning in Julia","category":"page"},{"location":"","page":"Home","title":"Home","text":"Maintainer: Maria Heitmeier @MariaHei\nOriginal codebase: Xuefeng Luo @MegamindHenry","category":"page"},{"location":"#Installation","page":"Home","title":"Installation","text":"","category":"section"},{"location":"","page":"Home","title":"Home","text":"You can install JudiLing by the follow commands:","category":"page"},{"location":"","page":"Home","title":"Home","text":"using Pkg\nPkg.add(\"JudiLing\")","category":"page"},{"location":"","page":"Home","title":"Home","text":"For brave adventurers, install test version of JudiLing by:","category":"page"},{"location":"","page":"Home","title":"Home","text":"julia> Pkg.add(url=\"https://github.com/quantling/JudiLing.jl.git\")","category":"page"},{"location":"","page":"Home","title":"Home","text":"Or from the Julia REPL, type ] to enter the Pkg REPL mode and run","category":"page"},{"location":"","page":"Home","title":"Home","text":"pkg> add https://github.com/quantling/JudiLing.jl.git","category":"page"},{"location":"#Running-Julia-with-multiple-threads","page":"Home","title":"Running Julia with multiple threads","text":"","category":"section"},{"location":"","page":"Home","title":"Home","text":"JudiLing supports the use of multiple threads. Simply start up Julia in your terminal as follows:","category":"page"},{"location":"","page":"Home","title":"Home","text":"$ julia -t your_num_of_threads","category":"page"},{"location":"","page":"Home","title":"Home","text":"For detailed information on using Julia with threads, see this link.","category":"page"},{"location":"#Include-packages","page":"Home","title":"Include packages","text":"","category":"section"},{"location":"","page":"Home","title":"Home","text":"Before we start, we first need to load the JudiLing package:","category":"page"},{"location":"","page":"Home","title":"Home","text":"using JudiLing","category":"page"},{"location":"","page":"Home","title":"Home","text":"Note: As of JudiLing 0.8.0, PyCall and Flux have become optional dependencies. This means that all code in JudiLing which requires calls to python is only available if PyCall is loaded first, like this:","category":"page"},{"location":"","page":"Home","title":"Home","text":"using PyCall\nusing JudiLing","category":"page"},{"location":"","page":"Home","title":"Home","text":"Likewise, the code involving deep learning is only available if Julia's deep learning library Flux is loaded first, like this:","category":"page"},{"location":"","page":"Home","title":"Home","text":"using Flux\nusing JudiLing","category":"page"},{"location":"","page":"Home","title":"Home","text":"Note that Flux and PyCall have to be installed separately, and the newest version of Flux requires at least Julia 1.9. If you want to run deep learning in a GPU, make sure to also install and import CUDA.","category":"page"},{"location":"#Running-Julia-with-multiple-threads-2","page":"Home","title":"Running Julia with multiple threads","text":"","category":"section"},{"location":"","page":"Home","title":"Home","text":"JudiLing supports the use of multiple threads. Simply start up Julia in your terminal as follows:","category":"page"},{"location":"","page":"Home","title":"Home","text":"$ julia -t your_num_of_threads","category":"page"},{"location":"","page":"Home","title":"Home","text":"For detailed information on using Julia with threads, see this link.","category":"page"},{"location":"#Quick-start-example","page":"Home","title":"Quick start example","text":"","category":"section"},{"location":"","page":"Home","title":"Home","text":"The Latin dataset latin.csv contains lexemes and inflectional features for 672 inflected Latin verb forms for 8 lexemes from 4 conjugation classes. Word forms are inflected for person, number, tense, voice and mood.","category":"page"},{"location":"","page":"Home","title":"Home","text":"\"\",\"Word\",\"Lexeme\",\"Person\",\"Number\",\"Tense\",\"Voice\",\"Mood\"\n\"1\",\"vocoo\",\"vocare\",\"p1\",\"sg\",\"present\",\"active\",\"ind\"\n\"2\",\"vocaas\",\"vocare\",\"p2\",\"sg\",\"present\",\"active\",\"ind\"\n\"3\",\"vocat\",\"vocare\",\"p3\",\"sg\",\"present\",\"active\",\"ind\"\n\"4\",\"vocaamus\",\"vocare\",\"p1\",\"pl\",\"present\",\"active\",\"ind\"\n\"5\",\"vocaatis\",\"vocare\",\"p2\",\"pl\",\"present\",\"active\",\"ind\"\n\"6\",\"vocant\",\"vocare\",\"p3\",\"pl\",\"present\",\"active\",\"ind\"","category":"page"},{"location":"","page":"Home","title":"Home","text":"We first download and read the csv file into Julia:","category":"page"},{"location":"","page":"Home","title":"Home","text":"download(\"https://osf.io/2ejfu/download\", \"latin.csv\")\n\nlatin = JudiLing.load_dataset(\"latin.csv\");","category":"page"},{"location":"","page":"Home","title":"Home","text":"and we can inspect the latin dataframe:","category":"page"},{"location":"","page":"Home","title":"Home","text":"display(latin)","category":"page"},{"location":"","page":"Home","title":"Home","text":"672×8 DataFrame. Omitted printing of 2 columns\n│ Row │ Column1 │ Word           │ Lexeme  │ Person │ Number │ Tense      │\n│     │ Int64   │ String         │ String  │ String │ String │ String     │\n├─────┼─────────┼────────────────┼─────────┼────────┼────────┼────────────┤\n│ 1   │ 1       │ vocoo          │ vocare  │ p1     │ sg     │ present    │\n│ 2   │ 2       │ vocaas         │ vocare  │ p2     │ sg     │ present    │\n│ 3   │ 3       │ vocat          │ vocare  │ p3     │ sg     │ present    │\n│ 4   │ 4       │ vocaamus       │ vocare  │ p1     │ pl     │ present    │\n│ 5   │ 5       │ vocaatis       │ vocare  │ p2     │ pl     │ present    │\n│ 6   │ 6       │ vocant         │ vocare  │ p3     │ pl     │ present    │\n│ 7   │ 7       │ clamoo         │ clamare │ p1     │ sg     │ present    │\n│ 8   │ 8       │ clamaas        │ clamare │ p2     │ sg     │ present    │\n⋮\n│ 664 │ 664     │ carpsisseemus  │ carpere │ p1     │ pl     │ pluperfect │\n│ 665 │ 665     │ carpsisseetis  │ carpere │ p2     │ pl     │ pluperfect │\n│ 666 │ 666     │ carpsissent    │ carpere │ p3     │ pl     │ pluperfect │\n│ 667 │ 667     │ cuccurissem    │ currere │ p1     │ sg     │ pluperfect │\n│ 668 │ 668     │ cuccurissees   │ currere │ p2     │ sg     │ pluperfect │\n│ 669 │ 669     │ cuccurisset    │ currere │ p3     │ sg     │ pluperfect │\n│ 670 │ 670     │ cuccurisseemus │ currere │ p1     │ pl     │ pluperfect │\n│ 671 │ 671     │ cuccurisseetis │ currere │ p2     │ pl     │ pluperfect │\n│ 672 │ 672     │ cuccurissent   │ currere │ p3     │ pl     │ pluperfect │","category":"page"},{"location":"","page":"Home","title":"Home","text":"For the production model, we want to predict correct forms given their lexemes and inflectional features. For example, giving the lexeme vocare and its inflectional features p1, sg, present, active and ind, the model should produce the form vocoo. On the other hand, the comprehension model takes forms as input and tries to predict their lexemes and inflectional features.","category":"page"},{"location":"","page":"Home","title":"Home","text":"We use letter trigrams to encode our forms. For word vocoo, for example, we use trigrams #vo, voc, oco, coo and oo#. Here, # is used as start/end token to encode the initial trigram and finial trigram of a word. The row vectors of the C matrix specify for each word which of the trigrams are realized in that word.","category":"page"},{"location":"","page":"Home","title":"Home","text":"To make the C matrix, we use the make_cue_matrix function:","category":"page"},{"location":"","page":"Home","title":"Home","text":"cue_obj = JudiLing.make_cue_matrix(\n    latin,\n    grams=3,\n    target_col=:Word,\n    tokenized=false,\n    keep_sep=false\n    )","category":"page"},{"location":"","page":"Home","title":"Home","text":"Next, we simulate the semantic matrix S using the make_S_matrix function:","category":"page"},{"location":"","page":"Home","title":"Home","text":"n_features = size(cue_obj.C, 2)\nS = JudiLing.make_S_matrix(\n    latin,\n    [\"Lexeme\"],\n    [\"Person\",\"Number\",\"Tense\",\"Voice\",\"Mood\"],\n    ncol=n_features)","category":"page"},{"location":"","page":"Home","title":"Home","text":"For this simulation, first random vectors are assigned to every lexeme and inflectional feature, and next the vectors of those features are summed up to obtain the semantic vector of the inflected form. Similar dimensions for C and S work best. Therefore, we retrieve the number of columns from the C matrix and pass it to make_S_matrix when constructing S.","category":"page"},{"location":"","page":"Home","title":"Home","text":"Then, the next step is to calculate a mapping from S to C by solving equation C = SG. We use Cholesky decomposition to solve this equation:","category":"page"},{"location":"","page":"Home","title":"Home","text":"G = JudiLing.make_transform_matrix(S, cue_obj.C)","category":"page"},{"location":"","page":"Home","title":"Home","text":"Then, we can make our predicted C matrix Chat:","category":"page"},{"location":"","page":"Home","title":"Home","text":"Chat = S * G","category":"page"},{"location":"","page":"Home","title":"Home","text":"and evaluate the model's prediction accuracy:","category":"page"},{"location":"","page":"Home","title":"Home","text":"@show JudiLing.eval_SC(Chat, cue_obj.C)","category":"page"},{"location":"","page":"Home","title":"Home","text":"Output:","category":"page"},{"location":"","page":"Home","title":"Home","text":"JudiLing.eval_SC(Chat, cue_obj.C) = 0.9926","category":"page"},{"location":"","page":"Home","title":"Home","text":"NOTE: Accuracy may be different depending on the simulated semantic matrix.","category":"page"},{"location":"","page":"Home","title":"Home","text":"Similar to G and Chat, we can solve S = CF:","category":"page"},{"location":"","page":"Home","title":"Home","text":"F = JudiLing.make_transform_matrix(cue_obj.C, S)","category":"page"},{"location":"","page":"Home","title":"Home","text":"and we then calculate the Shat matrix and evaluate comprehension accuracy:","category":"page"},{"location":"","page":"Home","title":"Home","text":"Shat = cue_obj.C * F\n@show JudiLing.eval_SC(Shat, S)","category":"page"},{"location":"","page":"Home","title":"Home","text":"Output:","category":"page"},{"location":"","page":"Home","title":"Home","text":"JudiLing.eval_SC(Shat, S) = 0.9911","category":"page"},{"location":"","page":"Home","title":"Home","text":"NOTE: Accuracy may be different depending on the simulated semantic matrix.","category":"page"},{"location":"","page":"Home","title":"Home","text":"To model speech production, the proper triphones have to be selected and put into the right order. We have two algorithms that accomplish this. Both algorithms construct paths in a triphone space that start with word-initial triphones and end with word-final triphones.","category":"page"},{"location":"","page":"Home","title":"Home","text":"The first step is to construct an adjacency matrix that specify which triphone can follow each other. In this example, we use the adjacency matrix constructed by make_cue_matrix, but we can also make use of a independently constructed adjacency matrix if required.","category":"page"},{"location":"","page":"Home","title":"Home","text":"A = cue_obj.A","category":"page"},{"location":"","page":"Home","title":"Home","text":"For our sequencing algorithms, we calculate the number of timesteps we need for our algorithms. For the Latin dataset, the max timestep is equal to the length of the longest word. The argument :Word specifies the column in the Latin dataset that lists the words' forms.","category":"page"},{"location":"","page":"Home","title":"Home","text":"max_t = JudiLing.cal_max_timestep(latin, :Word)","category":"page"},{"location":"","page":"Home","title":"Home","text":"One sequence finding algorithm used discrimination learning for the position of triphones. This function returns two lists, one with candidate triphone paths and their positional learning support (res) and one with the semantic supports for the gold paths (gpi).","category":"page"},{"location":"","page":"Home","title":"Home","text":"res_learn, gpi_learn = JudiLing.learn_paths(\n    latin,\n    latin,\n    cue_obj.C,\n    S,\n    F,\n    Chat,\n    A,\n    cue_obj.i2f,\n    cue_obj.f2i, # api changed in 0.3.1\n    check_gold_path = true,\n    gold_ind = cue_obj.gold_ind,\n    Shat_val = Shat,\n    max_t = max_t,\n    max_can = 10,\n    grams = 3,\n    threshold = 0.05,\n    tokenized = false,\n    keep_sep = false,\n    target_col = :Word,\n    verbose = true\n)","category":"page"},{"location":"","page":"Home","title":"Home","text":"We evaluate the accuracy on the training data as follows:","category":"page"},{"location":"","page":"Home","title":"Home","text":"acc_learn = JudiLing.eval_acc(res_learn, cue_obj.gold_ind, verbose = false)\n\nprintln(\"Acc for learn: $acc_learn\")","category":"page"},{"location":"","page":"Home","title":"Home","text":"Acc for learn: 0.9985","category":"page"},{"location":"","page":"Home","title":"Home","text":"The second sequence finding algorithm is usually faster than the first, but does not provide positional learnability estimates.","category":"page"},{"location":"","page":"Home","title":"Home","text":"res_build = JudiLing.build_paths(\n    latin,\n    cue_obj.C,\n    S,\n    F,\n    Chat,\n    A,\n    cue_obj.i2f,\n    cue_obj.gold_ind,\n    max_t=max_t,\n    n_neighbors=3,\n    verbose=true\n    )\n\nacc_build = JudiLing.eval_acc(\n    res_build,\n    cue_obj.gold_ind,\n    verbose=false\n)","category":"page"},{"location":"","page":"Home","title":"Home","text":"Acc for build: 0.9955","category":"page"},{"location":"","page":"Home","title":"Home","text":"After having obtained the results from the sequence functions: learn_paths or build_paths, we can save the results either into a csv or into a dataframe, the dataframe can be loaded into R with the rput command of the RCall package.","category":"page"},{"location":"","page":"Home","title":"Home","text":"JudiLing.write2csv(\n    res_learn,\n    latin,\n    cue_obj,\n    cue_obj,\n    \"latin_learn_res.csv\",\n    grams = 3,\n    tokenized = false,\n    sep_token = nothing,\n    start_end_token = \"#\",\n    output_sep_token = \"\",\n    path_sep_token = \":\",\n    target_col = :Word,\n    root_dir = @__DIR__,\n    output_dir = \"latin_out\"\n)\n\ndf_learn = JudiLing.write2df(\n    res_learn,\n    latin,\n    cue_obj,\n    cue_obj,\n    grams = 3,\n    tokenized = false,\n    sep_token = nothing,\n    start_end_token = \"#\",\n    output_sep_token = \"\",\n    path_sep_token = \":\",\n    target_col = :Word\n)\n\nJudiLing.write2csv(\n    res_build,\n    latin,\n    cue_obj,\n    cue_obj,\n    \"latin_build_res.csv\",\n    grams = 3,\n    tokenized = false,\n    sep_token = nothing,\n    start_end_token = \"#\",\n    output_sep_token = \"\",\n    path_sep_token = \":\",\n    target_col = :Word,\n    root_dir = @__DIR__,\n    output_dir = \"latin_out\"\n)\n\ndf_build = JudiLing.write2df(\n    res_build,\n    latin,\n    cue_obj,\n    cue_obj,\n    grams = 3,\n    tokenized = false,\n    sep_token = nothing,\n    start_end_token = \"#\",\n    output_sep_token = \"\",\n    path_sep_token = \":\",\n    target_col = :Word\n)\n\ndisplay(df_learn)\ndisplay(df_build)","category":"page"},{"location":"","page":"Home","title":"Home","text":"3805×9 DataFrame. Omitted printing of 5 columns\n│ Row  │ utterance │ identifier     │ path                                                    │ pred           │\n│      │ Int64?    │ String?        │ Union{Missing, String}                                  │ String?        │\n├──────┼───────────┼────────────────┼─────────────────────────────────────────────────────────┼────────────────┤\n│ 1    │ 1         │ vocoo          │ #vo:voc:oco:coo:oo#                                     │ vocoo          │\n│ 2    │ 2         │ vocaas         │ #vo:voc:oca:caa:aas:as#                                 │ vocaas         │\n│ 3    │ 2         │ vocaas         │ #vo:voc:oca:caa:aab:aba:baa:aas:as#                     │ vocaabaas      │\n│ 4    │ 2         │ vocaas         │ #vo:voc:oca:caa:aat:ati:tis:is#                         │ vocaatis       │\n│ 5    │ 2         │ vocaas         │ #vo:voc:oca:caa:aav:avi:vis:ist:sti:tis:is#             │ vocaavistis    │\n│ 6    │ 2         │ vocaas         │ #vo:voc:oca:caa:aam:amu:mus:us#                         │ vocaamus       │\n│ 7    │ 2         │ vocaas         │ #vo:voc:oca:caa:aab:abi:bit:it#                         │ vocaabit       │\n│ 8    │ 2         │ vocaas         │ #vo:voc:oca:caa:aam:amu:mur:ur#                         │ vocaamur       │\n│ 9    │ 2         │ vocaas         │ #vo:voc:oca:caa:aar:are:ret:et#                         │ vocaaret       │\n⋮\n│ 3796 │ 671       │ cuccurisseetis │ #cu:cuc:ucc:ccu:cur:ure:ree:eet:eti:tis:is#             │ cuccureetis    │\n│ 3797 │ 671       │ cuccurisseetis │ #cu:cuc:ucc:ccu:cur:uri:ris:ist:sti:tis:is#             │ cuccuristis    │\n│ 3798 │ 671       │ cuccurisseetis │ #cu:cuc:ucc:ccu:cur:uri:ris:iss:sse:set:et#             │ cuccurisset    │\n│ 3799 │ 671       │ cuccurisseetis │ #cu:cur:urr:rri:rim:imi:min:ini:nii:ii#                 │ curriminii     │\n│ 3800 │ 672       │ cuccurissent   │ #cu:cuc:ucc:ccu:cur:uri:ris:iss:sse:sen:ent:nt#         │ cuccurissent   │\n│ 3801 │ 672       │ cuccurissent   │ #cu:cur:urr:rre:rer:ere:ren:ent:nt#                     │ currerent      │\n│ 3802 │ 672       │ cuccurissent   │ #cu:cuc:ucc:ccu:cur:uri:ris:iss:sse:see:eem:emu:mus:us# │ cuccurisseemus │\n│ 3803 │ 672       │ cuccurissent   │ #cu:cuc:ucc:ccu:cur:uri:ris:iss:sse:see:eet:eti:tis:is# │ cuccurisseetis │\n│ 3804 │ 672       │ cuccurissent   │ #cu:cur:urr:rre:rer:ere:ren:ent:ntu:tur:ur#             │ currerentur    │\n│ 3805 │ 672       │ cuccurissent   │ #cu:cuc:ucc:ccu:cur:uri:ris:iss:sse:see:ees:es#         │ cuccurissees   │\n2519×9 DataFrame. Omitted printing of 4 columns\n│ Row  │ utterance │ identifier     │ path                                            │ pred         │ num_tolerance │\n│      │ Int64?    │ String?        │ Union{Missing, String}                          │ String?      │ Int64?        │\n├──────┼───────────┼────────────────┼─────────────────────────────────────────────────┼──────────────┼───────────────┤\n│ 1    │ 1         │ vocoo          │ #vo:voc:oco:coo:oo#                             │ vocoo        │ 0             │\n│ 2    │ 1         │ vocoo          │ #vo:voc:oca:caa:aab:abo:boo:oo#                 │ vocaaboo     │ 0             │\n│ 3    │ 1         │ vocoo          │ #vo:voc:oca:caa:aab:aba:bam:am#                 │ vocaabam     │ 0             │\n│ 4    │ 2         │ vocaas         │ #vo:voc:oca:caa:aas:as#                         │ vocaas       │ 0             │\n│ 5    │ 2         │ vocaas         │ #vo:voc:oca:caa:aab:abi:bis:is#                 │ vocaabis     │ 0             │\n│ 6    │ 2         │ vocaas         │ #vo:voc:oca:caa:aat:ati:tis:is#                 │ vocaatis     │ 0             │\n│ 7    │ 3         │ vocat          │ #vo:voc:oca:cat:at#                             │ vocat        │ 0             │\n│ 8    │ 3         │ vocat          │ #vo:voc:oca:caa:aab:aba:bat:at#                 │ vocaabat     │ 0             │\n│ 9    │ 3         │ vocat          │ #vo:voc:oca:caa:aas:as#                         │ vocaas       │ 0             │\n⋮\n│ 2510 │ 671       │ cuccurisseetis │ #cu:cur:uri:ris:iss:sse:see:ees:es#             │ curissees    │ 0             │\n│ 2511 │ 671       │ cuccurisseetis │ #cu:cur:uri:ris:iss:sse:see:eem:emu:mus:us#     │ curisseemus  │ 0             │\n│ 2512 │ 671       │ cuccurisseetis │ #cu:cur:uri:ris:is#                             │ curis        │ 0             │\n│ 2513 │ 671       │ cuccurisseetis │ #cu:cuc:ucc:ccu:cur:uri:ris:is#                 │ cuccuris     │ 0             │\n│ 2514 │ 672       │ cuccurissent   │ #cu:cuc:ucc:ccu:cur:uri:ris:iss:sse:sen:ent:nt# │ cuccurissent │ 0             │\n│ 2515 │ 672       │ cuccurissent   │ #cu:cur:uri:ris:iss:sse:sen:ent:nt#             │ curissent    │ 0             │\n│ 2516 │ 672       │ cuccurissent   │ #cu:cuc:ucc:ccu:cur:uri:ris:iss:sse:set:et#     │ cuccurisset  │ 0             │\n│ 2517 │ 672       │ cuccurissent   │ #cu:cur:uri:ris:iss:sse:set:et#                 │ curisset     │ 0             │\n│ 2518 │ 672       │ cuccurissent   │ #cu:cuc:ucc:ccu:cur:uri:ris:iss:sse:sem:em#     │ cuccurissem  │ 0             │\n│ 2519 │ 672       │ cuccurissent   │ #cu:cur:uri:ris:iss:sse:sem:em#                 │ curissem     │ 0             │","category":"page"},{"location":"#Cross-validation","page":"Home","title":"Cross-validation","text":"","category":"section"},{"location":"","page":"Home","title":"Home","text":"The model also provides functionality for cross-validation. Here, we first split the dataset randomly into 90% training and 10% validation data:","category":"page"},{"location":"","page":"Home","title":"Home","text":"latin_train, latin_val = JudiLing.loading_data_randomly_split(\"latin.csv\",\n                                                                \"data\",\n                                                                \"latin\",\n                                                                val_ratio=0.1,\n                                                                random_seed=42)","category":"page"},{"location":"","page":"Home","title":"Home","text":"Then, we make the C matrix by passing both training and validation datasets to the make_combined_cue_matrix function which ensures that the C matrix contains columns for both training and validation data.","category":"page"},{"location":"","page":"Home","title":"Home","text":"cue_obj_train, cue_obj_val = JudiLing.make_combined_cue_matrix(\n    latin_train,\n    latin_val,\n    grams = 3,\n    target_col = :Word,\n    tokenized = false,\n    keep_sep = false\n)","category":"page"},{"location":"","page":"Home","title":"Home","text":"Next, we simulate semantic vectors, again for both the training and validation data, using make_combined_S_matrix:","category":"page"},{"location":"","page":"Home","title":"Home","text":"n_features = size(cue_obj_train.C, 2)\nS_train, S_val = JudiLing.make_combined_S_matrix(\n    latin_train,\n    latin_val,\n    [\"Lexeme\"],\n    [\"Person\", \"Number\", \"Tense\", \"Voice\", \"Mood\"],\n    ncol = n_features\n)","category":"page"},{"location":"","page":"Home","title":"Home","text":"After that, we make the transformation matrices, but this time we only use the training dataset. We use these transformation matrices to predict the validation dataset.","category":"page"},{"location":"","page":"Home","title":"Home","text":"G_train = JudiLing.make_transform_matrix(S_train, cue_obj_train.C)\nF_train = JudiLing.make_transform_matrix(cue_obj_train.C, S_train)\n\nChat_train = S_train * G_train\nChat_val = S_val * G_train\nShat_train = cue_obj_train.C * F_train\nShat_val = cue_obj_val.C * F_train\n\n@show JudiLing.eval_SC(Chat_train, cue_obj_train.C)\n@show JudiLing.eval_SC(Chat_val, cue_obj_val.C)\n@show JudiLing.eval_SC(Shat_train, S_train)\n@show JudiLing.eval_SC(Shat_val, S_val)","category":"page"},{"location":"","page":"Home","title":"Home","text":"Output:","category":"page"},{"location":"","page":"Home","title":"Home","text":"JudiLing.eval_SC(Chat_train, cue_obj_train.C) = 0.995\nJudiLing.eval_SC(Chat_val, cue_obj_val.C) = 0.403\nJudiLing.eval_SC(Shat_train, S_train) = 0.9917\nJudiLing.eval_SC(Shat_val, S_val) = 1.0","category":"page"},{"location":"","page":"Home","title":"Home","text":"Finally, we can find possible paths through build_paths or learn_paths. Since validation datasets are harder to predict, we turn on tolerant mode which allow the algorithms to find more paths but at the cost of investing more time.","category":"page"},{"location":"","page":"Home","title":"Home","text":"A = cue_obj_train.A\nmax_t = JudiLing.cal_max_timestep(latin_train, latin_val, :Word)\n\nres_learn_train, gpi_learn_train = JudiLing.learn_paths(\n    latin_train,\n    latin_train,\n    cue_obj_train.C,\n    S_train,\n    F_train,\n    Chat_train,\n    A,\n    cue_obj_train.i2f,\n    cue_obj_train.f2i, # api changed in 0.3.1\n    gold_ind = cue_obj_train.gold_ind,\n    Shat_val = Shat_train,\n    check_gold_path = true,\n    max_t = max_t,\n    max_can = 10,\n    grams = 3,\n    threshold = 0.05,\n    tokenized = false,\n    sep_token = \"_\",\n    keep_sep = false,\n    target_col = :Word,\n    issparse = :dense,\n    verbose = true,\n)\n\nres_learn_val, gpi_learn_val = JudiLing.learn_paths(\n    latin_train,\n    latin_val,\n    cue_obj_train.C,\n    S_val,\n    F_train,\n    Chat_val,\n    A,\n    cue_obj_train.i2f,\n    cue_obj_train.f2i, # api changed in 0.3.1\n    gold_ind = cue_obj_val.gold_ind,\n    Shat_val = Shat_val,\n    check_gold_path = true,\n    max_t = max_t,\n    max_can = 10,\n    grams = 3,\n    threshold = 0.05,\n    is_tolerant = true,\n    tolerance = -0.1,\n    max_tolerance = 2,\n    tokenized = false,\n    sep_token = \"-\",\n    keep_sep = false,\n    target_col = :Word,\n    issparse = :dense,\n    verbose = true,\n)\n\nacc_learn_train =\n    JudiLing.eval_acc(res_learn_train, cue_obj_train.gold_ind, verbose = false)\nacc_learn_val = JudiLing.eval_acc(res_learn_val, cue_obj_val.gold_ind, verbose = false)\n\nres_build_train = JudiLing.build_paths(\n    latin_train,\n    cue_obj_train.C,\n    S_train,\n    F_train,\n    Chat_train,\n    A,\n    cue_obj_train.i2f,\n    cue_obj_train.gold_ind,\n    max_t = max_t,\n    n_neighbors = 3,\n    verbose = true,\n)\n\nres_build_val = JudiLing.build_paths(\n    latin_val,\n    cue_obj_train.C,\n    S_val,\n    F_train,\n    Chat_val,\n    A,\n    cue_obj_train.i2f,\n    cue_obj_train.gold_ind,\n    max_t = max_t,\n    n_neighbors = 20,\n    verbose = true,\n)\n\nacc_build_train =\n    JudiLing.eval_acc(res_build_train, cue_obj_train.gold_ind, verbose = false)\nacc_build_val = JudiLing.eval_acc(res_build_val, cue_obj_val.gold_ind, verbose = false)\n\n@show acc_learn_train\n@show acc_learn_val\n@show acc_build_train\n@show acc_build_val","category":"page"},{"location":"","page":"Home","title":"Home","text":"Output:","category":"page"},{"location":"","page":"Home","title":"Home","text":"acc_learn_train = 0.9983\nacc_learn_val = 0.6866\nacc_build_train = 1.0\nacc_build_val = 0.3284","category":"page"},{"location":"","page":"Home","title":"Home","text":"Alternatively, we  have a wrapper function incorporating all above functionalities. With this function, you can quickly explore datasets with different parameter settings. Please find more in the Test Combo Introduction.","category":"page"},{"location":"#Supports","page":"Home","title":"Supports","text":"","category":"section"},{"location":"","page":"Home","title":"Home","text":"There are two types of supports in outputs. An utterance level and a set of supports for each cue. The former support is also called \"synthesis-by-analysis\" support. This support is calculated by predicted S vector and original S vector and it is used to select the best paths. Cue level supports are slices of Yt matrices from each timestep. Those supports are used to determine whether a cue is eligible for constructing paths.","category":"page"},{"location":"#Acknowledgments","page":"Home","title":"Acknowledgments","text":"","category":"section"},{"location":"","page":"Home","title":"Home","text":"This project was supported by the ERC advanced grant WIDE-742545 and by the Deutsche Forschungsgemeinschaft (DFG, German Research Foundation) under Germany’s Excellence Strategy - EXC number 2064/1 - Project number 390727645.","category":"page"},{"location":"#Citation","page":"Home","title":"Citation","text":"","category":"section"},{"location":"","page":"Home","title":"Home","text":"If you find this package helpful, please cite it as follows:","category":"page"},{"location":"","page":"Home","title":"Home","text":"Luo, X., Heitmeier, M., Chuang, Y. Y., Baayen, R. H. JudiLing: an implementation of the Discriminative Lexicon Model in Julia. Eberhard Karls Universität Tübingen, Seminar für Sprachwissenschaft.","category":"page"},{"location":"","page":"Home","title":"Home","text":"The following studies have made use of several algorithms now implemented in JudiLing instead of WpmWithLdl:","category":"page"},{"location":"","page":"Home","title":"Home","text":"Baayen, R. H., Chuang, Y. Y., Shafaei-Bajestan, E., and Blevins, J. P. (2019). The discriminative lexicon: A unified computational model for the lexicon and lexical processing in comprehension and production grounded not in (de)composition but in linear discriminative learning. Complexity, 2019, 1-39.\nBaayen, R. H., Chuang, Y. Y., and Blevins, J. P. (2018). Inflectional morphology with linear mappings. The Mental Lexicon, 13 (2), 232-270.\nChuang, Y.-Y., Lõo, K., Blevins, J. P., and Baayen, R. H. (2020). Estonian case inflection made simple. A case study in Word and Paradigm morphology with Linear Discriminative Learning. In Körtvélyessy, L., and Štekauer, P. (Eds.) Complex Words: Advances in Morphology, 1-19.\nChuang, Y-Y., Bell, M. J., Banke, I., and Baayen, R. H. (2020). Bilingual and multilingual mental lexicon: a modeling study with Linear Discriminative Learning. Language Learning, 1-55.\nHeitmeier, M., Chuang, Y-Y., Baayen, R. H. (2021). Modeling morphology with Linear Discriminative Learning: considerations and design choices. Frontiers in Psychology, 12, 4929.\nDenistia, K., and Baayen, R. H. (2022). The morphology of Indonesian: Data and quantitative modeling. In Shei, C., and Li, S. (Eds.) The Routledge Handbook of Asian Linguistics, (pp. 605-634). Routledge, London.\nHeitmeier, M., Chuang, Y.-Y., and Baayen, R. H. (2023). How trial-to-trial learning shapes mappings in the mental lexicon: Modelling lexical decision with linear discriminative learning. Cognitive Psychology, 1-30.\nChuang, Y. Y., Kang, M., Luo, X. F. and Baayen, R. H. (2023). Vector Space Morphology with Linear Discriminative Learning. In Crepaldi, D. (Ed.) Linguistic morphology in the mind and brain.\nHeitmeier, M., Chuang, Y. Y., Axen, S. D., & Baayen, R. H. (2024). Frequency effects in linear discriminative learning. Frontiers in Human Neuroscience, 17, 1242720.\nPlag, I., Heitmeier, M. & Domahs, F. (to appear). German nominal number interpretation in an impaired mental lexicon: A naive discriminative learning perspective. The Mental Lexicon.","category":"page"},{"location":"man/make_cue_matrix/","page":"Make Cue Matrix","title":"Make Cue Matrix","text":"CurrentModule = JudiLing","category":"page"},{"location":"man/make_cue_matrix/#Make-Cue-Matrix","page":"Make Cue Matrix","title":"Make Cue Matrix","text":"","category":"section"},{"location":"man/make_cue_matrix/","page":"Make Cue Matrix","title":"Make Cue Matrix","text":"    Cue_Matrix_Struct\r\n    make_cue_matrix\r\n    make_combined_cue_matrix\r\n    make_ngrams\r\n    make_cue_matrix(data::DataFrame)\r\n    make_cue_matrix(data::DataFrame, cue_obj::Cue_Matrix_Struct)\r\n    make_cue_matrix(data_train::DataFrame, data_val::DataFrame)\r\n    make_combined_cue_matrix(data_train, data_val)\r\n    make_cue_matrix_from_CFBS(features::Vector{Vector{T}};\r\n                                        pad_val::T = 0.,\r\n                                        ncol::Union{Missing,Int}=missing) where {T}\r\n    make_combined_cue_matrix_from_CFBS(features_train::Vector{Vector{T}},\r\n                                                features_test::Vector{Vector{T}};\r\n                                                pad_val::T = 0.,\r\n                                                ncol::Union{Missing,Int}=missing) where {T}\r\n    make_ngrams(tokens, grams, keep_sep, sep_token, start_end_token)","category":"page"},{"location":"man/make_cue_matrix/#JudiLing.Cue_Matrix_Struct","page":"Make Cue Matrix","title":"JudiLing.Cue_Matrix_Struct","text":"A structure that stores information created by makecuematrix: C is the cue matrix; f2i is a dictionary returning the indices for features; i2f is a dictionary returning the features for indices; goldind is a list of indices of gold paths; A is the adjacency matrix; grams is the number of grams for cues; targetcol is the column name for target strings; tokenized is whether the dataset target is tokenized; septoken is the separator; keepsep is whether to keep separators in cues; startendtoken is the start and end token in boundary cues.\n\n\n\n\n\n","category":"type"},{"location":"man/make_cue_matrix/#JudiLing.make_cue_matrix","page":"Make Cue Matrix","title":"JudiLing.make_cue_matrix","text":"Construct cue matrix.\n\n\n\n\n\n","category":"function"},{"location":"man/make_cue_matrix/#JudiLing.make_combined_cue_matrix","page":"Make Cue Matrix","title":"JudiLing.make_combined_cue_matrix","text":"Construct cue matrix where combined features and adjacencies for both training datasets and validation datasets.\n\n\n\n\n\n","category":"function"},{"location":"man/make_cue_matrix/#JudiLing.make_ngrams","page":"Make Cue Matrix","title":"JudiLing.make_ngrams","text":"Given a list of string tokens, extract their n-grams.\n\n\n\n\n\n","category":"function"},{"location":"man/make_cue_matrix/#JudiLing.make_cue_matrix-Tuple{DataFrames.DataFrame}","page":"Make Cue Matrix","title":"JudiLing.make_cue_matrix","text":"make_cue_matrix(data::DataFrame)\n\nMake the cue matrix for training datasets and corresponding indices as well as the adjacency matrix and gold paths given a dataset in a form of dataframe.\n\nObligatory Arguments\n\ndata::DataFrame: the dataset\n\nOptional Arguments\n\ngrams::Int64=3: the number of grams for cues\ntarget_col::Union{String, Symbol}=:Words: the column name for target strings\ntokenized::Bool=false:if true, the dataset target is assumed to be tokenized\nsep_token::Union{Nothing, String, Char}=nothing: separator\nkeep_sep::Bool=false: if true, keep separators in cues\nstart_end_token::Union{String, Char}=\"#\": start and end token in boundary cues\nverbose::Bool=false: if true, more information is printed\n\nExamples\n\n# make cue matrix without tokenization\ncue_obj_train = JudiLing.make_cue_matrix(\n     latin_train,\n    grams=3,\n    target_col=:Word,\n    tokenized=false,\n    sep_token=\"-\",\n    start_end_token=\"#\",\n    keep_sep=false,\n    verbose=false\n    )\n\n# make cue matrix with tokenization\ncue_obj_train = JudiLing.make_cue_matrix(\n    french_train,\n    grams=3,\n    target_col=:Syllables,\n    tokenized=true,\n    sep_token=\"-\",\n    start_end_token=\"#\",\n    keep_sep=true,\n    verbose=false\n    )\n\n\n\n\n\n","category":"method"},{"location":"man/make_cue_matrix/#JudiLing.make_cue_matrix-Tuple{DataFrames.DataFrame, JudiLing.Cue_Matrix_Struct}","page":"Make Cue Matrix","title":"JudiLing.make_cue_matrix","text":"make_cue_matrix(data::DataFrame, cue_obj::Cue_Matrix_Struct)\n\nMake the cue matrix for validation datasets and corresponding indices as well as the adjacency matrix and gold paths given a dataset in a form of dataframe.\n\nObligatory Arguments\n\ndata::DataFrame: the dataset\ncue_obj::Cue_Matrix_Struct: training cue object\n\nOptional Arguments\n\ngrams::Int64=3: the number of grams for cues\ntarget_col::Union{String, Symbol}=:Words: the column name for target strings\ntokenized::Bool=false:if true, the dataset target is assumed to be tokenized\nsep_token::Union{Nothing, String, Char}=nothing: separator\nkeep_sep::Bool=false: if true, keep separators in cues\nstart_end_token::Union{String, Char}=\"#\": start and end token in boundary cues\nverbose::Bool=false: if true, more information is printed\n\nExamples\n\n# make cue matrix without tokenization\ncue_obj_val = JudiLing.make_cue_matrix(\n  latin_val,\n  cue_obj_train,\n  grams=3,\n  target_col=:Word,\n  tokenized=false,\n  sep_token=\"-\",\n  keep_sep=false,\n  start_end_token=\"#\",\n  verbose=false\n  )\n\n# make cue matrix with tokenization\ncue_obj_val = JudiLing.make_cue_matrix(\n    french_val,\n    cue_obj_train,\n    grams=3,\n    target_col=:Syllables,\n    tokenized=true,\n    sep_token=\"-\",\n    keep_sep=true,\n    start_end_token=\"#\",\n    verbose=false\n    )\n\n\n\n\n\n","category":"method"},{"location":"man/make_cue_matrix/#JudiLing.make_cue_matrix-Tuple{DataFrames.DataFrame, DataFrames.DataFrame}","page":"Make Cue Matrix","title":"JudiLing.make_cue_matrix","text":"make_cue_matrix(data_train::DataFrame, data_val::DataFrame)\n\nMake the cue matrix for traiing and validation datasets at the same time.\n\nObligatory Arguments\n\ndata_train::DataFrame: the training dataset\ndata_val::DataFrame: the validation dataset\n\nOptional Arguments\n\ngrams::Int64=3: the number of grams for cues\ntarget_col::Union{String, Symbol}=:Words: the column name for target strings\ntokenized::Bool=false:if true, the dataset target is assumed to be tokenized\nsep_token::Union{Nothing, String, Char}=nothing: separator\nkeep_sep::Bool=false: if true, keep separators in cues\nstart_end_token::Union{String, Char}=\"#\": start and end token in boundary cues\nverbose::Bool=false: if true, more information is printed\n\nExamples\n\n# make cue matrix without tokenization\ncue_obj_train, cue_obj_val = JudiLing.make_cue_matrix(\n    latin_train,\n    latin_val,\n    grams=3,\n    target_col=:Word,\n    tokenized=false,\n    keep_sep=false\n    )\n\n# make cue matrix with tokenization\ncue_obj_train, cue_obj_val = JudiLing.make_cue_matrix(\n    french_train,\n    french_val,\n    grams=3,\n    target_col=:Syllables,\n    tokenized=true,\n    sep_token=\"-\",\n    keep_sep=true,\n    start_end_token=\"#\",\n    verbose=false\n    )\n\n\n\n\n\n","category":"method"},{"location":"man/make_cue_matrix/#JudiLing.make_combined_cue_matrix-Tuple{Any, Any}","page":"Make Cue Matrix","title":"JudiLing.make_combined_cue_matrix","text":"make_combined_cue_matrix(data_train, data_val)\n\nMake the cue matrix for training and validation datasets at the same time, where the features and adjacencies are combined.\n\nObligatory Arguments\n\ndata_train::DataFrame: the training dataset\ndata_val::DataFrame: the validation dataset\n\nOptional Arguments\n\ngrams::Int64=3: the number of grams for cues\ntarget_col::Union{String, Symbol}=:Words: the column name for target strings\ntokenized::Bool=false:if true, the dataset target is assumed to be tokenized\nsep_token::Union{Nothing, String, Char}=nothing: separator\nkeep_sep::Bool=false: if true, keep separators in cues\nstart_end_token::Union{String, Char}=\"#\": start and end token in boundary cues\nverbose::Bool=false: if true, more information is printed\n\nExamples\n\n# make cue matrix without tokenization\ncue_obj_train, cue_obj_val = JudiLing.make_combined_cue_matrix(\n    latin_train,\n    latin_val,\n    grams=3,\n    target_col=:Word,\n    tokenized=false,\n    keep_sep=false\n    )\n\n# make cue matrix with tokenization\ncue_obj_train, cue_obj_val = JudiLing.make_combined_cue_matrix(\n    french_train,\n    french_val,\n    grams=3,\n    target_col=:Syllables,\n    tokenized=true,\n    sep_token=\"-\",\n    keep_sep=true,\n    start_end_token=\"#\",\n    verbose=false\n    )\n\n\n\n\n\n","category":"method"},{"location":"man/make_cue_matrix/#JudiLing.make_cue_matrix_from_CFBS-Union{Tuple{Array{Vector{T}, 1}}, Tuple{T}} where T","page":"Make Cue Matrix","title":"JudiLing.make_cue_matrix_from_CFBS","text":"make_cue_matrix_from_CFBS(features::Vector{Vector{T}};\n                          pad_val::T = 0.,\n                          ncol::Union{Missing,Int}=missing) where {T}\n\nCreate a cue matrix from a vector of feature vectors (usually CFBS vectors). It is expected (though of course not necessary) that the vectors have varying lengths. They are consequently padded on the right with the provided pad_val.\n\nObligatory arguments\n\nfeatures::Vector{Vector{T}}: vector of vectors containing C-FBS features\n\nOptional arguments\n\npad_val::T = 0.: Value with which the feature vectors will be padded\nncol::Union{Missing,Int}=missing: Number of columns of the C matrix. If not set, will be set to the maximum number of features\n\nExamples\n\nC = JudiLing.make_cue_matrix_from_CFBS(features)\n\n\n\n\n\n","category":"method"},{"location":"man/make_cue_matrix/#JudiLing.make_combined_cue_matrix_from_CFBS-Union{Tuple{T}, Tuple{Array{Vector{T}, 1}, Array{Vector{T}, 1}}} where T","page":"Make Cue Matrix","title":"JudiLing.make_combined_cue_matrix_from_CFBS","text":"make_combined_cue_matrix_from_CFBS(features_train::Vector{Vector{T}},\n                                   features_test::Vector{Vector{T}};\n                                   pad_val::T = 0.,\n                                   ncol::Union{Missing,Int}=missing) where {T}\n\nCreate cue matrices from two vectors of feature vectors (usually CFBS vectors). It is expected (though of course not necessary) that the vectors have varying lengths. They are consequently padded on the right with the provided pad_val. The cue matrices are set to have to the size of the maximum number of feature values in features_train and features_test.\n\nObligatory arguments\n\nfeatures_train::Vector{Vector{T}}: vector of vectors containing C-FBS features\nfeatures_test::Vector{Vector{T}}: vector of vectors containing C-FBS features\n\nOptional arguments\n\npad_val::T = 0.: Value with which the feature vectors will be padded\nncol::Union{Missing,Int}=missing: Number of columns of the C matrices. If not set, will be set to the maximum number of features in features_train and features_test\n\nExamples\n\nC_train, C_test = JudiLing.make_combined_cue_matrix_from_CFBS(features_train, features_test)\n\n\n\n\n\n","category":"method"},{"location":"man/make_cue_matrix/#JudiLing.make_ngrams-NTuple{5, Any}","page":"Make Cue Matrix","title":"JudiLing.make_ngrams","text":"make_ngrams(tokens, grams, keep_sep, sep_token, start_end_token)\n\nGiven a list of string tokens return a list of all n-grams for these tokens.\n\n\n\n\n\n","category":"method"}]
 }