pglpm
diff --git a/‎OPM_application_nominal.ipynb
+502 b/‎OPM_application_nominal.ipynb
+502
diff --git a/‎OPM_application_nominal.qmd
+16-12 b/‎OPM_application_nominal.qmd
+16-12
diff --git a/‎OPM_application_nominal_files/execute-results/html.json
+11 b/‎OPM_application_nominal_files/execute-results/html.json
+11
diff --git a/‎docs/OPM_application_nominal_files/figure-html/cell-10-output-1.png ‎OPM_application_nominal_files/figure-html/cell-10-output-1.png b/‎docs/OPM_application_nominal_files/figure-html/cell-10-output-1.png ‎OPM_application_nominal_files/figure-html/cell-10-output-1.png
diff --git a/‎docs/OPM_application_nominal_files/figure-html/cell-7-output-1.png ‎OPM_application_nominal_files/figure-html/cell-7-output-1.png b/‎docs/OPM_application_nominal_files/figure-html/cell-7-output-1.png ‎OPM_application_nominal_files/figure-html/cell-7-output-1.png
diff --git a/‎docs/OPM_application_nominal_files/figure-html/cell-8-output-1.png ‎OPM_application_nominal_files/figure-html/cell-8-output-1.png b/‎docs/OPM_application_nominal_files/figure-html/cell-8-output-1.png ‎OPM_application_nominal_files/figure-html/cell-8-output-1.png
diff --git a/‎docs/OPM_application_nominal_files/figure-html/fig-conditional-glass-output-1.png ‎OPM_application_nominal_files/figure-html/fig-conditional-glass-output-1.png b/‎docs/OPM_application_nominal_files/figure-html/fig-conditional-glass-output-1.png ‎OPM_application_nominal_files/figure-html/fig-conditional-glass-output-1.png
diff --git a/‎docs/OPM_application_nominal_files/figure-html/fig-unconditional-glass-output-1.png ‎OPM_application_nominal_files/figure-html/fig-unconditional-glass-output-1.png b/‎docs/OPM_application_nominal_files/figure-html/fig-unconditional-glass-output-1.png ‎OPM_application_nominal_files/figure-html/fig-unconditional-glass-output-1.png
diff --git a/‎_quarto.yml
+1-1 b/‎_quarto.yml
+1-1
diff --git a/‎code/OPM-nominal/buildK.R ‎code/OPM-nominal/buildP.R
+1-1 b/‎code/OPM-nominal/buildK.R ‎code/OPM-nominal/buildP.R
+1-1
diff --git a/‎code/OPM-nominal/forecastK.R ‎code/OPM-nominal/forecastP.R
+8-8 b/‎code/OPM-nominal/forecastK.R ‎code/OPM-nominal/forecastP.R
+8-8
diff --git a/‎code/OPM-nominal/plotFsamples1D.R
+4-4 b/‎code/OPM-nominal/plotFsamples1D.R
+4-4
diff --git a/‎code/OPM-nominal/rF.R
+6-6 b/‎code/OPM-nominal/rF.R
+6-6
@@ -11,7 +11,11 @@ jupyter: ir
 
 ```{r}
 source('code/tplotfunctions.R')
-source('code/optimal_predictor_machine-nominal.R')
+source('code/OPM-nominal/buildP.R')
+source('code/OPM-nominal/forecastP.R')
+source('code/OPM-nominal/guessmetadata.R')
+source('code/OPM-nominal/plotFsamples1D.R')
+source('code/OPM-nominal/rF.R')
 ```
 ```{r}
 #| echo: false
@@ -71,7 +75,7 @@ Our agent at the moment doesn't know anything at all, not even about the existen
 Let us give it the basic background information about the population: the variates' names and domains. We do this through the function `finfo()`: it has a `data` argument, which we omit for the moment, and a `metadata` argument. The latter can simply be the name of the file containing the metadata (NB: this file must have a specific format):
 
 ```{r}
-priorknowledge <- buildK(metadata='datasets/glass_metadata-4_lev.csv')
+priorknowledge <- buildP(metadata='datasets/glass_metadata-4_lev.csv')
 ```
 
 The agent now possesses this basic background knowlege, encoded in the `priorknowledge` object. The encoding uses a particular mathematical representation which, however, is of no interest to us^[If you're curious you can have a glimpse at it with the command `str(priorknowledge)`, which displays structural information about an object.]. Other representations could also be used, but the knowledge would be the same. Think of this as encoding an image into a `png` or other lossless format: the representation of the image would be different, but the image would be the same.
@@ -86,7 +90,7 @@ Let's ask the agent: what is the marginal frequency distribution for the variate
 This probability distribution for the $\vType$ variate is calculated by the function `fmarginal()`. It has arguments `finfo`: the agent's information; and `variates`: the names of the variates of which we want the marginal frequencies:
 
 ```{r}
-priorknowledge_type <- fprobability(K=priorknowledge, marginal='Type', Kout=TRUE)
+priorknowledge_type <- forecastP(P=priorknowledge, marginal='Type', Kout=TRUE)
 
 ```
 
@@ -99,7 +103,7 @@ The function `plotsamples1D()` does this kind of visual representation. It has a
 How do you think this probability distribution will look like? what kind of marginal frequencies we do expect in the full population?
 
 ```{r}
-plotsamples1D(K=priorknowledge_type, n=100, predict=FALSE)
+plotsamples1D(P=priorknowledge_type, n=100, predict=FALSE)
 ```
 
 You see that anything goes: Some frequency distributions give frequency almost `1` to a specific value, and almost `0` to the others. Other frequency distributions spread out the frequencies more evenly, with some peaks here or there.
@@ -120,7 +124,7 @@ Before continuing, ask yourself the same question: which probabilities would you
 The agent's answer this time is a probability distribution over seven values, which we can draw faithfully. The function `plotsamples1D()` can draw this probability as well, if we give the argument `predict=TRUE` (default):
 
 ```{r}
-plotsamples1D(K=priorknowledge_type)
+plotsamples1D(P=priorknowledge_type)
 ```
 
 This plot shows the [probability distribution]{.blue} for the next unit in [blue]{.blue}, together with a sample of 100 possible frequency distributions for the $\vType$ variate over the full population. Note that samples are drawn anew every time, so they can look somewhat differently from time to time.^[To have reproducible plots, use `set.seed(314)` (or any integer you like) before calling the plot function.]
@@ -139,10 +143,10 @@ Inspect the agent's inferences for other variates.
 
 ### Learning from the sample data
 
-Now let's give the agent the data from the sample of 214 glass fragments. This is done again with the `buildK()` function, but providing the `data` argument, which can be the name of the data file:
+Now let's give the agent the data from the sample of 214 glass fragments. This is done again with the `buildP()` function, but providing the `data` argument, which can be the name of the data file:
 
 ```{r}
-postknowledge <- buildK(data='datasets/glass_data-4_lev.csv', metadata='datasets/glass_metadata-4_lev.csv')
+postknowledge <- buildP(data='datasets/glass_data-4_lev.csv', metadata='datasets/glass_metadata-4_lev.csv')
 ```
 
 The `postknowledge` object contains the agent's knowledge from the metadata and the sample data. This object can be used in the same way as the object representing the agent's background knowledge.
@@ -154,9 +158,9 @@ Now that the agent has learned from the data, we can ask it again what is the ma
 We calculate the probability for the possible marginal frequency distributions, and then plot it as a set of 100 representative samples:
 
 ```{r}
-postknowledge_type <- fprobability(K=postknowledge, marginal='Type', Kout=TRUE)
+postknowledge_type <- forecastP(P=postknowledge, marginal='Type', Kout=TRUE)
 
-plotsamples1D(K=postknowledge_type, predict=FALSE)
+plotsamples1D(P=postknowledge_type, predict=FALSE)
 ```
 
 This plot shows two important aspects of this probability distribution and of the agent's current state of knowledge:
@@ -185,7 +189,7 @@ Finally we ask the agent what $\vType$ value we should observe in the next glass
 ```{r}
 #| label: fig-unconditional-glass
 #| fig-cap: "[Frequency distributions for full population]{.grey}, and [probability distribution for next unit]{.blue}"
-plotsamples1D(K=postknowledge_type)
+plotsamples1D(P=postknowledge_type)
 ```
 
 
@@ -213,7 +217,7 @@ The detectives would like to know what's the possible origin of this fragment, t
 First, the agent can calculate the probability distribution over the *conditional frequencies* ([§ @sec-conditional-freqs]) of the $\vType$ values for the subpopulation ([§ @sec-subpopulations]) of units having the specific variate values above. This calculation is done with the function `fconditional()`, with arguments `finfo`: the agent's current knowledge, and `unitdata`: the partial data obtained from the unit.
 
 ```{r}
-condknowledge_type <- fprobability(K=postknowledge, marginal='Type', conditional=newfragment, Kout=TRUE)
+condknowledge_type <- forecastP(P=postknowledge, marginal='Type', conditional=newfragment, Kout=TRUE)
 ```
 
 The `condknowledge` object contains the agent's knowledge conditional on the variates given; this knowledge is about the remaining variates, which in this case are the single variate $\vType$ (so the `fmarginal()` calculation is actually redundant in this case).
@@ -225,7 +229,7 @@ Both inferences can be visualized in the usual way:
 ```{r}
 #| label: fig-conditional-glass
 #| fig-cap: "[Conditional frequency distributions for full population]{.grey}, and [conditional probability distribution for next unit]{.blue}"
-plotsamples1D(K=condknowledge_type)
+plotsamples1D(P=condknowledge_type)
 ```
 
 The agent thus gives a probability around $80\%$ to the fragment's being of $\cat{T1}$ type, around $10\%$ of being $\cat{T2}$ type, and around $5\%$ of being $\cat{T5}$ type. It also shows that further training data could change these probabilities by even $\pm 10\%$ or even $\pm 15\%$.
 
@@ -107,7 +107,7 @@ book:
       chapters:
         - dirichlet-mixture.qmd
         - prototype_code.qmd
-        - OPM_application_nominal.qmd
+#        - OPM_application_nominal.qmd
 
     - part: "[**Decision theory**]{.lightblue}"
       chapters:
 
@@ -1,4 +1,4 @@
-buildK <- function(metadata, data=NULL, alphas=NULL){
+buildP <- function(metadata, data=NULL, alphas=NULL){
 #### Build object encoding background knowledge and learned knowledge
 #### Requires 'data.table'
     ##
 
@@ -1,7 +1,7 @@
-forecastK <- function(K, conditional=NULL){
+forecastP <- function(P, conditional=NULL){
 #### Calculate conditional or unconditional probability
-    variates <- names(dimnames(K[['freqs']]))
-    M <- length(K[['freqs']])
+    variates <- names(dimnames(P[['freqs']]))
+    M <- length(P[['freqs']])
     ## Selection of conditional values
     ## select subarray of freqs corresponding to the conditional values
     if(!is.null(conditional)){
@@ -18,23 +18,23 @@ forecastK <- function(K, conditional=NULL){
         iconditional <- match(names(conditional), variates)
         totake <- as.list(rep(TRUE, length(variates)))
         totake[iconditional] <- conditional
-        freqs <- do.call(`[`, c(list(K[['freqs']]), totake))
+        freqs <- do.call(`[`, c(list(P[['freqs']]), totake))
         if(is.null(dim(freqs))){
             dim(freqs) <- length(freqs)
-            dimnames(freqs) <- dimnames(K[['freqs']])[-iconditional]
+            dimnames(freqs) <- dimnames(P[['freqs']])[-iconditional]
         }
     }else{
-        freqs <- K[['freqs']]
+        freqs <- P[['freqs']]
     }
     ##
     ## create an array of forecast variates and alphas
     freqs <- aperm(
-        sapply(K[['alphas']], function(alpha){
+        sapply(P[['alphas']], function(alpha){
             log(M*alpha + freqs)
         }, simplify='array'),
         c(length(dim(freqs))+1, 1:length(dim(freqs)))
     )
-    freqs <- freqs - max(freqs) + K[['valphas']]
+    freqs <- freqs - max(freqs) + P[['valphas']]
     ##
     temp <- dimnames(freqs)[-1]
     freqs <- colSums(exp(freqs))
 
@@ -1,10 +1,10 @@
-plotFsamples1D <- function(K, n=100, predict=TRUE, file=NULL){
+plotFsamples1D <- function(P, n=100, predict=TRUE, file=NULL){
 #### Plot samples of full-population freq. distributions for one variate
 #### Requires 'png' to plot png
-    if(length(dim(K[['freqs']])) > 1){
+    if(length(dim(P[['freqs']])) > 1){
         stop('State of knowledge comprises more than one variate.')
     }
-    samples <- rF(n=n, K=K)
+    samples <- rF(n=n, P=P)
     if(!is.null(file)){
         filext <- sub(".*\\.|.*", "", file, perl=TRUE)
         if(filext == 'pdf'){
@@ -21,7 +21,7 @@ plotFsamples1D <- function(K, n=100, predict=TRUE, file=NULL){
       lty=1, lwd=1, pch=16, col=7, alpha=0.5, cex=0.75
       )
     if(predict){
-        fmean <- fprobability(K=K, Kout=F)
+        fmean <- fprobability(P=P, Kout=F)
         tplot(y=fmean, x=1:ncol(samples), type='b',
               lty=1, lwd=4, pch=18, col=1, alpha=0.25, cex=1, add=T
               )
 
@@ -1,10 +1,10 @@
-rF <- function(n=1, K){
+rF <- function(n=1, P){
 #### Return a sample of full-population frequency
 #### Requires 'extraDistr'
-    alphasample <- sample(rep(K[['alphas']],2), size=n, replace=T,
-                          prob=rep(K[['palphas']],2))
-    ff <- extraDistr::rdirichlet(n, alpha=outer(alphasample, c(K[['freqs']]), `+`))
-    dim(ff) <- c(n,dim(K[['freqs']]))
-    dimnames(ff) <- c(list(sample=NULL), dimnames(K[['freqs']]))
+    alphasample <- sample(rep(P[['alphas']],2), size=n, replace=T,
+                          prob=rep(P[['palphas']],2))
+    ff <- extraDistr::rdirichlet(n, alpha=outer(alphasample, c(P[['freqs']]), `+`))
+    dim(ff) <- c(n,dim(P[['freqs']]))
+    dimnames(ff) <- c(list(sample=NULL), dimnames(P[['freqs']]))
     ff
 }
Original file line number	Diff line number	Diff line change
`@@ -1,4 +1,4 @@`
`1`		`-buildK <- function(metadata, data=NULL, alphas=NULL){`
	`1`	`+buildP <- function(metadata, data=NULL, alphas=NULL){`
`2`	`2`	`#### Build object encoding background knowledge and learned knowledge`
`3`	`3`	`#### Requires 'data.table'`
`4`	`4`	`##`