From 61570f0c5d68212c60c5518f76005462abe3d444 Mon Sep 17 00:00:00 2001
From: Louis Aslett <louis.aslett@durham.ac.uk>
Date: Mon, 23 Sep 2024 16:51:56 +0100
Subject: [PATCH 01/43] Start work on v2

---
 DESCRIPTION | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/DESCRIPTION b/DESCRIPTION
index c71448f..3a696fd 100644
--- a/DESCRIPTION
+++ b/DESCRIPTION
@@ -1,7 +1,7 @@
 Package: kalis
 Type: Package
 Title: High Performance Li & Stephens Local Ancestry Inference
-Version: 1.0.0
+Version: 2.0.0
 Authors@R: c(person("Louis", "Aslett", role = c("aut", "cre"),
                     email = "louis.aslett@durham.ac.uk"),
              person("Ryan", "Christ", role = "aut",

From 55c3672d33b8a066ec3cd74dd14a4a23e5591f5d Mon Sep 17 00:00:00 2001
From: ryanchrist <ryan.christ7@gmail.com>
Date: Mon, 23 Sep 2024 11:43:39 -0500
Subject: [PATCH 02/43] Introducing O(n) clustering algorithm (blobby) and
 C-core for clade calling and clade matrix construction

---
 src/R_CladeMat.c | 834 +++++++++++++++++++++++++++++++++++++++++++++++
 src/R_CladeMat.h |  20 ++
 2 files changed, 854 insertions(+)
 create mode 100644 src/R_CladeMat.c
 create mode 100644 src/R_CladeMat.h

diff --git a/src/R_CladeMat.c b/src/R_CladeMat.c
new file mode 100644
index 0000000..6c26f30
--- /dev/null
+++ b/src/R_CladeMat.c
@@ -0,0 +1,834 @@
+#include "R_CladeMat.h"
+
+#define _GNU_SOURCE
+#include <pthread.h>
+#include "R_Kalis.h"
+#include "Cache.h"
+
+#define min(X, Y)  ((X) < (Y) ? (X) : (Y))
+
+typedef struct blob {
+  struct blob* blob;
+  size_t num_in_blob;
+  double lower;
+  double upper;
+  struct blob* next;
+  struct blob* prev;
+  struct blob* morepop;
+  struct blob* lesspop;
+  double c3;
+} blob;
+
+
+void printblob(blob* bobtheblob) {
+  Rprintf("Blob %p (%p): # = %d, range = (%lf, %lf), prv = %p, nxt = %p, lp = %p, mp = %p \n",
+          bobtheblob,
+          (bobtheblob==bobtheblob->blob?NULL:bobtheblob->blob),
+          bobtheblob->num_in_blob,
+          bobtheblob->lower,
+          bobtheblob->upper,
+          bobtheblob->prev,
+          bobtheblob->next,
+          bobtheblob->lesspop,
+          bobtheblob->morepop);
+}
+
+void blobby_pop_contest(blob* cur, blob** headpop, blob** tailpop) {
+  if(cur->morepop != NULL && cur->morepop->num_in_blob < cur->num_in_blob) {
+    blob *other;
+    other = cur->morepop;
+
+    if(other->morepop != NULL) {
+      other->morepop->lesspop = cur;
+    }
+    cur->morepop = other->morepop;
+    other->morepop = cur;
+    if(cur->morepop == NULL) {
+      *headpop = cur;
+    }
+
+    if(cur->lesspop != NULL) {
+      cur->lesspop->morepop = other;
+    }
+    other->lesspop = cur->lesspop;
+    cur->lesspop = other;
+    if(other->lesspop == NULL) {
+      *tailpop = other;
+    }
+
+    blobby_pop_contest(cur, headpop, tailpop);
+  } else if(cur->lesspop != NULL && cur->lesspop->num_in_blob > cur->num_in_blob) {
+    blob *other;
+    other = cur->lesspop;
+
+    if(cur->morepop != NULL) {
+      cur->morepop->lesspop = other;
+    }
+    other->morepop = cur->morepop;
+    cur->morepop = other;
+    if(other->morepop == NULL) {
+      *headpop = other;
+    }
+
+    if(other->lesspop != NULL) {
+      other->lesspop->morepop = cur;
+    }
+    cur->lesspop = other->lesspop;
+    other->lesspop = cur;
+    if(cur->lesspop == NULL) {
+      *tailpop = cur;
+    }
+
+    blobby_pop_contest(cur, headpop, tailpop);
+  }
+}
+
+
+blob* hunttheblob(blob* blob) {
+  if(blob->blob == blob)
+    return(blob);
+  return(hunttheblob(blob->blob));
+}
+
+double alphabetascaling(double x, double z0) {
+  x = x * z0;
+  if(x == 0.0) {
+    return(744.4400719213812180897);
+  } else {
+    return(-log(x));
+  }
+}
+
+blob* blobby_BB(const double* alpha, const double* beta, const size_t recipient, size_t n, blob* blobs, blob*** x_in_blob, double* n_clade, const double thres, const double maxd, const double unitdist, const int max1var) {
+  double z0 = 0.0;
+  for(size_t i = 0; i<n; i++) {
+    z0 += alpha[i] * beta[i];
+  }
+  z0 = 1/z0;
+
+  const double* a_ptr = alpha+1;
+  const double* b_ptr = beta+1;
+
+  double x, xnext;
+
+  blob *head, *tail, *headpop, *tailpop;
+  head = tail = headpop = tailpop = blobs;
+
+  blobs[0].blob = blobs;
+  blobs[0].num_in_blob = 1;
+  if(recipient==0)
+    x = 0.0;
+  else
+    x = alphabetascaling(*alpha * *beta, z0);
+  if(recipient==1)
+    xnext = 0.0;
+  else
+    xnext = alphabetascaling(*a_ptr * *b_ptr, z0);
+  blobs[0].lower = x - thres;
+  blobs[0].upper = x + thres;
+  blobs[0].next = NULL;
+  blobs[0].prev = NULL;
+  blobs[0].morepop = NULL;
+  blobs[0].lesspop = NULL;
+
+  x_in_blob[0] = &(blobs[0].blob);
+
+  // What element of blob array is the next new one?
+  size_t next_new_blob = 1;
+
+  const size_t recipientm1 = recipient - 1;
+  blob* cur;
+
+  //Rprintf("Adding obs %lf\n", x);
+
+  for(size_t i = 1; i < n; i++) {
+    x = xnext;
+    if(i<n-1){
+      if(recipientm1==i)
+      {
+        xnext = 0.0;
+      }
+      else
+      {
+        xnext = alphabetascaling(*(a_ptr+1) * *(b_ptr+1), z0);
+      }
+    }
+
+    cur = headpop;
+
+    // DETAILED DEBUG
+    // Rprintf("COMPUTED BLOBS (hp = %p, tp = %p): \n", headpop, tailpop);
+    // blob* prt = head;
+    // while(prt != NULL) {
+    //   printblob(prt);
+    //   prt = prt->next;
+    // }
+    // Rprintf("Adding obs: %d = %lf\n", i, x);
+
+    //Rprintf("Adding obs %lf\n", x);
+
+    while(cur != NULL) {
+
+
+      // this observation is between blobs
+      if(cur->prev != NULL && x < cur->lower && x >= cur->prev->upper) { // do we want to check to the right here or just leave to that pointer iteration?
+        blobs[next_new_blob].blob = blobs + next_new_blob;
+        blobs[next_new_blob].num_in_blob = 1;
+        blobs[next_new_blob].lower = x - thres;
+        blobs[next_new_blob].upper = x + thres;
+        blobs[next_new_blob].next = cur;
+        blobs[next_new_blob].prev = cur->prev;
+        blobs[next_new_blob].morepop = tailpop;
+        blobs[next_new_blob].lesspop = NULL;
+        cur->prev->next = blobs + next_new_blob;
+        cur->prev = blobs + next_new_blob;
+        tailpop->lesspop = blobs + next_new_blob;
+        tailpop = blobs + next_new_blob;
+        x_in_blob[i] = &(blobs[next_new_blob].blob);
+        next_new_blob++;
+        a_ptr++;
+        b_ptr++;
+        break;
+      }
+
+      // this observation is between and causes blobs to merge (to the right)
+      if(cur->next != NULL && x >= cur->next->lower && x < cur->upper) {
+        cur->next->blob = cur->blob;
+        cur->num_in_blob += cur->next->num_in_blob + 1;
+        if(tail == cur->next) {
+          tail = cur->blob;
+        } else {
+          cur->next->next->prev = cur;
+        }
+        if(cur->next == headpop) {
+          headpop = cur->next->lesspop;
+        } else {
+          cur->next->morepop->lesspop = cur->next->lesspop;
+        }
+        if(cur->next == tailpop) {
+          tailpop = cur->next->morepop;
+        } else {
+          cur->next->lesspop->morepop = cur->next->morepop;
+        }
+        cur->upper = cur->next->upper;
+        cur->next = cur->next->next;
+        blobby_pop_contest(cur, &headpop, &tailpop);
+        x_in_blob[i] = &(cur->blob);
+        a_ptr++;
+        b_ptr++;
+        break;
+      }
+
+      // this observation is between and causes blobs to merge (to the left)
+      if(cur->prev != NULL && x >= cur->lower && x < cur->prev->upper) {
+        cur->prev->blob = cur->blob;
+        cur->num_in_blob += cur->prev->num_in_blob + 1;
+        if(head == cur->prev) {
+          head = cur->blob;
+        } else {
+          cur->prev->prev->next = cur;
+        }
+        if(cur->prev == headpop) {
+          headpop = cur->prev->lesspop;
+        } else {
+          cur->prev->morepop->lesspop = cur->prev->lesspop;
+        }
+        if(cur->prev == tailpop) {
+          tailpop = cur->prev->morepop;
+        } else {
+          cur->prev->lesspop->morepop = cur->prev->morepop;
+        }
+        cur->lower = cur->prev->lower;
+        cur->prev = cur->prev->prev;
+        blobby_pop_contest(cur, &headpop, &tailpop);
+        x_in_blob[i] = &(cur->blob);
+        a_ptr++;
+        b_ptr++;
+        break;
+      }
+
+      // this observation is in this blob
+      if(x >= cur->lower && x < cur->upper) {
+        (cur->num_in_blob)++;
+        if(x - thres < cur->lower) {
+          cur->lower = x - thres;
+        } else if(x + thres > cur->upper) {
+          cur->upper = x + thres;
+        }
+        blobby_pop_contest(cur, &headpop, &tailpop);
+        x_in_blob[i] = &(cur->blob);
+        a_ptr++;
+        b_ptr++;
+        break;
+      }
+
+      cur = cur->lesspop;
+    }
+    // this observation is smaller than any previously seen blob
+    if(cur == NULL && x < head->lower) {
+      blobs[next_new_blob].blob = blobs + next_new_blob;
+      blobs[next_new_blob].num_in_blob = 1;
+      blobs[next_new_blob].lower = x - thres;
+      blobs[next_new_blob].upper = x + thres;
+      blobs[next_new_blob].next = head;
+      blobs[next_new_blob].prev = NULL;
+      blobs[next_new_blob].morepop = tailpop;
+      blobs[next_new_blob].lesspop = NULL;
+      head->prev = blobs + next_new_blob;
+      head = blobs + next_new_blob;
+      tailpop->lesspop = blobs + next_new_blob;
+      tailpop = blobs + next_new_blob;
+      x_in_blob[i] = &(blobs[next_new_blob].blob);
+      next_new_blob++;
+      a_ptr++;
+      b_ptr++;
+      continue;
+    }
+    // this observation is larger than any previously seen blob
+    if(cur == NULL && x >= tail->upper) {
+      // this observation is beyond the end of all blobs
+      blobs[next_new_blob].blob = blobs + next_new_blob;
+      blobs[next_new_blob].num_in_blob = 1;
+      blobs[next_new_blob].lower = x - thres;
+      blobs[next_new_blob].upper = x + thres;
+      blobs[next_new_blob].next = NULL;
+      blobs[next_new_blob].prev = tail;
+      blobs[next_new_blob].morepop = tailpop;
+      blobs[next_new_blob].lesspop = NULL;
+      tail->next = blobs + next_new_blob;
+      tail = blobs + next_new_blob;
+      tailpop->lesspop = blobs + next_new_blob;
+      tailpop = blobs + next_new_blob;
+      x_in_blob[i] = &(blobs[next_new_blob].blob);
+      next_new_blob++;
+      a_ptr++;
+      b_ptr++;
+      continue;
+    }
+  }
+
+  // Chase down pointers
+  // DEBUG
+  // Rprintf("ALL USED BLOBS (pre-parse):\n\n");
+  // for(size_t i = 0; i<next_new_blob; i++) {
+  //   printblob(blobs+i);
+  // }
+
+  for(size_t i = 0; i<next_new_blob; i++) {
+    if(blobs[i].blob == blobs+i || (blobs[i].blob)->blob == blobs[i].blob)
+      continue;
+
+    blobs[i].blob = hunttheblob(blobs[i].blob);
+  }
+
+  // DEBUG
+  // Rprintf("ALL USED BLOBS:\n\n");
+  // for(size_t i = 0; i<next_new_blob; i++) {
+  //   printblob(blobs+i);
+  // }
+
+  // Col 3 calc
+  double j = n, diff = 0.0, temp_n_mut = 0.0;
+  cur = tail;
+  cur->c3 = 0.0;
+  int num_surv_blob = 0;
+  *n_clade = 0.0;
+  while(cur->prev != NULL) {
+    num_surv_blob++;
+    j -= cur->num_in_blob;
+    diff = cur->lower - cur->prev->upper + 2*thres;
+    temp_n_mut = diff/unitdist;
+    if(max1var){
+      cur->prev->c3 = *n_clade += min(temp_n_mut,1.0)/j;
+    } else {
+      cur->prev->c3 = *n_clade += temp_n_mut/j;
+    }
+    cur = cur->prev;
+  }
+  // DEBUG
+  // cur = head;
+  // while(cur != NULL) {
+  //   Rprintf("%lf\n", cur->c3);
+  //   cur = cur->next;
+  // }
+
+  //DEBUG
+  // Rprintf("\nCOMPUTED BLOBS:\n\n");
+  // cur = head;
+  // int i=0;
+  // while(cur != NULL) {
+  //   i++;
+  //   printblob(cur);
+  //   cur = cur->next;
+  // }
+  // Rprintf("%d blobs used in total, %d survive.\n", next_new_blob+1, num_surv_blob+1);
+
+  return(head);
+}
+
+void blobby_B1(double* alpha1, double* beta1, size_t recipient, size_t n, double thres, const double unitdist, const int max1var) {
+  thres *= unitdist;
+  double maxd = 744.4400719213812180897;
+  blob blobs[(int) (maxd/thres+2)];
+  blob** x_in_blob[n];
+  double* n_clade;
+  blobby_BB(alpha1, beta1, recipient, n, blobs, x_in_blob, n_clade, thres, maxd, unitdist, max1var);
+}
+
+
+SEXP blobbyB1(SEXP ALPHA, SEXP BETA, SEXP FROMRECIPIENT, SEXP THRES, SEXP UNITDIST, SEXP MAX1VAR) {
+  double* alpha = REAL(ALPHA);
+  double* beta = REAL(BETA);
+  double* thres = REAL(THRES);
+  double* unitdist = REAL(UNITDIST);
+  int* max1var = INTEGER(MAX1VAR);
+  size_t cur_left_recipient = (size_t) *INTEGER(FROMRECIPIENT) - 1;
+
+  blobby_B1(alpha, beta, cur_left_recipient, (size_t) Rf_length(ALPHA), *thres, *unitdist, *max1var);
+
+  return(R_NilValue);
+}
+
+
+
+void blobby_B2(const double* alpha1, const double* beta1, const double* alpha2, const double* beta2, size_t cur_left_recipient,
+               size_t n, double thres, const double unitdist, const int max1var,
+               double* res,
+               int** neigh1, int** neigh2, int* n_neigh1, int* n_neigh2,
+               double* n_clade1, double* n_clade2,
+               double* similarities1, double* similarities2,
+               blob*** x_in_blob1, blob*** x_in_blob2,
+               const double maxd, blob* blobs1, blob* blobs2) {
+  thres *= unitdist;
+  blob* head1 = blobby_BB(alpha1, beta1, cur_left_recipient, n, blobs1, x_in_blob1, n_clade1, thres, maxd, unitdist, max1var);
+  blob* head2 = blobby_BB(alpha2, beta2, cur_left_recipient + 1, n, blobs2, x_in_blob2, n_clade2, thres, maxd, unitdist, max1var);
+
+  int both1, both2;
+  if(head1->num_in_blob > 1) {
+    *n_neigh1 = head1->num_in_blob;
+    both1 = 0;
+    similarities1[0] = head1->c3;
+    similarities1[1] = head1->c3;
+    if(head1->next != NULL) {
+      similarities1[2] = head1->next->c3;
+    } else {
+      similarities1[2] = 0.0;
+    }
+  } else {
+    *n_neigh1 = 1 + head1->next->num_in_blob;
+    both1 = 1;
+    similarities1[0] = head1->c3;
+    similarities1[1] = head1->next->c3;
+    if(head1->next->next != NULL) {
+      similarities1[2] = head1->next->next->c3;
+    } else {
+      similarities1[2] = 0.0;
+    }
+  }
+  if(head2->num_in_blob > 1) {
+    *n_neigh2 = head2->num_in_blob;
+    both2 = 0;
+    similarities2[0] = head2->c3;
+    similarities2[1] = head2->c3;
+    if(head2->next != NULL) {
+      similarities2[2] = head2->next->c3;
+    } else {
+      similarities2[2] = 0.0;
+    }
+  } else {
+    *n_neigh2 = 1 + head2->next->num_in_blob;
+    both2 = 1;
+    similarities2[0] = head2->c3;
+    similarities2[1] = head2->next->c3;
+    if(head2->next->next != NULL) {
+      similarities2[2] = head2->next->next->c3;
+    } else {
+      similarities2[2] = 0.0;
+    }
+  }
+
+  *neigh1 = malloc(sizeof(int)* *n_neigh1);
+  *neigh2 = malloc(sizeof(int)* *n_neigh2);
+
+  // Neighbours and dedip
+  size_t j = 0, ni1 = 0, ni2 = 0;
+  for(size_t i = 0; i<n/2; i++) {
+    if((*(x_in_blob1[j]))->blob == head1 || (both1 && (*(x_in_blob1[j]))->blob == head1->next)) {
+      (*neigh1)[ni1++] = j+1;
+    }
+    if((*(x_in_blob1[j+1]))->blob == head1 || (both1 && (*(x_in_blob1[j+1]))->blob == head1->next)) {
+      (*neigh1)[ni1++] = j+2;
+    }
+    if((*(x_in_blob2[j]))->blob == head2 || (both2 && (*(x_in_blob2[j]))->blob == head2->next)) {
+      (*neigh2)[ni2++] = j+1;
+    }
+    if((*(x_in_blob2[j+1]))->blob == head2 || (both2 && (*(x_in_blob2[j+1]))->blob == head2->next)) {
+      (*neigh2)[ni2++] = j+2;
+    }
+    res[i] = (*(x_in_blob1[j]))->blob->c3 + (*(x_in_blob1[j+1]))->blob->c3 + (*(x_in_blob2[j]))->blob->c3 + (*(x_in_blob2[j+1]))->blob->c3;
+    j += 2;
+  }
+}
+
+SEXP blobbyB2(SEXP ALPHA, SEXP BETA, SEXP FROMRECIPIENT, SEXP THRES, SEXP UNITDIST, SEXP MAX1VAR, SEXP DEDIP) {
+  // ALPHA and BETA must each be a R matrix with two columns
+
+  double* alpha = REAL(ALPHA);
+  double* beta = REAL(BETA);
+  size_t from_recipient = (size_t) Rf_asInteger(FROMRECIPIENT) - 1;
+  double thres = Rf_asReal(THRES);
+  double unitdist = Rf_asReal(UNITDIST);
+  int max1var = Rf_asInteger(MAX1VAR);
+  double* dedip = REAL(DEDIP);
+  size_t n = Rf_nrows(ALPHA);
+
+  if(Rf_ncols(ALPHA) != Rf_ncols(BETA)) {
+    Rf_error("All alphas/betas must have same number of columns");
+  }
+  if(Rf_nrows(ALPHA) != Rf_nrows(BETA)) {
+    Rf_error("All alphas/betas must have same number of rows");
+  }
+  if(Rf_ncols(ALPHA) != 2 || Rf_ncols(BETA) != 2) {
+    Rf_error("alpha and beta must both have two columns");
+  }
+  if(Rf_nrows(ALPHA)/2 != Rf_length(DEDIP)) {
+    Rf_error("Length of DEDIP must equal nrows(alpha)/2.");
+  }
+
+
+  int* neigh1;
+  int* neigh2;
+  int n_neigh[2];
+
+  double simi1[3], simi2[3];
+
+  blob*** x_in_blob1 = malloc(sizeof(blob**)*n);
+  blob*** x_in_blob2 = malloc(sizeof(blob**)*n);
+
+  const double maxd = 744.4400719213812180897;
+  blob* blobs1 = malloc(sizeof(blob)*((int) (maxd/thres+2)));
+  blob* blobs2 = malloc(sizeof(blob)*((int) (maxd/thres+2)));
+
+  double* n_clade1;
+  double* n_clade2;
+
+  blobby_B2(alpha, beta, alpha+n, beta+n, from_recipient, n, thres, unitdist, max1var, dedip,
+            &neigh1, &neigh2, &n_neigh[0], &n_neigh[1], n_clade1, n_clade2,
+                                                   simi1, simi2,
+                                                   x_in_blob1, x_in_blob2,
+                                                   maxd, blobs1, blobs2);
+
+  free(x_in_blob1); free(x_in_blob2);
+  free(blobs1); free(blobs2);
+
+  return(R_NilValue);
+}
+
+
+
+struct blobby_core_args {
+  const double* const restrict alpha;
+  const double* const restrict beta;
+  double* const restrict dedip;
+  const size_t from_recipient;
+  const size_t n;
+  const double thres;
+  const double unitdist;
+  const int max1var;
+  int** const neigh;
+  int* const n_neigh;
+  double* const n_clade;
+  double* const similarities1;
+  double* const similarities2;
+  double* const similarities3;
+};
+
+struct blobby_args {
+  struct blobby_core_args *core_args;
+  size_t from;
+  size_t N;
+};
+
+void* blobby_B(void *args) {
+  struct blobby_args *b_args;
+  b_args = (struct blobby_args *) args;
+  const double* restrict alpha = b_args->core_args->alpha;
+  const double* restrict beta = b_args->core_args->beta;
+  double* restrict dedip = b_args->core_args->dedip;
+  size_t from_recipient = b_args->core_args->from_recipient;
+  const size_t n = b_args->core_args->n;
+  const double thres = b_args->core_args->thres;
+  const double unitdist = b_args->core_args->unitdist;
+  const int max1var = b_args->core_args->max1var;
+  int** neigh = b_args->core_args->neigh;
+  int* n_neigh = b_args->core_args->n_neigh;
+  double* n_clade = b_args->core_args->n_clade;
+  double* similarities1 = b_args->core_args->similarities1;
+  double* similarities2 = b_args->core_args->similarities2;
+  double* similarities3 = b_args->core_args->similarities3;
+  size_t from = b_args->from;
+  size_t N = b_args->N;
+
+  alpha += n*from;
+  beta += n*from;
+  dedip += (n/2)*(from/2);
+  from_recipient += from;
+  neigh += from;
+  n_neigh += from;
+  n_clade += from;
+  similarities1 += from;
+  similarities2 += from;
+  similarities3 += from;
+
+  double simi1[3], simi2[3];
+
+  blob*** x_in_blob1 = malloc(sizeof(blob**)*n);
+  blob*** x_in_blob2 = malloc(sizeof(blob**)*n);
+
+  const double maxd = 744.4400719213812180897;
+  blob* blobs1 = malloc(sizeof(blob)*((int) (maxd/thres+2)));
+  blob* blobs2 = malloc(sizeof(blob)*((int) (maxd/thres+2)));
+
+  for(size_t i = 0; i < N; i+=2) {
+    blobby_B2(alpha, beta, alpha+n, beta+n, from_recipient, n, thres, unitdist, max1var, dedip,
+              neigh, neigh+1, n_neigh, n_neigh+1, n_clade, n_clade+1,
+              simi1, simi2,
+              x_in_blob1, x_in_blob2,
+              maxd, blobs1, blobs2);
+
+    similarities1[i] = simi1[0];
+    similarities2[i] = simi1[1];
+    similarities3[i] = simi1[2];
+    similarities1[i+1] = simi2[0];
+    similarities2[i+1] = simi2[1];
+    similarities3[i+1] = simi2[2];
+
+    alpha += 2*n;
+    beta += 2*n;
+    dedip += n/2;
+    from_recipient += 2;
+    neigh += 2;
+    n_neigh += 2;
+    n_clade += 2;
+  }
+
+  free(x_in_blob1); free(x_in_blob2);
+  free(blobs1); free(blobs2);
+
+  return(NULL);
+}
+
+void blobby_A(const double* const restrict alpha,
+              const double* const restrict beta,
+              double* const restrict dedip,
+              size_t from_recipient,
+              size_t n,
+              size_t p,
+              double thres,
+              double unitdist,
+              int max1var,
+              int** const neigh,
+              int* const n_neigh,
+              double* const n_clade,
+              double* const similarities1,
+              double* const similarities2,
+              double* const similarities3,
+              size_t nthreads) {
+
+
+  struct blobby_core_args core_args = {
+    .alpha = alpha,
+    .beta = beta,
+    .dedip = dedip,
+    .from_recipient = from_recipient,
+    .n = n,
+    .thres = thres,
+    .unitdist = unitdist,
+    .max1var = max1var,
+    .neigh = neigh,
+    .n_neigh = n_neigh,
+    .n_clade = n_clade,
+    .similarities1 = similarities1,
+    .similarities2 = similarities2,
+    .similarities3 = similarities3
+  };
+
+  if(nthreads > 1) {
+
+    pthread_t threads[nthreads];
+    pthread_attr_t attr;
+
+    pthread_attr_init(&attr);
+    pthread_attr_setdetachstate(&attr, PTHREAD_CREATE_JOINABLE);
+
+    size_t num_perth = (p/2)/nthreads;
+    size_t rag_end   = (p/2)%nthreads;
+
+    struct blobby_args args[nthreads+1];
+    for(size_t i=0; i<nthreads; i++) {
+      args[i].core_args = &core_args;
+      args[i].from = i*2*num_perth;
+      args[i].N = 2*num_perth;
+    }
+
+    for(size_t i=0; i<nthreads; ++i) {
+      pthread_create(&threads[i], &attr, blobby_B, (void*) &args[i]);
+      //blobby_B((void*) &args[i]);
+    }
+    Rprintf("%d threads created (rag end left over = %d)\n", nthreads, rag_end);
+
+    // Tidy ragged end
+    if(rag_end != 0) {
+      args[nthreads].core_args = &core_args;
+      args[nthreads].from = 2*nthreads*num_perth;
+      args[nthreads].N = 2*rag_end;
+      blobby_B((void*) &args[nthreads]);
+    }
+
+    for(size_t i=0; i<nthreads; i++) {
+      pthread_join(threads[i], NULL);
+    }
+    pthread_attr_destroy(&attr);
+  } else {
+
+    //Rprintf("\n(not using threading)\n");
+    struct blobby_args args;
+    args.core_args = &core_args;
+    args.from = 0;
+    args.N = p;
+
+    blobby_B((void*) &args);
+
+  }
+}
+
+
+
+SEXP CladeMat(SEXP Rfwd,
+              SEXP Rbck,
+              SEXP RM,
+              SEXP Runitdist,
+              SEXP Rthresh,
+              SEXP Rmax1var,
+              SEXP Rnthreads) {
+
+  // Extract table variables
+  double *alpha, *beta;
+  int *from_rec, *to_rec;
+  KALIS_GET_TABLE(alpha, Rfwd);
+  KALIS_GET_TABLE(beta, Rbck);
+  KALIS_GET_TABLE_FROM(from_rec, Rbck);
+  KALIS_GET_TABLE_TO(to_rec, Rbck);
+
+  double unitdist = Rf_asReal(Runitdist);
+  double thres = Rf_asReal(Rthresh);
+  int max1var = Rf_asInteger(Rmax1var);
+  double* dedip = REAL(RM);
+  size_t n = num_inds; // from Cache.h
+  size_t p = *to_rec - *from_rec + 1;
+  size_t from_recipient = (size_t) *from_rec - 1;
+  size_t nthreads = (size_t) Rf_asInteger(Rnthreads);
+
+
+  SEXP SIMILARITIES1 = PROTECT(Rf_allocVector(REALSXP, p));
+  double* similarities1 = REAL(SIMILARITIES1);
+  SEXP SIMILARITIES2 = PROTECT(Rf_allocVector(REALSXP, p));
+  double* similarities2 = REAL(SIMILARITIES2);
+  SEXP SIMILARITIES3 = PROTECT(Rf_allocVector(REALSXP, p));
+  double* similarities3 = REAL(SIMILARITIES3);
+  SEXP RES_SIMI = PROTECT(Rf_allocVector(VECSXP, 3));
+  SET_VECTOR_ELT(RES_SIMI, 0, SIMILARITIES1);
+  SET_VECTOR_ELT(RES_SIMI, 1, SIMILARITIES2);
+  SET_VECTOR_ELT(RES_SIMI, 2, SIMILARITIES3);
+
+  int** neigh;
+  neigh = malloc(sizeof(int*)*p);
+  if(neigh == NULL) {
+    printf("Failed allocating neigh!\n");
+    exit(1);
+  }
+  SEXP RES_NNEIGH = PROTECT(Rf_allocVector(INTSXP, p+1));
+  int* n_neigh = INTEGER(RES_NNEIGH);
+  *n_neigh = 1;
+
+  SEXP RES_NCLADE = PROTECT(Rf_allocVector(REALSXP, p));
+  double* n_clade = REAL(RES_NCLADE);
+
+  blobby_A(alpha,
+           beta,
+           dedip,
+           from_recipient,
+           n,
+           p,
+           thres,
+           unitdist,
+           max1var,
+           neigh,
+           n_neigh+1,
+           n_clade,
+           similarities1,
+           similarities2,
+           similarities3,
+           nthreads);
+
+  int neigh_sz = 0;
+  for(size_t i=0; i<p; i++) {
+    neigh_sz += n_neigh[i+1];
+  }
+
+  double tot_clade = 0;
+  for(size_t i=0; i<p; i++) {
+    tot_clade += n_clade[i];
+  }
+
+  SEXP RES_TOT_CLADE = PROTECT(Rf_ScalarReal(tot_clade));
+
+  SEXP RES_NEIGH = PROTECT(Rf_allocVector(INTSXP, neigh_sz));
+  int* res_neigh = INTEGER(RES_NEIGH);
+  int* tmp = res_neigh;
+  for(size_t i=0; i<p; i++) {
+    for(size_t j=0; j<n_neigh[i+1]; j++) {
+      *(tmp++) = neigh[i][j];
+    }
+    free(neigh[i]);
+  }
+  free(neigh);
+
+  for(size_t i=0; i<p; i++) {
+    n_neigh[i+1] += n_neigh[i];
+  }
+
+  SEXP RES_NE = PROTECT(Rf_allocVector(VECSXP, 2));
+  SET_VECTOR_ELT(RES_NE, 0, RES_NNEIGH);
+  SET_VECTOR_ELT(RES_NE, 1, RES_NEIGH);
+  SEXP RES = PROTECT(Rf_allocVector(VECSXP, 3));
+  SET_VECTOR_ELT(RES, 0, RES_NE);
+  SET_VECTOR_ELT(RES, 1, RES_SIMI);
+  SET_VECTOR_ELT(RES, 2, RES_TOT_CLADE);
+
+
+  UNPROTECT(10);
+  return(RES);
+}
+
+
+
+
+
+SEXP UpdateRealInPlace(SEXP RM,
+                       SEXP Ridx,
+                       SEXP Rvec) {
+
+  double* M = REAL(RM);
+  int* idx = INTEGER(Ridx);
+  double* vec = REAL(Rvec);
+  int p = Rf_length(Ridx);
+
+  for(size_t i=0; i<p; i++){
+    M[*idx - 1] += *vec;
+    idx++;
+    vec++;
+  }
+
+  return(R_NilValue);
+}
diff --git a/src/R_CladeMat.h b/src/R_CladeMat.h
new file mode 100644
index 0000000..ea89cce
--- /dev/null
+++ b/src/R_CladeMat.h
@@ -0,0 +1,20 @@
+#ifndef R_CLADEMAT_H
+#define R_CLADEMAT_H
+
+#define R_NO_REMAP
+#include <R.h>
+#include <Rinternals.h>
+
+SEXP CladeMat(SEXP Rfwd,
+              SEXP Rbck,
+              SEXP RM,
+              SEXP Runit_dist,
+              SEXP Rthresh,
+              SEXP Rmax1var,
+              SEXP Rnthreads);
+
+SEXP UpdateRealInPlace(SEXP RM,
+                       SEXP Ridx,
+                       SEXP Rvec);
+
+#endif

From e0df97fff10f4e424db746d871ea5bcf7add34e1 Mon Sep 17 00:00:00 2001
From: ryanchrist <ryan.christ7@gmail.com>
Date: Mon, 23 Sep 2024 12:08:40 -0500
Subject: [PATCH 03/43] Introducing R interface for Clade/Sprig calling and
 Clade Matrix (generalized eGRM) construction

---
 R/CladeMat.R         |  45 ++++
 R/Clades.R           | 627 +++++++++++++++++++++++++++++++++++++++++++
 R/GoldMasterClades.R |  58 ++++
 3 files changed, 730 insertions(+)
 create mode 100644 R/CladeMat.R
 create mode 100644 R/Clades.R
 create mode 100644 R/GoldMasterClades.R

diff --git a/R/CladeMat.R b/R/CladeMat.R
new file mode 100644
index 0000000..2e1a601
--- /dev/null
+++ b/R/CladeMat.R
@@ -0,0 +1,45 @@
+#' Fast Clade Matrix Construction
+#' @export CladeMat
+CladeMat <- function(fwd, bck, M, unit.dist, thresh = 0.2, max1var = FALSE,
+                    nthreads = min(parallel::detectCores(logical = FALSE), fwd$to_recipient-fwd$from_recipient+1)){
+
+  # input checks
+  #########################
+  input_checks_for_probs_and_dist_mat(fwd,bck)
+
+  if(nrow(fwd$alpha)%%2 !=0 || ncol(fwd$alpha)%%2 !=0 || nrow(bck$beta)%%2 !=0 || ncol(bck$beta)%%2 !=0 ){
+    stop("fwd and bck must both have an even number of recipient haplotypes and an even number of donor haplotypes")
+  }
+
+  if(!is.matrix(M) || !is.double(M) || nrow(M) != nrow(fwd$alpha)/2 || ncol(M) != ncol(fwd$alpha)/2){
+    stop("M must be a matrix of doubles with nrow(fwd$alpha)/2 rows and ncol(fwd$alpha)/2 columns")}
+
+  if(!is.atomic(unit.dist) || length(unit.dist)!=1L || !is.finite(unit.dist) || unit.dist <= 0){
+    stop("unit.dist must be a number greater than 0")}
+
+  if(is.integer(unit.dist)){
+    unit.dist <- as.double(unit.dist)
+  } else {
+    if(!is.double(unit.dist)){stop("unit.dist must be a number greater than 0")}}
+
+  if(!is.atomic(thresh) || length(thresh)!=1L || !is.finite(thresh) || thresh < 0 || thresh > 1){
+    stop("thresh must be a number in [0,1]")}
+
+  if(is.integer(thresh)){
+    thresh <- as.double(thresh)
+  } else {
+    if(!is.double(thresh)){stop("thresh must be a number in [0,1]")}}
+
+  if(!is.logical(max1var) || length(max1var) > 1){
+    stop("max1var must be TRUE or FALSE")}
+
+  nthreads <- as.integer(nthreads)
+  if(!is.integer(nthreads) || length(nthreads)!=1L || !is.finite(nthreads) || nthreads <= 0){
+    stop("nthreads must be a positive integer")}
+
+  if(nthreads > ncol(fwd$alpha)/2){
+    stop("nthreads cannot be greater than the number of recipient haplotypes divided by 2.")
+  }
+
+  invisible(.Call(CCall_CladeMat, fwd, bck, M, unit.dist, thresh, max1var, nthreads))
+}
diff --git a/R/Clades.R b/R/Clades.R
new file mode 100644
index 0000000..398c49a
--- /dev/null
+++ b/R/Clades.R
@@ -0,0 +1,627 @@
+
+
+
+get_neigh <- function(x,i){
+  idx <- x[[1]][c(i,i+1L)]
+  x[[2]][seq.int(idx[1],idx[2]-1L)]
+}
+
+get_neigh_seq <- function(x, i, return.lengths = FALSE){
+  from <- x[[1]][i]
+  nvec <- x[[1]][i+1] - from
+  if(return.lengths){
+    list("seq" = x[[2]][sequence(nvec,from)],
+         "lengths" = nvec)
+  } else {
+    x[[2]][sequence(nvec,from)]
+  }
+}
+
+#' Sprigs
+#' @export Sprigs
+Sprigs <- function(x, old.sprigs = FALSE){
+
+  N <- length(x[[1]])-1L
+  roster <- rep(NA_integer_,N)
+  label <- 0L
+  done <- neighborhood.is.sprig.ind <- rep(FALSE,N)
+
+  if(old.sprigs){
+
+    xx <- as.list(1:N)
+    for(i in 1:N){xx[[i]] <- get_neigh(x,i)}
+
+    roster <- Sprigs_old(xx, use.forking = FALSE, nthreads = 1L, add.self = FALSE)
+
+    label <- attr(roster,"n.sprigs")
+
+    attributes(roster) <- NULL
+
+    neighborhood.is.sprig.ind <- !is.na(roster)
+
+
+    # for(i in sample.int(N)){
+    #
+    #   if(done[i]){next}
+    #
+    #   C = get_neigh(x,i)
+    #   lC <- length(C)
+    #
+    #   neigh.list <- get_neigh_seq(x, C, return.lengths = TRUE)
+    #
+    #   temp.table <- table(neigh.list[[1]])
+    #   proposed.set <- as.integer(names(temp.table)[which(temp.table == lC)])
+    #
+    #   # in case the neighborhood of i overshoots into previously established cliques, it has a BIG effect in real data
+    #   proposed.set <- proposed.set[!done[proposed.set]]
+    #
+    #   if(length(proposed.set) > 1 && i %in% proposed.set){
+    #
+    #     label <- label + 1L
+    #     # this repeated intersection step has truly a small effect but
+    #     # helps guard us against the case where i might have erroneously added some candidates in its neighborhood that
+    #     # do not belong in the clade and do not include some clade members.  This steps helps us recover those clade members
+    #
+    #     neigh.list <- get_neigh_seq(x, proposed.set, return.lengths = TRUE)
+    #     temp.table <- table(neigh.list[[1]])
+    #     proposed.set <- as.integer(names(temp.table)[which(temp.table == lC)])
+    #     proposed.set <- proposed.set[!done[proposed.set]]
+    #
+    #     roster[proposed.set] <- label
+    #     done[proposed.set] <- TRUE
+    #     neighborhood.is.sprig.ind[proposed.set] <- neigh.list[[2]] == lC # indicator that a haplotype's neighborhood is exactly the proposed sprig
+    #   }
+    # }
+
+
+  } else {
+
+    # the randomness in indices here is not really essential but
+    for(i in seq_len(N)){ #sample.int(N)){
+
+      if(done[i]){next}
+
+      C = get_neigh(x,i) # keep simple get_neigh here because about 2x faster than get_neigh_seq when only querying one index
+      C <- C[!done[C]] # we know this will at least include i because of the if(!done[i]) check above and every neighborhood includes self
+
+      lC <- length(C)
+
+      if(lC == 1){ # C is an orphan that could never be a part of another clade because all of it's neighbors are already assigned
+        done[i] <- TRUE
+        next}
+
+      neigh.list <- get_neigh_seq(x, C, return.lengths = TRUE)
+
+      if(all(tabulate(factor(neigh.list[[1]],C),nbins = lC)==lC)){
+        label <- label + 1L
+        roster[C] <- label
+        done[C] <- TRUE
+        neighborhood.is.sprig.ind[C] <- neigh.list[[2]] == lC # indicator that a haplotype's neighborhood is exactly the proposed sprig
+      }
+    }
+
+  }
+
+  list("assignments" = roster,
+       "to.prune" = neighborhood.is.sprig.ind,
+       "num.sprigs" = label)
+}
+
+
+
+UpdateMatrixInPlace <- function(M,row.idx,col.idx,x){
+  invisible(.Call(getFromNamespace("CCall_UpdateRealInPlace","kalis"),M,
+                  as.integer(row.idx + (col.idx-1L)*nrow(M)),x))
+}
+
+# test <- matrix(as.double(1:144),12,12)
+# UpdateMatrixInPlace(test,c(5,12,12),c(1,3,5),as.double(c(100,200,300)))
+
+#' PruneCladeMat
+#' @export PruneCladeMat
+PruneCladeMat <- function(M, neigh, sprigs, prune = "singleton.info", from.recipient = 1L){
+
+  if(!from.recipient%%2){stop("from.recipient must be odd and encode the index of the first recipient haplotype")}
+
+  N.recipients <- 2 * ncol(M)
+
+  if(prune=="singleton.info"){
+
+    v <- neigh[[2]][[2]] - neigh[[2]][[1]]
+    v <- v[seq.int(1,N.recipients,2)] + v[seq.int(2,N.recipients,2)]
+    UpdateMatrixInPlace(M,
+                        seq.int(from = (from.recipient+1L)/2L,length.out = ncol(M)),
+                        seq.int(from = 1, to = ncol(M)),
+                        v)
+
+  } else if(prune=="sprigs"){
+
+    neigh.list <- get_neigh_seq(neigh[[1]], which(sprigs$to.prune), return.lengths = TRUE)
+
+    hap.idx <- cbind(neigh.list[[1]], rep(which(sprigs$to.prune), times = neigh.list[[2]]))
+
+    key <- rep(0L,nrow(hap.idx))
+
+    hap.idx.odd <- hap.idx%%2
+    temp.hap.idx.odd <- hap.idx.odd[,1] + hap.idx.odd[,2]
+    key[temp.hap.idx.odd==2] <- 1L
+    key[temp.hap.idx.odd==0] <- 4L
+    temp.hap.idx.odd <- hap.idx.odd[,1] - hap.idx.odd[,2]
+    key[temp.hap.idx.odd==1] <- 3L
+    key[temp.hap.idx.odd==-1] <- 2L
+
+    sim.updates <- rep((neigh[[2]][[3]]-neigh[[2]][[2]])[sprigs$to.prune], times = neigh.list[[2]])
+
+    # if M was not already dediploided:
+    # M[hap.idx] <- M[hap.idx] - sim.updates
+
+    # since M is dediploided, we run
+
+    if(!is.na(match(1L,key))){
+      to.fetch <- key==1L
+      UpdateMatrixInPlace(M,
+                          (hap.idx[to.fetch,1L]+1L)/2L,
+                          (hap.idx[to.fetch,2L]+1L)/2L,
+                          sim.updates[to.fetch])}
+
+    if(!is.na(match(2L,key))){
+      to.fetch <- key==2L
+      UpdateMatrixInPlace(M,
+                          hap.idx[to.fetch,1L]/2L,
+                          (hap.idx[to.fetch,2L]+1L)/2L,
+                          sim.updates[to.fetch])}
+
+    if(!is.na(match(3L,key))){
+      to.fetch <- key==3L
+      UpdateMatrixInPlace(M,
+                          (hap.idx[to.fetch,1L]+1L)/2L,
+                          (hap.idx[to.fetch,2L])/2L,
+                          sim.updates[to.fetch])}
+
+    if(!is.na(match(4L,key))){
+      to.fetch <- key==4L
+      UpdateMatrixInPlace(M,
+                          hap.idx[to.fetch,1L]/2L,
+                          hap.idx[to.fetch,2L]/2L,
+                          sim.updates[to.fetch])}
+
+  } else {
+    stop("unrecognized option for prune")
+  }
+  invisible(NULL)
+}
+
+
+
+
+
+
+#' Probabilistic Clades
+#'
+#' Utility for calling probabilistic clades at, in between, or excluding variants.
+#' @param fwd a forward table as returned by \code{\link{MakeForwardTable}}
+#' @param bck a backward table as returned by \code{\link{MakeBackwardTable}}
+#' @param pars a \code{kalisParameters} object, as returned by
+#'   \code{\link{Parameters}}.
+#' @param beta.theta.opts a list; see Details for \code{\link{DistMat}}.
+#' @param safety.checks a logical, should safety checks be applied to the distances?  See \code{\link{DistMat}}.
+#' @param neighbors a logical, should nearest neighbors be pre-calculated?  See \code{\link{Neighbors}}.
+#' @param use.forking a logical, should forked processes be used?
+#' @param nthreads the number of CPU cores to use. Currently, no parallelism is used.
+#' @return
+#'   a \code{kalisClades} object encoding probabilistic clade calls
+#'
+#' @export Clades
+Clades <- function(fwd, bck, pars, beta.theta.opts = NULL,
+                   safety.checks = FALSE, neighbors = FALSE,
+                   #use.bettermc = FALSE,
+                   use.forking = FALSE,
+                   forking.chunk.size = 100L,
+                   mc.preschedule = FALSE, # FALSE is more conservative of memory but means many new forked processes need to be launched so it's slower than TRUE
+                   nthreads = 1L){
+  # currently only outputs a list but should eventually also output a matrix of integers and an attribute list of clades
+
+  unit.mut.dist <- -log(pars$pars$mu)
+
+  M <- DistMat(fwd, bck, beta.theta.opts = beta.theta.opts, nthreads = nthreads)
+
+  if(safety.checks){
+    M[!is.finite(M)] <- 0
+    diag(M) <- NA_real_
+  }
+
+  rank_donors_func <- function(x, type="linear_20", neighbors = FALSE, mac.range = c(NA,NA)){
+    rank_donors_func_res <- as.list(1:length(x))
+    for(j in 1:length(x)){
+      d.ranks <- data.table::frank(M[,x[j]], na.last = FALSE, ties.method = "first")
+      phi <- c(diff(M[order(d.ranks),x[j]]),0)
+      phi[1] <- 0
+      phi <- phi / unit.mut.dist # an N-long vector
+      if(type == "linear_20"){
+        phi[phi > 1] <- 1
+        phi[phi < 0.2] <- 0
+      } else if(type == "step_80"){
+        phi[phi < 0.8] <- 0
+        phi[phi > 0] <- 1
+      }
+
+      if(!is.na(mac.range[1])){phi[1:mac.range[1]] <- 0}
+      if(!is.na(mac.range[2])){phi[mac.range[2]:nrow(fwd$alpha)] <- 0}
+
+      i <- which(phi!=0)
+
+      # compress phi
+      clades <- cbind(i,phi[i]) # if i = integer(0) (no clades called), clades will be a 0 x 2 matrix.
+      attr(d.ranks,"clades") <- clades
+
+      if(neighbors){
+        attr(d.ranks,"neighbors") <- if(nrow(clades)){
+          match(2:clades[1,1],d.ranks)
+        } else {
+          NA_integer_
+        }
+      }
+
+      rank_donors_func_res[[j]] <- d.ranks
+    }
+    rank_donors_func_res
+  }
+
+
+  chunks <- chunk_int(ncol(M), chunk.size = forking.chunk.size)
+
+  if(use.forking){
+    # if(use.bettermc){
+    #   rank.list <- bettermc::mclapply(chunks, rank_donors_func, neighbors = neighbors, mc.preschedule = mc.preschedule, mc.cores=nthreads, mc.share.copy = FALSE)
+    # } else {
+      rank.list <- parallel::mclapply(chunks, rank_donors_func, neighbors = neighbors, mc.preschedule = mc.preschedule, mc.cores=nthreads)
+    #}
+  } else {
+    rank.list <- lapply(chunks, rank_donors_func, neighbors = neighbors) # this matrix is ranked in each column, not scaled by Ne or Mu
+  }
+
+  rank.list <- unlist(rank.list,recursive = FALSE)
+
+  attr(rank.list,"from_recipient") <- fwd$from_recipient
+  attr(rank.list,"to_recipient")   <- fwd$to_recipient
+
+  class(rank.list) <- c("kalisClades","list") # rank.list is a list where each element is a vector of ranks with attributes clades
+
+  rank.list
+}
+
+
+#' Neighbors
+#'
+#' Utility for calling tied nearest neighbors for each recipient haplotype
+#' @param x a \code{kalisClades} object returned by \code{\link{kalisClades}}
+#' @param use.forking a logical, should forked processes be used?
+#' @param nthreads the number of CPU cores to use. Currently, no parallelism is used.
+#' @return
+#'   a \code{kalisNeighbors} encoding the nearest neighbors for each recipient haplotype
+#'
+#' @export Neighbors
+Neighbors <- function(x,
+                      #use.bettermc = FALSE,
+                      use.forking = FALSE, nthreads = 1L){
+  # currently only supports list x but should support matrix x as well
+
+  if(!is.null(attr(x[[1]],"neighbors"))){
+
+    neighbors <- lapply(x,function(z){attr(z,"neighbors")})
+
+  } else {
+
+
+    call_neighbors <- function(z){
+      # x should be a vector of ranks with attribute "clades"
+      clades <- attr(z,"clades")
+      if(nrow(clades)){
+        match(2:clades[1,1],z)
+      } else {
+        NA_integer_
+      }
+    }
+
+    if(use.forking){
+      # if(use.bettermc){
+      #   neighbors <- bettermc::mclapply(x, call_neighbors, mc.cores = nthreads, mc.share.copy = FALSE)
+      # } else {
+        neighbors <- parallel::mclapply(x, call_neighbors, mc.cores = nthreads)
+      #}
+    } else {
+      neighbors <- lapply(x,call_neighbors)
+    }
+  }
+
+  attr(neighbors,"from_recipient") <- attr(x,"from_recipient")
+  attr(neighbors,"to_recipient")   <- attr(x,"to_recipient")
+  class(neighbors) <- c("kalisNeighbors","list")
+
+  neighbors
+}
+
+
+#' Sprigs
+#'
+#' Utility for calling sprigs from probabilistic clades
+#' @param x a \code{kalisNeighbors} object returned by \code{\link{kalisNeighbors}}, a \code{kalisClades} object returned by \code{\link{kalisClades}} with \code{neighbors = TRUE}, or a list
+#' @param use.forking a logical, should forked processes be used?
+#' @param nthreads the number of CPU cores to use. Currently, no parallelism is used.
+#' @return
+#'   a \code{kalisSprigs} object assigning each haplotype to a sprig
+#'
+#' @export Sprigs_old
+Sprigs_old <- function(x, use.forking = FALSE, nthreads = 1L, add.self = TRUE){
+
+  # this version of Sprigs still has a bit of randomness in it's sprig building between runs on the same input
+  # which can be seen by running table(is.na(s),is.na(s1)) where s and s1 are the output of Sprigs
+  # for the same data run twice. it's relatively minor
+
+  if(inherits(x,"kalisClades")){
+    if(!is.null(attr(x[[1]],"neighbors"))){
+      x <- lapply(x,function(z){attr(z,"neighbors")})
+    } else {
+      stop("The kalisClades provided do not have the Neighbors pre-calculated, use kalis::Neighbors to obtain them and then pass them to Sprigs")
+    }
+  }
+
+  # x here is a list that's N long st x[[i]] gives the indices of the (tied) nearest neighbors of i
+  roster <- rep(NA_integer_,length(x))
+
+  label <- 0L
+  # add self to own neighborhood
+  if(add.self){x <- mapply(c,x,1:length(x))}
+
+  done <- rep(FALSE,length(x))
+  to.prune <- rep(NA_integer_,length(x))
+
+  # the randomness in indices here is not really essential but
+  for(i in sample.int(length(x))){
+    if(!done[i]){
+
+      # pulling out cliques in the graph that are fully connected bi-directionally:
+      # if i is in a clique, rather trivially, this will return the full clique
+      # Note, we require i %in% proposed.set to prevent called cliques from being broken up later in the for loop:
+      # if i is not in a clique, then it's still possible for a partial clique to be returned that doesn't include i if i projects onto
+      # a superset or subset of a clique.  If i supercedes a clique member and projects
+      # onto a subset, this clique subset will be overwritten later by the larger clique.  However, it would still be possible for a i that comes
+      # after all of the clade members in our for loop to break up the clique by projecting onto a subset of them.
+      # Enforcing i %in% proposed.set avoids that possibility.
+
+      # we also require that length(proposed.set) > 1 so that we don't end up with solo cliques being called that are just i by itself.
+
+      #missing_sprig_6 <- c(6103,1804, 6015, 4726, 4752, 807,3118,3991,6466,6068,  10,1250, 3669, 3658, 1997, 1399, 1116, 3738, 5015)
+      proposed.set <- Reduce(intersect,x[x[[i]]])
+      # we can really speed up this Reduce by using table and looking for entries that are present in all groups
+
+      # in case the neighborhood of i overshoots into previously established cliques, it has a BIG effect in real data
+      proposed.set <- proposed.set[!done[proposed.set]]
+
+      if(length(proposed.set) > 1 && i %in% proposed.set){
+
+        label <- label + 1L
+        # this repeated intersection step has truly a small effect but
+        # helps guard us against the case where i might have erroneously added some candidates in its neighborhood that
+        # do not belong in the clade and do not include some clade members.  This steps helps us recover those clade members
+        proposed.set <- Reduce(intersect,x[proposed.set])
+        proposed.set <- proposed.set[!done[proposed.set]]
+
+        # if(!all(is.na(roster[missing_sprig_6])) && !all(roster[missing_sprig_6]==6L)){
+        #   print(i)
+        #   print(label)
+        #   print(roster[missing_sprig_6])
+        #   browser()
+        # }
+        roster[proposed.set] <- label
+        done[proposed.set] <- TRUE
+      }
+    }
+
+    # individuals that are not part of a fully connected clique are left with NA_integer_ on the roster
+  }
+
+  # Size frequency spectrum: table(table(roster))
+
+  attr(roster,"n.sprigs") <- label
+  attr(roster,"from_recipient") <- attr(x,"from_recipient")
+  attr(roster,"to_recipient")   <- attr(x,"to_recipient")
+  class(roster) <- c("kalisSprigs","integer")
+
+  roster
+}
+
+#Testing Sprigs
+# kalis::Sprigs(list(
+#   1:2,
+#   1:2,
+#   3:7,
+#   1:10,
+#   1:10,
+#   1:10,
+#   5:11
+# ))
+
+#' CladeMat OLD
+#'
+#' Utility for contructing a probabilistic clade matrix
+#' @param x a \code{kalisClades} object returned by \code{\link{kalisClades}}
+#' @param ploidy an integer, the ploidy of the organism
+#' @param sprigs.to.prune a \code{kalisSprigs} object returned by \code{\link{kalisSprigs}} encoding sprigs that should be excluded from the matrix returned
+#' @param assemble a logical, if FALSE return the clade matrix as a list of columns rather than as a symmetrized matrix
+#' @param use.forking a logical, should forked processes be used?
+#' @param nthreads the number of CPU cores to use. Currently, no parallelism is used.
+#' @return
+#'   a matrix representation of the probabilistic clades provided
+#'
+#' @export CladeMat_old
+CladeMat_old <- function(x, ploidy = 2L, sprigs.to.prune = NULL, assemble = TRUE,
+                         #use.bettermc = FALSE,
+                         use.forking = FALSE, forking.chunk.size = 100L, mc.preschedule = FALSE, nthreads = 1L){
+
+  # prepare sprigs
+  if(is.null(sprigs.to.prune)){sprigs.to.prune <- integer()}
+  sl <- length(sprigs.to.prune)
+  if(sl){sprig.sizes <- tabulate(sprigs.to.prune)}
+
+  n.recipient.samples <- as.integer(length(x)/ploidy)
+
+  chunks <- chunk_int(n.recipient.samples, chunk.size = forking.chunk.size)
+
+  if(ploidy == 1){
+    omega_func <- function(s){
+      omega_func_res <- as.list(1:length(s))
+      for(j in 1:length(s)){
+
+        N <- length(x[[s[j]]])
+
+        idx <- attr(x[[s[j]]],"clades")[,1]
+        phi <- attr(x[[s[j]]],"clades")[,2]
+
+        # prune sprig
+        if(sl && !is.na(sprigs.to.prune[s[j]]) && length(idx) && sprig.sizes[sprigs.to.prune[s[j]]] == idx[1]){
+          idx <- idx[-1]
+          phi <- phi[-1]
+        }
+
+        # we know that phi[N] = 0, so there must always be a 0 appended
+        omega_func_res[[j]] <-  inverse.rle(list("values" =  c(rev(cumsum(rev(phi/idx))),0),
+                                                 "lengths" = diff(c(0,idx,N))))[x[[s[j]]]]
+
+      }
+      omega_func_res
+    }
+
+  } else if(ploidy == 2){
+
+    omega_func <- function(s){
+      omega_func_res <- as.list(1:length(s))
+      for(j in 1:length(s)){
+        N <- length(x[[s[j]]])
+
+        idx <- attr(x[[s[j]*2-1]],"clades")[,1]
+        phi <- attr(x[[s[j]*2-1]],"clades")[,2]
+
+        idx2 <- attr(x[[s[j]*2]],"clades")[,1]
+        phi2 <- attr(x[[s[j]*2]],"clades")[,2]
+
+
+        if(sl && !is.na(sprigs.to.prune[s[j]*2-1]) && length(idx) && sprig.sizes[sprigs.to.prune[s[j]*2-1]] == idx[1]){
+          idx <- idx[-1]
+          phi <- phi[-1]
+        }
+
+        if(sl && !is.na(sprigs.to.prune[s[j]*2]) && length(idx2) && sprig.sizes[sprigs.to.prune[s[j]*2]] == idx2[1]){
+          idx2 <- idx2[-1]
+          phi2 <- phi2[-1]
+        }
+
+        # we know that phi[N] = 0, so there must always be a 0 appended
+        w <- inverse.rle(list("values" =  c(rev(cumsum(rev(phi/idx))),0),
+                              "lengths" = diff(c(0,idx,N))))[x[[s[j]*2-1]]] +
+          inverse.rle(list("values" =  c(rev(cumsum(rev(phi2/idx2))),0),
+                           "lengths" = diff(c(0,idx2,N))))[x[[s[j]*2]]]
+
+        omega_func_res[[j]] <- w[seq(1,N,by=2)] + w[seq(2,N,by=2)]
+      }
+      omega_func_res
+    }
+
+  } else {
+    stop("Relatedness currently only supports ploidy  = 1 or 2")
+  }
+
+  # we don't simplify this list to a matrix at this stage to help preserve memory.
+  if(use.forking){
+    # if(use.bettermc){
+    #   res <- bettermc::mclapply(chunks, omega_func, mc.preschedule = mc.preschedule, mc.cores=nthreads, mc.share.copy = FALSE)
+    # } else {
+      res <- parallel::mclapply(chunks, omega_func, mc.preschedule = mc.preschedule, mc.cores=nthreads)
+    #}
+  } else {
+    res <- lapply(chunks, omega_func)
+  }
+
+  res <- unlist(res, recursive = FALSE)
+
+  if(assemble){
+    res <- do.call(cbind,res)
+    res <- 0.5 * (res + t(res))
+  }
+
+  res
+}
+
+chunk_int <- function(n, chunk.size = 100){
+  # subdivide 1:n into chunks of size at most chunk.size
+  if(n < 1){stop("n must be an integer >= 1")}
+  interval.starts <- seq(1,n,by=chunk.size)
+  interval.ends <- c(interval.starts[-1]-1,n)
+  res <- as.list(1:length(interval.starts))
+  for(i in 1:length(interval.starts)){
+    res[[i]] <- seq.int(interval.starts[i],interval.ends[i])}
+  res
+}
+#
+# use.forking <- FALSE
+# use.forking <- TRUE
+# nthreads <- 8L
+#
+# require(kalis)
+# haps.file <-"~/Dropbox/Benchmarking_StatGen/kalis_benchmarking_tests/benchmark_on_msprime_simulations/msprime_sim_N_100000_L_10000.hdf5"
+# CacheHaplotypes(haps = haps.file,loci.idx = 1:1000,hap.idx = 1:24000)#SmallHaps)
+# #CacheHaplotypes(SmallHaps)
+# pars <- Parameters(rep(1e-2, L() - 1))
+# fwd <- MakeForwardTable(pars)
+# bck <- MakeBackwardTable(pars)
+# Forward(fwd,pars,floor(L()/2),1)
+# Backward(bck,pars,floor(L()/2),1)
+# #
+# start <- proc.time()
+# rl2 <- Clades(fwd, bck, pars, neighbors = TRUE, safety.checks = FALSE, use.forking = use.forking, nthreads = nthreads)
+# finish <- proc.time() - start
+# print(finish)
+# #
+# sprigs <- Sprigs(rl2)
+# start <- proc.time()
+# M <- CladeMat(rl2, sprigs.to.prune = sprigs, use.forking = use.forking, nthreads=nthreads)
+# finish <- proc.time() - start
+# print(finish)
+#
+
+# rl<- readRDS("~/Downloads/clades_test.rds")
+# all.equal(rl,rl2)
+
+# sprigs <- CallSprigs(rl, use.forking = use.forking, nthreads = nthreads)
+#
+# #hist(sapply(rl,function(x){nrow(attr(x,"clades"))}),breaks=20)
+# #mean(unlist(lapply(rl,function(x){attr(x,"clades")[,2]}))>0.5)
+#
+# rl <- CladeMat(rl, ploidy = 2L, sprigs.to.prune = sprigs, assemble = FALSE, use.forking = use.forking, nthreads = nthreads)
+# rl <- do.call(cbind,rl)
+# rl <- 0.5 * (rl + t(rl))
+#
+# r2 <- -r2
+# class(r2) <- c("kalisDistanceMatrix","matrix")
+# plot(r2)
+#
+# M <- DistMat(fwd,bck)
+# M <- M + t(M)
+#
+# perm <- fastcluster::hclust(stats::as.dist(M),method="average")$order
+#
+# layout(matrix(1:3,1))
+# print(lattice::levelplot(M[perm,][,rev(perm)],
+#                          useRaster = TRUE,
+#                          col.regions = grDevices::colorRampPalette(RColorBrewer::brewer.pal(9,name = "BuPu"))(100),
+#                          yaxt = "n", xaxt = "n", xlab = "", ylab = "", xaxt = "n"))
+# print(lattice::levelplot(r1[perm,][,rev(perm)],
+#                          useRaster = TRUE,
+#                          col.regions = grDevices::colorRampPalette(RColorBrewer::brewer.pal(9,name = "BuPu"))(100),
+#                          yaxt = "n", xaxt = "n", xlab = "", ylab = "", xaxt = "n"))
+# print(lattice::levelplot(r2[perm,][,rev(perm)],
+#                          useRaster = TRUE,
+#                          col.regions = grDevices::colorRampPalette(RColorBrewer::brewer.pal(9,name = "BuPu"))(100),
+#                          yaxt = "n", xaxt = "n", xlab = "", ylab = "", xaxt = "n"))
+#
+
diff --git a/R/GoldMasterClades.R b/R/GoldMasterClades.R
new file mode 100644
index 0000000..96e6e09
--- /dev/null
+++ b/R/GoldMasterClades.R
@@ -0,0 +1,58 @@
+##### Gold Master #####
+
+goldmaster.blobby <- function(alpha,beta,recipient_hap, unit.dist = 1, thresh = 0.2){
+  f <- function(x,c){ifelse(x<c,0,pmin(x,1))}
+  probs <- alpha * beta
+  d <- -log(probs/sum(probs))
+  d[recipient_hap] <- 0
+  d[!is.finite(d)] <- 744.4400719213812180897
+  sigma <- order(d)
+  psi <- f(c(diff(d[sigma])/unit.dist,0),thresh)/seq_len(length(alpha))
+  psi[sigma] <- rev(cumsum(rev(psi)))
+  psi
+}
+
+
+goldmaster.blobby.dedip <- function(alpha,beta,left_recipient_hap, unit.dist = 1, thresh = 0.2){
+  if(ncol(alpha) != 2){stop("alpha must be a matrix with 2 columns")}
+  if(ncol(beta) != 2){stop("beta must be a matrix with 2 columns")}
+
+  if(left_recipient_hap <= 0 || left_recipient_hap > nrow(alpha)-1 || as.integer(left_recipient_hap)!=left_recipient_hap){
+    stop("left_recipient_hap must be an integer in [1,nrow(alpha)-1]")
+  }
+  if(c < 0 || c > 1){stop("c must be in [0,1]")}
+
+  v <- goldmaster.blobby(alpha[,1],beta[,1],recipient_hap=left_recipient_hap,unit.dist,thresh)
+  v <- v + goldmaster.blobby(alpha[,2],beta[,2],recipient_hap=left_recipient_hap+1L,unit.dist,thresh)
+  v[seq.int(1,length(v),2)] + v[seq.int(2,length(v),2)]
+}
+
+goldmaster.blobby.full <- function(alpha,beta,left_recipient_hap, unit.dist, thresh){
+  if(ncol(alpha) != ncol(beta)){stop("alpha and beta must have the same number of columns")}
+  if(nrow(alpha) != nrow(beta)){stop("alpha and beta must have the same number of rows")}
+
+  if( nrow(alpha)%%2 || ncol(alpha)%%2 ){stop("alpha must be a matrix with an even number of rows and columns")}
+
+  if(left_recipient_hap <= 0 || left_recipient_hap > nrow(alpha)-1 || as.integer(left_recipient_hap)!=left_recipient_hap){
+    stop("left_recipient_hap must be an integer in [1,nrow(alpha)-1]")
+  }
+
+  if(thresh < 0 || thresh > 1){stop("thresh must be in [0,1]")}
+
+  n.samps <- ncol(alpha)/2
+
+  M <- matrix(0,n.samps,n.samps)
+
+  for(i in 1:n.samps){
+    v <- goldmaster.blobby(alpha[,2*i-1],beta[,2*i-1],recipient_hap=left_recipient_hap+2*i-2L,unit.dist,thresh)
+    v <- v + goldmaster.blobby(alpha[,2*i],beta[,2*i],recipient_hap=left_recipient_hap+2*i-1L,unit.dist,thresh)
+    M[,i] <- v[seq.int(1,length(v),2)] + v[seq.int(2,length(v),2)]
+  }
+  M
+}
+
+
+CladeMat.GM <- function(fwd,bck,unit.dist,thresh = 0.2){
+  M <- goldmaster.blobby.full(fwd$alpha,bck$beta,left_recipient_hap = bck$from_recipient,unit.dist,thresh)
+  M
+}
\ No newline at end of file

From 2805f3110909b8484e23722fec700dda36a610c7 Mon Sep 17 00:00:00 2001
From: ryanchrist <ryan.christ7@gmail.com>
Date: Mon, 23 Sep 2024 12:11:06 -0500
Subject: [PATCH 04/43] Introducing optimal checkpointing routines and iterator
 interface for using checkpointing to have kalis sequentially visit (infer
 ancestries at) consecutive target variants

---
 R/Iterator.R    | 694 ++++++++++++++++++++++++++++++++++++++++++++++++
 R/TableCache.R  | 427 +++++++++++++++++++++++++++++
 src/R_OptCkpt.c |  58 ++++
 src/R_OptCkpt.h |  10 +
 4 files changed, 1189 insertions(+)
 create mode 100644 R/Iterator.R
 create mode 100644 R/TableCache.R
 create mode 100644 src/R_OptCkpt.c
 create mode 100644 src/R_OptCkpt.h

diff --git a/R/Iterator.R b/R/Iterator.R
new file mode 100644
index 0000000..e28a095
--- /dev/null
+++ b/R/Iterator.R
@@ -0,0 +1,694 @@
+#' Build an efficient iterator over loci
+#'
+#' Create a \code{kalisForwardIterator} for propagating a forward table iteratively over target loci using a table cache and optimal checkpointing.
+#'
+#' See example.
+#'
+#'
+#' @param ram.ckpts an integer specifying the number of checkpoints to store in RAM
+#' @param targets a vector of loci to iterate over (starting with the most downstream target)
+#' @param base.fwd.table a \code{kalisForwardTable} either at the most upstream target, or if the targets are evenly spaced, one interval upstream of the most upstream target.
+#' NULL (the default) is interpretted as the prior \code{Pi}, see \code{\link{Parameters}}
+#' @param disk.ckpts an integer specifying the number of checkpoints to store on disk
+#' @param disk.dir a path to a directory where a temporary folder may be made to store checkpoints on disk
+#' @param force.unif a logical, if TRUE iterate over targets as if they were uniformly spaced. WARNING: DO NOT use this in conjunction with the targets method, still experimental. With force.unif = TRUE, the resulting iterator appear to be targeting the first length(targets) variants with all methods, but in fact will be silently iterating over the original targets.
+#' @seealso \code{\link{MakeForwardTable}} to create a \code{kalisForwardTable}.
+#'
+#' @examples
+#' \dontrun{
+#' data("SmallHaps")
+#' CacheHaplotypes(SmallHaps)
+#' pars <- Parameters()
+#' fwd <- MakeForwardTable(pars)
+#' bck <- MakeBackwardTable(pars)
+#' Iter <- ForwardIterator(2)
+#' for(t in targets(Iter)){
+#'   Iter(fwd,pars,t)
+#'   Backward(bck,pars,t)
+#'   print(paste("Mean Distance at locus",t,"is",mean(DistMat(fwd,bck))))
+#' }
+#' }
+#'
+#' @export
+ForwardIterator <- function(pars,
+                            ram.ckpts = 1L,
+                            targets = 1:kalis:::pkgVars$L,
+                            base.fwd.table = NULL,
+                            disk.ckpts = 0,
+                            disk.dir = NULL,
+                            from_recipient = 1,
+                            to_recipient = Inf,
+                            lookup.tables = NULL,
+                            cache = NULL,
+                            save.cache = FALSE,
+                            exact = TRUE,
+                            force.unif = FALSE){
+
+  force(force.unif)
+
+  # Sanity checks
+  ####################
+  ram.ckpts <- as.integer(ram.ckpts)
+  if(ram.ckpts <= 0){stop("ram.ckpts must be a positive integer")}
+
+
+  # Check to ensure that the cache provided can actually be recycled for this problem
+
+  if(!is.null(cache)){
+    for(i in 1:length(cache)){
+      if(cache[[i]]$from_recipient!=from_recipient){stop("The provided cache must have the same from_recipient as currently requested.")}
+      if(cache[[i]]$to_recipient!=min(to_recipient,kalis:::pkgVars$N)){stop("The provided cache must have the same to_recipient as currently requested.")}
+    }
+  }
+
+
+
+  # Only RAM checkpoints for now
+  ##################
+  # for now we ignore disk checkpoints:
+  num.available.ckpts <- ram.ckpts
+
+  if(disk.ckpts != 0 | !is.null(disk.dir)){
+    warning("disk checkpoints not yet implemnted, proceeding ignoring disk.ckpts and disk.dir")
+  }
+
+
+  # Cover case when base.fwd.table provided
+  ##################
+
+  if(is.null(base.fwd.table)){
+    use.pi <- TRUE
+  }else{
+    if( !("kalisForwardTable" %in% class(base.fwd.table)) ){stop("base.fwd.table is not a kalisForwardTable")}
+    if(any(targets < base.fwd.table$l)){stop("no targets may be less than base.fwd.table$l")}
+    use.pi <- FALSE
+  }
+
+
+  if(force.unif){
+
+    if(!use.pi){
+      if(targets[1] != base.fwd.table$l){stop("When using force.unif, for now, base.fwd.table$l must be AT the first target")}
+    }
+
+    targets.idx <- targets
+    targets <- 1:length(targets)
+    base.fwd.table.l <- 1
+
+  } else {
+    targets.idx <- NULL
+    base.fwd.table.l <- base.fwd.table$l
+  }
+
+
+  # Figure out whether using uniform or general checkpointing
+  ####################
+  # by default
+  uniform.ckpts <- FALSE
+  first.target.given <- FALSE
+
+  intervals <- unique(diff(targets))
+
+  if(length(intervals) == 1){
+    if(use.pi){
+      if(targets[1] == intervals){ uniform.ckpts <- TRUE }
+    }else{
+      if(targets[1] == base.fwd.table.l){ uniform.ckpts <- TRUE; first.target.given <- TRUE}
+      if( (targets[1] - intervals) == base.fwd.table.l){ uniform.ckpts <- TRUE; first.target.given <- FALSE}
+    }
+  }
+  rm(intervals)
+
+
+  # Perform Table Benchmarking
+  ####################
+  # bench <- BenchmarkTables()
+
+  propagation.cost <- 1:length(targets)
+
+
+  # Solve Optimal Checkpointing
+  ###############################
+
+  if(uniform.ckpts){
+
+    if(is.null(lookup.tables)){
+      message("Calculating Optimal Checkpoint Schedule")
+      lookup.tables <- calc_tables(propagation.cost,num.available.ckpts)
+    }
+
+    cost.table <- lookup.tables$cost
+    index.table <- lookup.tables$index
+
+
+
+
+    if(!first.target.given){
+
+      uniform_SolveSchedule <- uniform_MakeSolveSchedule(targets,cost.table,index.table)
+      assign("uniform_SolveSchedule",uniform_SolveSchedule,envir = environment(uniform_SolveSchedule))
+
+      uniform_SolveSchedule(1,length(targets),num.available.ckpts)
+
+      cost <- uniform_LookupCost(length(targets),num.available.ckpts,cost.table)
+
+    }else{
+
+      uniform_SolveSchedule <- uniform_MakeSolveSchedule(targets[-1],cost.table,index.table)
+      assign("uniform_SolveSchedule",uniform_SolveSchedule,envir = environment(uniform_SolveSchedule))
+
+      uniform_SolveSchedule(1,length(targets)-1,num.available.ckpts)
+      cost <- uniform_LookupCost(length(targets)-1,num.available.ckpts,cost.table)
+
+    }
+
+    sch <- uniform_trim.sch(uniform_SolveSchedule)
+
+    # I don't believe we need to modify this schedule in order to still request the baseline locus as our last target
+
+  }else{
+
+    # Solve general problem
+    SolveSchedule <- MakeSolveSchedule(exact = exact)
+    environment(obj_func_for_SolveSchedule) <- environment(SolveSchedule)
+
+    if(!first.target.given){
+      cost <- SolveSchedule(d = c(targets[1],diff(targets)),targets, num.available.ckpts)
+    }else{
+      cost <- SolveSchedule(d = diff(targets),targets[-1], num.available.ckpts)
+    }
+    sch <- trim.sch(SolveSchedule)
+
+  }
+
+
+  # Construct Table Cache
+  ########################
+
+  max.tables <- max(sch$k)
+
+  if(is.null(cache) || length(cache) < max.tables){
+    cache <- CreateForwardTableCache(pars = pars,size = Inf, from_recipient = from_recipient, to_recipient = to_recipient, max.tables = max.tables)
+
+  }else{
+
+    for(i in 1:length(cache)){
+
+      if(i > max.tables){
+        cache[[i]] <- NULL
+      }else{
+        # check if parameters match, if not, overwrite with warning
+        if(cache[[i]]$pars.sha256!=pars$sha256){
+          warning("The provided cache was initialized with parameters that are different from those currently in pars.  Overwritting the pars in the provided cache...")
+          cache[[i]]$pars.sha256 <- pars$sha256
+        }
+        kalis:::ResetTable(cache[[i]])
+      }
+    }
+
+  }
+
+  rm(pars); gc()
+
+
+  # Construct Iterator
+  ######################
+
+  UpdateCache <- MakeUpdateCache(sch, use.pi, targets.idx = targets.idx)
+
+  current.sch <- data.frame("i" = Inf)
+
+  current.target.index <- length(targets)
+
+  iter.internal <- function(fwd, pars, t, nthreads = 1){
+
+    if(force.unif){t <- match(t,targets.idx)}
+
+    if(current.target.index == 0){warning("This iterator has been exhausted."); return()}
+
+    if(t == targets[current.target.index]){
+      current.target.index <<- current.target.index - 1
+    }else{
+      stop(paste("The next target locus for this iterator is",targets[current.target.index],"not",t))
+    }
+
+    if(identical(lobstr::obj_addr(fwd),lobstr::obj_addr(base.fwd.table))){
+      stop("base.fwd.table cannot point to the same table as fwd: they must be created independently.")
+    }
+
+    #print(c(current.sch$i, t))
+    if(current.sch$i > t){ current.sch <<- UpdateCache(cache, pars, nthreads, base.fwd.table) }
+
+    if(current.sch$k != 0){
+      CopyTable(to = fwd, from = cache[[current.sch$k]])
+    }else{
+      if(use.pi){
+        kalis:::ResetTable(fwd)
+      }else{
+        CopyTable(to = fwd, from = base.fwd.table)
+      }
+    }
+
+    # Clean Up cache unless we're instructed to save it
+    if(current.target.index == 0){
+      if(!save.cache){
+        cache <<- NULL
+        gc()
+      }
+    }
+
+    if(force.unif){
+      Forward(fwd = fwd, pars = pars, t = targets.idx[t], nthreads = nthreads)
+    } else {
+      Forward(fwd = fwd, pars = pars, t = t, nthreads = nthreads)
+    }
+  }
+
+  class(iter.internal) <- c("kalisIterator",class(iter.internal))
+
+  iter.internal
+}
+
+
+targets <- function(x) { # put this declaration above and below because it seems that order determines whether targets is recognized
+  UseMethod("targets")
+}
+
+targets.kalisIterator <- function(iter){
+  if(!"kalisIterator"%in%class(iter)){stop("argument must be a kalisIterator")}
+  rev(get("targets", envir = environment(iter)))
+}
+
+targets <- function(x) {
+  UseMethod("targets")
+}
+
+print.kalisIterator <- function(iter){
+  if(!"kalisIterator"%in%class(iter)){stop("argument must be a kalisIterator")}
+
+  if(get("current.target.index", envir=environment(iter)) == 0){
+    "This is an exhausted kalisIterator."
+  }else{
+    target.range <- range(get("targets", envir = environment(iter)))
+    message(paste("A kalisIterator for",length(get("targets", envir = environment(iter))),"targets ranging from",target.range[1],"to",target.range[2]),appendLF = TRUE)
+    message(paste("Contains",get("max.tables", envir = environment(iter)),"checkpoints using ~",utils::object.size(get("cache", envir = environment(iter)))/1e9,"Gb of RAM"),appendLF = TRUE)
+    message(paste("Next target locus:",get("targets", envir = environment(iter))[get("current.target.index", envir = environment(iter))]),appendLF = TRUE)
+    message("",appendLF = TRUE)
+  }
+}
+
+plot.kalisIterator <- function(iter){
+  if(!"kalisIterator"%in%class(iter)){stop("argument must be a kalisIterator")}
+  sch <- get("sch",envir = environment(iter))
+  loci <- get("targets",envir = environment(iter))
+  plot(sch$i[-c(1,nrow(sch))],sch$k[-c(1,nrow(sch))],type="h",lwd=1,bty="n",ylab="K",xlab="locus",las=1,ylim=c(0,max(sch$k)),xlim=range(loci),xaxt="n",yaxt="n")
+  p.loci <- pretty(loci)
+  axis(1,at = p.loci ,pos=0)
+  axis(2,at = pretty(0:max(sch$k)),pos=p.loci[1],las=2)
+}
+
+
+#' @export
+calc_tables <- function(propagation.cost,max.num.checkpoints, use.R = FALSE){
+  start <- proc.time()
+
+  propagation.cost <- as.numeric(propagation.cost)
+
+  max.n <- length(propagation.cost)
+
+  # the first row corresponds to solving a 0 locus problem
+  cost.table <- matrix(0,nrow=max.n + 1,ncol= max.num.checkpoints + 1)
+  index.table <- matrix(0L,nrow=max.n,ncol= max.num.checkpoints)
+
+  cost.table[,1] <- c(0,cumsum(as.numeric(propagation.cost)))
+
+  if(use.R){
+
+    for(k in 1:max.num.checkpoints){
+      for(n in 1:max.n){
+        # now solving a n long problem with k checkpoints
+        v <- cost.table[1:n,k + 1] + propagation.cost[1:n] + cost.table[n:1,k]
+        x <- which.min(v)
+        index.table[n, k] <- x
+        cost.table[n + 1,k + 1] <- v[x]
+      }
+      print(paste(k,"done at",c(proc.time() - start)[3]/3600,"hours from start."))
+    }
+  }else{
+    invisible(.Call(CCall_OptCkpt, cost.table, index.table, propagation.cost))
+  }
+
+  cost.table <- cost.table[-1,]
+  return(list("cost" = cost.table,"index" = index.table))
+}
+
+
+MakeUpdateCache <- function(sch, use.pi, cost.list = NULL, targets.idx = NULL){
+
+  force(targets.idx)
+
+  track.cost <- FALSE
+
+  if(!is.null(cost.list)){
+
+    mem.copy.cost = cost.list$mem.copy.cost
+    disk.read.cost = cost.list$disk.read.cost
+    disk.write.cost = cost.list$disk.write.cost
+    num.ram.ckpts = cost.list$num.ram.ckpts
+    num.disk.ckpts = cost.list$num.disk.ckpts
+    K <- num.ram.ckpts + num.disk.ckpts
+    track.cost <- TRUE
+    cost <- 0
+
+    transfer.cost <- function(to_k,from_k){
+      from_ram <- from_k <= num.ram.ckpts
+      to_ram <- to_k <= num.ram.ckpts
+
+      if(from_ram & to_ram){
+        return(mem.copy.cost)
+      }
+
+      if(!from_ram & to_ram){
+        return(disk.read.cost)
+      }
+    }
+
+    write.cost <- function(k){
+      if(k <= num.ram.ckpts ){
+        return(0)
+      }else{
+        return(disk.write.cost)
+      }
+    }
+
+  }
+
+
+  exhausted <- FALSE
+  current.ins <- leading.ins <- 1
+  ancestor <- 1
+  cost <- 0
+
+  function(cache, pars, nthreads, base.fwd.table){
+
+    if(exhausted){
+      warning("This iterator has been exhausted.")
+      return(data.frame("k" = 0L,"i" = 0L))
+    }
+
+    repeat{
+
+      candidates <- which(sch$i[1:(current.ins-1)] <= sch$i[current.ins])
+      ancestor <<- candidates[which.max(sch$i[candidates])]
+
+      if(sch$i[leading.ins + 1] < sch$i[ancestor]){ # if the next checkpoint destination is on the left side of the current ancestor
+        current.ins <<- ancestor
+        return(sch[current.ins,])
+      } else {
+        leading.ins <<- leading.ins + 1
+        current.ins <<- leading.ins
+      }
+
+      candidates <- which(sch$i[1:(current.ins-1)] <= sch$i[current.ins])
+      ancestor <<- candidates[which.max(sch$i[candidates])]
+
+
+      if(sch$i[current.ins] != 0){ # we're not at the end yet
+
+        # Update Cache
+        kk <- sch$k[current.ins]
+        akk <- sch$k[ancestor]
+
+        if(akk != 0){
+          if(track.cost){ cost <<- cost + transfer.cost(kk,akk) }
+          CopyTable(cache[[ kk ]],cache[[ akk ]])
+        }else{
+          if(track.cost){ cost <<- cost + transfer.cost(kk,0) }
+          if(use.pi){
+            kalis:::ResetTable(cache[[kk]]) # Pi could also be the baseline table here for the entire interval
+          }else{
+            CopyTable(to = cache[[kk]],base.fwd.table)
+          }
+        }
+
+        # advance cache table from ancestor to current checkpoint destination
+        if(track.cost){ cost <<- cost + sum( d[ (sch$i[ancestor] + 1) : sch$i[current.ins] ])}
+        if(!is.null(targets.idx)){
+          Forward(cache[[kk]],pars,targets.idx[sch$i[current.ins]],nthreads)
+        } else {
+          Forward(cache[[kk]],pars,sch$i[current.ins],nthreads)
+        }
+        if(sch$i[current.ins + 1] > sch$i[current.ins]){
+          next
+        }else{
+          return(sch[current.ins,])
+        }
+
+      }else{ # we are at the end
+        exhausted <<- TRUE
+        rm(cache)
+        rm(sch, envir = parent.env(environment())) # remove large objects from memory
+        gc()
+        return(data.frame("k" = 0L,"i" = 0L))
+      }
+    }
+  }
+}
+
+
+
+
+uniform_MakeSolveSchedule <- function(loci,cost.table,index.table){
+
+  uniform_SolveSchedule <- function(){NULL}
+
+  sch.k <- 0L
+  sch.i <- 0L
+  nrow.sch <- 1
+
+  function(i,j,num.available.ckpts){ # i is the index of the first locus and j is the index of the last locus in the problem to solve (from indicies[i] to indicies[j])
+
+    l.d <- j-i+1
+
+    k <- as.integer(min(l.d-1,num.available.ckpts))
+    if(k==0){return(cost.table[l.d,1])}
+
+    # at this point, we know that num.available.ckpts is at least 1
+    # and l.d is at least 2
+
+    # If neither of the above cases, create a new instruction
+    ins <- which.max(sch.k < 0) # this is the first emtpy slot for an instruction
+    if(ins == nrow.sch){ # then we're about to assign to the last schedule entry and need to add on space for instructions before we can call obj.func
+      sch.k <<- c(sch.k, rep(-1L,50))
+      sch.i <<- c(sch.i, rep(-1L,50))
+      nrow.sch <<- length(sch.k)
+      ins <- which.max(sch.k < 0)
+    }
+
+    sch.k[ins] <<- k
+    ckpt.location <- index.table[l.d,k]
+    sch.i[ins] <<- loci[i-1+ckpt.location]
+
+    # solve right problem if the interval to the right contains at least one target locus
+    if(l.d > ckpt.location){ uniform_SolveSchedule(i+ckpt.location, j, num.available.ckpts - 1) }
+    #if(l.d > ckpt.location){ get("uniform_SolveSchedule", envir = parent.frame())(i+ckpt.location, j, num.available.ckpts - 1) }
+
+
+    # solve left problem if the interval to the left contains at least one target locus
+    if(ckpt.location > 1){ uniform_SolveSchedule(i, i-2+ckpt.location,num.available.ckpts) }
+    #if(ckpt.location > 1){ get("uniform_SolveSchedule", envir = parent.frame())(i, i-2+ckpt.location,num.available.ckpts) }
+
+
+    return()
+  }
+}
+
+uniform_LookupCost<- function(L,num.available.ckpts,cost.table){cost.table[L,as.integer(min(L-1,num.available.ckpts)) + 1]}
+
+uniform_trim.sch <- function(f){
+  sch.k <- get("sch.k",envir = environment(f))
+  sch.i <- get("sch.i",envir = environment(f))
+  # prune
+  if(any(sch.k == -1)){
+    upper.limit <- which.max(sch.k == -1) - 1
+    sch.k <- sch.k[1:upper.limit]
+    sch.i <- sch.i[1:upper.limit]
+  }
+
+  # create dataframe schedule
+  sch <- data.frame("k" = c(sch.k,0L), "i" = c(sch.i,0L))
+}
+
+
+
+
+obj_func_for_SolveSchedule <- function(i,ins,d,indicies,num.available.ckpts){
+
+  i <- floor(i)
+
+  # clear out schedule for all entries below this instruction
+  sch.k[(ins+1):nrow.sch] <<- -1L
+  sch.i[(ins+1):nrow.sch] <<- -1L
+
+  proposed.location <- which(indicies==i)
+
+  # solve right problem
+  if(length(d) > proposed.location){ # if the interval to the right contains at least one target locus
+    right.cost <- SolveSchedule(d[(proposed.location+1):length(d)],
+                                indicies[(proposed.location+1):length(d)],
+                                num.available.ckpts - 1)
+  }else{
+    right.cost <- 0
+  }
+
+
+  # solve left problem
+  if(proposed.location > 1){ # if the interval to the left contains at least one target locus
+    left.cost <- SolveSchedule(d[1:(proposed.location-1)],
+                               indicies[1:(proposed.location-1)],
+                               num.available.ckpts)
+  }else{
+    left.cost <- 0
+  }
+
+  # total up the cost
+  sum(d[1:proposed.location]) + left.cost + right.cost  # Cost to initialize and place and record the checkpoint is first
+}
+
+
+MakeSolveSchedule <- function(exact = TRUE){
+
+  sch.k <- 0L
+  sch.i <- 0L
+  nrow.sch <- 1
+
+  function(d, indicies, num.available.ckpts){
+
+    l.d <- length(d)
+    if(l.d==0){return(0)} # nothing to solve
+
+    k <- as.integer(min(l.d-1,num.available.ckpts))
+    if(k==0){return(sum(d*(l.d:1)))}
+
+
+    # at this point, we know that num.available.ckpts is at least 1
+    # and l.d is at least 2
+
+
+    # If neither of the above cases, create a new instruction
+    ins <- which.max(sch.k < 0) # this is the first emtpy slot for an instruction
+    if(ins == nrow.sch){ # then we're about to assign to the last schedule entry and need to add on space for instructions before we can call obj.func
+      sch.k <<- c(sch.k, rep(-1L,50))
+      sch.i <<- c(sch.i, rep(-1L,50))
+
+      if(sequential){
+        first.index <<- c(first.index, rep(NA_integer_,50))
+        last.index <<- c(last.index, rep(NA_integer_,50))
+      }
+      nrow.sch <<- length(sch.k)
+      ins <- which.max(sch.k < 0)
+    }
+
+    sch.k[ins] <<- k
+
+    if( (l.d-1) <= num.available.ckpts ){ # We know what the solution is to this problem
+      cost <- d[1] + SolveSchedule(d[-1],
+                                   indicies[-1],
+                                   num.available.ckpts - 1)
+      sch.i[ins] <<- indicies[1]
+
+    }else{
+
+      if(exact){
+        tol <- 1e-4
+      }else{
+        tol <- l.d / 20 * 0.4
+      }
+
+      ans <- optimize(obj_func_for_SolveSchedule,
+                      lower = indicies[1],  # NOTE THIS WILL NEED TO BE CHANGED BACK TO LOWER IF ABOVE UNCOMMENTED
+                      upper=tail(indicies,1),
+                      ins = ins,
+                      d = d,
+                      indicies = indicies,
+                      num.available.ckpts = num.available.ckpts,
+                      tol = tol)
+      # choose tol so that we will get the exact solution when we have 20 or fewer locations to choose from
+      # slight approximation for larger sequences, but those being a bit off shouldn't be as critical to having the low level
+      # solutions all correct.
+
+      cost <- ans$objective
+      sch.i[ins] <<- as.integer(floor(ans$minimum))
+    }
+
+    cost
+  }
+}
+
+trim.sch <- function(f){
+  sch.k <- get("sch.k",envir = environment(f))
+  sch.i <- get("sch.i",envir = environment(f))
+  lookup.available <- get("lookup.available",envir = environment(f))
+
+  if(lookup.available){
+    first.index <- get("first.index",envir = environment(f))
+    last.index <- get("last.index",envir = environment(f))
+  }
+
+  # prune
+  if(any(sch.k == -1)){
+    upper.limit <- which.max(sch.k == -1) - 1
+    sch.k <- sch.k[1:upper.limit]
+    sch.i <- sch.i[1:upper.limit]
+    if(lookup.available){
+      first.index <- first.index[1:upper.limit]
+      last.index <- last.index[1:upper.limit]
+    }
+  }
+
+  # create dataframe schedule
+  sch <- data.frame("k" = c(sch.k,0L), "i" = c(sch.i,0L))
+
+  # Expand any incomplete parts of the schedule
+  while(!all(is.na(first.index))){
+
+    # identify an entry that needs to be expanded
+    c.row <- which.min(is.na(first.index))
+
+    # separate that entry from entries above and below
+    if(c.row!=1){sch.above <- sch[1:(c.row-1),]}else{sch.above <- data.frame("k" = 0L, "i" = 0L); sch.above <- sch.above[-1,]}
+    if(c.row!=nrow(sch)){sch.below <- sch[(c.row+1):nrow(sch),]}else{sch.below <- data.frame("k" = 0L, "i" = 0L); sch.below <- sch.below[-1,]}
+
+    kk <- sch$k[c.row] # this is the number of checkpoints we must apply over the range first.index to last.index
+
+
+  }
+
+}
+
+
+# Some code for file backed checkpointing:
+
+# X2 <- list(x=X)
+# system.time(fst:::fststore(normalizePath("~/test.fst", mustWork = FALSE), X2,
+#                            as.integer(50), TRUE))
+#
+# library(fst)
+# X.res <- matrix(0, 10000, 40000)
+#
+# # from and to index rows from massive 1 column data.frame
+# # split it up to read in 10 to 20 blocks of columns
+# # check if assignment to column is triggering a copy.
+#
+# Read to a block and then use a C function like the substitution one I have
+# to write in C from a vector to fwd$alpha
+#
+# system.time({
+#   for(i in 1:100) {
+#     X.res[,i] <- read_fst("~/test.fst", from=(i-1)*10000+1, to=i*10000)
+#   }
+# })
+#
+
+
+
diff --git a/R/TableCache.R b/R/TableCache.R
new file mode 100644
index 0000000..e6a3428
--- /dev/null
+++ b/R/TableCache.R
@@ -0,0 +1,427 @@
+#' Create cache for forward tables
+#'
+#' Create an in-memory cache for forward tables to improve efficiency when
+#' iterating in reverse along the haplotype sequences.
+#'
+#' If the objective is to run the Li and Stephens hidden Markov model both
+#' forwards and backwards to the same locus (and to do so for every possible
+#' locus), then considerable efficiency can be achieved by first performing a
+#' full scan forwards, filling a geometrically spaced cache whilst doing so.
+#' Then, by working backwards, the backward propagation moves one locus at a
+#' time and the forward propagation can move backwards by moving forward from a
+#' recently cached local table.
+#'
+#' Memory for a cache can be allocated using this function and should then be
+#' filled with \code{\link{FillTableCache}}.
+#' To use the cache, then instead of using the \code{\link{Forward}} function,
+#' use \code{\link{ForwardUsingTableCache}}.
+#'
+#' @param pars a \code{kalisParameters} object, as returned by
+#'   \code{Parameters}.
+#' @param size the maximum amount of RAM (in GB) to devote to this cache.
+#' @param from_recipient first recipient haplotype if creating a partial forward
+#'   table cache.  By default includes from the first recipient haplotype.
+#' @param to_recipient last recipient haplotype if creating a partial forward
+#'   table cache.  By default includes to the last recipient haplotype.
+#'
+#' @return
+#'   A list of forward tables representing a cache and ready to be filled is
+#'   returned.
+#'
+#' @seealso
+#'   \code{\link{MakeForwardTable}} to make a forward table;
+#'   \code{\link{FillTableCache}} to fill a cache;
+#'   \code{\link{ForwardUsingTableCache}} to use a cache;
+#'   \code{\link{Forward}} for forward function without using a cache.
+#'
+#' @examples
+#' \dontrun{
+#' # This code assumes you have already:
+#' #  i) cached the haplotypes using CacheHaplotypes function
+#' #  ii) setup parameters in a variable called pars
+#' #  iii) set the number of loci in a variable called L
+#'
+#' # Allocate up to 10GB to a cache, with parameters already setup in pars ...
+#' cache <- CreateForwardTableCache(pars, 10)
+#' # ... and fill it
+#' FillTableCache(cache, pars, nthreads = 8)
+#'
+#' # Create forward and backward tables
+#' fwd <- MakeForwardTable(pars)
+#' bck <- MakeBackwardTable(pars)
+#'
+#' # Then reach every locus faster by iterating backwards, using the cache to
+#' # move the forward table into position faster
+#' for(l in L:1) {
+#'   Backward(bck, pars, l, nthreads = 8)
+#'   ForwardUsingTableCache(fwd, pars, cache, l, nthreads = 8)
+#'   # Do whatever work is required at
+#'   # every locus here using fwd and bck
+#' }
+#' }
+#'
+#' @export
+CreateForwardTableCache <- function(pars, size = 1, from_recipient = 1, to_recipient = Inf, max.tables = 0) {
+  if(!("kalisParameters" %in% class(pars))) {
+    stop("The pars argument is not a valid parameters object.")
+  }
+
+  N <- get("N", envir = pkgVars)
+  L <- get("L", envir = pkgVars)
+
+  if(anyNA(N)) {
+    stop("No haplotypes cached ... cannot determine table size until cache is loaded with CacheAllHaplotypes().")
+  }
+
+  if(from_recipient>to_recipient) {
+    stop("from_recipient must be smaller than to_recipient.")
+  }
+  if(from_recipient < 1) {
+    from_recipient <- 1
+  }
+  if(to_recipient > N) {
+    to_recipient <- N
+  }
+  delN <- to_recipient-from_recipient+1
+  if(!is.vector(max.tables) || !is.numeric(max.tables) || length(max.tables) != 1 || max.tables < 0) {
+    stop("max.tables must be a positive scalar.")
+  }
+
+  cat("Found", N, "haplotypes in the cache.")
+  if((delN*N+2*delN+1)*8/1e9 > size) {
+    stop(size, "GB is not big enough for even 1 table.")
+  }
+  cat("  Constructing table cache of appropriate size ...\n")
+
+  if(max.tables == 0) {
+    max.tables <- floor(log2(L))
+  }
+  cache <- list()
+  i <- 1
+  while((length(cache) == 0 || ((utils::object.size(cache)*(length(cache)+1))/length(cache))/1e9 < size) && length(cache)<max.tables) {
+    cache[[i]] <- MakeForwardTable(pars, from_recipient, to_recipient)
+    i <- i+1
+  }
+  cat("Cache constructed, can hold ", length(cache), " tables for recipients ", from_recipient, " ... ", to_recipient, ".  Actual size approx ", ceiling(utils::object.size(cache)/1e6)/1e3, "GB.\n", sep = "")
+
+  class(cache) <- c("kalisCheckpointTable", class(cache))
+  cache
+}
+
+
+
+#' Fill a forward table cache
+#'
+#' An in-memory cache for forward tables can be filled using this function, for
+#' either the whole sequence length or some sub-sequence.
+#'
+#' If the objective is to run the Li and Stephens hidden Markov model both
+#' forwards and backwards to the same locus (and to do so for every possible
+#' locus), then considerable efficiency can be achieved by first performing a
+#' full scan forwards, filling a geometrically spaced cache whilst doing so.
+#' Then, by working backwards, the backward propagation moves one locus at a
+#' time and the forward propagation can move backwards by moving forward from a
+#' recently cached local table.
+#'
+#' Memory for a cache can be allocated using
+#' \code{\link{CreateForwardTableCache}} and should then be filled with this
+#' function.
+#' To use the cache, then instead of using the \code{\link{Forward}} function,
+#' use \code{\link{ForwardUsingTableCache}}.
+#'
+#' @param cache a cache of forward tables as generated by
+#'   \code{\link{CreateForwardTableCache}}
+#' @param pars a \code{kalisParameters} object, as returned by
+#'   \code{Parameters}.
+#' @param from the first locus which the geometrically spaced cache should be
+#'   built from.
+#'   By default the whole sequence length will be cached so this defaults to 1.
+#' @param to the last locus up to which the geometrically spaced cache should be
+#'   built.
+#'   By default the whole sequence length will be cached so this defaults to
+#'   \code{Inf}.
+#' @param nthreads the number of CPU cores to use.
+#'   By default no parallelism is used.
+#'
+#' @return
+#' There is nothing returned.
+#' For performance reasons, \code{cache} is updated in-place.
+#'
+#' @seealso
+#'   \code{\link{MakeForwardTable}} to make a forward table;
+#'   \code{\link{CreateForwardTableCache}} to generate a cache;
+#'   \code{\link{ForwardUsingTableCache}} to use a cache;
+#'   \code{\link{Forward}} for forward function without using a cache.
+#'
+#' @examples
+#' \dontrun{
+#' # This code assumes you have already:
+#' #  i) cached the haplotypes using CacheHaplotypes function
+#' #  ii) setup parameters in a variable called pars
+#' #  iii) set the number of loci in a variable called L
+#'
+#' # Allocate up to 10GB to a cache, with parameters already setup in pars ...
+#' cache <- CreateForwardTableCache(pars, 10)
+#' # ... and fill it
+#' FillTableCache(cache, pars, nthreads = 8)
+#'
+#' # Create forward and backward tables
+#' fwd <- MakeForwardTable(pars)
+#' bck <- MakeBackwardTable(pars)
+#'
+#' # Then reach every locus faster by iterating backwards, using the cache to
+#' # move the forward table into position faster
+#' for(l in L:1) {
+#'   Backward(bck, pars, l, nthreads = 8)
+#'   ForwardUsingTableCache(fwd, pars, cache, l, nthreads = 8)
+#'   # Do whatever work is required at
+#'   # every locus here using fwd and bck
+#' }
+#' }
+#'
+#' @export
+FillTableCache <- function(cache,
+                           pars,
+                           nthreads = min(parallel::detectCores(logical = FALSE), cache[[1]]$to_recipient-cache[[1]]$from_recipient+1)) {
+  if(!("kalisCheckpointTable" %in% class(cache))) {
+    stop("The cache argument is not a valid forward table cache.")
+  }
+  if(!("kalisParameters" %in% class(pars))) {
+    stop("The pars argument is not a valid parameters object.")
+  }
+  if(cache[[1]]$pars.sha256 != pars$sha256) {
+    stop("The forward table provided was created with different parameter values (SHA-256 mismatch).")
+  }
+
+  L <- get("L", envir = pkgVars)
+
+  from <- cache[[1]]$from_recipient
+  to <- cache[[1]]$from_recipient
+
+  if(from < 1 || from > L) {
+    stop("from argument is invalid.")
+  }
+  if(is.infinite(to)) {
+    to <- L
+  }
+  if(to < 1 || to > L) {
+    stop("to argument is invalid.")
+  }
+
+  pos <- 0.5
+  if(from > 1) {
+    pos <- 1
+  }
+
+  for(i in 1:length(cache)) {
+    t <- floor((1.0-pos)*(to-from))+from
+    if(t == cache[[i]]$l) {
+      ResetTable(cache[[i]])
+      break
+    }
+    pos <- pos*0.5
+
+    cat(glue("Computing cache entry {i} up to locus {t} for recipients {cache[[i]]$from_recipient} to {cache[[i]]$to_recipient} from "))
+    if(cache[[i]]$l < 1) {
+      cat("start\n")
+    } else {
+      cat(glue("locus {cache[[i]]$l}"), "\n")
+    }
+
+    Forward(cache[[i]], pars, t, nthreads)
+
+    if(i < length(cache)) {
+      CopyTable(cache[[i+1]], cache[[i]])
+    }
+  }
+}
+
+
+
+#' Use a forward table cache to propagate
+#'
+#' An in-memory cache for forward tables, which has already been filled, can be
+#' used to move more quickly to a specified locus.
+#'
+#' If the objective is to run the Li and Stephens hidden Markov model both
+#' forwards and backwards to the same locus (and to do so for every possible
+#' locus), then considerable efficiency can be achieved by first performing a
+#' full scan forwards, filling a geometrically spaced cache whilst doing so.
+#' Then, by working backwards, the backward propagation moves one locus at a
+#' time and the forward propagation can move backwards by moving forward from a
+#' recently cached local table.
+#'
+#' Memory for a cache can be allocated using
+#' \code{\link{CreateForwardTableCache}} and should then be filled with
+#' \code{\link{FillTableCache}}.
+#' To use the cache, then instead of using the \code{\link{Forward}} function,
+#' use this function.
+#'
+#' Note that the \code{cache} which is passed to this function will be
+#' dynamically updated based on the locus requested: the assumption is that
+#' the cache is used to propagate in reverse so any cache entries for a locus
+#' position past \code{t} are taken to be no longer needed and that space will
+#' redeployed to more densely fill the cache with earlier locus positions.
+#'
+#' @param fwd a \code{kalisForwardTable} object, as returned by
+#'   \code{\link{MakeForwardTable}}.
+#' @param pars a \code{kalisParameters} object, as returned by
+#'   \code{Parameters}.
+#' @param cache a cache of forward tables as generated by
+#'   \code{\link{CreateForwardTableCache}} and filled using
+#'   \code{\link{FillTableCache}}.
+#' @param t a locus position to move the forward table to, starting the forward
+#'   propagation from whatever table in the \code{cache} variable is immediately
+#'   before locus \code{t}.
+#'   By default, it simply advances to the previous locus (which is the natural
+#'   direction to move when using the cache).
+#' @param nthreads the number of CPU cores to use.
+#'   By default no parallelism is used.
+#'
+#' @return
+#'   There is nothing returned.
+#'   For performance reasons, \code{fwd} is updated in-place.
+#'
+#' @seealso
+#'   \code{\link{MakeForwardTable}} to make a forward table;
+#'   \code{\link{CreateForwardTableCache}} to generate a cache;
+#'   \code{\link{FillTableCache}} to fill a cache;
+#'   \code{\link{Forward}} for forward function without using a cache.
+#'
+#' @examples
+#' \dontrun{
+#' # This code assumes you have already:
+#' #  i) cached the haplotypes using CacheHaplotypes function
+#' #  ii) setup parameters in a variable called pars
+#' #  iii) set the number of loci in a variable called L
+#'
+#' # Allocate up to 10GB to a cache, with parameters already setup in pars ...
+#' cache <- CreateForwardTableCache(pars, 10)
+#' # ... and fill it
+#' FillTableCache(cache, pars, nthreads = 8)
+#'
+#' # Create forward and backward tables
+#' fwd <- MakeForwardTable(pars)
+#' bck <- MakeBackwardTable(pars)
+#'
+#' # Then reach every locus faster by iterating backwards, using the cache to
+#' # move the forward table into position faster
+#' for(l in L:1) {
+#'   Backward(bck, pars, l, nthreads = 8)
+#'   ForwardUsingTableCache(fwd, pars, cache, l, nthreads = 8)
+#'   # Do whatever work is required at
+#'   # every locus here using fwd and bck
+#' }
+#' }
+#'
+#' @export
+ForwardUsingTableCache <- function(fwd, pars, cache, t = fwd$l-1,
+                                   nthreads = min(parallel::detectCores(logical = FALSE), fwd$to_recipient-fwd$from_recipient+1)) {
+  if(!("kalisForwardTable" %in% class(fwd))) {
+    stop("The fwd argument is not a valid forward table.")
+  }
+  if(!("kalisParameters" %in% class(pars))) {
+    stop("The pars argument is not a valid parameters object.")
+  }
+  if(fwd$pars.sha256 != pars$sha256) {
+    stop("The forward table provided was created with different parameter values (SHA-256 mismatch).")
+  }
+  if(!("kalisCheckpointTable" %in% class(cache))) {
+    stop("The cache argument is not a valid forward table cache.")
+  }
+  if(cache[[1]]$pars.sha256 != pars$sha256) {
+    stop("The forward table cache provided was created with different parameter values (SHA-256 mismatch).")
+  }
+
+  if(!all(sapply(cache,function(x){x$from_recipient}) == fwd$from_recipient)){
+    stop("from_recipient is not consistent across fwd and the tables in the cache.")
+  }
+
+  if(!all(sapply(cache,function(x){x$to_recipient}) == fwd$to_recipient)){
+    stop("to_recipient is not consistent across fwd and the tables in the cache.")
+  }
+
+
+  l <- sapply(cache, function(x) { x$l })
+  if(any(l==t)) {
+    CopyTable(fwd, cache[[which(l==t)]])
+    return()
+  }
+  todo <- which(l>t)
+  l[todo] <- -1
+  # Is the max -1?  Then we've passed the half way mark.  Fill up the first slot
+  # and march on
+  if(max(l) == -1) {
+    ResetTable(cache[[1]]) # Have to do this in C++ as must in place modify
+    Forward(cache[[1]], pars, 1, nthreads)
+    l[1] <- 1
+    todo <- which(l==-1)
+  }
+  from <- max(l)
+  from.idx <- which.max(l)
+
+  # First, check if there are any spare slots -- we might just be accessing after
+  # the last checkpoint already.  If so, run forward and return right away
+  if(length(todo)==0) {
+    CopyTable(fwd, cache[[from.idx]])
+    Forward(fwd, pars, t, nthreads)
+    return()
+  }
+
+  # If we want just one step after the jumping off checkpoint, then we just wind
+  # forward to it right away though I have spare checkpoint slots
+  if(t == from+1) {
+    CopyTable(fwd, cache[[from.idx]])
+    Forward(fwd, pars, t, nthreads)
+    return()
+  }
+
+  # Now figure out how to fill in
+  if(t-from <= length(todo)) {
+    # In here, we have more spare slots than there are steps to reach t,
+    # so do one step at a time and store into a cache element
+
+    # NB t-from >= 2 due to if statement above
+    for(i in 1:(t-from-1)) {
+      CopyTable(cache[[todo[i]]], cache[[from.idx]])
+      Forward(cache[[todo[i]]], pars, from+i, nthreads)
+      from.idx <- todo[i]
+    }
+    CopyTable(fwd, cache[[from.idx]])
+    Forward(fwd, pars, t, nthreads)
+  } else {
+    # We have more steps than spare slots, so we need a schedule to fill in the
+    # gaps
+
+    # NB t-from-1 >= 1 due to if statement above
+    geom.spacing <- ceiling( (1-0.5^{1:length(todo)})*(t-from-1)+from )
+    fillin <- rep(NA, length(geom.spacing))
+
+    fillin[length(geom.spacing)] <- geom.spacing[length(geom.spacing)]
+    if(length(geom.spacing)>1) {
+      for(i in (length(geom.spacing)-1):1) {
+        fillin[i] <- min(geom.spacing[i], fillin[i+1]-1)
+      }
+    }
+    fillin <- unique(fillin[fillin>from & fillin<t])
+
+    for(i in 1:length(fillin)) {
+      CopyTable(cache[[todo[i]]], cache[[from.idx]])
+      Forward(cache[[todo[i]]], pars, fillin[i], nthreads)
+      from.idx <- todo[i]
+    }
+    CopyTable(fwd, cache[[from.idx]])
+    Forward(fwd, pars, t, nthreads)
+  }
+}
+
+
+
+#' @export
+print.kalisCheckpointTable <- function(x, ...) {
+  if(!("kalisCheckpointTable" %in% class(x))) stop("Not a kalisCheckpointTable object")
+  cat("Checkpoint Table object containing", length(x), "checkpoints.\n")
+  cat("  Loci of checkpoints:\n")
+  cat("   ", sapply(x, function(x) { x$l }), "\n")
+  cat("  Memory consumed: ", ceiling(utils::object.size(x)/1e6)/1e3, "GB.\n")
+}
\ No newline at end of file
diff --git a/src/R_OptCkpt.c b/src/R_OptCkpt.c
new file mode 100644
index 0000000..241dcaf
--- /dev/null
+++ b/src/R_OptCkpt.c
@@ -0,0 +1,58 @@
+#include "R_OptCkpt.h"
+
+#include <limits.h> // DBL_MAX
+
+#include "R_Kalis.h"
+
+SEXP OptCkpt(SEXP Rcost_table, SEXP Rindex_table, SEXP Rpropagation_cost) {
+
+  int cost_nr = Rf_nrows(Rcost_table);
+  int index_nr = Rf_nrows(Rindex_table);
+
+  if(cost_nr != index_nr + 1) {
+    REprintf("Error: incorrect number of rows in cost/index table combination.\n");
+    KALIS_RETURN;
+  }
+  if(Rf_ncols(Rcost_table) != Rf_ncols(Rindex_table) + 1) {
+    REprintf("Error: incorrect number of cols in cost/index table combination.\n");
+    KALIS_RETURN;
+  }
+
+  int k,n,i;
+
+  double x = DBL_MAX;
+  int xi = 0;
+  double y = 0;
+
+  int maxckpt = Rf_ncols(Rindex_table);
+  int maxn = index_nr;
+
+  double * p_c = REAL(Rcost_table);
+  int * p_i = INTEGER(Rindex_table);
+  double * s = REAL(Rpropagation_cost);
+
+
+  for(k = 0; k < maxckpt; k++)
+  {
+    for(n = 0; n < maxn; n++)
+    {
+      x = DBL_MAX;
+      xi = 0;
+      y = 0;
+
+      for(i = n; i > -1; i--)
+      {
+        y = p_c[i + cost_nr*(k+1)] + s[i] + p_c[n-i + cost_nr*k];
+        if(y <= x) {
+          xi = i;
+          x = y;
+        } else {
+          break;
+        }
+      }
+      p_i[n + index_nr * k] = xi+1;
+      p_c[n+1 + cost_nr * (k+1)] = x;
+    }
+  }
+  KALIS_RETURN;
+}
diff --git a/src/R_OptCkpt.h b/src/R_OptCkpt.h
new file mode 100644
index 0000000..a317dc4
--- /dev/null
+++ b/src/R_OptCkpt.h
@@ -0,0 +1,10 @@
+#ifndef R_OPTCKPT_H
+#define R_OPTCKPT_H
+
+#define R_NO_REMAP
+#include <R.h>
+#include <Rinternals.h>
+
+SEXP OptCkpt(SEXP Rcost_table, SEXP Rindex_table, SEXP Rpropagation_cost);
+
+#endif

From ca8fc820d09dfdbc138cb7b4e3cd1bd32c6b8bfd Mon Sep 17 00:00:00 2001
From: ryanchrist <ryan.christ7@gmail.com>
Date: Mon, 23 Sep 2024 12:12:26 -0500
Subject: [PATCH 05/43] Introducing efficient algorithm for parallelized
 implicit matrix trace and Hilbert-Schmidt norm calculation

---
 R/CalcTraces.R     |   6 ++
 src/R_CalcTraces.c | 169 +++++++++++++++++++++++++++++++++++++++++++++
 src/R_CalcTraces.h |  14 ++++
 3 files changed, 189 insertions(+)
 create mode 100644 R/CalcTraces.R
 create mode 100644 src/R_CalcTraces.c
 create mode 100644 src/R_CalcTraces.h

diff --git a/R/CalcTraces.R b/R/CalcTraces.R
new file mode 100644
index 0000000..aa8b32c
--- /dev/null
+++ b/R/CalcTraces.R
@@ -0,0 +1,6 @@
+#' @export
+CalcTraces <- function(M, tX, tQ, J,
+                       from_recipient = 1L,
+                       nthreads = min(parallel::detectCores(logical = FALSE), ncol(M))) {
+  .Call(CCall_CalcTraces, M, tX, tQ, J, from_recipient, nthreads)
+}
diff --git a/src/R_CalcTraces.c b/src/R_CalcTraces.c
new file mode 100644
index 0000000..7bb95c7
--- /dev/null
+++ b/src/R_CalcTraces.c
@@ -0,0 +1,169 @@
+#include "R_CalcTraces.h"
+
+#define _GNU_SOURCE
+#include <pthread.h>
+#include <math.h>
+
+
+
+struct CalcTraces_A_core_args {
+  const double *restrict M;
+  const double *restrict tX;
+  const double *restrict tQ;
+  const double *restrict J;
+  double *diag;
+  size_t r;
+  size_t from_off;
+  size_t p;
+};
+struct CalcTraces_A_args {
+  struct CalcTraces_A_core_args *core_args;
+  double *restrict res;
+  double *restrict res2;
+  size_t from;
+  size_t N;
+};
+
+void* CalcTraces_A(void *args) {
+  struct CalcTraces_A_args *ct_args;
+  ct_args = (struct CalcTraces_A_args *) args;
+  const double *restrict M = ct_args->core_args->M;
+  const double *restrict tX = ct_args->core_args->tX;
+  const double *restrict tQ = ct_args->core_args->tQ;
+  const double *restrict J = ct_args->core_args->J;
+  double *restrict res = ct_args->res;
+  double *restrict res2 = ct_args->res2;
+  double *diag = ct_args->core_args->diag;
+  size_t r = ct_args->core_args->r;
+  size_t from_off = ct_args->core_args->from_off;
+  size_t from = ct_args->from;
+  size_t N = ct_args->N;
+  size_t p = ct_args->core_args->p;
+
+  double temp;
+  double temp2;
+  for(size_t j = from; j < from+N; j++) {
+    for(size_t i = 0; i < r; i++) {
+      temp = M[i + j*r];
+      for(size_t l = 0; l < p; l++){
+        // temp += temp;
+        temp += tX[l + i*p] * tQ[l + (from_off+j)*p] - tQ[l + i*p] * J[l + (from_off+j)*p];
+      }
+      temp2 = temp * temp;
+      res2[0] += temp2; // part of the HS norm
+      if(i==j){
+        res[0] += temp; // add to the trace (for the expected value of the quadratic form)
+        diag[j] = temp; // add to the diagonal component of the varaince (for the variance of the quadratic form)
+      }
+    }
+  }
+
+  return(NULL);
+}
+
+
+// // [[Rcpp::export]]
+// List CalcTraces(NumericMatrix M,  // r x c
+//                 NumericMatrix tX, // p x r
+//                 NumericMatrix tQ, // p x r
+//                 NumericMatrix J,  // p x r (will only use a subset of these rows)
+//                 size_t from_recipient,
+//                 size_t nthreads) {
+SEXP CalcTraces(SEXP RM,  // r x c
+                SEXP RtX, // p x r
+                SEXP RtQ, // p x r
+                SEXP RJ,  // p x r (will only use a subset of these rows)
+                SEXP Rfrom_recipient,
+                SEXP Rnthreads) {
+
+  size_t p = (size_t) Rf_nrows(RtX);
+  size_t r = (size_t) Rf_nrows(RM);
+  size_t c = (size_t) Rf_ncols(RM);
+
+  size_t nthreads = (size_t) Rf_asInteger(Rnthreads);
+
+  SEXP Rtrace = PROTECT(Rf_allocVector(REALSXP, 1));
+  REAL(Rtrace)[0] = 0.0;
+  SEXP Rhsnorm = PROTECT(Rf_allocVector(REALSXP, 1));
+  REAL(Rhsnorm)[0] = 0.0;
+  SEXP Rdiag = PROTECT(Rf_allocVector(REALSXP, r));
+  for(size_t i=0; i<r; i++) {
+    REAL(Rdiag)[i] = 0.0;
+  }
+
+  size_t from_off = (size_t) (Rf_asInteger(Rfrom_recipient)-1);
+
+  struct CalcTraces_A_core_args core_args = {
+    .M = REAL(RM),
+    .tX = REAL(RtX),
+    .tQ = REAL(RtQ),
+    .J = REAL(RJ),
+    .diag = REAL(Rdiag),
+    .r = r,
+    .from_off = from_off,
+    .p = p
+  };
+
+  if(nthreads > 1) {
+    pthread_t threads[nthreads];
+    pthread_attr_t attr;
+
+    pthread_attr_init(&attr);
+    pthread_attr_setdetachstate(&attr, PTHREAD_CREATE_JOINABLE);
+
+    double res_perth[nthreads+1]; // = (double*) R_alloc((nthreads+1), sizeof(double));
+    double res_perth2[nthreads+1]; // = (double*) R_alloc((nthreads+1), sizeof(double));
+
+    size_t num_perth = c/nthreads;
+    size_t rag_end   = c%nthreads;
+
+    struct CalcTraces_A_args args[nthreads+1];
+    for(size_t i=0; i<nthreads; i++) {
+      args[i].core_args = &core_args;
+      args[i].res = res_perth + i;
+      args[i].res2 = res_perth2 + i;
+      args[i].from = i*num_perth;
+      args[i].N = num_perth;
+    };
+
+    for(size_t i=0; i<nthreads; ++i) {
+      pthread_create(&threads[i], &attr, CalcTraces_A, (void*) &args[i]);
+    }
+    // Tidy ragged end
+    if(rag_end != 0) {
+      args[nthreads].core_args = &core_args;
+      args[nthreads].res = res_perth + nthreads;
+      args[nthreads].res2 = res_perth2 + nthreads;
+      args[nthreads].from = nthreads*num_perth;
+      args[nthreads].N = rag_end;
+      CalcTraces_A((void*) &args[nthreads]);
+    }
+
+    for(size_t i=0; i<nthreads; i++) {
+      pthread_join(threads[i], NULL);
+    }
+    pthread_attr_destroy(&attr);
+
+    for(size_t j = 0; j < nthreads+1; j++) {
+      REAL(Rtrace)[0] += res_perth[j];
+      REAL(Rhsnorm)[0] += res_perth2[j];
+    }
+  } else {
+    struct CalcTraces_A_args args;
+    args.core_args = &core_args;
+    args.res = REAL(Rtrace);
+    args.res2 = REAL(Rhsnorm);
+    args.from = 0;
+    args.N = c;
+    CalcTraces_A((void*) &args);
+  }
+
+  const char *names[] = {"trace", "hsnorm2", "diag", ""};
+  SEXP RL = PROTECT(Rf_mkNamed(VECSXP, names));
+  SET_VECTOR_ELT(RL, 0, Rtrace);
+  SET_VECTOR_ELT(RL, 1, Rhsnorm);
+  SET_VECTOR_ELT(RL, 2, Rdiag);
+
+  UNPROTECT(4);
+  return(RL);
+}
diff --git a/src/R_CalcTraces.h b/src/R_CalcTraces.h
new file mode 100644
index 0000000..536d5e6
--- /dev/null
+++ b/src/R_CalcTraces.h
@@ -0,0 +1,14 @@
+#ifndef R_CALCTRACES_H
+#define R_CALCTRACES_H
+
+#define R_NO_REMAP
+#include <R.h>
+#include <Rinternals.h>
+
+SEXP CalcTraces(SEXP RM,
+                SEXP RtX,
+                SEXP RtQ,
+                SEXP RJ,
+                SEXP Rfrom_recipient,
+                SEXP Rnthreads);
+#endif

From add21d5379beeb4d35daea0d0e0476a414843e51 Mon Sep 17 00:00:00 2001
From: ryanchrist <ryan.christ7@gmail.com>
Date: Mon, 23 Sep 2024 12:14:11 -0500
Subject: [PATCH 06/43] Introducing tests for CladeMat

---
 tests/testthat/test-CladeMat.R | 22 ++++++++++++++++++++++
 1 file changed, 22 insertions(+)
 create mode 100644 tests/testthat/test-CladeMat.R

diff --git a/tests/testthat/test-CladeMat.R b/tests/testthat/test-CladeMat.R
new file mode 100644
index 0000000..842bd2e
--- /dev/null
+++ b/tests/testthat/test-CladeMat.R
@@ -0,0 +1,22 @@
+test_that("CladeMat Matches GoldMaster CladeMat", {
+
+  CacheHaplotypes(SmallHaps)
+  map <- SmallMap
+
+  target.idx <- floor(L()/2)
+  pars <- Parameters(CalcRho(diff(map),s = 0.01),mu = 0.0001) # specify HMM parameters
+  fwd <- MakeForwardTable(pars)
+  bck <- MakeBackwardTable(pars)
+  Forward(fwd, pars, target.idx)
+  Backward(bck, pars, target.idx)
+
+  unit.dist <- -log(pars$pars$mu)
+  thresh <- 0.2
+
+  M <- matrix(0,N()/2,N()/2)
+  neigh <- CladeMat(fwd,bck,M,unit.dist = unit.dist, thresh = thresh ,max1var = TRUE)
+
+  M2 <- kalis:::CladeMat.GM(fwd,bck,unit.dist = unit.dist, thresh = thresh)
+
+  expect_equal(M, M2)
+})

From 9a6a9e6aaae22471df572f2abec4fe02a78269b0 Mon Sep 17 00:00:00 2001
From: ryanchrist <ryan.christ7@gmail.com>
Date: Mon, 23 Sep 2024 12:14:26 -0500
Subject: [PATCH 07/43] Adding vignette for iterating over target loci
 sequentially

---
 vignettes/Iterating_Over_Loci.Rmd | 49 +++++++++++++++++++++++++++++++
 1 file changed, 49 insertions(+)
 create mode 100644 vignettes/Iterating_Over_Loci.Rmd

diff --git a/vignettes/Iterating_Over_Loci.Rmd b/vignettes/Iterating_Over_Loci.Rmd
new file mode 100644
index 0000000..657c4ae
--- /dev/null
+++ b/vignettes/Iterating_Over_Loci.Rmd
@@ -0,0 +1,49 @@
+---
+title: "Iterating Over Loci"
+author: "Louis Aslett & Ryan Christ"
+date: "`r Sys.Date()`"
+output: rmarkdown::html_vignette
+vignette: >
+  %\VignetteIndexEntry{Iterating Over Loci}
+  %\VignetteEngine{knitr::rmarkdown}
+  %\VignetteEncoding{UTF-8}
+---
+
+```{r setup, include = FALSE}
+knitr::opts_chunk$set(
+  collapse = TRUE
+  )
+```
+
+Here show how to use \pkg{kalis} to efficiently iterate over loci sequentially.
+
+
+```{r, results='hide'}
+require(kalis)
+# 
+# total.nthreads <- 4
+# n.checkpoints <- 7
+# 
+# nthreads <- as.integer(0:(total.nthreads-1))
+# CacheHaplotypes(SmallHaps)
+# 
+# m <- rbeta(L()-1,1,10)*1e-6
+# pars <- Parameters(CalcRho(cM = m, s = 1, gamma = 1), mu = 1e-8, use.speidel = TRUE)
+# 
+# fwd <- MakeForwardTable(pars)
+# bck <- MakeBackwardTable(pars)
+# M <- matrix(0,N(),N())
+# 
+# Iter <- ForwardIterator(pars,n.checkpoints)
+# 
+# start.time <- proc.time()
+# 
+# for(t in L():1){
+#   Iter(fwd,pars,t,nthreads = nthreads)
+#   Backward(bck,pars,t, nthreads = nthreads)
+#   # Optional: DistMat(fwd,bck,M,type="minus.min", nthreads = total.nthreads)
+#   print(paste("At locus",t))
+# }
+# 
+# print(proc.time() - start.time)
+```
\ No newline at end of file

From a23711f4d709be87493ac7a9b4d2ba82dec9322a Mon Sep 17 00:00:00 2001
From: ryanchrist <ryan.christ7@gmail.com>
Date: Mon, 23 Sep 2024 12:16:36 -0500
Subject: [PATCH 08/43] Registrations required for previous C commits

---
 src/R_Registrations.c | 8 ++++++++
 1 file changed, 8 insertions(+)

diff --git a/src/R_Registrations.c b/src/R_Registrations.c
index 8a280de..35de9c5 100644
--- a/src/R_Registrations.c
+++ b/src/R_Registrations.c
@@ -2,12 +2,16 @@
 
 #include "R_Backward.h"
 #include "R_Cache.h"
+#include "R_CalcTraces.h"
 #include "R_ComputeStatus.h"
 #include "R_Forward.h"
 #include "R_MatAndMul.h"
 #include "R_MatAndMulBtwVar.h"
+#include "R_OptCkpt.h"
 #include "R_TableCache.h"
 #include "R_TableMaker.h"
+#include "R_CladeMat.h"
+
 
 #define CALLDEF(name, n)  {#name, (DL_FUNC) &name, n}
 
@@ -22,15 +26,19 @@ static const R_CallMethodDef callMethods[] = {
   CALLDEF(CacheHaplotypes_hapgz_2, 5),
   CALLDEF(QueryCache2_ind, 1),
   CALLDEF(QueryCache2_loc, 1),
+  CALLDEF(CalcTraces, 6),
   CALLDEF(ComputeStatus, 0),
   CALLDEF(VectorBitWidth, 0),
   CALLDEF(ResetForwardTable, 1),
   CALLDEF(Forward, 8),
   CALLDEF(MatAndMul, 9),
   CALLDEF(MatAndMulBtwVar, 11),
+  CALLDEF(OptCkpt, 3),
   CALLDEF(CopyFBTable, 2),
   CALLDEF(MakeForwardTable, 3),
   CALLDEF(MakeBackwardTable, 3),
+  CALLDEF(CladeMat, 7),
+  CALLDEF(UpdateRealInPlace,3),
   { NULL, NULL, 0 }
 };
 

From bd5eb3cd5ff2f523e9e0e32acc05a3662060d692 Mon Sep 17 00:00:00 2001
From: ryanchrist <ryan.christ7@gmail.com>
Date: Mon, 23 Sep 2024 12:19:41 -0500
Subject: [PATCH 09/43] Reducing memory footprint of loading haplotypes

---
 R/CacheHaplotypes_hdf5.R | 6 ++++--
 1 file changed, 4 insertions(+), 2 deletions(-)

diff --git a/R/CacheHaplotypes_hdf5.R b/R/CacheHaplotypes_hdf5.R
index 41fda9e..d5934a9 100644
--- a/R/CacheHaplotypes_hdf5.R
+++ b/R/CacheHaplotypes_hdf5.R
@@ -112,6 +112,7 @@ CacheHaplotypes.hdf5.hdf5r <- function(hdf5.file,
       else
         res <- t(h5.haps[hap.idx[current.step:upto],loci.idx])
       current.step <<- upto + 1
+      storage.mode(res) <- "integer"
       res
     }
   }
@@ -201,10 +202,11 @@ CacheHaplotypes.hdf5.rhdf5 <- function(hdf5.file,
       }
       upto <- min(current.step + step.size - 1, N)
       if(!transpose)
-        res <- matrix(as.integer(rhdf5::h5read(hdf5.file, haps.path, index = list(loci.idx, hap.idx[current.step:upto]))), nrow = length(loci.idx))
+        res <- rhdf5::h5read(hdf5.file, haps.path, index = list(loci.idx, hap.idx[current.step:upto]))
       else
-        res <- t(matrix(as.integer(rhdf5::h5read(hdf5.file, haps.path, index = list(hap.idx[current.step:upto], loci.idx))), ncol = length(loci.idx)))
+        res <- t(rhdf5::h5read(hdf5.file, haps.path, index = list(hap.idx[current.step:upto], loci.idx)))
       current.step <<- upto + 1
+      storage.mode(res) <- "integer"
       res
     }
   }

From 073ec6382d802c18677c19815d9ea6d3a1c4391e Mon Sep 17 00:00:00 2001
From: ryanchrist <ryan.christ7@gmail.com>
Date: Mon, 23 Sep 2024 13:00:44 -0500
Subject: [PATCH 10/43] Changing rhdf5 h5write call to h5writeDataset based on
 some prior failed runs -- might need to revisit this if in the new context we
 need to revert back to h5write .

---
 R/IndividualSequenceIO_H5.R | 8 +++++---
 1 file changed, 5 insertions(+), 3 deletions(-)

diff --git a/R/IndividualSequenceIO_H5.R b/R/IndividualSequenceIO_H5.R
index c06ca58..0fea53f 100644
--- a/R/IndividualSequenceIO_H5.R
+++ b/R/IndividualSequenceIO_H5.R
@@ -99,6 +99,7 @@ WriteHaplotypes <- function(hdf5.file, haps,
     write.loci.ids <- TRUE
   }
 
+  # NOTE: this previously had to be removed to allow running on WashU cluster -- if error triggers here again LA and RC to discuss
   if(length(find.package("rhdf5", quiet = TRUE)) == 0) {
     stop("The WriteHaplotypes function requires the optional rhdf5 package to be installed (see Bioconductor https://bioconductor.org/packages/rhdf5)")
   }
@@ -248,12 +249,12 @@ WriteHaplotypes <- function(hdf5.file, haps,
   # Write
   message(glue("Writing {N} haplotype(s) of size {L} ...\n"))
 
-  rhdf5::h5write(as.array(haps), h5, haps.name, index = list(NULL, (N.old+1):(N.old+N)))
+  rhdf5::h5writeDataset(as.array(haps), h5, haps.name, index = list(NULL, (N.old+1):(N.old+N)))
   if(write.hap.ids) {
-    rhdf5::h5write(as.array(as.character(hap.ids)), h5, hap.ids.name, index = list((N.old+1):(N.old+N)))
+    rhdf5::h5writeDataset(as.array(as.character(hap.ids)), h5, hap.ids.name, index = list((N.old+1):(N.old+N)))
   }
   if(write.loci.ids) {
-    rhdf5::h5write(as.array(as.character(loci.ids)), h5, loci.ids.name, index = list(1:L))
+    rhdf5::h5writeDataset(as.array(as.character(loci.ids)), h5, loci.ids.name, index = list(1:L))
   }
 
   rhdf5::h5closeAll()
@@ -351,6 +352,7 @@ ReadHaplotypes <- function(hdf5.file,
   if(!identical(loci.ids, NA) && !identical(loci.idx, NA)) {
     stop("Can only specify one of loci.ids or loci.idx argument.")
   }
+  # NOTE: this previously had to be removed to allow running on WashU cluster -- if error triggers here again LA and RC to discuss
   if(length(find.package("rhdf5", quiet = TRUE)) == 0) {
     stop("The ReadHaplotypes function requires the optional rhdf5 package to be installed (see Bioconductor https://bioconductor.org/packages/rhdf5)")
   }

From d7e3e6f58d87a7b4ccb8e5e42dd05b69f58240fd Mon Sep 17 00:00:00 2001
From: ryanchrist <ryan.christ7@gmail.com>
Date: Mon, 23 Sep 2024 13:15:49 -0500
Subject: [PATCH 11/43] Minor bug fixes to Probs

---
 R/Probs.R | 10 +++++-----
 1 file changed, 5 insertions(+), 5 deletions(-)

diff --git a/R/Probs.R b/R/Probs.R
index 3396a07..1361f75 100644
--- a/R/Probs.R
+++ b/R/Probs.R
@@ -221,7 +221,7 @@ DistMat <- function(fwd, bck, type = "raw", M = NULL, beta.theta.opts = NULL,
                     nthreads = min(parallel::detectCores(logical = FALSE), fwd$to_recipient-fwd$from_recipient+1)){
 
   if(identical(nthreads, "R")) {
-    if(!is.null(M)){stop("M cannot be NULL when requesting the gold master R version with R nthreads")}
+    if(!is.null(M)){stop("M must be NULL when requesting the gold master R version with R nthreads")}
     warning("Warning: using gold master R implementation.")
     return(invisible(DistMat.GM(fwd, bck, type, beta.theta.opts)))
   }
@@ -256,7 +256,7 @@ DistMat <- function(fwd, bck, type = "raw", M = NULL, beta.theta.opts = NULL,
 
 
 
-input_checks_for_probs_and_dist_mat <-  function(fwd,bck,beta.theta.opts){
+input_checks_for_probs_and_dist_mat <-  function(fwd,bck,beta.theta.opts = NULL){
 
   # RUN GENERAL CHECKS
   if(fwd$l == 2147483647L){stop("forward table has not been initialized but not propagated to a variant in {1,...,L}.")}
@@ -295,7 +295,7 @@ input_checks_for_probs_and_dist_mat <-  function(fwd,bck,beta.theta.opts){
 
       if(!inherits(beta.theta.opts$pars,"kalisParameters")){stop("beta.theta.opts$pars must be kalisParameters object.")}
 
-      if(!is.numeric(beta.theta.opts$bias) || beta.theta.opts$bias<=0 || beta.theta.opts$bias>=1 ){stop("bias must be numeric and within (0,1). To obtain a distance matrix AT a particular variant, advance bck to that variant in beta space.")}
+      if(!is.numeric(beta.theta.opts$bias) || beta.theta.opts$bias<0 || beta.theta.opts$bias>1 ){stop("bias must be numeric and within [0,1]. To obtain a distance matrix AT a particular variant, advance bck to that variant in beta space.")}
 
       total.rho <- sum(beta.theta.opts$pars$pars$rho[fwd$l:(bck$l - 1)])
 
@@ -304,12 +304,12 @@ input_checks_for_probs_and_dist_mat <-  function(fwd,bck,beta.theta.opts){
 
     }
 
-    return(list("rho.fwd" = rho.fwd, "rho.bck" = rho.bck))
+    return(invisible(list("rho.fwd" = rho.fwd, "rho.bck" = rho.bck)))
 
   }else{
 
     if(bck$l != fwd$l){stop("variant position of the forward table and backward table do not match.")}
-    return(NULL)
+    return(invisible(NULL))
   }
 }
 

From 7f9252b3bb45263d4e4f062bd38397cff2278a69 Mon Sep 17 00:00:00 2001
From: ryanchrist <ryan.christ7@gmail.com>
Date: Mon, 23 Sep 2024 13:29:56 -0500
Subject: [PATCH 12/43] roxygenize all updates

---
 NAMESPACE                      | 17 ++++++
 R/Iterator.R                   |  3 ++
 man/CladeMat.Rd                | 20 +++++++
 man/CladeMat_old.Rd            | 36 +++++++++++++
 man/Clades.Rd                  | 43 +++++++++++++++
 man/CreateForwardTableCache.Rd | 81 ++++++++++++++++++++++++++++
 man/FillTableCache.Rd          | 88 ++++++++++++++++++++++++++++++
 man/ForwardIterator.Rd         | 61 +++++++++++++++++++++
 man/ForwardUsingTableCache.Rd  | 97 ++++++++++++++++++++++++++++++++++
 man/Neighbors.Rd               | 21 ++++++++
 man/PruneCladeMat.Rd           | 11 ++++
 man/Sprigs.Rd                  | 11 ++++
 man/Sprigs_old.Rd              | 21 ++++++++
 13 files changed, 510 insertions(+)
 create mode 100644 man/CladeMat.Rd
 create mode 100644 man/CladeMat_old.Rd
 create mode 100644 man/Clades.Rd
 create mode 100644 man/CreateForwardTableCache.Rd
 create mode 100644 man/FillTableCache.Rd
 create mode 100644 man/ForwardIterator.Rd
 create mode 100644 man/ForwardUsingTableCache.Rd
 create mode 100644 man/Neighbors.Rd
 create mode 100644 man/PruneCladeMat.Rd
 create mode 100644 man/Sprigs.Rd
 create mode 100644 man/Sprigs_old.Rd

diff --git a/NAMESPACE b/NAMESPACE
index e67a690..2dcd5a3 100644
--- a/NAMESPACE
+++ b/NAMESPACE
@@ -1,27 +1,44 @@
 # Generated by roxygen2: do not edit by hand
 
 S3method(plot,kalisDistanceMatrix)
+S3method(plot,kalisIterator)
 S3method(print,kalisBackwardTable)
+S3method(print,kalisCheckpointTable)
 S3method(print,kalisForwardTable)
+S3method(print,kalisIterator)
 S3method(print,kalisParameters)
+S3method(targets,kalisIterator)
 export(Backward)
 export(CacheHaplotypes)
 export(CacheSummary)
 export(CalcRho)
+export(CalcTraces)
+export(CladeMat)
+export(CladeMat_old)
+export(Clades)
 export(ClearHaplotypeCache)
 export(CopyTable)
+export(CreateForwardTableCache)
 export(DistMat)
+export(FillTableCache)
 export(Forward)
+export(ForwardIterator)
+export(ForwardUsingTableCache)
 export(L)
 export(MakeBackwardTable)
 export(MakeForwardTable)
 export(N)
+export(Neighbors)
 export(Parameters)
 export(PostProbs)
+export(PruneCladeMat)
 export(QueryCache)
 export(ReadHaplotypes)
 export(ResetTable)
+export(Sprigs)
+export(Sprigs_old)
 export(WriteHaplotypes)
+export(calc_tables)
 import(checkmate)
 import(dplyr)
 importFrom(digest,digest)
diff --git a/R/Iterator.R b/R/Iterator.R
index e28a095..51cb1d7 100644
--- a/R/Iterator.R
+++ b/R/Iterator.R
@@ -274,6 +274,7 @@ targets <- function(x) { # put this declaration above and below because it seems
   UseMethod("targets")
 }
 
+#' @export
 targets.kalisIterator <- function(iter){
   if(!"kalisIterator"%in%class(iter)){stop("argument must be a kalisIterator")}
   rev(get("targets", envir = environment(iter)))
@@ -283,6 +284,7 @@ targets <- function(x) {
   UseMethod("targets")
 }
 
+#' @export
 print.kalisIterator <- function(iter){
   if(!"kalisIterator"%in%class(iter)){stop("argument must be a kalisIterator")}
 
@@ -297,6 +299,7 @@ print.kalisIterator <- function(iter){
   }
 }
 
+#' @export
 plot.kalisIterator <- function(iter){
   if(!"kalisIterator"%in%class(iter)){stop("argument must be a kalisIterator")}
   sch <- get("sch",envir = environment(iter))
diff --git a/man/CladeMat.Rd b/man/CladeMat.Rd
new file mode 100644
index 0000000..7eed863
--- /dev/null
+++ b/man/CladeMat.Rd
@@ -0,0 +1,20 @@
+% Generated by roxygen2: do not edit by hand
+% Please edit documentation in R/CladeMat.R
+\name{CladeMat}
+\alias{CladeMat}
+\title{Fast Clade Matrix Construction}
+\usage{
+CladeMat(
+  fwd,
+  bck,
+  M,
+  unit.dist,
+  thresh = 0.2,
+  max1var = FALSE,
+  nthreads = min(parallel::detectCores(logical = FALSE), fwd$to_recipient -
+    fwd$from_recipient + 1)
+)
+}
+\description{
+Fast Clade Matrix Construction
+}
diff --git a/man/CladeMat_old.Rd b/man/CladeMat_old.Rd
new file mode 100644
index 0000000..aebb53c
--- /dev/null
+++ b/man/CladeMat_old.Rd
@@ -0,0 +1,36 @@
+% Generated by roxygen2: do not edit by hand
+% Please edit documentation in R/Clades.R
+\name{CladeMat_old}
+\alias{CladeMat_old}
+\title{CladeMat OLD}
+\usage{
+CladeMat_old(
+  x,
+  ploidy = 2L,
+  sprigs.to.prune = NULL,
+  assemble = TRUE,
+  use.forking = FALSE,
+  forking.chunk.size = 100L,
+  mc.preschedule = FALSE,
+  nthreads = 1L
+)
+}
+\arguments{
+\item{x}{a \code{kalisClades} object returned by \code{\link{kalisClades}}}
+
+\item{ploidy}{an integer, the ploidy of the organism}
+
+\item{sprigs.to.prune}{a \code{kalisSprigs} object returned by \code{\link{kalisSprigs}} encoding sprigs that should be excluded from the matrix returned}
+
+\item{assemble}{a logical, if FALSE return the clade matrix as a list of columns rather than as a symmetrized matrix}
+
+\item{use.forking}{a logical, should forked processes be used?}
+
+\item{nthreads}{the number of CPU cores to use. Currently, no parallelism is used.}
+}
+\value{
+a matrix representation of the probabilistic clades provided
+}
+\description{
+Utility for contructing a probabilistic clade matrix
+}
diff --git a/man/Clades.Rd b/man/Clades.Rd
new file mode 100644
index 0000000..cae541b
--- /dev/null
+++ b/man/Clades.Rd
@@ -0,0 +1,43 @@
+% Generated by roxygen2: do not edit by hand
+% Please edit documentation in R/Clades.R
+\name{Clades}
+\alias{Clades}
+\title{Probabilistic Clades}
+\usage{
+Clades(
+  fwd,
+  bck,
+  pars,
+  beta.theta.opts = NULL,
+  safety.checks = FALSE,
+  neighbors = FALSE,
+  use.forking = FALSE,
+  forking.chunk.size = 100L,
+  mc.preschedule = FALSE,
+  nthreads = 1L
+)
+}
+\arguments{
+\item{fwd}{a forward table as returned by \code{\link{MakeForwardTable}}}
+
+\item{bck}{a backward table as returned by \code{\link{MakeBackwardTable}}}
+
+\item{pars}{a \code{kalisParameters} object, as returned by
+\code{\link{Parameters}}.}
+
+\item{beta.theta.opts}{a list; see Details for \code{\link{DistMat}}.}
+
+\item{safety.checks}{a logical, should safety checks be applied to the distances?  See \code{\link{DistMat}}.}
+
+\item{neighbors}{a logical, should nearest neighbors be pre-calculated?  See \code{\link{Neighbors}}.}
+
+\item{use.forking}{a logical, should forked processes be used?}
+
+\item{nthreads}{the number of CPU cores to use. Currently, no parallelism is used.}
+}
+\value{
+a \code{kalisClades} object encoding probabilistic clade calls
+}
+\description{
+Utility for calling probabilistic clades at, in between, or excluding variants.
+}
diff --git a/man/CreateForwardTableCache.Rd b/man/CreateForwardTableCache.Rd
new file mode 100644
index 0000000..ff224ed
--- /dev/null
+++ b/man/CreateForwardTableCache.Rd
@@ -0,0 +1,81 @@
+% Generated by roxygen2: do not edit by hand
+% Please edit documentation in R/TableCache.R
+\name{CreateForwardTableCache}
+\alias{CreateForwardTableCache}
+\title{Create cache for forward tables}
+\usage{
+CreateForwardTableCache(
+  pars,
+  size = 1,
+  from_recipient = 1,
+  to_recipient = Inf,
+  max.tables = 0
+)
+}
+\arguments{
+\item{pars}{a \code{kalisParameters} object, as returned by
+\code{Parameters}.}
+
+\item{size}{the maximum amount of RAM (in GB) to devote to this cache.}
+
+\item{from_recipient}{first recipient haplotype if creating a partial forward
+table cache.  By default includes from the first recipient haplotype.}
+
+\item{to_recipient}{last recipient haplotype if creating a partial forward
+table cache.  By default includes to the last recipient haplotype.}
+}
+\value{
+A list of forward tables representing a cache and ready to be filled is
+returned.
+}
+\description{
+Create an in-memory cache for forward tables to improve efficiency when
+iterating in reverse along the haplotype sequences.
+}
+\details{
+If the objective is to run the Li and Stephens hidden Markov model both
+forwards and backwards to the same locus (and to do so for every possible
+locus), then considerable efficiency can be achieved by first performing a
+full scan forwards, filling a geometrically spaced cache whilst doing so.
+Then, by working backwards, the backward propagation moves one locus at a
+time and the forward propagation can move backwards by moving forward from a
+recently cached local table.
+
+Memory for a cache can be allocated using this function and should then be
+filled with \code{\link{FillTableCache}}.
+To use the cache, then instead of using the \code{\link{Forward}} function,
+use \code{\link{ForwardUsingTableCache}}.
+}
+\examples{
+\dontrun{
+# This code assumes you have already:
+#  i) cached the haplotypes using CacheHaplotypes function
+#  ii) setup parameters in a variable called pars
+#  iii) set the number of loci in a variable called L
+
+# Allocate up to 10GB to a cache, with parameters already setup in pars ...
+cache <- CreateForwardTableCache(pars, 10)
+# ... and fill it
+FillTableCache(cache, pars, nthreads = 8)
+
+# Create forward and backward tables
+fwd <- MakeForwardTable(pars)
+bck <- MakeBackwardTable(pars)
+
+# Then reach every locus faster by iterating backwards, using the cache to
+# move the forward table into position faster
+for(l in L:1) {
+  Backward(bck, pars, l, nthreads = 8)
+  ForwardUsingTableCache(fwd, pars, cache, l, nthreads = 8)
+  # Do whatever work is required at
+  # every locus here using fwd and bck
+}
+}
+
+}
+\seealso{
+\code{\link{MakeForwardTable}} to make a forward table;
+\code{\link{FillTableCache}} to fill a cache;
+\code{\link{ForwardUsingTableCache}} to use a cache;
+\code{\link{Forward}} for forward function without using a cache.
+}
diff --git a/man/FillTableCache.Rd b/man/FillTableCache.Rd
new file mode 100644
index 0000000..b1fc2f8
--- /dev/null
+++ b/man/FillTableCache.Rd
@@ -0,0 +1,88 @@
+% Generated by roxygen2: do not edit by hand
+% Please edit documentation in R/TableCache.R
+\name{FillTableCache}
+\alias{FillTableCache}
+\title{Fill a forward table cache}
+\usage{
+FillTableCache(
+  cache,
+  pars,
+  nthreads = min(parallel::detectCores(logical = FALSE), cache[[1]]$to_recipient -
+    cache[[1]]$from_recipient + 1)
+)
+}
+\arguments{
+\item{cache}{a cache of forward tables as generated by
+\code{\link{CreateForwardTableCache}}}
+
+\item{pars}{a \code{kalisParameters} object, as returned by
+\code{Parameters}.}
+
+\item{nthreads}{the number of CPU cores to use.
+By default no parallelism is used.}
+
+\item{from}{the first locus which the geometrically spaced cache should be
+built from.
+By default the whole sequence length will be cached so this defaults to 1.}
+
+\item{to}{the last locus up to which the geometrically spaced cache should be
+built.
+By default the whole sequence length will be cached so this defaults to
+\code{Inf}.}
+}
+\value{
+There is nothing returned.
+For performance reasons, \code{cache} is updated in-place.
+}
+\description{
+An in-memory cache for forward tables can be filled using this function, for
+either the whole sequence length or some sub-sequence.
+}
+\details{
+If the objective is to run the Li and Stephens hidden Markov model both
+forwards and backwards to the same locus (and to do so for every possible
+locus), then considerable efficiency can be achieved by first performing a
+full scan forwards, filling a geometrically spaced cache whilst doing so.
+Then, by working backwards, the backward propagation moves one locus at a
+time and the forward propagation can move backwards by moving forward from a
+recently cached local table.
+
+Memory for a cache can be allocated using
+\code{\link{CreateForwardTableCache}} and should then be filled with this
+function.
+To use the cache, then instead of using the \code{\link{Forward}} function,
+use \code{\link{ForwardUsingTableCache}}.
+}
+\examples{
+\dontrun{
+# This code assumes you have already:
+#  i) cached the haplotypes using CacheHaplotypes function
+#  ii) setup parameters in a variable called pars
+#  iii) set the number of loci in a variable called L
+
+# Allocate up to 10GB to a cache, with parameters already setup in pars ...
+cache <- CreateForwardTableCache(pars, 10)
+# ... and fill it
+FillTableCache(cache, pars, nthreads = 8)
+
+# Create forward and backward tables
+fwd <- MakeForwardTable(pars)
+bck <- MakeBackwardTable(pars)
+
+# Then reach every locus faster by iterating backwards, using the cache to
+# move the forward table into position faster
+for(l in L:1) {
+  Backward(bck, pars, l, nthreads = 8)
+  ForwardUsingTableCache(fwd, pars, cache, l, nthreads = 8)
+  # Do whatever work is required at
+  # every locus here using fwd and bck
+}
+}
+
+}
+\seealso{
+\code{\link{MakeForwardTable}} to make a forward table;
+\code{\link{CreateForwardTableCache}} to generate a cache;
+\code{\link{ForwardUsingTableCache}} to use a cache;
+\code{\link{Forward}} for forward function without using a cache.
+}
diff --git a/man/ForwardIterator.Rd b/man/ForwardIterator.Rd
new file mode 100644
index 0000000..668137f
--- /dev/null
+++ b/man/ForwardIterator.Rd
@@ -0,0 +1,61 @@
+% Generated by roxygen2: do not edit by hand
+% Please edit documentation in R/Iterator.R
+\name{ForwardIterator}
+\alias{ForwardIterator}
+\title{Build an efficient iterator over loci}
+\usage{
+ForwardIterator(
+  pars,
+  ram.ckpts = 1L,
+  targets = 1:kalis:::pkgVars$L,
+  base.fwd.table = NULL,
+  disk.ckpts = 0,
+  disk.dir = NULL,
+  from_recipient = 1,
+  to_recipient = Inf,
+  lookup.tables = NULL,
+  cache = NULL,
+  save.cache = FALSE,
+  exact = TRUE,
+  force.unif = FALSE
+)
+}
+\arguments{
+\item{ram.ckpts}{an integer specifying the number of checkpoints to store in RAM}
+
+\item{targets}{a vector of loci to iterate over (starting with the most downstream target)}
+
+\item{base.fwd.table}{a \code{kalisForwardTable} either at the most upstream target, or if the targets are evenly spaced, one interval upstream of the most upstream target.
+NULL (the default) is interpretted as the prior \code{Pi}, see \code{\link{Parameters}}}
+
+\item{disk.ckpts}{an integer specifying the number of checkpoints to store on disk}
+
+\item{disk.dir}{a path to a directory where a temporary folder may be made to store checkpoints on disk}
+
+\item{force.unif}{a logical, if TRUE iterate over targets as if they were uniformly spaced. WARNING: DO NOT use this in conjunction with the targets method, still experimental. With force.unif = TRUE, the resulting iterator appear to be targeting the first length(targets) variants with all methods, but in fact will be silently iterating over the original targets.}
+}
+\description{
+Create a \code{kalisForwardIterator} for propagating a forward table iteratively over target loci using a table cache and optimal checkpointing.
+}
+\details{
+See example.
+}
+\examples{
+\dontrun{
+data("SmallHaps")
+CacheHaplotypes(SmallHaps)
+pars <- Parameters()
+fwd <- MakeForwardTable(pars)
+bck <- MakeBackwardTable(pars)
+Iter <- ForwardIterator(2)
+for(t in targets(Iter)){
+  Iter(fwd,pars,t)
+  Backward(bck,pars,t)
+  print(paste("Mean Distance at locus",t,"is",mean(DistMat(fwd,bck))))
+}
+}
+
+}
+\seealso{
+\code{\link{MakeForwardTable}} to create a \code{kalisForwardTable}.
+}
diff --git a/man/ForwardUsingTableCache.Rd b/man/ForwardUsingTableCache.Rd
new file mode 100644
index 0000000..87b26e9
--- /dev/null
+++ b/man/ForwardUsingTableCache.Rd
@@ -0,0 +1,97 @@
+% Generated by roxygen2: do not edit by hand
+% Please edit documentation in R/TableCache.R
+\name{ForwardUsingTableCache}
+\alias{ForwardUsingTableCache}
+\title{Use a forward table cache to propagate}
+\usage{
+ForwardUsingTableCache(
+  fwd,
+  pars,
+  cache,
+  t = fwd$l - 1,
+  nthreads = min(parallel::detectCores(logical = FALSE), fwd$to_recipient -
+    fwd$from_recipient + 1)
+)
+}
+\arguments{
+\item{fwd}{a \code{kalisForwardTable} object, as returned by
+\code{\link{MakeForwardTable}}.}
+
+\item{pars}{a \code{kalisParameters} object, as returned by
+\code{Parameters}.}
+
+\item{cache}{a cache of forward tables as generated by
+\code{\link{CreateForwardTableCache}} and filled using
+\code{\link{FillTableCache}}.}
+
+\item{t}{a locus position to move the forward table to, starting the forward
+propagation from whatever table in the \code{cache} variable is immediately
+before locus \code{t}.
+By default, it simply advances to the previous locus (which is the natural
+direction to move when using the cache).}
+
+\item{nthreads}{the number of CPU cores to use.
+By default no parallelism is used.}
+}
+\value{
+There is nothing returned.
+For performance reasons, \code{fwd} is updated in-place.
+}
+\description{
+An in-memory cache for forward tables, which has already been filled, can be
+used to move more quickly to a specified locus.
+}
+\details{
+If the objective is to run the Li and Stephens hidden Markov model both
+forwards and backwards to the same locus (and to do so for every possible
+locus), then considerable efficiency can be achieved by first performing a
+full scan forwards, filling a geometrically spaced cache whilst doing so.
+Then, by working backwards, the backward propagation moves one locus at a
+time and the forward propagation can move backwards by moving forward from a
+recently cached local table.
+
+Memory for a cache can be allocated using
+\code{\link{CreateForwardTableCache}} and should then be filled with
+\code{\link{FillTableCache}}.
+To use the cache, then instead of using the \code{\link{Forward}} function,
+use this function.
+
+Note that the \code{cache} which is passed to this function will be
+dynamically updated based on the locus requested: the assumption is that
+the cache is used to propagate in reverse so any cache entries for a locus
+position past \code{t} are taken to be no longer needed and that space will
+redeployed to more densely fill the cache with earlier locus positions.
+}
+\examples{
+\dontrun{
+# This code assumes you have already:
+#  i) cached the haplotypes using CacheHaplotypes function
+#  ii) setup parameters in a variable called pars
+#  iii) set the number of loci in a variable called L
+
+# Allocate up to 10GB to a cache, with parameters already setup in pars ...
+cache <- CreateForwardTableCache(pars, 10)
+# ... and fill it
+FillTableCache(cache, pars, nthreads = 8)
+
+# Create forward and backward tables
+fwd <- MakeForwardTable(pars)
+bck <- MakeBackwardTable(pars)
+
+# Then reach every locus faster by iterating backwards, using the cache to
+# move the forward table into position faster
+for(l in L:1) {
+  Backward(bck, pars, l, nthreads = 8)
+  ForwardUsingTableCache(fwd, pars, cache, l, nthreads = 8)
+  # Do whatever work is required at
+  # every locus here using fwd and bck
+}
+}
+
+}
+\seealso{
+\code{\link{MakeForwardTable}} to make a forward table;
+\code{\link{CreateForwardTableCache}} to generate a cache;
+\code{\link{FillTableCache}} to fill a cache;
+\code{\link{Forward}} for forward function without using a cache.
+}
diff --git a/man/Neighbors.Rd b/man/Neighbors.Rd
new file mode 100644
index 0000000..3aac88f
--- /dev/null
+++ b/man/Neighbors.Rd
@@ -0,0 +1,21 @@
+% Generated by roxygen2: do not edit by hand
+% Please edit documentation in R/Clades.R
+\name{Neighbors}
+\alias{Neighbors}
+\title{Neighbors}
+\usage{
+Neighbors(x, use.forking = FALSE, nthreads = 1L)
+}
+\arguments{
+\item{x}{a \code{kalisClades} object returned by \code{\link{kalisClades}}}
+
+\item{use.forking}{a logical, should forked processes be used?}
+
+\item{nthreads}{the number of CPU cores to use. Currently, no parallelism is used.}
+}
+\value{
+a \code{kalisNeighbors} encoding the nearest neighbors for each recipient haplotype
+}
+\description{
+Utility for calling tied nearest neighbors for each recipient haplotype
+}
diff --git a/man/PruneCladeMat.Rd b/man/PruneCladeMat.Rd
new file mode 100644
index 0000000..2cd1b48
--- /dev/null
+++ b/man/PruneCladeMat.Rd
@@ -0,0 +1,11 @@
+% Generated by roxygen2: do not edit by hand
+% Please edit documentation in R/Clades.R
+\name{PruneCladeMat}
+\alias{PruneCladeMat}
+\title{PruneCladeMat}
+\usage{
+PruneCladeMat(M, neigh, sprigs, prune = "singleton.info", from.recipient = 1L)
+}
+\description{
+PruneCladeMat
+}
diff --git a/man/Sprigs.Rd b/man/Sprigs.Rd
new file mode 100644
index 0000000..c7afd3b
--- /dev/null
+++ b/man/Sprigs.Rd
@@ -0,0 +1,11 @@
+% Generated by roxygen2: do not edit by hand
+% Please edit documentation in R/Clades.R
+\name{Sprigs}
+\alias{Sprigs}
+\title{Sprigs}
+\usage{
+Sprigs(x, old.sprigs = FALSE)
+}
+\description{
+Sprigs
+}
diff --git a/man/Sprigs_old.Rd b/man/Sprigs_old.Rd
new file mode 100644
index 0000000..d8dc6f0
--- /dev/null
+++ b/man/Sprigs_old.Rd
@@ -0,0 +1,21 @@
+% Generated by roxygen2: do not edit by hand
+% Please edit documentation in R/Clades.R
+\name{Sprigs_old}
+\alias{Sprigs_old}
+\title{Sprigs}
+\usage{
+Sprigs_old(x, use.forking = FALSE, nthreads = 1L, add.self = TRUE)
+}
+\arguments{
+\item{x}{a \code{kalisNeighbors} object returned by \code{\link{kalisNeighbors}}, a \code{kalisClades} object returned by \code{\link{kalisClades}} with \code{neighbors = TRUE}, or a list}
+
+\item{use.forking}{a logical, should forked processes be used?}
+
+\item{nthreads}{the number of CPU cores to use. Currently, no parallelism is used.}
+}
+\value{
+a \code{kalisSprigs} object assigning each haplotype to a sprig
+}
+\description{
+Utility for calling sprigs from probabilistic clades
+}

From 9749c4b52fa06d4a12b0e6115aa2d748bfffd239 Mon Sep 17 00:00:00 2001
From: ryanchrist <ryan.christ7@gmail.com>
Date: Mon, 23 Sep 2024 13:30:36 -0500
Subject: [PATCH 13/43] reintroducing inputting haplotypes to kalis vignette

---
 vignettes/Reading_Haplotype_Data.Rmd | 52 ++++++++++++++++++++++++++++
 1 file changed, 52 insertions(+)
 create mode 100644 vignettes/Reading_Haplotype_Data.Rmd

diff --git a/vignettes/Reading_Haplotype_Data.Rmd b/vignettes/Reading_Haplotype_Data.Rmd
new file mode 100644
index 0000000..bfbdc7a
--- /dev/null
+++ b/vignettes/Reading_Haplotype_Data.Rmd
@@ -0,0 +1,52 @@
+---
+title: "Reading Haplotype Data"
+author: "Louis Aslett & Ryan Christ"
+date: "`r Sys.Date()`"
+output: rmarkdown::html_vignette
+vignette: >
+  %\VignetteIndexEntry{Reading Haplotype Data}
+  %\VignetteEngine{knitr::rmarkdown}
+  %\VignetteEncoding{UTF-8}
+  ---
+  
+  ```{r setup, include = FALSE}
+knitr::opts_chunk$set(
+collapse = TRUE,
+comment = "#>"
+)
+```
+
+`kalis` calculates pairwise genetic distances at loci of interest for a set of phased haplotypes stored in a `L x N` matrix `H` where `H[l,i] = 1` if haplotype `i` carries the alternative allele at locus `l` and `H[l,i] = 0` if it carries the reference allele.  For efficiency `kalis` internally must load and store `H` as a matrix of bits.
+
+*For all of the data input types below, it assumed that the haplotypes have already been phased, as required to run `kalis`.*
+
+# Reading from BCF/VCF
+
+To read phased haplotypes stored in a compressed or uncompressed BCF or VCF, the file must first be converted to HAP/SAMPLE/LEGEND format.  For example, for a given compressed VCF, we simply call `bcftools` as follows.
+
+```{r, engine = 'bash', eval = FALSE}
+bcftools convert -h my.vcf.gz
+```
+
+Then, from `R`, we read in the haplotypes by calling
+
+```{r load.data, results = "hide", message=FALSE, eval=FALSE}
+require(kalis)
+CacheHaplotypes("my.hap.gz")
+```
+
+See <http://samtools.github.io/bcftools/bcftools.html#convert> for more details.
+
+For increased reading efficiency `CacheHaplotypes` look will look for the `my.legend` file that was produced by `bcftools` in the same directory as `my.hap.gz` so its worthwhile keeping the `.legend` files. 
+
+`bcftools` can read from many different formats into BCF/VCF, making it an easy tool for conversion into HAP/SAMPLE/LEGEND format.  
+
+
+`kalis`  <http://hgdownload.cse.ucsc.edu/gbdb/hg19/1000Genomes/phase3/>
+
+ALL.chr21.phase3_shapeit2_mvncall_integrated_v5a.20130502.genotypes.hap.gz
+
+
+
+
+

From 2fbd289f39907bf6cd194610ca48f5db7d6b90e9 Mon Sep 17 00:00:00 2001
From: ryanchrist <ryan.christ7@gmail.com>
Date: Mon, 23 Sep 2024 13:35:24 -0500
Subject: [PATCH 14/43] iterating ready to go!

---
 vignettes/Iterating_Over_Loci.Rmd | 51 +++++++++++++++----------------
 1 file changed, 25 insertions(+), 26 deletions(-)

diff --git a/vignettes/Iterating_Over_Loci.Rmd b/vignettes/Iterating_Over_Loci.Rmd
index 657c4ae..f8dafe2 100644
--- a/vignettes/Iterating_Over_Loci.Rmd
+++ b/vignettes/Iterating_Over_Loci.Rmd
@@ -20,30 +20,29 @@ Here show how to use \pkg{kalis} to efficiently iterate over loci sequentially.
 
 ```{r, results='hide'}
 require(kalis)
-# 
-# total.nthreads <- 4
-# n.checkpoints <- 7
-# 
-# nthreads <- as.integer(0:(total.nthreads-1))
-# CacheHaplotypes(SmallHaps)
-# 
-# m <- rbeta(L()-1,1,10)*1e-6
-# pars <- Parameters(CalcRho(cM = m, s = 1, gamma = 1), mu = 1e-8, use.speidel = TRUE)
-# 
-# fwd <- MakeForwardTable(pars)
-# bck <- MakeBackwardTable(pars)
-# M <- matrix(0,N(),N())
-# 
-# Iter <- ForwardIterator(pars,n.checkpoints)
-# 
-# start.time <- proc.time()
-# 
-# for(t in L():1){
-#   Iter(fwd,pars,t,nthreads = nthreads)
-#   Backward(bck,pars,t, nthreads = nthreads)
-#   # Optional: DistMat(fwd,bck,M,type="minus.min", nthreads = total.nthreads)
-#   print(paste("At locus",t))
-# }
-# 
-# print(proc.time() - start.time)
+
+n.checkpoints <- 7
+
+nthreads <- 4
+CacheHaplotypes(SmallHaps)
+
+m <- rbeta(L()-1,1,10)*1e-6
+pars <- Parameters(CalcRho(cM = m, s = 1, gamma = 1), mu = 1e-8, use.speidel = TRUE)
+
+fwd <- MakeForwardTable(pars)
+bck <- MakeBackwardTable(pars)
+M <- matrix(0,N(),N())
+
+Iter <- ForwardIterator(pars,n.checkpoints)
+
+start.time <- proc.time()
+
+for(t in L():1){
+  Iter(fwd,pars,t,nthreads = nthreads)
+  Backward(bck,pars,t, nthreads = nthreads)
+  if(t==200){plot(DistMat(fwd,bck,M,type="minus.min", nthreads = nthreads))}
+  print(paste("At locus",t))
+}
+
+print(proc.time() - start.time)
 ```
\ No newline at end of file

From 1338a48f236658948b49b4ab2f424e5e335dbf16 Mon Sep 17 00:00:00 2001
From: Louis Aslett <louis.aslett@durham.ac.uk>
Date: Wed, 25 Sep 2024 17:21:48 +0100
Subject: [PATCH 15/43] Fixes for CHECK error:
MIME-Version: 1.0
Content-Type: text/plain; charset=UTF-8
Content-Transfer-Encoding: 8bit

W  checking dependencies in R code (488ms)
   '::' or ':::' import not declared from: ‘data.table’
   Namespaces in Imports field not imported from:
     ‘methods’ ‘prettyunits’
     All declared Imports should be used.
   There are ::: calls to the package's namespace in its code. A package
     almost never needs to use ::: for its own objects:
     ‘ResetTable’ ‘pkgVars’
---
 DESCRIPTION            |  4 ++--
 NAMESPACE              |  2 ++
 R/CacheSummary.R       |  1 +
 R/Clades.R             |  1 +
 R/Iterator.R           | 10 +++++-----
 man/ForwardIterator.Rd |  2 +-
 6 files changed, 12 insertions(+), 8 deletions(-)

diff --git a/DESCRIPTION b/DESCRIPTION
index 3a696fd..f4c25b9 100644
--- a/DESCRIPTION
+++ b/DESCRIPTION
@@ -25,7 +25,6 @@ LazyData: TRUE
 Depends: R (>= 3.5.0)
 Imports:
     utils,
-    methods,
     stats,
     parallel,
     dplyr,
@@ -36,7 +35,8 @@ Imports:
     grDevices,
     RColorBrewer,
     lobstr,
-    prettyunits
+    prettyunits,
+    data.table
 RoxygenNote: 7.3.2
 Roxygen: list(markdown = TRUE)
 Suggests: 
diff --git a/NAMESPACE b/NAMESPACE
index 2dcd5a3..41c51cd 100644
--- a/NAMESPACE
+++ b/NAMESPACE
@@ -41,8 +41,10 @@ export(WriteHaplotypes)
 export(calc_tables)
 import(checkmate)
 import(dplyr)
+importFrom(data.table,frank)
 importFrom(digest,digest)
 importFrom(glue,glue)
 importFrom(glue,glue_collapse)
+importFrom(prettyunits,pretty_bytes)
 importFrom(rlang,duplicate)
 useDynLib(kalis, .registration = TRUE, .fixes = "CCall_")
diff --git a/R/CacheSummary.R b/R/CacheSummary.R
index b89510a..396f4f9 100644
--- a/R/CacheSummary.R
+++ b/R/CacheSummary.R
@@ -24,6 +24,7 @@
 #' N()
 #' L()
 #'
+#' @importFrom prettyunits pretty_bytes
 #' @export
 CacheSummary <- function() {
   N <- get("N", envir = pkgVars)
diff --git a/R/Clades.R b/R/Clades.R
index 398c49a..f46b8d5 100644
--- a/R/Clades.R
+++ b/R/Clades.R
@@ -211,6 +211,7 @@ PruneCladeMat <- function(M, neigh, sprigs, prune = "singleton.info", from.recip
 #' @return
 #'   a \code{kalisClades} object encoding probabilistic clade calls
 #'
+#' @importFrom data.table frank
 #' @export Clades
 Clades <- function(fwd, bck, pars, beta.theta.opts = NULL,
                    safety.checks = FALSE, neighbors = FALSE,
diff --git a/R/Iterator.R b/R/Iterator.R
index 51cb1d7..06f0e10 100644
--- a/R/Iterator.R
+++ b/R/Iterator.R
@@ -32,7 +32,7 @@
 #' @export
 ForwardIterator <- function(pars,
                             ram.ckpts = 1L,
-                            targets = 1:kalis:::pkgVars$L,
+                            targets = 1:L(),
                             base.fwd.table = NULL,
                             disk.ckpts = 0,
                             disk.dir = NULL,
@@ -57,7 +57,7 @@ ForwardIterator <- function(pars,
   if(!is.null(cache)){
     for(i in 1:length(cache)){
       if(cache[[i]]$from_recipient!=from_recipient){stop("The provided cache must have the same from_recipient as currently requested.")}
-      if(cache[[i]]$to_recipient!=min(to_recipient,kalis:::pkgVars$N)){stop("The provided cache must have the same to_recipient as currently requested.")}
+      if(cache[[i]]$to_recipient!=min(to_recipient,N())){stop("The provided cache must have the same to_recipient as currently requested.")}
     }
   }
 
@@ -202,7 +202,7 @@ ForwardIterator <- function(pars,
           warning("The provided cache was initialized with parameters that are different from those currently in pars.  Overwritting the pars in the provided cache...")
           cache[[i]]$pars.sha256 <- pars$sha256
         }
-        kalis:::ResetTable(cache[[i]])
+        ResetTable(cache[[i]])
       }
     }
 
@@ -243,7 +243,7 @@ ForwardIterator <- function(pars,
       CopyTable(to = fwd, from = cache[[current.sch$k]])
     }else{
       if(use.pi){
-        kalis:::ResetTable(fwd)
+        ResetTable(fwd)
       }else{
         CopyTable(to = fwd, from = base.fwd.table)
       }
@@ -428,7 +428,7 @@ MakeUpdateCache <- function(sch, use.pi, cost.list = NULL, targets.idx = NULL){
         }else{
           if(track.cost){ cost <<- cost + transfer.cost(kk,0) }
           if(use.pi){
-            kalis:::ResetTable(cache[[kk]]) # Pi could also be the baseline table here for the entire interval
+            ResetTable(cache[[kk]]) # Pi could also be the baseline table here for the entire interval
           }else{
             CopyTable(to = cache[[kk]],base.fwd.table)
           }
diff --git a/man/ForwardIterator.Rd b/man/ForwardIterator.Rd
index 668137f..2954e86 100644
--- a/man/ForwardIterator.Rd
+++ b/man/ForwardIterator.Rd
@@ -7,7 +7,7 @@
 ForwardIterator(
   pars,
   ram.ckpts = 1L,
-  targets = 1:kalis:::pkgVars$L,
+  targets = 1:L(),
   base.fwd.table = NULL,
   disk.ckpts = 0,
   disk.dir = NULL,

From 31c64cc5c4db26726236bc0709eb194caa7d7c12 Mon Sep 17 00:00:00 2001
From: Louis Aslett <louis.aslett@durham.ac.uk>
Date: Wed, 25 Sep 2024 17:31:04 +0100
Subject: [PATCH 16/43] Fixes for CHECK errors:
MIME-Version: 1.0
Content-Type: text/plain; charset=UTF-8
Content-Transfer-Encoding: 8bit

W  checking S3 generic/method consistency ...
   targets:
     function(x)
   targets.kalisIterator:
     function(iter)

   print:
     function(x, ...)
   print.kalisIterator:
     function(iter)

   plot:
     function(x, ...)
   plot.kalisIterator:
     function(iter)
   See section ‘Generic functions and methods’ in the ‘Writing R
   Extensions’ manual.
---
 R/Iterator.R | 30 +++++++++++++++---------------
 1 file changed, 15 insertions(+), 15 deletions(-)

diff --git a/R/Iterator.R b/R/Iterator.R
index 06f0e10..4e48635 100644
--- a/R/Iterator.R
+++ b/R/Iterator.R
@@ -275,9 +275,9 @@ targets <- function(x) { # put this declaration above and below because it seems
 }
 
 #' @export
-targets.kalisIterator <- function(iter){
-  if(!"kalisIterator"%in%class(iter)){stop("argument must be a kalisIterator")}
-  rev(get("targets", envir = environment(iter)))
+targets.kalisIterator <- function(x){
+  if(!"kalisIterator"%in%class(x)){stop("argument must be a kalisIterator")}
+  rev(get("targets", envir = environment(x)))
 }
 
 targets <- function(x) {
@@ -285,26 +285,26 @@ targets <- function(x) {
 }
 
 #' @export
-print.kalisIterator <- function(iter){
-  if(!"kalisIterator"%in%class(iter)){stop("argument must be a kalisIterator")}
+print.kalisIterator <- function(x, ...){
+  if(!"kalisIterator"%in%class(x)){stop("argument must be a kalisIterator")}
 
-  if(get("current.target.index", envir=environment(iter)) == 0){
+  if(get("current.target.index", envir=environment(x)) == 0){
     "This is an exhausted kalisIterator."
   }else{
-    target.range <- range(get("targets", envir = environment(iter)))
-    message(paste("A kalisIterator for",length(get("targets", envir = environment(iter))),"targets ranging from",target.range[1],"to",target.range[2]),appendLF = TRUE)
-    message(paste("Contains",get("max.tables", envir = environment(iter)),"checkpoints using ~",utils::object.size(get("cache", envir = environment(iter)))/1e9,"Gb of RAM"),appendLF = TRUE)
-    message(paste("Next target locus:",get("targets", envir = environment(iter))[get("current.target.index", envir = environment(iter))]),appendLF = TRUE)
+    target.range <- range(get("targets", envir = environment(x)))
+    message(paste("A kalisIterator for",length(get("targets", envir = environment(x))),"targets ranging from",target.range[1],"to",target.range[2]),appendLF = TRUE)
+    message(paste("Contains",get("max.tables", envir = environment(x)),"checkpoints using ~",utils::object.size(get("cache", envir = environment(x)))/1e9,"Gb of RAM"),appendLF = TRUE)
+    message(paste("Next target locus:",get("targets", envir = environment(x))[get("current.target.index", envir = environment(x))]),appendLF = TRUE)
     message("",appendLF = TRUE)
   }
 }
 
 #' @export
-plot.kalisIterator <- function(iter){
-  if(!"kalisIterator"%in%class(iter)){stop("argument must be a kalisIterator")}
-  sch <- get("sch",envir = environment(iter))
-  loci <- get("targets",envir = environment(iter))
-  plot(sch$i[-c(1,nrow(sch))],sch$k[-c(1,nrow(sch))],type="h",lwd=1,bty="n",ylab="K",xlab="locus",las=1,ylim=c(0,max(sch$k)),xlim=range(loci),xaxt="n",yaxt="n")
+plot.kalisIterator <- function(x, ...){
+  if(!"kalisIterator"%in%class(x)){stop("argument must be a kalisIterator")}
+  sch <- get("sch",envir = environment(x))
+  loci <- get("targets",envir = environment(x))
+  plot(sch$i[-c(1,nrow(sch))],sch$k[-c(1,nrow(sch))],type="h",lwd=1,bty="n",ylab="K",xlab="locus",las=1,ylim=c(0,max(sch$k)),xlim=range(loci),xaxt="n",yaxt="n", ...)
   p.loci <- pretty(loci)
   axis(1,at = p.loci ,pos=0)
   axis(2,at = pretty(0:max(sch$k)),pos=p.loci[1],las=2)

From 718f617d61c73016d5eca7e7ab78d477d588c194 Mon Sep 17 00:00:00 2001
From: Louis Aslett <louis.aslett@durham.ac.uk>
Date: Wed, 25 Sep 2024 17:46:39 +0100
Subject: [PATCH 17/43] Partial fix for CHECK errors:
MIME-Version: 1.0
Content-Type: text/plain; charset=UTF-8
Content-Transfer-Encoding: 8bit

N  checking R code for possible problems (3.8s)
   DistMat.GM: no visible binding for global variable ‘sd’
   MakeSolveSchedule : <anonymous>: no visible binding for global variable
     ‘sequential’
   MakeSolveSchedule : <anonymous>: no visible binding for '<<-'
     assignment to ‘first.index’
   MakeSolveSchedule : <anonymous>: no visible binding for global variable
     ‘first.index’
   MakeSolveSchedule : <anonymous>: no visible binding for '<<-'
     assignment to ‘last.index’
   MakeSolveSchedule : <anonymous>: no visible binding for global variable
     ‘last.index’
   MakeSolveSchedule : <anonymous>: no visible global function definition
     for ‘SolveSchedule’
   MakeSolveSchedule : <anonymous>: no visible global function definition
     for ‘optimize’
   MakeSolveSchedule : <anonymous>: no visible global function definition
     for ‘tail’
   MakeUpdateCache : <anonymous>: no visible binding for global variable
     ‘d’
   UpdateMatrixInPlace: no visible global function definition for
     ‘getFromNamespace’
   obj_func_for_SolveSchedule: no visible binding for '<<-' assignment to
     ‘sch.k’
   obj_func_for_SolveSchedule: no visible binding for global variable
     ‘sch.k’
   obj_func_for_SolveSchedule: no visible binding for global variable
     ‘nrow.sch’
   obj_func_for_SolveSchedule: no visible binding for '<<-' assignment to
     ‘sch.i’
   obj_func_for_SolveSchedule: no visible binding for global variable
     ‘sch.i’
   obj_func_for_SolveSchedule: no visible global function definition for
     ‘SolveSchedule’
   plot.kalisIterator: no visible global function definition for ‘axis’
   Undefined global functions or variables:
     SolveSchedule axis d first.index getFromNamespace last.index nrow.sch
     optimize sch.i sch.k sd sequential tail
   Consider adding
     importFrom("graphics", "axis")
     importFrom("stats", "optimize", "sd")
     importFrom("utils", "getFromNamespace", "tail")
   to your NAMESPACE file.
---
 NAMESPACE      | 5 +++++
 R/Clades.R     | 2 +-
 R/Iterator.R   | 3 +++
 R/Parameters.R | 1 +
 R/kalis.R      | 1 +
 5 files changed, 11 insertions(+), 1 deletion(-)

diff --git a/NAMESPACE b/NAMESPACE
index 41c51cd..3d211fa 100644
--- a/NAMESPACE
+++ b/NAMESPACE
@@ -45,6 +45,11 @@ importFrom(data.table,frank)
 importFrom(digest,digest)
 importFrom(glue,glue)
 importFrom(glue,glue_collapse)
+importFrom(graphics,axis)
 importFrom(prettyunits,pretty_bytes)
 importFrom(rlang,duplicate)
+importFrom(stats,optimize)
+importFrom(stats,sd)
+importFrom(utils,getFromNamespace)
+importFrom(utils,tail)
 useDynLib(kalis, .registration = TRUE, .fixes = "CCall_")
diff --git a/R/Clades.R b/R/Clades.R
index f46b8d5..122f529 100644
--- a/R/Clades.R
+++ b/R/Clades.R
@@ -108,7 +108,7 @@ Sprigs <- function(x, old.sprigs = FALSE){
 }
 
 
-
+#' @importFrom utils getFromNamespace
 UpdateMatrixInPlace <- function(M,row.idx,col.idx,x){
   invisible(.Call(getFromNamespace("CCall_UpdateRealInPlace","kalis"),M,
                   as.integer(row.idx + (col.idx-1L)*nrow(M)),x))
diff --git a/R/Iterator.R b/R/Iterator.R
index 4e48635..4272942 100644
--- a/R/Iterator.R
+++ b/R/Iterator.R
@@ -299,6 +299,7 @@ print.kalisIterator <- function(x, ...){
   }
 }
 
+#' @importFrom graphics axis
 #' @export
 plot.kalisIterator <- function(x, ...){
   if(!"kalisIterator"%in%class(x)){stop("argument must be a kalisIterator")}
@@ -559,6 +560,8 @@ obj_func_for_SolveSchedule <- function(i,ins,d,indicies,num.available.ckpts){
 }
 
 
+#' @importFrom stats optimize
+#' @importFrom utils tail
 MakeSolveSchedule <- function(exact = TRUE){
 
   sch.k <- 0L
diff --git a/R/Parameters.R b/R/Parameters.R
index bf40ca1..846ef91 100644
--- a/R/Parameters.R
+++ b/R/Parameters.R
@@ -238,6 +238,7 @@ Parameters <- function(rho = rep(0, get("L", envir = pkgVars)-1),
   res
 }
 
+#' @importFrom utils tail
 #' @export
 print.kalisParameters <- function(x, ...) {
   if(is.matrix(x$pars$Pi)) {
diff --git a/R/kalis.R b/R/kalis.R
index e3f75a2..49c9c74 100644
--- a/R/kalis.R
+++ b/R/kalis.R
@@ -3,6 +3,7 @@
 #' @importFrom glue glue glue_collapse
 #' @importFrom rlang duplicate
 #' @importFrom digest digest
+#' @importFrom stats sd
 #'
 #' @useDynLib kalis, .registration = TRUE, .fixes = "CCall_"
 NULL

From 2b0341b4e97bbf50aae521a7cc953488d6aaaad8 Mon Sep 17 00:00:00 2001
From: Louis Aslett <louis.aslett@durham.ac.uk>
Date: Wed, 25 Sep 2024 17:51:49 +0100
Subject: [PATCH 18/43] Fix N  checking Rd line widths ...    Rd file
 'WriteHaplotypes.Rd':      \examples lines wider than 100 characters:        
 # ... write them to a file, giving alphabetic letters "A" through "T" as the
 #' # haplotype names ...

   These lines will be truncated in the PDF manual.
---
 R/IndividualSequenceIO_H5.R | 3 ++-
 man/WriteHaplotypes.Rd      | 3 ++-
 2 files changed, 4 insertions(+), 2 deletions(-)

diff --git a/R/IndividualSequenceIO_H5.R b/R/IndividualSequenceIO_H5.R
index 0fea53f..ac3f74c 100644
--- a/R/IndividualSequenceIO_H5.R
+++ b/R/IndividualSequenceIO_H5.R
@@ -38,7 +38,8 @@
 #' haps <- matrix(sample(0:1, n.haps*n.vars, replace = TRUE),
 #'                nrow = n.vars, ncol = n.haps)
 #'
-#' # ... write them to a file, giving alphabetic letters "A" through "T" as the #' # haplotype names ...
+#' # ... write them to a file, giving alphabetic letters "A" through "T" as the
+#' # haplotype names ...
 #' WriteHaplotypes("~/myhaps.h5", haps, hap.ids = LETTERS[1:20])
 #'
 #' # ... and confirm we can read a chosen portion back.  Try to read back
diff --git a/man/WriteHaplotypes.Rd b/man/WriteHaplotypes.Rd
index b6f4fb6..5d2d0fe 100644
--- a/man/WriteHaplotypes.Rd
+++ b/man/WriteHaplotypes.Rd
@@ -78,7 +78,8 @@ n.vars <- 200
 haps <- matrix(sample(0:1, n.haps*n.vars, replace = TRUE),
                nrow = n.vars, ncol = n.haps)
 
-# ... write them to a file, giving alphabetic letters "A" through "T" as the #' # haplotype names ...
+# ... write them to a file, giving alphabetic letters "A" through "T" as the
+# haplotype names ...
 WriteHaplotypes("~/myhaps.h5", haps, hap.ids = LETTERS[1:20])
 
 # ... and confirm we can read a chosen portion back.  Try to read back

From 5d325b5d484cdc672ed2bb8bc44c70bee0fe6e85 Mon Sep 17 00:00:00 2001
From: Louis Aslett <louis.aslett@durham.ac.uk>
Date: Wed, 25 Sep 2024 18:18:31 +0100
Subject: [PATCH 19/43] =?UTF-8?q?Change=20to=20markdown=20\code=20and=20\l?=
 =?UTF-8?q?ink's=20and=20also=20fix=20W=20=20checking=20Rd=20cross-referen?=
 =?UTF-8?q?ces=20...=20=20=20=20Missing=20link=20or=20links=20in=20Rd=20fi?=
 =?UTF-8?q?le=20'CladeMat=5Fold.Rd':=20=20=20=20=20=20=E2=80=98kalisClades?=
 =?UTF-8?q?=E2=80=99=20=E2=80=98kalisSprigs=E2=80=99?=
MIME-Version: 1.0
Content-Type: text/plain; charset=UTF-8
Content-Transfer-Encoding: 8bit

   Missing link or links in Rd file 'Neighbors.Rd':
     ‘kalisClades’

   Missing link or links in Rd file 'Sprigs_old.Rd':
     ‘kalisNeighbors’ ‘kalisClades’

   See section 'Cross-references' in the 'Writing R Extensions' manual.
---
 R/Clades.R          | 29 ++++++++++++++---------------
 man/CladeMat_old.Rd |  6 +++---
 man/Clades.Rd       | 13 ++++++-------
 man/Neighbors.Rd    |  2 +-
 man/Sprigs_old.Rd   |  2 +-
 5 files changed, 25 insertions(+), 27 deletions(-)

diff --git a/R/Clades.R b/R/Clades.R
index 122f529..0a29988 100644
--- a/R/Clades.R
+++ b/R/Clades.R
@@ -199,17 +199,16 @@ PruneCladeMat <- function(M, neigh, sprigs, prune = "singleton.info", from.recip
 #' Probabilistic Clades
 #'
 #' Utility for calling probabilistic clades at, in between, or excluding variants.
-#' @param fwd a forward table as returned by \code{\link{MakeForwardTable}}
-#' @param bck a backward table as returned by \code{\link{MakeBackwardTable}}
-#' @param pars a \code{kalisParameters} object, as returned by
-#'   \code{\link{Parameters}}.
-#' @param beta.theta.opts a list; see Details for \code{\link{DistMat}}.
-#' @param safety.checks a logical, should safety checks be applied to the distances?  See \code{\link{DistMat}}.
-#' @param neighbors a logical, should nearest neighbors be pre-calculated?  See \code{\link{Neighbors}}.
+#' @param fwd a forward table as returned by [MakeForwardTable()]
+#' @param bck a backward table as returned by [MakeBackwardTable()]
+#' @param pars a `kalisParameters` object, as returned by [Parameters()].
+#' @param beta.theta.opts a list; see Details for [DistMat()].
+#' @param safety.checks a logical, should safety checks be applied to the distances?  See [DistMat()].
+#' @param neighbors a logical, should nearest neighbors be pre-calculated?  See [Neighbors()].
 #' @param use.forking a logical, should forked processes be used?
 #' @param nthreads the number of CPU cores to use. Currently, no parallelism is used.
 #' @return
-#'   a \code{kalisClades} object encoding probabilistic clade calls
+#'   a `kalisClades` object encoding probabilistic clade calls
 #'
 #' @importFrom data.table frank
 #' @export Clades
@@ -295,11 +294,11 @@ Clades <- function(fwd, bck, pars, beta.theta.opts = NULL,
 #' Neighbors
 #'
 #' Utility for calling tied nearest neighbors for each recipient haplotype
-#' @param x a \code{kalisClades} object returned by \code{\link{kalisClades}}
+#' @param x a `kalisClades` object returned by [Clades()]
 #' @param use.forking a logical, should forked processes be used?
 #' @param nthreads the number of CPU cores to use. Currently, no parallelism is used.
 #' @return
-#'   a \code{kalisNeighbors} encoding the nearest neighbors for each recipient haplotype
+#'   a `kalisNeighbors` encoding the nearest neighbors for each recipient haplotype
 #'
 #' @export Neighbors
 Neighbors <- function(x,
@@ -346,11 +345,11 @@ Neighbors <- function(x,
 #' Sprigs
 #'
 #' Utility for calling sprigs from probabilistic clades
-#' @param x a \code{kalisNeighbors} object returned by \code{\link{kalisNeighbors}}, a \code{kalisClades} object returned by \code{\link{kalisClades}} with \code{neighbors = TRUE}, or a list
+#' @param x a `kalisNeighbors` object returned by [Neighbors()], a `kalisClades` object returned by [Clades()] with `neighbors = TRUE`, or a list
 #' @param use.forking a logical, should forked processes be used?
 #' @param nthreads the number of CPU cores to use. Currently, no parallelism is used.
 #' @return
-#'   a \code{kalisSprigs} object assigning each haplotype to a sprig
+#'   a `kalisSprigs` object assigning each haplotype to a sprig
 #'
 #' @export Sprigs_old
 Sprigs_old <- function(x, use.forking = FALSE, nthreads = 1L, add.self = TRUE){
@@ -446,10 +445,10 @@ Sprigs_old <- function(x, use.forking = FALSE, nthreads = 1L, add.self = TRUE){
 #' CladeMat OLD
 #'
 #' Utility for contructing a probabilistic clade matrix
-#' @param x a \code{kalisClades} object returned by \code{\link{kalisClades}}
+#' @param x a `kalisClades` object returned by [Clades()]
 #' @param ploidy an integer, the ploidy of the organism
-#' @param sprigs.to.prune a \code{kalisSprigs} object returned by \code{\link{kalisSprigs}} encoding sprigs that should be excluded from the matrix returned
-#' @param assemble a logical, if FALSE return the clade matrix as a list of columns rather than as a symmetrized matrix
+#' @param sprigs.to.prune a `kalisSprigs` object returned by [Sprigs()] encoding sprigs that should be excluded from the matrix returned
+#' @param assemble a logical, if `FALSE` return the clade matrix as a list of columns rather than as a symmetrized matrix
 #' @param use.forking a logical, should forked processes be used?
 #' @param nthreads the number of CPU cores to use. Currently, no parallelism is used.
 #' @return
diff --git a/man/CladeMat_old.Rd b/man/CladeMat_old.Rd
index aebb53c..7695578 100644
--- a/man/CladeMat_old.Rd
+++ b/man/CladeMat_old.Rd
@@ -16,13 +16,13 @@ CladeMat_old(
 )
 }
 \arguments{
-\item{x}{a \code{kalisClades} object returned by \code{\link{kalisClades}}}
+\item{x}{a \code{kalisClades} object returned by \code{\link[=Clades]{Clades()}}}
 
 \item{ploidy}{an integer, the ploidy of the organism}
 
-\item{sprigs.to.prune}{a \code{kalisSprigs} object returned by \code{\link{kalisSprigs}} encoding sprigs that should be excluded from the matrix returned}
+\item{sprigs.to.prune}{a \code{kalisSprigs} object returned by \code{\link[=Sprigs]{Sprigs()}} encoding sprigs that should be excluded from the matrix returned}
 
-\item{assemble}{a logical, if FALSE return the clade matrix as a list of columns rather than as a symmetrized matrix}
+\item{assemble}{a logical, if \code{FALSE} return the clade matrix as a list of columns rather than as a symmetrized matrix}
 
 \item{use.forking}{a logical, should forked processes be used?}
 
diff --git a/man/Clades.Rd b/man/Clades.Rd
index cae541b..b5552c5 100644
--- a/man/Clades.Rd
+++ b/man/Clades.Rd
@@ -18,18 +18,17 @@ Clades(
 )
 }
 \arguments{
-\item{fwd}{a forward table as returned by \code{\link{MakeForwardTable}}}
+\item{fwd}{a forward table as returned by \code{\link[=MakeForwardTable]{MakeForwardTable()}}}
 
-\item{bck}{a backward table as returned by \code{\link{MakeBackwardTable}}}
+\item{bck}{a backward table as returned by \code{\link[=MakeBackwardTable]{MakeBackwardTable()}}}
 
-\item{pars}{a \code{kalisParameters} object, as returned by
-\code{\link{Parameters}}.}
+\item{pars}{a \code{kalisParameters} object, as returned by \code{\link[=Parameters]{Parameters()}}.}
 
-\item{beta.theta.opts}{a list; see Details for \code{\link{DistMat}}.}
+\item{beta.theta.opts}{a list; see Details for \code{\link[=DistMat]{DistMat()}}.}
 
-\item{safety.checks}{a logical, should safety checks be applied to the distances?  See \code{\link{DistMat}}.}
+\item{safety.checks}{a logical, should safety checks be applied to the distances?  See \code{\link[=DistMat]{DistMat()}}.}
 
-\item{neighbors}{a logical, should nearest neighbors be pre-calculated?  See \code{\link{Neighbors}}.}
+\item{neighbors}{a logical, should nearest neighbors be pre-calculated?  See \code{\link[=Neighbors]{Neighbors()}}.}
 
 \item{use.forking}{a logical, should forked processes be used?}
 
diff --git a/man/Neighbors.Rd b/man/Neighbors.Rd
index 3aac88f..63e1695 100644
--- a/man/Neighbors.Rd
+++ b/man/Neighbors.Rd
@@ -7,7 +7,7 @@
 Neighbors(x, use.forking = FALSE, nthreads = 1L)
 }
 \arguments{
-\item{x}{a \code{kalisClades} object returned by \code{\link{kalisClades}}}
+\item{x}{a \code{kalisClades} object returned by \code{\link[=Clades]{Clades()}}}
 
 \item{use.forking}{a logical, should forked processes be used?}
 
diff --git a/man/Sprigs_old.Rd b/man/Sprigs_old.Rd
index d8dc6f0..4e76fb2 100644
--- a/man/Sprigs_old.Rd
+++ b/man/Sprigs_old.Rd
@@ -7,7 +7,7 @@
 Sprigs_old(x, use.forking = FALSE, nthreads = 1L, add.self = TRUE)
 }
 \arguments{
-\item{x}{a \code{kalisNeighbors} object returned by \code{\link{kalisNeighbors}}, a \code{kalisClades} object returned by \code{\link{kalisClades}} with \code{neighbors = TRUE}, or a list}
+\item{x}{a \code{kalisNeighbors} object returned by \code{\link[=Neighbors]{Neighbors()}}, a \code{kalisClades} object returned by \code{\link[=Clades]{Clades()}} with \code{neighbors = TRUE}, or a list}
 
 \item{use.forking}{a logical, should forked processes be used?}
 

From 2ea7fddd62c86a1d0221263b57ed5fadb1494a82 Mon Sep 17 00:00:00 2001
From: Louis Aslett <louis.aslett@durham.ac.uk>
Date: Wed, 25 Sep 2024 18:19:41 +0100
Subject: [PATCH 20/43] Update all doc \code and \link to markdown versions,
 including spotting a few instances in v1 codebase.

---
 R/CacheHaplotypes.R            |  2 +-
 R/CacheSummary.R               |  8 ++--
 R/Iterator.R                   | 10 ++---
 R/Probs.R                      |  4 +-
 R/TableCache.R                 | 75 ++++++++++++++++------------------
 R/TableMaker.R                 |  2 +-
 man/CacheHaplotypes.Rd         |  2 +-
 man/CreateForwardTableCache.Rd | 17 ++++----
 man/FillTableCache.Rd          | 19 ++++-----
 man/ForwardIterator.Rd         |  6 +--
 man/ForwardUsingTableCache.Rd  | 23 +++++------
 11 files changed, 81 insertions(+), 87 deletions(-)

diff --git a/R/CacheHaplotypes.R b/R/CacheHaplotypes.R
index d900e11..dcc6b3c 100644
--- a/R/CacheHaplotypes.R
+++ b/R/CacheHaplotypes.R
@@ -36,7 +36,7 @@ assign("L", NA, envir = pkgVars) # must be integer
 #'
 #' (num rows)x(num cols) = (num variants)x(num haplotypes).
 #'
-#' It is fine to delete this matrix from R after calling \code{CacheHaplotypes}.
+#' It is fine to delete this matrix from R after calling [CacheHaplotypes()].
 #'
 #'
 #' **HDF5 format**
diff --git a/R/CacheSummary.R b/R/CacheSummary.R
index 396f4f9..8c5b77a 100644
--- a/R/CacheSummary.R
+++ b/R/CacheSummary.R
@@ -1,12 +1,12 @@
 #' Retrieve information about the haplotype cache
 #'
 #' @return
-#'   \code{CacheSummary()} prints information about the current state of the kalis cache.
-#'     Also invisibly returns a vector giving the dimensions of the cached haplotype data (num variants, num haplotypes), or \code{NULL} if the cache is empty.
+#'   `CacheSummary()` prints information about the current state of the kalis cache.
+#'     Also invisibly returns a vector giving the dimensions of the cached haplotype data (num variants, num haplotypes), or `NULL` if the cache is empty.
 #'
-#'   \code{N()} returns the number of haplotypes currently in the kalis cache, or \code{NULL} if the cache is empty.
+#'   `N()` returns the number of haplotypes currently in the kalis cache, or `NULL` if the cache is empty.
 #'
-#'   \code{L()} returns the number of variants currently in the kalis cache, or \code{NULL} if the cache is empty.
+#'   `L()` returns the number of variants currently in the kalis cache, or `NULL` if the cache is empty.
 #'
 #' @examples
 #' # First fill the cache with the toy data included in the package
diff --git a/R/Iterator.R b/R/Iterator.R
index 4272942..79d2c80 100644
--- a/R/Iterator.R
+++ b/R/Iterator.R
@@ -1,18 +1,18 @@
 #' Build an efficient iterator over loci
 #'
-#' Create a \code{kalisForwardIterator} for propagating a forward table iteratively over target loci using a table cache and optimal checkpointing.
+#' Create a `kalisForwardIterator` for propagating a forward table iteratively over target loci using a table cache and optimal checkpointing.
 #'
 #' See example.
 #'
 #'
 #' @param ram.ckpts an integer specifying the number of checkpoints to store in RAM
 #' @param targets a vector of loci to iterate over (starting with the most downstream target)
-#' @param base.fwd.table a \code{kalisForwardTable} either at the most upstream target, or if the targets are evenly spaced, one interval upstream of the most upstream target.
-#' NULL (the default) is interpretted as the prior \code{Pi}, see \code{\link{Parameters}}
+#' @param base.fwd.table a `kalisForwardTable` either at the most upstream target, or if the targets are evenly spaced, one interval upstream of the most upstream target.
+#' `NULL` (the default) is interpretted as the prior `Pi`, see [Parameters()]
 #' @param disk.ckpts an integer specifying the number of checkpoints to store on disk
 #' @param disk.dir a path to a directory where a temporary folder may be made to store checkpoints on disk
-#' @param force.unif a logical, if TRUE iterate over targets as if they were uniformly spaced. WARNING: DO NOT use this in conjunction with the targets method, still experimental. With force.unif = TRUE, the resulting iterator appear to be targeting the first length(targets) variants with all methods, but in fact will be silently iterating over the original targets.
-#' @seealso \code{\link{MakeForwardTable}} to create a \code{kalisForwardTable}.
+#' @param force.unif a logical, if `TRUE` iterate over targets as if they were uniformly spaced. WARNING: DO NOT use this in conjunction with the targets method, still experimental. With `force.unif = TRUE`, the resulting iterator appear to be targeting the first length(targets) variants with all methods, but in fact will be silently iterating over the original targets.
+#' @seealso [MakeForwardTable()] to create a `kalisForwardTable`.
 #'
 #' @examples
 #' \dontrun{
diff --git a/R/Probs.R b/R/Probs.R
index 1361f75..152a8ef 100644
--- a/R/Probs.R
+++ b/R/Probs.R
@@ -41,7 +41,7 @@
 #'
 #' When provided, `M` must have dimensions matching that of `fwd$alpha`.
 #' Typically, that is simply \eqn{N \times N}{N x N} for \eqn{N} haplotypes.
-#' However, if kalis is being run in a distributed manner, \code{M} will be a \eqn{N \times R}{N x R} matrix where \eqn{R} is the number of recipient haplotypes on the current machine.
+#' However, if kalis is being run in a distributed manner, `M` will be a \eqn{N \times R}{N x R} matrix where \eqn{R} is the number of recipient haplotypes on the current machine.
 #'
 #' @param fwd a forward table as returned by [MakeForwardTable()] and propagated to a target variant by [Forward()].
 #'   Must be at the same variant as `bck` (unless `bck` is in "beta-theta space" in which case if must be downstream ... see [Backward()] for details).
@@ -162,7 +162,7 @@ PostProbs <- function(fwd, bck, unif.on.underflow = FALSE, M = NULL, beta.theta.
 #'
 #' When provided, `M` must have dimensions matching that of `fwd$alpha`.
 #' Typically, that is simply \eqn{N \times N}{N x N} for \eqn{N} haplotypes.
-#' However, if kalis is being run in a distributed manner, \code{M} will be a \eqn{N \times R}{N x R} matrix where \eqn{R} is the number of recipient haplotypes on the current machine.
+#' However, if kalis is being run in a distributed manner, `M` will be a \eqn{N \times R}{N x R} matrix where \eqn{R} is the number of recipient haplotypes on the current machine.
 #'
 #' @param fwd a forward table as returned by [MakeForwardTable()] and propagated to a target variant by [Forward()].
 #'   Must be at the same variant as `bck` (unless `bck` is in "beta-theta space" in which case if must be downstream ... see [Backward()] for details).
diff --git a/R/TableCache.R b/R/TableCache.R
index e6a3428..5de70dc 100644
--- a/R/TableCache.R
+++ b/R/TableCache.R
@@ -12,12 +12,11 @@
 #' recently cached local table.
 #'
 #' Memory for a cache can be allocated using this function and should then be
-#' filled with \code{\link{FillTableCache}}.
-#' To use the cache, then instead of using the \code{\link{Forward}} function,
-#' use \code{\link{ForwardUsingTableCache}}.
+#' filled with [FillTableCache()].
+#' To use the cache, then instead of using the [Forward()] function,
+#' use [ForwardUsingTableCache()].
 #'
-#' @param pars a \code{kalisParameters} object, as returned by
-#'   \code{Parameters}.
+#' @param pars a `kalisParameters` object, as returned by [Parameters()].
 #' @param size the maximum amount of RAM (in GB) to devote to this cache.
 #' @param from_recipient first recipient haplotype if creating a partial forward
 #'   table cache.  By default includes from the first recipient haplotype.
@@ -29,10 +28,10 @@
 #'   returned.
 #'
 #' @seealso
-#'   \code{\link{MakeForwardTable}} to make a forward table;
-#'   \code{\link{FillTableCache}} to fill a cache;
-#'   \code{\link{ForwardUsingTableCache}} to use a cache;
-#'   \code{\link{Forward}} for forward function without using a cache.
+#'   [MakeForwardTable()] to make a forward table;
+#'   [FillTableCache()] to fill a cache;
+#'   [ForwardUsingTableCache()] to use a cache;
+#'   [Forward()] for forward function without using a cache.
 #'
 #' @examples
 #' \dontrun{
@@ -124,34 +123,33 @@ CreateForwardTableCache <- function(pars, size = 1, from_recipient = 1, to_recip
 #' recently cached local table.
 #'
 #' Memory for a cache can be allocated using
-#' \code{\link{CreateForwardTableCache}} and should then be filled with this
+#' [CreateForwardTableCache()] and should then be filled with this
 #' function.
-#' To use the cache, then instead of using the \code{\link{Forward}} function,
-#' use \code{\link{ForwardUsingTableCache}}.
+#' To use the cache, then instead of using the [Forward()] function,
+#' use [ForwardUsingTableCache()].
 #'
 #' @param cache a cache of forward tables as generated by
-#'   \code{\link{CreateForwardTableCache}}
-#' @param pars a \code{kalisParameters} object, as returned by
-#'   \code{Parameters}.
+#'   [CreateForwardTableCache()]
+#' @param pars a `kalisParameters` object, as returned by [Parameters()].
 #' @param from the first locus which the geometrically spaced cache should be
 #'   built from.
 #'   By default the whole sequence length will be cached so this defaults to 1.
 #' @param to the last locus up to which the geometrically spaced cache should be
 #'   built.
 #'   By default the whole sequence length will be cached so this defaults to
-#'   \code{Inf}.
+#'   `Inf`.
 #' @param nthreads the number of CPU cores to use.
 #'   By default no parallelism is used.
 #'
 #' @return
 #' There is nothing returned.
-#' For performance reasons, \code{cache} is updated in-place.
+#' For performance reasons, `cache` is updated in-place.
 #'
 #' @seealso
-#'   \code{\link{MakeForwardTable}} to make a forward table;
-#'   \code{\link{CreateForwardTableCache}} to generate a cache;
-#'   \code{\link{ForwardUsingTableCache}} to use a cache;
-#'   \code{\link{Forward}} for forward function without using a cache.
+#'   [MakeForwardTable()] to make a forward table;
+#'   [CreateForwardTableCache()] to generate a cache;
+#'   [ForwardUsingTableCache()] to use a cache;
+#'   [Forward()] for forward function without using a cache.
 #'
 #' @examples
 #' \dontrun{
@@ -252,27 +250,26 @@ FillTableCache <- function(cache,
 #' recently cached local table.
 #'
 #' Memory for a cache can be allocated using
-#' \code{\link{CreateForwardTableCache}} and should then be filled with
-#' \code{\link{FillTableCache}}.
-#' To use the cache, then instead of using the \code{\link{Forward}} function,
+#' [CreateForwardTableCache()] and should then be filled with
+#' [FillTableCache()].
+#' To use the cache, then instead of using the [Forward()] function,
 #' use this function.
 #'
-#' Note that the \code{cache} which is passed to this function will be
+#' Note that the `cache` which is passed to this function will be
 #' dynamically updated based on the locus requested: the assumption is that
 #' the cache is used to propagate in reverse so any cache entries for a locus
-#' position past \code{t} are taken to be no longer needed and that space will
+#' position past `t` are taken to be no longer needed and that space will
 #' redeployed to more densely fill the cache with earlier locus positions.
 #'
-#' @param fwd a \code{kalisForwardTable} object, as returned by
-#'   \code{\link{MakeForwardTable}}.
-#' @param pars a \code{kalisParameters} object, as returned by
-#'   \code{Parameters}.
+#' @param fwd a `kalisForwardTable` object, as returned by
+#'   [MakeForwardTable()].
+#' @param pars a `kalisParameters` object, as returned by [Parameters()].
 #' @param cache a cache of forward tables as generated by
-#'   \code{\link{CreateForwardTableCache}} and filled using
-#'   \code{\link{FillTableCache}}.
+#'   [CreateForwardTableCache()] and filled using
+#'   [FillTableCache()].
 #' @param t a locus position to move the forward table to, starting the forward
-#'   propagation from whatever table in the \code{cache} variable is immediately
-#'   before locus \code{t}.
+#'   propagation from whatever table in the `cache` variable is immediately
+#'   before locus `t`.
 #'   By default, it simply advances to the previous locus (which is the natural
 #'   direction to move when using the cache).
 #' @param nthreads the number of CPU cores to use.
@@ -280,13 +277,13 @@ FillTableCache <- function(cache,
 #'
 #' @return
 #'   There is nothing returned.
-#'   For performance reasons, \code{fwd} is updated in-place.
+#'   For performance reasons, `fwd` is updated in-place.
 #'
 #' @seealso
-#'   \code{\link{MakeForwardTable}} to make a forward table;
-#'   \code{\link{CreateForwardTableCache}} to generate a cache;
-#'   \code{\link{FillTableCache}} to fill a cache;
-#'   \code{\link{Forward}} for forward function without using a cache.
+#'   [MakeForwardTable()] to make a forward table;
+#'   [CreateForwardTableCache()] to generate a cache;
+#'   [FillTableCache()] to fill a cache;
+#'   [Forward()] for forward function without using a cache.
 #'
 #' @examples
 #' \dontrun{
diff --git a/R/TableMaker.R b/R/TableMaker.R
index 4cdd55f..8792c21 100644
--- a/R/TableMaker.R
+++ b/R/TableMaker.R
@@ -140,7 +140,7 @@ print.kalisForwardTable <- function(x, ...) {
 #'   Haplotypes are indexed from 1.
 #'
 #' @return
-#'   A specialized list of class \code{kalisBackwardTable}.
+#'   A specialized list of class `kalisBackwardTable`.
 #'   The elements of the backward table list are:
 #'   \describe{
 #'     \item{`l`}{denotes the current variant position.
diff --git a/man/CacheHaplotypes.Rd b/man/CacheHaplotypes.Rd
index a54430f..b22bed1 100644
--- a/man/CacheHaplotypes.Rd
+++ b/man/CacheHaplotypes.Rd
@@ -86,7 +86,7 @@ That is, the dimensions should be:
 
 (num rows)x(num cols) = (num variants)x(num haplotypes).
 
-It is fine to delete this matrix from R after calling \code{CacheHaplotypes}.
+It is fine to delete this matrix from R after calling \code{\link[=CacheHaplotypes]{CacheHaplotypes()}}.
 
 \strong{HDF5 format}
 
diff --git a/man/CreateForwardTableCache.Rd b/man/CreateForwardTableCache.Rd
index ff224ed..865844d 100644
--- a/man/CreateForwardTableCache.Rd
+++ b/man/CreateForwardTableCache.Rd
@@ -13,8 +13,7 @@ CreateForwardTableCache(
 )
 }
 \arguments{
-\item{pars}{a \code{kalisParameters} object, as returned by
-\code{Parameters}.}
+\item{pars}{a \code{kalisParameters} object, as returned by \code{\link[=Parameters]{Parameters()}}.}
 
 \item{size}{the maximum amount of RAM (in GB) to devote to this cache.}
 
@@ -42,9 +41,9 @@ time and the forward propagation can move backwards by moving forward from a
 recently cached local table.
 
 Memory for a cache can be allocated using this function and should then be
-filled with \code{\link{FillTableCache}}.
-To use the cache, then instead of using the \code{\link{Forward}} function,
-use \code{\link{ForwardUsingTableCache}}.
+filled with \code{\link[=FillTableCache]{FillTableCache()}}.
+To use the cache, then instead of using the \code{\link[=Forward]{Forward()}} function,
+use \code{\link[=ForwardUsingTableCache]{ForwardUsingTableCache()}}.
 }
 \examples{
 \dontrun{
@@ -74,8 +73,8 @@ for(l in L:1) {
 
 }
 \seealso{
-\code{\link{MakeForwardTable}} to make a forward table;
-\code{\link{FillTableCache}} to fill a cache;
-\code{\link{ForwardUsingTableCache}} to use a cache;
-\code{\link{Forward}} for forward function without using a cache.
+\code{\link[=MakeForwardTable]{MakeForwardTable()}} to make a forward table;
+\code{\link[=FillTableCache]{FillTableCache()}} to fill a cache;
+\code{\link[=ForwardUsingTableCache]{ForwardUsingTableCache()}} to use a cache;
+\code{\link[=Forward]{Forward()}} for forward function without using a cache.
 }
diff --git a/man/FillTableCache.Rd b/man/FillTableCache.Rd
index b1fc2f8..dc3865a 100644
--- a/man/FillTableCache.Rd
+++ b/man/FillTableCache.Rd
@@ -13,10 +13,9 @@ FillTableCache(
 }
 \arguments{
 \item{cache}{a cache of forward tables as generated by
-\code{\link{CreateForwardTableCache}}}
+\code{\link[=CreateForwardTableCache]{CreateForwardTableCache()}}}
 
-\item{pars}{a \code{kalisParameters} object, as returned by
-\code{Parameters}.}
+\item{pars}{a \code{kalisParameters} object, as returned by \code{\link[=Parameters]{Parameters()}}.}
 
 \item{nthreads}{the number of CPU cores to use.
 By default no parallelism is used.}
@@ -48,10 +47,10 @@ time and the forward propagation can move backwards by moving forward from a
 recently cached local table.
 
 Memory for a cache can be allocated using
-\code{\link{CreateForwardTableCache}} and should then be filled with this
+\code{\link[=CreateForwardTableCache]{CreateForwardTableCache()}} and should then be filled with this
 function.
-To use the cache, then instead of using the \code{\link{Forward}} function,
-use \code{\link{ForwardUsingTableCache}}.
+To use the cache, then instead of using the \code{\link[=Forward]{Forward()}} function,
+use \code{\link[=ForwardUsingTableCache]{ForwardUsingTableCache()}}.
 }
 \examples{
 \dontrun{
@@ -81,8 +80,8 @@ for(l in L:1) {
 
 }
 \seealso{
-\code{\link{MakeForwardTable}} to make a forward table;
-\code{\link{CreateForwardTableCache}} to generate a cache;
-\code{\link{ForwardUsingTableCache}} to use a cache;
-\code{\link{Forward}} for forward function without using a cache.
+\code{\link[=MakeForwardTable]{MakeForwardTable()}} to make a forward table;
+\code{\link[=CreateForwardTableCache]{CreateForwardTableCache()}} to generate a cache;
+\code{\link[=ForwardUsingTableCache]{ForwardUsingTableCache()}} to use a cache;
+\code{\link[=Forward]{Forward()}} for forward function without using a cache.
 }
diff --git a/man/ForwardIterator.Rd b/man/ForwardIterator.Rd
index 2954e86..9c2cb82 100644
--- a/man/ForwardIterator.Rd
+++ b/man/ForwardIterator.Rd
@@ -26,13 +26,13 @@ ForwardIterator(
 \item{targets}{a vector of loci to iterate over (starting with the most downstream target)}
 
 \item{base.fwd.table}{a \code{kalisForwardTable} either at the most upstream target, or if the targets are evenly spaced, one interval upstream of the most upstream target.
-NULL (the default) is interpretted as the prior \code{Pi}, see \code{\link{Parameters}}}
+\code{NULL} (the default) is interpretted as the prior \code{Pi}, see \code{\link[=Parameters]{Parameters()}}}
 
 \item{disk.ckpts}{an integer specifying the number of checkpoints to store on disk}
 
 \item{disk.dir}{a path to a directory where a temporary folder may be made to store checkpoints on disk}
 
-\item{force.unif}{a logical, if TRUE iterate over targets as if they were uniformly spaced. WARNING: DO NOT use this in conjunction with the targets method, still experimental. With force.unif = TRUE, the resulting iterator appear to be targeting the first length(targets) variants with all methods, but in fact will be silently iterating over the original targets.}
+\item{force.unif}{a logical, if \code{TRUE} iterate over targets as if they were uniformly spaced. WARNING: DO NOT use this in conjunction with the targets method, still experimental. With \code{force.unif = TRUE}, the resulting iterator appear to be targeting the first length(targets) variants with all methods, but in fact will be silently iterating over the original targets.}
 }
 \description{
 Create a \code{kalisForwardIterator} for propagating a forward table iteratively over target loci using a table cache and optimal checkpointing.
@@ -57,5 +57,5 @@ for(t in targets(Iter)){
 
 }
 \seealso{
-\code{\link{MakeForwardTable}} to create a \code{kalisForwardTable}.
+\code{\link[=MakeForwardTable]{MakeForwardTable()}} to create a \code{kalisForwardTable}.
 }
diff --git a/man/ForwardUsingTableCache.Rd b/man/ForwardUsingTableCache.Rd
index 87b26e9..09f1bad 100644
--- a/man/ForwardUsingTableCache.Rd
+++ b/man/ForwardUsingTableCache.Rd
@@ -15,14 +15,13 @@ ForwardUsingTableCache(
 }
 \arguments{
 \item{fwd}{a \code{kalisForwardTable} object, as returned by
-\code{\link{MakeForwardTable}}.}
+\code{\link[=MakeForwardTable]{MakeForwardTable()}}.}
 
-\item{pars}{a \code{kalisParameters} object, as returned by
-\code{Parameters}.}
+\item{pars}{a \code{kalisParameters} object, as returned by \code{\link[=Parameters]{Parameters()}}.}
 
 \item{cache}{a cache of forward tables as generated by
-\code{\link{CreateForwardTableCache}} and filled using
-\code{\link{FillTableCache}}.}
+\code{\link[=CreateForwardTableCache]{CreateForwardTableCache()}} and filled using
+\code{\link[=FillTableCache]{FillTableCache()}}.}
 
 \item{t}{a locus position to move the forward table to, starting the forward
 propagation from whatever table in the \code{cache} variable is immediately
@@ -51,9 +50,9 @@ time and the forward propagation can move backwards by moving forward from a
 recently cached local table.
 
 Memory for a cache can be allocated using
-\code{\link{CreateForwardTableCache}} and should then be filled with
-\code{\link{FillTableCache}}.
-To use the cache, then instead of using the \code{\link{Forward}} function,
+\code{\link[=CreateForwardTableCache]{CreateForwardTableCache()}} and should then be filled with
+\code{\link[=FillTableCache]{FillTableCache()}}.
+To use the cache, then instead of using the \code{\link[=Forward]{Forward()}} function,
 use this function.
 
 Note that the \code{cache} which is passed to this function will be
@@ -90,8 +89,8 @@ for(l in L:1) {
 
 }
 \seealso{
-\code{\link{MakeForwardTable}} to make a forward table;
-\code{\link{CreateForwardTableCache}} to generate a cache;
-\code{\link{FillTableCache}} to fill a cache;
-\code{\link{Forward}} for forward function without using a cache.
+\code{\link[=MakeForwardTable]{MakeForwardTable()}} to make a forward table;
+\code{\link[=CreateForwardTableCache]{CreateForwardTableCache()}} to generate a cache;
+\code{\link[=FillTableCache]{FillTableCache()}} to fill a cache;
+\code{\link[=Forward]{Forward()}} for forward function without using a cache.
 }

From 6550df11bd2bc80f15056423926c83d1bc12fdbf Mon Sep 17 00:00:00 2001
From: Louis Aslett <louis.aslett@durham.ac.uk>
Date: Wed, 25 Sep 2024 18:27:15 +0100
Subject: [PATCH 21/43] Correct indentation of YAML and markdown blocks

---
 vignettes/Reading_Haplotype_Data.Rmd | 11 +++--------
 1 file changed, 3 insertions(+), 8 deletions(-)

diff --git a/vignettes/Reading_Haplotype_Data.Rmd b/vignettes/Reading_Haplotype_Data.Rmd
index bfbdc7a..b576d67 100644
--- a/vignettes/Reading_Haplotype_Data.Rmd
+++ b/vignettes/Reading_Haplotype_Data.Rmd
@@ -7,9 +7,9 @@ vignette: >
   %\VignetteIndexEntry{Reading Haplotype Data}
   %\VignetteEngine{knitr::rmarkdown}
   %\VignetteEncoding{UTF-8}
-  ---
-  
-  ```{r setup, include = FALSE}
+---
+
+```{r setup, include = FALSE}
 knitr::opts_chunk$set(
 collapse = TRUE,
 comment = "#>"
@@ -45,8 +45,3 @@ For increased reading efficiency `CacheHaplotypes` look will look for the `my.le
 `kalis`  <http://hgdownload.cse.ucsc.edu/gbdb/hg19/1000Genomes/phase3/>
 
 ALL.chr21.phase3_shapeit2_mvncall_integrated_v5a.20130502.genotypes.hap.gz
-
-
-
-
-

From 8fa8200c14ff4af34e0481e7d2d27737ef92603f Mon Sep 17 00:00:00 2001
From: Louis Aslett <louis.aslett@durham.ac.uk>
Date: Thu, 26 Sep 2024 16:46:13 +0100
Subject: [PATCH 22/43] Turn off tests on package check for speed (kalis tests
 take ~30 minutes)

---
 kalis.Rproj | 1 +
 1 file changed, 1 insertion(+)

diff --git a/kalis.Rproj b/kalis.Rproj
index 175b662..2eb25a2 100644
--- a/kalis.Rproj
+++ b/kalis.Rproj
@@ -17,4 +17,5 @@ StripTrailingWhitespace: Yes
 BuildType: Package
 PackageUseDevtools: Yes
 PackageInstallArgs: --no-multiarch --with-keep.source --configure-vars="PKG_CFLAGS='-march=native -mtune=native -O3'"
+PackageCheckArgs: --no-tests
 PackageRoxygenize: rd,collate,namespace,vignette

From d8f78a01345a0562c78fecbff1d19303ed620fcd Mon Sep 17 00:00:00 2001
From: Louis Aslett <louis.aslett@durham.ac.uk>
Date: Thu, 26 Sep 2024 17:15:58 +0100
Subject: [PATCH 23/43] Eliminate compiler warnings about printing size_t's
 when int expected (no concern here, these do not affect the algorithm so cast
 freely to ints)

---
 src/R_Cache.c    | 14 +++++++-------
 src/R_CladeMat.c |  4 ++--
 2 files changed, 9 insertions(+), 9 deletions(-)

diff --git a/src/R_Cache.c b/src/R_Cache.c
index 875b6f5..e403b00 100644
--- a/src/R_Cache.c
+++ b/src/R_Cache.c
@@ -282,7 +282,7 @@ SEXP CacheHaplotypes_hapgz_2(SEXP Rfile, SEXP Rloci_idx, SEXP Rhap_idx, SEXP RL,
   for(size_t l=0; l<hap_size_file; l++) {
     line = gzgets(fd, buf, bufsize);
     if(line == NULL) {
-      REprintf("Error: only reached line %d ... there are not %d loci in the file!\n", l+1, hap_size_file);
+      REprintf("Error: only reached line %d ... there are not %d loci in the file!\n", (int) l+1, (int) hap_size_file);
       ClearHaplotypeCache2();
       gzclose(fd);
       KALIS_RETURN;
@@ -300,13 +300,13 @@ SEXP CacheHaplotypes_hapgz_2(SEXP Rfile, SEXP Rloci_idx, SEXP Rhap_idx, SEXP RL,
       if(i != next_i) {
         // Check that there is at least valid data at this position ...
         if(*line != '0' && *line != '1') {
-          REprintf("Error: line %d contains an invalid character!\n", l);
+          REprintf("Error: line %d contains an invalid character!\n", (int) l);
           ClearHaplotypeCache2();
           gzclose(fd);
           KALIS_RETURN;
         }
         if((i < num_inds_file-1 && *(line+1) != ' ') || (i == num_inds_file-1 && *(line+1) != '\n')) {
-          REprintf("Error: line %d does not contain a space (or EOL) after haplotype << %d!\n", l, i+1);
+          REprintf("Error: line %d does not contain a space (or EOL) after haplotype << %d!\n", (int) l, (int) i+1);
           ClearHaplotypeCache2();
           gzclose(fd);
           KALIS_RETURN;
@@ -319,7 +319,7 @@ SEXP CacheHaplotypes_hapgz_2(SEXP Rfile, SEXP Rloci_idx, SEXP Rhap_idx, SEXP RL,
       // Process line
       x = *(line++); // should be a 0/1
       if(x == '\0') {
-        REprintf("Error: line %d is of the incorrect length!\n", l);
+        REprintf("Error: line %d is of the incorrect length!\n", (int) l);
         ClearHaplotypeCache2();
         gzclose(fd);
         KALIS_RETURN;
@@ -329,7 +329,7 @@ SEXP CacheHaplotypes_hapgz_2(SEXP Rfile, SEXP Rloci_idx, SEXP Rhap_idx, SEXP RL,
       } else if(x == '0') {
         hap_locus[next_ll][next_ii/32] ^= (-0 ^ hap_locus[next_ll][next_ii/32]) & (1 << next_ii%32);
       } else {
-        REprintf("Error: line %d contains an invalid character!\n", l);
+        REprintf("Error: line %d contains an invalid character!\n", (int) l);
         ClearHaplotypeCache2();
         gzclose(fd);
         KALIS_RETURN;
@@ -337,13 +337,13 @@ SEXP CacheHaplotypes_hapgz_2(SEXP Rfile, SEXP Rloci_idx, SEXP Rhap_idx, SEXP RL,
 
       x = *(line++); // should be a space following the 0/1 unless last hap on the line
       if(i < num_inds_file-1 && x != ' ') {
-        REprintf("Error: line %d does not contain a space after haplotype << %d!\n", l, i+1);
+        REprintf("Error: line %d does not contain a space after haplotype << %d!\n", (int) l, (int) i+1);
         ClearHaplotypeCache2();
         gzclose(fd);
         KALIS_RETURN;
       }
       if(i == num_inds_file-1 && x != '\n') {
-        REprintf("Error: line %d does not end at the right place!\n", l);
+        REprintf("Error: line %d does not end at the right place!\n", (int) l);
         ClearHaplotypeCache2();
         gzclose(fd);
         KALIS_RETURN;
diff --git a/src/R_CladeMat.c b/src/R_CladeMat.c
index 6c26f30..55e01fc 100644
--- a/src/R_CladeMat.c
+++ b/src/R_CladeMat.c
@@ -24,7 +24,7 @@ void printblob(blob* bobtheblob) {
   Rprintf("Blob %p (%p): # = %d, range = (%lf, %lf), prv = %p, nxt = %p, lp = %p, mp = %p \n",
           bobtheblob,
           (bobtheblob==bobtheblob->blob?NULL:bobtheblob->blob),
-          bobtheblob->num_in_blob,
+          (int) bobtheblob->num_in_blob,
           bobtheblob->lower,
           bobtheblob->upper,
           bobtheblob->prev,
@@ -675,7 +675,7 @@ void blobby_A(const double* const restrict alpha,
       pthread_create(&threads[i], &attr, blobby_B, (void*) &args[i]);
       //blobby_B((void*) &args[i]);
     }
-    Rprintf("%d threads created (rag end left over = %d)\n", nthreads, rag_end);
+    Rprintf("%d threads created (rag end left over = %d)\n", (int) nthreads, (int) rag_end);
 
     // Tidy ragged end
     if(rag_end != 0) {

From 43d2d4cee21041834f7e7ebda558c39cfec231b9 Mon Sep 17 00:00:00 2001
From: Louis Aslett <louis.aslett@durham.ac.uk>
Date: Thu, 26 Sep 2024 17:16:32 +0100
Subject: [PATCH 24/43] Avoid compiler warnings about using undefined pointers

---
 src/R_CladeMat.c | 6 +++---
 1 file changed, 3 insertions(+), 3 deletions(-)

diff --git a/src/R_CladeMat.c b/src/R_CladeMat.c
index 55e01fc..ab27131 100644
--- a/src/R_CladeMat.c
+++ b/src/R_CladeMat.c
@@ -371,7 +371,7 @@ void blobby_B1(double* alpha1, double* beta1, size_t recipient, size_t n, double
   double maxd = 744.4400719213812180897;
   blob blobs[(int) (maxd/thres+2)];
   blob** x_in_blob[n];
-  double* n_clade;
+  double* n_clade = NULL;
   blobby_BB(alpha1, beta1, recipient, n, blobs, x_in_blob, n_clade, thres, maxd, unitdist, max1var);
 }
 
@@ -509,8 +509,8 @@ SEXP blobbyB2(SEXP ALPHA, SEXP BETA, SEXP FROMRECIPIENT, SEXP THRES, SEXP UNITDI
   blob* blobs1 = malloc(sizeof(blob)*((int) (maxd/thres+2)));
   blob* blobs2 = malloc(sizeof(blob)*((int) (maxd/thres+2)));
 
-  double* n_clade1;
-  double* n_clade2;
+  double* n_clade1 = NULL;
+  double* n_clade2 = NULL;
 
   blobby_B2(alpha, beta, alpha+n, beta+n, from_recipient, n, thres, unitdist, max1var, dedip,
             &neigh1, &neigh2, &n_neigh[0], &n_neigh[1], n_clade1, n_clade2,

From 7beab0a4ddc241724a6b18de303e547adbe27b31 Mon Sep 17 00:00:00 2001
From: Louis Aslett <louis.aslett@durham.ac.uk>
Date: Thu, 26 Sep 2024 17:16:50 +0100
Subject: [PATCH 25/43] Eliminate apparently redundant variable causing
 compiler warnings

---
 src/R_CladeMat.c | 4 ++--
 1 file changed, 2 insertions(+), 2 deletions(-)

diff --git a/src/R_CladeMat.c b/src/R_CladeMat.c
index ab27131..8512caa 100644
--- a/src/R_CladeMat.c
+++ b/src/R_CladeMat.c
@@ -331,10 +331,10 @@ blob* blobby_BB(const double* alpha, const double* beta, const size_t recipient,
   double j = n, diff = 0.0, temp_n_mut = 0.0;
   cur = tail;
   cur->c3 = 0.0;
-  int num_surv_blob = 0;
+  // int num_surv_blob = 0; // This does not seem to be used, except on line 337, which has no side effects
   *n_clade = 0.0;
   while(cur->prev != NULL) {
-    num_surv_blob++;
+    // num_surv_blob++;
     j -= cur->num_in_blob;
     diff = cur->lower - cur->prev->upper + 2*thres;
     temp_n_mut = diff/unitdist;

From 667c798dda5d2f3d4ec0ed637a635325a93ea200 Mon Sep 17 00:00:00 2001
From: Louis Aslett <louis.aslett@durham.ac.uk>
Date: Thu, 26 Sep 2024 18:38:55 +0100
Subject: [PATCH 26/43] Update configure script to have strict POSIX shell
 support

---
 configure | 50 ++++++++++++++++++++++++++++++++++----------------
 1 file changed, 34 insertions(+), 16 deletions(-)

diff --git a/configure b/configure
index 42179bb..d8755da 100755
--- a/configure
+++ b/configure
@@ -1,4 +1,4 @@
-#!/bin/bash
+#!/bin/sh
 # Anticonf (tm, Jeroen Ooms) style alternative to autoconf written by Louis
 # Aslett based on work by Jeroen Ooms (cf github: jeroen/curl & jeroen/openssl)
 
@@ -57,21 +57,21 @@ fi
 # Check combinations of intrinsics flags
 counter=0
 intrinsics=""
-[[ ! -z ${NOASM+isset} ]] && ((counter+=1)) && PKG_CFLAGS="$PKG_CFLAGS -DKALIS_ISA_NOASM" && intrinsics="No special assembly"
-[[ ! -z ${AVX512+isset} ]] && ((counter+=1)) && PKG_CFLAGS="$PKG_CFLAGS -DKALIS_ISA_AVX512" && intrinsics="AVX-512 family of"
-[[ ! -z ${AVX2+isset} ]] && ((counter+=1)) && PKG_CFLAGS="$PKG_CFLAGS -DKALIS_ISA_AVX2" && intrinsics="AVX2 family of"
-[[ ! -z ${NEON+isset} ]] && ((counter+=1)) && PKG_CFLAGS="$PKG_CFLAGS -DKALIS_ISA_NEON" && intrinsics="NEON family of"
+[ -n "${NOASM+isset}" ] && counter=$((counter + 1)) && PKG_CFLAGS="$PKG_CFLAGS -DKALIS_ISA_NOASM" && intrinsics="No special assembly"
+[ -n "${AVX512+isset}" ] && counter=$((counter + 1)) && PKG_CFLAGS="$PKG_CFLAGS -DKALIS_ISA_AVX512" && intrinsics="AVX-512 family of"
+[ -n "${AVX2+isset}" ] && counter=$((counter + 1)) && PKG_CFLAGS="$PKG_CFLAGS -DKALIS_ISA_AVX2" && intrinsics="AVX2 family of"
+[ -n "${NEON+isset}" ] && counter=$((counter + 1)) && PKG_CFLAGS="$PKG_CFLAGS -DKALIS_ISA_NEON" && intrinsics="NEON family of"
 # Were zero/one options chosen?
-if ((counter > 1)); then
+if [ "$counter" -gt 1 ]; then
   echo "ERROR: At most one set of instructions can be specified (NOASM, AVX512, AVX2 or NEON)"
   exit 1
 fi
 # Was an option forced?
-if ((counter == 1)); then
+if [ "$counter" -eq 1 ]; then
   echo "$intrinsics instruction set extentions will by used (forced by user)."
 fi
 # If no option force by user, then attempt to auto-detect
-if ((counter == 0)); then
+if [ "$counter" -eq 0 ]; then
 
   intrindetected=0
 
@@ -87,7 +87,7 @@ if ((counter == 0)); then
   intrin=$((intrin+$?))
   echo "#include <immintrin.h>" | ${CC} ${PKG_CFLAGS} ${CFLAGS} -Wno-error -E -xc - >/dev/null 2>&1
   intrin=$((intrin+$?))
-  if ((intrindetected == 0 && intrin == 0)); then
+  if [ "$intrindetected" -eq 0 ] && [ "$intrin" -eq 0 ]; then
     PKG_CFLAGS="$PKG_CFLAGS -DKALIS_ISA_AVX512"
     intrinsics="AVX-512 family of"
     intrindetected=1
@@ -109,7 +109,7 @@ if ((counter == 0)); then
   intrin=$((intrin+$?))
   echo "#include <immintrin.h>" | ${CC} ${PKG_CFLAGS} ${CFLAGS} -Wno-error -E -xc - >/dev/null 2>&1
   intrin=$((intrin+$?))
-  if ((intrindetected == 0 && intrin == 0)); then
+  if [ "$intrindetected" -eq 0 ] && [ "$intrin" -eq 0 ]; then
     PKG_CFLAGS="$PKG_CFLAGS -DKALIS_ISA_AVX2"
     intrinsics="AVX2 family of"
     intrindetected=1
@@ -123,13 +123,13 @@ if ((counter == 0)); then
   intrin=$((intrin+$?))
   echo "#include <arm_neon.h>" | ${CC} ${PKG_CFLAGS} ${CFLAGS} -Wno-error -E -xc - >/dev/null 2>&1
   intrin=$((intrin+$?))
-  if ((intrindetected == 0 && intrin == 0)); then
+  if [ "$intrindetected" -eq 0 ] && [ "$intrin" -eq 0 ]; then
     PKG_CFLAGS="$PKG_CFLAGS -DKALIS_ISA_NEON"
     intrinsics="NEON family of"
     intrindetected=1
   fi
 
-  if ((intrindetected == 0)); then
+  if [ "$intrindetected" -eq 0 ]; then
     PKG_CFLAGS="$PKG_CFLAGS -DKALIS_ISA_NOASM"
     intrinsics="No special assembly"
   fi
@@ -138,15 +138,33 @@ if ((counter == 0)); then
 fi
 
 # Check if we have access to pthreads (checking functions and headers, so no -E on compiler)
-echo -e "#define _GNU_SOURCE\n#include <pthread.h>\nmain() { pthread_t threads[2]; pthread_attr_t attr; pthread_attr_init(&attr); pthread_create(&threads[0], &attr, NULL, NULL); }" | ${CC} ${PKG_CFLAGS} ${CFLAGS} -Wno-error -pthread -xc - >/dev/null 2>&1
-if [ $? -eq 0 ]; then
+echo "#define _GNU_SOURCE
+#include <pthread.h>
+int main() {
+  pthread_t threads[2];
+  pthread_attr_t attr;
+  pthread_attr_init(&attr);
+  pthread_create(&threads[0], &attr, NULL, NULL);
+  return 0;
+}" | ${CC} ${PKG_CFLAGS} ${CFLAGS} -Wno-error -pthread -xc - >/dev/null 2>&1
+if [ "$?" -eq 0 ]; then
   PKG_CFLAGS="$PKG_CFLAGS -pthread"
   PKG_LIBS="$PKG_LIBS -lpthread -pthread"
+  echo "Threading support detected."
 fi
 # NB: MacOS has pthreads but not pthread_setaffinity_np
-echo -e "#define _GNU_SOURCE\n#include <pthread.h>\nmain() { cpu_set_t cpus; CPU_ZERO(&cpus); CPU_SET(1, &cpus); pthread_setaffinity_np(0,0,0); }" | ${CC} ${PKG_CFLAGS} ${CFLAGS} -Wno-error -pthread -xc - >/dev/null 2>&1
-if [ $? -eq 0 ]; then
+echo "#define _GNU_SOURCE
+#include <pthread.h>
+int main() {
+  cpu_set_t cpus;
+  CPU_ZERO(&cpus);
+  CPU_SET(1, &cpus);
+  pthread_setaffinity_np(0,0,0);
+  return 0;
+}" | ${CC} ${PKG_CFLAGS} ${CFLAGS} -Wno-error -pthread -xc - >/dev/null 2>&1
+if [ "$?" -eq 0 ]; then
   PKG_CFLAGS="$PKG_CFLAGS -DKALIS_AFFINITY"
+  echo "Thread affinity support detected."
 fi
 
 # To customise unroll depth

From e641ceb66561e997eb96271827e6766be67ae011 Mon Sep 17 00:00:00 2001
From: Louis Aslett <louis.aslett@durham.ac.uk>
Date: Thu, 26 Sep 2024 18:48:38 +0100
Subject: [PATCH 27/43] Eliminate dangling a.out.dSYM after configure run on
 Macs

---
 configure | 3 +++
 1 file changed, 3 insertions(+)

diff --git a/configure b/configure
index d8755da..3d222ee 100755
--- a/configure
+++ b/configure
@@ -181,6 +181,9 @@ sed -e "s|@cflags@|$PKG_CFLAGS|" -e "s|@libs@|$PKG_LIBS|" src/Makevars.in > src/
 if [ -f a.out ] ; then
     rm a.out
 fi
+if [ -e a.out.dSYM ] ; then
+    rm -rf a.out.dSYM
+fi
 
 # Success
 exit 0

From ff8ee3ed9fb06e31341208bae52999570f62a8d7 Mon Sep 17 00:00:00 2001
From: Louis Aslett <louis.aslett@durham.ac.uk>
Date: Mon, 30 Sep 2024 18:42:20 +0100
Subject: [PATCH 28/43] Add cleanup script to remove temporary files created
 during configure run

---
 cleanup | 3 +++
 1 file changed, 3 insertions(+)
 create mode 100755 cleanup

diff --git a/cleanup b/cleanup
new file mode 100755
index 0000000..d2331f2
--- /dev/null
+++ b/cleanup
@@ -0,0 +1,3 @@
+#!/bin/sh
+
+rm -rf src/Makevars a.out.dSYM

From e7df962131fd0c45ae1cd6c04ebd0a4c71c830b2 Mon Sep 17 00:00:00 2001
From: Louis Aslett <louis.aslett@durham.ac.uk>
Date: Tue, 1 Oct 2024 17:40:57 +0100
Subject: [PATCH 29/43] Remove general checkpointing solution into separate dev
 branch and eliminiate from release code base

---
 NAMESPACE    |   1 -
 R/Iterator.R | 187 +--------------------------------------------------
 2 files changed, 1 insertion(+), 187 deletions(-)

diff --git a/NAMESPACE b/NAMESPACE
index 3d211fa..f280572 100644
--- a/NAMESPACE
+++ b/NAMESPACE
@@ -48,7 +48,6 @@ importFrom(glue,glue_collapse)
 importFrom(graphics,axis)
 importFrom(prettyunits,pretty_bytes)
 importFrom(rlang,duplicate)
-importFrom(stats,optimize)
 importFrom(stats,sd)
 importFrom(utils,getFromNamespace)
 importFrom(utils,tail)
diff --git a/R/Iterator.R b/R/Iterator.R
index 79d2c80..60e4046 100644
--- a/R/Iterator.R
+++ b/R/Iterator.R
@@ -168,16 +168,7 @@ ForwardIterator <- function(pars,
 
   }else{
 
-    # Solve general problem
-    SolveSchedule <- MakeSolveSchedule(exact = exact)
-    environment(obj_func_for_SolveSchedule) <- environment(SolveSchedule)
-
-    if(!first.target.given){
-      cost <- SolveSchedule(d = c(targets[1],diff(targets)),targets, num.available.ckpts)
-    }else{
-      cost <- SolveSchedule(d = diff(targets),targets[-1], num.available.ckpts)
-    }
-    sch <- trim.sch(SolveSchedule)
+    stop("Solving the non-uniform checkpointing problem is not yet implemented.")
 
   }
 
@@ -522,179 +513,3 @@ uniform_trim.sch <- function(f){
   # create dataframe schedule
   sch <- data.frame("k" = c(sch.k,0L), "i" = c(sch.i,0L))
 }
-
-
-
-
-obj_func_for_SolveSchedule <- function(i,ins,d,indicies,num.available.ckpts){
-
-  i <- floor(i)
-
-  # clear out schedule for all entries below this instruction
-  sch.k[(ins+1):nrow.sch] <<- -1L
-  sch.i[(ins+1):nrow.sch] <<- -1L
-
-  proposed.location <- which(indicies==i)
-
-  # solve right problem
-  if(length(d) > proposed.location){ # if the interval to the right contains at least one target locus
-    right.cost <- SolveSchedule(d[(proposed.location+1):length(d)],
-                                indicies[(proposed.location+1):length(d)],
-                                num.available.ckpts - 1)
-  }else{
-    right.cost <- 0
-  }
-
-
-  # solve left problem
-  if(proposed.location > 1){ # if the interval to the left contains at least one target locus
-    left.cost <- SolveSchedule(d[1:(proposed.location-1)],
-                               indicies[1:(proposed.location-1)],
-                               num.available.ckpts)
-  }else{
-    left.cost <- 0
-  }
-
-  # total up the cost
-  sum(d[1:proposed.location]) + left.cost + right.cost  # Cost to initialize and place and record the checkpoint is first
-}
-
-
-#' @importFrom stats optimize
-#' @importFrom utils tail
-MakeSolveSchedule <- function(exact = TRUE){
-
-  sch.k <- 0L
-  sch.i <- 0L
-  nrow.sch <- 1
-
-  function(d, indicies, num.available.ckpts){
-
-    l.d <- length(d)
-    if(l.d==0){return(0)} # nothing to solve
-
-    k <- as.integer(min(l.d-1,num.available.ckpts))
-    if(k==0){return(sum(d*(l.d:1)))}
-
-
-    # at this point, we know that num.available.ckpts is at least 1
-    # and l.d is at least 2
-
-
-    # If neither of the above cases, create a new instruction
-    ins <- which.max(sch.k < 0) # this is the first emtpy slot for an instruction
-    if(ins == nrow.sch){ # then we're about to assign to the last schedule entry and need to add on space for instructions before we can call obj.func
-      sch.k <<- c(sch.k, rep(-1L,50))
-      sch.i <<- c(sch.i, rep(-1L,50))
-
-      if(sequential){
-        first.index <<- c(first.index, rep(NA_integer_,50))
-        last.index <<- c(last.index, rep(NA_integer_,50))
-      }
-      nrow.sch <<- length(sch.k)
-      ins <- which.max(sch.k < 0)
-    }
-
-    sch.k[ins] <<- k
-
-    if( (l.d-1) <= num.available.ckpts ){ # We know what the solution is to this problem
-      cost <- d[1] + SolveSchedule(d[-1],
-                                   indicies[-1],
-                                   num.available.ckpts - 1)
-      sch.i[ins] <<- indicies[1]
-
-    }else{
-
-      if(exact){
-        tol <- 1e-4
-      }else{
-        tol <- l.d / 20 * 0.4
-      }
-
-      ans <- optimize(obj_func_for_SolveSchedule,
-                      lower = indicies[1],  # NOTE THIS WILL NEED TO BE CHANGED BACK TO LOWER IF ABOVE UNCOMMENTED
-                      upper=tail(indicies,1),
-                      ins = ins,
-                      d = d,
-                      indicies = indicies,
-                      num.available.ckpts = num.available.ckpts,
-                      tol = tol)
-      # choose tol so that we will get the exact solution when we have 20 or fewer locations to choose from
-      # slight approximation for larger sequences, but those being a bit off shouldn't be as critical to having the low level
-      # solutions all correct.
-
-      cost <- ans$objective
-      sch.i[ins] <<- as.integer(floor(ans$minimum))
-    }
-
-    cost
-  }
-}
-
-trim.sch <- function(f){
-  sch.k <- get("sch.k",envir = environment(f))
-  sch.i <- get("sch.i",envir = environment(f))
-  lookup.available <- get("lookup.available",envir = environment(f))
-
-  if(lookup.available){
-    first.index <- get("first.index",envir = environment(f))
-    last.index <- get("last.index",envir = environment(f))
-  }
-
-  # prune
-  if(any(sch.k == -1)){
-    upper.limit <- which.max(sch.k == -1) - 1
-    sch.k <- sch.k[1:upper.limit]
-    sch.i <- sch.i[1:upper.limit]
-    if(lookup.available){
-      first.index <- first.index[1:upper.limit]
-      last.index <- last.index[1:upper.limit]
-    }
-  }
-
-  # create dataframe schedule
-  sch <- data.frame("k" = c(sch.k,0L), "i" = c(sch.i,0L))
-
-  # Expand any incomplete parts of the schedule
-  while(!all(is.na(first.index))){
-
-    # identify an entry that needs to be expanded
-    c.row <- which.min(is.na(first.index))
-
-    # separate that entry from entries above and below
-    if(c.row!=1){sch.above <- sch[1:(c.row-1),]}else{sch.above <- data.frame("k" = 0L, "i" = 0L); sch.above <- sch.above[-1,]}
-    if(c.row!=nrow(sch)){sch.below <- sch[(c.row+1):nrow(sch),]}else{sch.below <- data.frame("k" = 0L, "i" = 0L); sch.below <- sch.below[-1,]}
-
-    kk <- sch$k[c.row] # this is the number of checkpoints we must apply over the range first.index to last.index
-
-
-  }
-
-}
-
-
-# Some code for file backed checkpointing:
-
-# X2 <- list(x=X)
-# system.time(fst:::fststore(normalizePath("~/test.fst", mustWork = FALSE), X2,
-#                            as.integer(50), TRUE))
-#
-# library(fst)
-# X.res <- matrix(0, 10000, 40000)
-#
-# # from and to index rows from massive 1 column data.frame
-# # split it up to read in 10 to 20 blocks of columns
-# # check if assignment to column is triggering a copy.
-#
-# Read to a block and then use a C function like the substitution one I have
-# to write in C from a vector to fwd$alpha
-#
-# system.time({
-#   for(i in 1:100) {
-#     X.res[,i] <- read_fst("~/test.fst", from=(i-1)*10000+1, to=i*10000)
-#   }
-# })
-#
-
-
-

From f595d726591d53d25d4eb33475fe7c32843cc0bf Mon Sep 17 00:00:00 2001
From: Louis Aslett <louis.aslett@durham.ac.uk>
Date: Tue, 1 Oct 2024 17:55:41 +0100
Subject: [PATCH 30/43] Remove incorrectly tracked vignette files from version
 control

---
 vignettes/.gitignore                     |   2 +
 vignettes/Decoding_a_Single_Variant.R    |  37 --
 vignettes/Decoding_a_Single_Variant.html | 416 ------------------
 vignettes/lct_example.R                  | 121 ------
 vignettes/lct_example.html               | 532 -----------------------
 5 files changed, 2 insertions(+), 1106 deletions(-)
 create mode 100644 vignettes/.gitignore
 delete mode 100644 vignettes/Decoding_a_Single_Variant.R
 delete mode 100644 vignettes/Decoding_a_Single_Variant.html
 delete mode 100644 vignettes/lct_example.R
 delete mode 100644 vignettes/lct_example.html

diff --git a/vignettes/.gitignore b/vignettes/.gitignore
new file mode 100644
index 0000000..097b241
--- /dev/null
+++ b/vignettes/.gitignore
@@ -0,0 +1,2 @@
+*.html
+*.R
diff --git a/vignettes/Decoding_a_Single_Variant.R b/vignettes/Decoding_a_Single_Variant.R
deleted file mode 100644
index 3e24034..0000000
--- a/vignettes/Decoding_a_Single_Variant.R
+++ /dev/null
@@ -1,37 +0,0 @@
-## ----setup, include = FALSE---------------------------------------------------
-knitr::opts_chunk$set(
-  collapse = TRUE,
-  comment = "#>"
-)
-
-## -----------------------------------------------------------------------------
-require(kalis)
-data("SmallHaps")
-
-## -----------------------------------------------------------------------------
-CacheHaplotypes(SmallHaps)
-
-## -----------------------------------------------------------------------------
-m <- rbeta(400-1,1,10)*1e-6
-pars <- Parameters(CalcRho(cM = m, s = 1, gamma = 1), mu = 1e-8)
-
-## -----------------------------------------------------------------------------
-fwd <- MakeForwardTable(pars)
-bck <- MakeBackwardTable(pars)
-
-Forward(fwd, pars, 250)
-Backward(bck, pars, 250)
-
-## -----------------------------------------------------------------------------
-
-p <- PostProbs(fwd,bck)
-d <- DistMat(fwd,bck)
-
-
-## ---- results='asis'----------------------------------------------------------
-plot(d)
-
-## ---- results='asis'----------------------------------------------------------
-d <- 0.5*(d + t(d))
-plot(d)
-
diff --git a/vignettes/Decoding_a_Single_Variant.html b/vignettes/Decoding_a_Single_Variant.html
deleted file mode 100644
index 0c07a51..0000000
--- a/vignettes/Decoding_a_Single_Variant.html
+++ /dev/null
@@ -1,416 +0,0 @@
-<!DOCTYPE html>
-
-<html>
-
-<head>
-
-<meta charset="utf-8" />
-<meta name="generator" content="pandoc" />
-<meta http-equiv="X-UA-Compatible" content="IE=EDGE" />
-
-<meta name="viewport" content="width=device-width, initial-scale=1" />
-
-<meta name="author" content="Louis Aslett &amp; Ryan Christ" />
-
-<meta name="date" content="2022-12-17" />
-
-<title>Decoding a Single Variant</title>
-
-<script>// Pandoc 2.9 adds attributes on both header and div. We remove the former (to
-// be compatible with the behavior of Pandoc < 2.8).
-document.addEventListener('DOMContentLoaded', function(e) {
-  var hs = document.querySelectorAll("div.section[class*='level'] > :first-child");
-  var i, h, a;
-  for (i = 0; i < hs.length; i++) {
-    h = hs[i];
-    if (!/^h[1-6]$/i.test(h.tagName)) continue;  // it should be a header h1-h6
-    a = h.attributes;
-    while (a.length > 0) h.removeAttribute(a[0].name);
-  }
-});
-</script>
-
-<style type="text/css">
-code{white-space: pre-wrap;}
-span.smallcaps{font-variant: small-caps;}
-span.underline{text-decoration: underline;}
-div.column{display: inline-block; vertical-align: top; width: 50%;}
-div.hanging-indent{margin-left: 1.5em; text-indent: -1.5em;}
-ul.task-list{list-style: none;}
-</style>
-
-
-
-<style type="text/css">
-code {
-white-space: pre;
-}
-.sourceCode {
-overflow: visible;
-}
-</style>
-<style type="text/css" data-origin="pandoc">
-pre > code.sourceCode { white-space: pre; position: relative; }
-pre > code.sourceCode > span { display: inline-block; line-height: 1.25; }
-pre > code.sourceCode > span:empty { height: 1.2em; }
-.sourceCode { overflow: visible; }
-code.sourceCode > span { color: inherit; text-decoration: inherit; }
-div.sourceCode { margin: 1em 0; }
-pre.sourceCode { margin: 0; }
-@media screen {
-div.sourceCode { overflow: auto; }
-}
-@media print {
-pre > code.sourceCode { white-space: pre-wrap; }
-pre > code.sourceCode > span { text-indent: -5em; padding-left: 5em; }
-}
-pre.numberSource code
-{ counter-reset: source-line 0; }
-pre.numberSource code > span
-{ position: relative; left: -4em; counter-increment: source-line; }
-pre.numberSource code > span > a:first-child::before
-{ content: counter(source-line);
-position: relative; left: -1em; text-align: right; vertical-align: baseline;
-border: none; display: inline-block;
--webkit-touch-callout: none; -webkit-user-select: none;
--khtml-user-select: none; -moz-user-select: none;
--ms-user-select: none; user-select: none;
-padding: 0 4px; width: 4em;
-color: #aaaaaa;
-}
-pre.numberSource { margin-left: 3em; border-left: 1px solid #aaaaaa; padding-left: 4px; }
-div.sourceCode
-{ }
-@media screen {
-pre > code.sourceCode > span > a:first-child::before { text-decoration: underline; }
-}
-code span.al { color: #ff0000; font-weight: bold; } 
-code span.an { color: #60a0b0; font-weight: bold; font-style: italic; } 
-code span.at { color: #7d9029; } 
-code span.bn { color: #40a070; } 
-code span.bu { color: #008000; } 
-code span.cf { color: #007020; font-weight: bold; } 
-code span.ch { color: #4070a0; } 
-code span.cn { color: #880000; } 
-code span.co { color: #60a0b0; font-style: italic; } 
-code span.cv { color: #60a0b0; font-weight: bold; font-style: italic; } 
-code span.do { color: #ba2121; font-style: italic; } 
-code span.dt { color: #902000; } 
-code span.dv { color: #40a070; } 
-code span.er { color: #ff0000; font-weight: bold; } 
-code span.ex { } 
-code span.fl { color: #40a070; } 
-code span.fu { color: #06287e; } 
-code span.im { color: #008000; font-weight: bold; } 
-code span.in { color: #60a0b0; font-weight: bold; font-style: italic; } 
-code span.kw { color: #007020; font-weight: bold; } 
-code span.op { color: #666666; } 
-code span.ot { color: #007020; } 
-code span.pp { color: #bc7a00; } 
-code span.sc { color: #4070a0; } 
-code span.ss { color: #bb6688; } 
-code span.st { color: #4070a0; } 
-code span.va { color: #19177c; } 
-code span.vs { color: #4070a0; } 
-code span.wa { color: #60a0b0; font-weight: bold; font-style: italic; } 
-</style>
-<script>
-// apply pandoc div.sourceCode style to pre.sourceCode instead
-(function() {
-  var sheets = document.styleSheets;
-  for (var i = 0; i < sheets.length; i++) {
-    if (sheets[i].ownerNode.dataset["origin"] !== "pandoc") continue;
-    try { var rules = sheets[i].cssRules; } catch (e) { continue; }
-    var j = 0;
-    while (j < rules.length) {
-      var rule = rules[j];
-      // check if there is a div.sourceCode rule
-      if (rule.type !== rule.STYLE_RULE || rule.selectorText !== "div.sourceCode") {
-        j++;
-        continue;
-      }
-      var style = rule.style.cssText;
-      // check if color or background-color is set
-      if (rule.style.color === '' && rule.style.backgroundColor === '') {
-        j++;
-        continue;
-      }
-      // replace div.sourceCode by a pre.sourceCode rule
-      sheets[i].deleteRule(j);
-      sheets[i].insertRule('pre.sourceCode{' + style + '}', j);
-    }
-  }
-})();
-</script>
-
-
-
-
-<style type="text/css">body {
-background-color: #fff;
-margin: 1em auto;
-max-width: 700px;
-overflow: visible;
-padding-left: 2em;
-padding-right: 2em;
-font-family: "Open Sans", "Helvetica Neue", Helvetica, Arial, sans-serif;
-font-size: 14px;
-line-height: 1.35;
-}
-#TOC {
-clear: both;
-margin: 0 0 10px 10px;
-padding: 4px;
-width: 400px;
-border: 1px solid #CCCCCC;
-border-radius: 5px;
-background-color: #f6f6f6;
-font-size: 13px;
-line-height: 1.3;
-}
-#TOC .toctitle {
-font-weight: bold;
-font-size: 15px;
-margin-left: 5px;
-}
-#TOC ul {
-padding-left: 40px;
-margin-left: -1.5em;
-margin-top: 5px;
-margin-bottom: 5px;
-}
-#TOC ul ul {
-margin-left: -2em;
-}
-#TOC li {
-line-height: 16px;
-}
-table {
-margin: 1em auto;
-border-width: 1px;
-border-color: #DDDDDD;
-border-style: outset;
-border-collapse: collapse;
-}
-table th {
-border-width: 2px;
-padding: 5px;
-border-style: inset;
-}
-table td {
-border-width: 1px;
-border-style: inset;
-line-height: 18px;
-padding: 5px 5px;
-}
-table, table th, table td {
-border-left-style: none;
-border-right-style: none;
-}
-table thead, table tr.even {
-background-color: #f7f7f7;
-}
-p {
-margin: 0.5em 0;
-}
-blockquote {
-background-color: #f6f6f6;
-padding: 0.25em 0.75em;
-}
-hr {
-border-style: solid;
-border: none;
-border-top: 1px solid #777;
-margin: 28px 0;
-}
-dl {
-margin-left: 0;
-}
-dl dd {
-margin-bottom: 13px;
-margin-left: 13px;
-}
-dl dt {
-font-weight: bold;
-}
-ul {
-margin-top: 0;
-}
-ul li {
-list-style: circle outside;
-}
-ul ul {
-margin-bottom: 0;
-}
-pre, code {
-background-color: #f7f7f7;
-border-radius: 3px;
-color: #333;
-white-space: pre-wrap; 
-}
-pre {
-border-radius: 3px;
-margin: 5px 0px 10px 0px;
-padding: 10px;
-}
-pre:not([class]) {
-background-color: #f7f7f7;
-}
-code {
-font-family: Consolas, Monaco, 'Courier New', monospace;
-font-size: 85%;
-}
-p > code, li > code {
-padding: 2px 0px;
-}
-div.figure {
-text-align: center;
-}
-img {
-background-color: #FFFFFF;
-padding: 2px;
-border: 1px solid #DDDDDD;
-border-radius: 3px;
-border: 1px solid #CCCCCC;
-margin: 0 5px;
-}
-h1 {
-margin-top: 0;
-font-size: 35px;
-line-height: 40px;
-}
-h2 {
-border-bottom: 4px solid #f7f7f7;
-padding-top: 10px;
-padding-bottom: 2px;
-font-size: 145%;
-}
-h3 {
-border-bottom: 2px solid #f7f7f7;
-padding-top: 10px;
-font-size: 120%;
-}
-h4 {
-border-bottom: 1px solid #f7f7f7;
-margin-left: 8px;
-font-size: 105%;
-}
-h5, h6 {
-border-bottom: 1px solid #ccc;
-font-size: 105%;
-}
-a {
-color: #0033dd;
-text-decoration: none;
-}
-a:hover {
-color: #6666ff; }
-a:visited {
-color: #800080; }
-a:visited:hover {
-color: #BB00BB; }
-a[href^="http:"] {
-text-decoration: underline; }
-a[href^="https:"] {
-text-decoration: underline; }
-
-code > span.kw { color: #555; font-weight: bold; } 
-code > span.dt { color: #902000; } 
-code > span.dv { color: #40a070; } 
-code > span.bn { color: #d14; } 
-code > span.fl { color: #d14; } 
-code > span.ch { color: #d14; } 
-code > span.st { color: #d14; } 
-code > span.co { color: #888888; font-style: italic; } 
-code > span.ot { color: #007020; } 
-code > span.al { color: #ff0000; font-weight: bold; } 
-code > span.fu { color: #900; font-weight: bold; } 
-code > span.er { color: #a61717; background-color: #e3d2d2; } 
-</style>
-
-
-
-
-</head>
-
-<body>
-
-
-
-
-<h1 class="title toc-ignore">Decoding a Single Variant</h1>
-<h4 class="author">Louis Aslett &amp; Ryan Christ</h4>
-<h4 class="date">2022-12-17</h4>
-
-
-
-<p>In order to demonstrate how to use to calculate and plot a local
-distance matrix <span class="math inline">\(d^{\ell}\)</span>, the
-package comes with an toy dataset of 300 simulated haplotypes, , stored
-as a <span class="math inline">\(L = 400\)</span> by <span class="math inline">\(N = 300\)</span> .</p>
-<div class="sourceCode" id="cb1"><pre class="sourceCode r"><code class="sourceCode r"><span id="cb1-1"><a href="#cb1-1" aria-hidden="true" tabindex="-1"></a><span class="fu">require</span>(kalis)</span>
-<span id="cb1-2"><a href="#cb1-2" aria-hidden="true" tabindex="-1"></a><span class="fu">data</span>(<span class="st">&quot;SmallHaps&quot;</span>)</span></code></pre></div>
-<p> maintains a special cache for loading a haplotype dataset (see next
-section for details). Since is designed for much larger datasets than
-this toy example that we would often never want load into , haplotypes
-can be imported directly into the cache using . can only cache and
-operate on one haplotype dataset at a time. Currently, requires that the
-haplotypes be stored in our custom HDF5 format but support for other
-common formats will be added shortly. In the following section we
-provide simple instructions for converting common file formats like VCFs
-and HAP/SAMPLE/LEGEND generated by SHAPEIT2 to our HDF5 format. However,
-if the haplotypes are loaded into a , we can easily import them straight
-into the cache using .</p>
-<div class="sourceCode" id="cb2"><pre class="sourceCode r"><code class="sourceCode r"><span id="cb2-1"><a href="#cb2-1" aria-hidden="true" tabindex="-1"></a><span class="fu">CacheHaplotypes</span>(SmallHaps)</span></code></pre></div>
-<p>From we can inspect the haplotype cache to ensure that the data has
-loaded correctly using . With the haplotypes loaded, next we must
-specify our model parameters. First we supply a recombination map, <span class="math inline">\(m\)</span>, where <span class="math inline">\(m^\ell\)</span> is the distance between variant
-<span class="math inline">\(\ell\)</span> and <span class="math inline">\(\ell + 1\)</span> in Morgans. Here we randomly
-generate a recombination map and set the remaining parameters to their
-default values.</p>
-<div class="sourceCode" id="cb3"><pre class="sourceCode r"><code class="sourceCode r"><span id="cb3-1"><a href="#cb3-1" aria-hidden="true" tabindex="-1"></a>m <span class="ot">&lt;-</span> <span class="fu">rbeta</span>(<span class="dv">400-1</span>,<span class="dv">1</span>,<span class="dv">10</span>)<span class="sc">*</span><span class="fl">1e-6</span></span>
-<span id="cb3-2"><a href="#cb3-2" aria-hidden="true" tabindex="-1"></a>pars <span class="ot">&lt;-</span> <span class="fu">Parameters</span>(<span class="fu">CalcRho</span>(<span class="at">cM =</span> m, <span class="at">s =</span> <span class="dv">1</span>, <span class="at">gamma =</span> <span class="dv">1</span>), <span class="at">mu =</span> <span class="fl">1e-8</span>)</span></code></pre></div>
-<p>Next we must initialize a forward table object with our parameters
-that will start at variant <span class="math inline">\(0\)</span> and a
-backward table object that will start at the variant <span class="math inline">\(L+1\)</span>. We then use the function to
-propagate the forward table using parameters to target variant <span class="math inline">\(250\)</span>. We do the same with the backward
-table using the function. Note that and do not return anything, the
-tables and are updated in place.</p>
-<div class="sourceCode" id="cb4"><pre class="sourceCode r"><code class="sourceCode r"><span id="cb4-1"><a href="#cb4-1" aria-hidden="true" tabindex="-1"></a>fwd <span class="ot">&lt;-</span> <span class="fu">MakeForwardTable</span>(pars)</span>
-<span id="cb4-2"><a href="#cb4-2" aria-hidden="true" tabindex="-1"></a>bck <span class="ot">&lt;-</span> <span class="fu">MakeBackwardTable</span>(pars)</span>
-<span id="cb4-3"><a href="#cb4-3" aria-hidden="true" tabindex="-1"></a></span>
-<span id="cb4-4"><a href="#cb4-4" aria-hidden="true" tabindex="-1"></a><span class="fu">Forward</span>(fwd, pars, <span class="dv">250</span>)</span>
-<span id="cb4-5"><a href="#cb4-5" aria-hidden="true" tabindex="-1"></a><span class="fu">Backward</span>(bck, pars, <span class="dv">250</span>)</span></code></pre></div>
-<p>Now that and are at the same variant, they can be combined to obtain
-the posterior marginal copying probabilities, <span class="math inline">\(p^\ell\)</span>, or a matrix of distances based on
-the negative log of those copying probabilities, <span class="math inline">\(d^\ell\)</span>, as follows.</p>
-<div class="sourceCode" id="cb5"><pre class="sourceCode r"><code class="sourceCode r"><span id="cb5-1"><a href="#cb5-1" aria-hidden="true" tabindex="-1"></a></span>
-<span id="cb5-2"><a href="#cb5-2" aria-hidden="true" tabindex="-1"></a>p <span class="ot">&lt;-</span> <span class="fu">PostProbs</span>(fwd,bck)</span>
-<span id="cb5-3"><a href="#cb5-3" aria-hidden="true" tabindex="-1"></a>d <span class="ot">&lt;-</span> <span class="fu">DistMat</span>(fwd,bck)</span></code></pre></div>
-<p>The distance matrix can be easily clustered and visualized just by
-calling</p>
-<div class="sourceCode" id="cb6"><pre class="sourceCode r"><code class="sourceCode r"><span id="cb6-1"><a href="#cb6-1" aria-hidden="true" tabindex="-1"></a><span class="fu">plot</span>(d)</span></code></pre></div>
-<p><img src="data:image/png;base64,iVBORw0KGgoAAAANSUhEUgAAASAAAAEgCAYAAAAUg66AAAAEDmlDQ1BrQ0dDb2xvclNwYWNlR2VuZXJpY1JHQgAAOI2NVV1oHFUUPpu5syskzoPUpqaSDv41lLRsUtGE2uj+ZbNt3CyTbLRBkMns3Z1pJjPj/KRpKT4UQRDBqOCT4P9bwSchaqvtiy2itFCiBIMo+ND6R6HSFwnruTOzu5O4a73L3PnmnO9+595z7t4LkLgsW5beJQIsGq4t5dPis8fmxMQ6dMF90A190C0rjpUqlSYBG+PCv9rt7yDG3tf2t/f/Z+uuUEcBiN2F2Kw4yiLiZQD+FcWyXYAEQfvICddi+AnEO2ycIOISw7UAVxieD/Cyz5mRMohfRSwoqoz+xNuIB+cj9loEB3Pw2448NaitKSLLRck2q5pOI9O9g/t/tkXda8Tbg0+PszB9FN8DuPaXKnKW4YcQn1Xk3HSIry5ps8UQ/2W5aQnxIwBdu7yFcgrxPsRjVXu8HOh0qao30cArp9SZZxDfg3h1wTzKxu5E/LUxX5wKdX5SnAzmDx4A4OIqLbB69yMesE1pKojLjVdoNsfyiPi45hZmAn3uLWdpOtfQOaVmikEs7ovj8hFWpz7EV6mel0L9Xy23FMYlPYZenAx0yDB1/PX6dledmQjikjkXCxqMJS9WtfFCyH9XtSekEF+2dH+P4tzITduTygGfv58a5VCTH5PtXD7EFZiNyUDBhHnsFTBgE0SQIA9pfFtgo6cKGuhooeilaKH41eDs38Ip+f4At1Rq/sjr6NEwQqb/I/DQqsLvaFUjvAx+eWirddAJZnAj1DFJL0mSg/gcIpPkMBkhoyCSJ8lTZIxk0TpKDjXHliJzZPO50dR5ASNSnzeLvIvod0HG/mdkmOC0z8VKnzcQ2M/Yz2vKldduXjp9bleLu0ZWn7vWc+l0JGcaai10yNrUnXLP/8Jf59ewX+c3Wgz+B34Df+vbVrc16zTMVgp9um9bxEfzPU5kPqUtVWxhs6OiWTVW+gIfywB9uXi7CGcGW/zk98k/kmvJ95IfJn/j3uQ+4c5zn3Kfcd+AyF3gLnJfcl9xH3OfR2rUee80a+6vo7EK5mmXUdyfQlrYLTwoZIU9wsPCZEtP6BWGhAlhL3p2N6sTjRdduwbHsG9kq32sgBepc+xurLPW4T9URpYGJ3ym4+8zA05u44QjST8ZIoVtu3qE7fWmdn5LPdqvgcZz8Ww8BWJ8X3w0PhQ/wnCDGd+LvlHs8dRy6bLLDuKMaZ20tZrqisPJ5ONiCq8yKhYM5cCgKOu66Lsc0aYOtZdo5QCwezI4wm9J/v0X23mlZXOfBjj8Jzv3WrY5D+CsA9D7aMs2gGfjve8ArD6mePZSeCfEYt8CONWDw8FXTxrPqx/r9Vt4biXeANh8vV7/+/16ffMD1N8AuKD/A/8leAvFY9bLAAAAOGVYSWZNTQAqAAAACAABh2kABAAAAAEAAAAaAAAAAAACoAIABAAAAAEAAAEgoAMABAAAAAEAAAEgAAAAAKtAJY0AAEAASURBVHgB7V0JmF1Fla4kHTB7WAOJJs2+yY5oEFAZFY3IOiKDIphBBgdkwBFZRDDjKKiDSAQHlyFsyjKgIoJsSkCEEIeYsIQdEjCBsGQhGyEhb+qv7v/26eqqevfdezuv0zn1fd1Vdbaq+7/7zqu9+tRsMBoUAUVAEWgCAn2bUKYWqQgoAoqAQ0AdkL4IioAi0DQE1AE1DXotWBFQBNQB6TugCCgCTUNAHVDToNeCFQFFQB2QvgOKgCLQNATUATUNei1YEVAE1AHpO6AIKAJNQ0AdUNOg14IVAUVAHZC+A4qAItA0BNQBNQ16LVgRUATUAek7oAgoAk1DQB1Q06DXghUBRUAdkL4DioAi0DQE1AE1DXotWBFQBNQB6TugCCgCTUNAHVDToNeCFQFFQB2QvgOKgCLQNATUATUNei1YEVAE1AHpO6AIKAJNQ0AdUNOg14IVAUVAHZC+A4qAItA0BNQBNQ16LVgRUATUAek7oAgoAk1DQB1Q06DXghUBRUAdkL4DioAi0DQE1AE1DXotWBFQBNQB6TugCCgCTUNAHVDToNeCFQFFQB2QvgOKgCLQNATUATUNei1YEVAE1AHpO6AIKAJNQ0AdUNOg14IVAUVAHZC+A4qAItA0BNQBNQ16LVgRUATUAek7oAgoAk1DQB1Q06DXghUBRUAdkL4DioAi0DQE1AE1DXotWBFQBNQB6TugCCgCTUNAHVDToNeCFQFFQB2QvgOKgCLQNATUATUNei1YEVAE1AHpO6AIKAJNQ0AdUNOg14IVAUVAHZC+A4qAItA0BNQBNQ16LVgRUATUAek7oAgoAk1DQB1Q06DXghUBRUAdkL4DioAi0DQE1AE1DXotWBFQBNQB6TugCCgCTUNAHVDToNeCFQFFQB2QvgOKgCLQNATUATUNei1YEVAE1AHpO6AIKAJNQ0AdUNOg14IVAUVAHZC+A4qAItA0BNQBNQ16LVgRUATUAek7oAgoAk1DQB3QGoD+zDPPNNdee23lJf3gBz8wl1xySeV2f/GLX5hvf/vbldv9zW9+Y0499dTK7d53333mmGOOqdzuY489Zj71qU9VblcNdiDQ0pHUVHchMH/+fLNkyZLKzS9cuNCsXLmycruLFy82CxYsqNzu0qVLzRtvvFG53eXLl5vXXnutcrtvv/22eeWVVyq3qwY7ENAWUAcWmlIEFIE1jIA6oDUMuBanCCgCHQioA+rAQlOKgCKwhhFQB7SGAdfiFAFFoAMBdUAdWGhKEVAE1jAC69ws2Jw5c5IQT5482ay//vpJmUaZzz//vOnbt6/ZYIMNGlVNyj/xxBPmXe96l7nxxhuTco0yZ8yYYV5//fXK7U6dOtXMnj27crvTp093s1VV44DP7c033zSpd2bw4MFm2LBhjUJcV/6RRx4xt9xyi9l+++3rykIASwbGjBljhgwZUld+0aJFZtmyZebkk0+uK9vdAn1qNnR3IT3FPqast9hii2h1ME2Mqe19DxjnZFa8sTQq2wgDdvu1tJh3VezYli1bbvr0MWbAgAGNVKeu7PK33jKrV682gwYOrCvbiMCKFSvssoFVZvDgQY2o1ZXF5/qWrXOXL1//fm26K9+J24CM5AudVatWmb89/hczcuRIi7MFOhCOPfZY853vfCfAKUf60Y9+ZCacO8GMGDIil6HX3nzNDBs4zKzXsl5d+WUrlpm+g/qaWbNn1ZXtboF1qgXUv39/8/e//z2K6fe+9z1zy3UPmjvuuMksWLLCXHLKzeatO20r4+M7ZDpLrr4/Sw8+Zl/HJ2HVvPAaF8hJPcrH4pYRG5mYrZhOWXqZMqHLwHrntSd1aaNwHPm9QJ0aLYfP8VjLVIOWUNWt4nrPuPXWW5sRQzc1G8/pwDals7GxcjmXmi00LWajHfPZTZVZBW+dckB5AOu38SDnfDYYvL5Z/coS++IOd2pIIwz52ifMyjufyWjkgyDTTqD9H3ThhFbNeFmSu6T7jhhiVs9b7Oi+rZZdN6+r38VggwS/zAbVnTicNZ9T2kP9ETLeGngeV6D9J+tBWr0405lZT1L5ZRBQB+Sht+DPM8xXN/iCo05aeb05b8+LnSOiGJ0P8nQW5KVifvFSMil7efRTttcUL1ZPn+7n11T9tJyehYA6oMTnAecz4eF/c05Itk6o4tOYRxwLkpdyOL4+beel+3L18iH7IZpvRz6Pzwvl8cyN6oTsdDetkc+mu+vSm+2rA0p8uviiTBh3uXNCiENfHJ/m533zZV7smO0Y3S+7Xj5kJ0SrZyfFr9peqqwyvKye2gVzMGKQ/513ug7mYwIEM7wImGSYN2+eGT16tMvn+acOKAdKcD7n3TbeOSPpQPCShvLZy5vDdiMisizq+XUgvYo4j+1GnxXPENNJ8fg8IQzIi9U3VR51NU4jcPDBB5u77rqri9C0adPM7rvvbv7jP/7D/PjHPzbrrbee2Wyzzcxtt91mRoyoP4OnDsiDdIAZaEbvso9565HnzAe+9Q9myrf+6CR+fN3fMickVfyX289DdsAntjHLb28buJa6jaZDtmEjRm/Ufki+atspeyke6xaS6bvZ4GycjnxJo64fU9and8prC8jB8fvf/75TC+j00083Tz/9tNltt93MX/7yF4MjXB5++GGz6aabmhNPPNGcccYZ5oorrugEZSijDshDZblZZl585AFHfeDLv824r//gPnOe/cOYkOuO2Zc+NJAaeqmXXjkts1M0Ie3iy8XA2Tnm/Tj0RZT6lIcdSadd0ORzoh6ypeK3SFhPKcMyQrGvH5LxaawD6SxL2mLal6UOY9YXeeogLenINyP0N/3NKNM2e1hl+f1NP7O6QYNo2TDcf//95vrrrzdYAIr1UTjn6TOf+UzW9fra175m9t57bzNp0qTo+inaUgdEJHLG7I59e/wNOTWqF6NzyGM5JBuiwVaIHqLlKVdlei4Cb5m3zCsvvWYuuOCCLpXcd999Df5iAQtUjz/+eLf4ctSoUU7shRdeMB/+8IczFazIxhlNOPtp4403zuihhO4FC6GSoKFFcM2dT5tvXn5kQqp7WagD/0Ilgccg05JGfcbgMS11ZDrTT8zyUUbjnotAzdTMO6veMdiS4f9hIDkV7r77bvPqq692OoESh7YNHTo0U8P2FIQ8h9ppCyiDrS2BMaDWjx3oMhy7QTxg08Fm+atL3FjOcz+630zAX3t3zDPRJbvx6fub+Vf9rQu9KKFeq0TyZZrlhWjgheigpbojMV6MzjowzitHecYhvRAN8jE6bTHOK0f5tTUeYAa4LUnnn39+w4/w85//3Hzxi1/stP1no402MjhFk4FpbGGpF9QBeQhhDGjZXdPNq2ae2bK9JYEB5BWiVUEVbNfIExa2r5zOI6syikBPRQB7Gm+++WY39iPriGl3dMMYkN5kk03MoEH19/ypAyJqIobzQZAtApmm6MQjf+m6LeiOYUwoJEM7coCT+o3E68qvcyOY1JNF9zH2mdTTVX5XBJ588kmD/ZT+Dn1cCHD44Ye7llFra6sbWzrqqKO6GghQ1AEFQGmEtMVRu2VjQhigjgV1IDFkuo8+/OPbVNr17b6arh2WZ86caXbcccds4SFr/f73v9+MHz/e7LXXXu7IGUzNo6uWJ6gDSqCEVgsch4ylOHjPnPUHRzrPxnLbBogcwMWvcJ4WEMuSZTAd48Xo1CsT57ENmUYCsQzppHiUT+Ho1xdLJxBidUzZYnkadyCAlk7s+iNc4/SNb3zDHYsyfHjbBu4OzXhKHVAcm+zF5QuMmE4FanAs5CGPFpAcmG60+V/vC8Gy/DpwpznqwICytzp1X/PCddNJyrojUp9M9yxinIt1h22mKVsm5jOEbKR4lK8nU49PO4hzyepCRAlZMo3D8fDXSFAH5KGFWbBUqPdl5DohnicEW+7L3WBLwa8DnAbLZgwZ0qVTceVZeTgfKevb9PPUo460SVmWh7xMSz7StEU6Y5/OssiXcci+5Pf2dIs9t2dTU387Q6M4vG1WmvlmYaNq3SLfYxwQFi1hY9tA7xQ+XA4nN8Fh5aX0skU2wDWCpP8lQJ4h9OUBH84H5wn1GdEua1sjVQRZtrTn02VepkP1DdmBTkwWY15YhiDtyjTtkQZ52Qoj3ZdDHmVKPvDzF6rF6kV7sVjapUzKVkieehpXh0DTHRBG1k866SR3VjCczf77729++tOfZlN4WNKNM4oZMAKPs5ARim6Ao61Q3H/0Jmb0gH0cC+t/GglcK3TN79va7V84bX+nfp3dR5YnUD8kG+PF6CEbjdJCtuc+Oc/tbYvZgg4C1kwhvWD+UoPBYAbSZZ7pYLx5Y2NMsBGqd9B2HuJ1eYRUpigCTXdA3/3ud92+EaywhAM68MADzdVXX+02tCGPkfdZs2a5TW54SJ7NW2YDXAqsN1+cbV5c0bYXrPX2xl7+5e2GuWbovg0Hmc9/fNvcG1GpH6pfjBejh2w0SitiW+rItCw7RpcyZdKV2l9nTkwvg3hx3aY6IJyHv+2225rjjjvOORacu4s9JX/4wx+cA3r88ced48HeEhw8jjUIDEU3wMGpxQIOIccY0JbHHOG6AxzExS/4BtaZIMjuBOipRYaQ/bb9w1EejewdQ9ejNq+ablvsWaumo86tH9m6Ez55yuCzMkaXDYE4k57HVkrG7wqmZH0e3hn+8Pm8fv36GfytKwFDHi+//LLBeh8/FBkOaaoDwod6zjnnZM+BD/pXv/qVcz4gYrctDjvab7/9DK50QfcLO2z32GMPt/Ky0Q1wcGJdbk7ISjdurGlbs7V5/uqb3ODfc+08bKOY356WM1Xz7ZiFzGNWBXl/doUD03BC+ELJQEcDOr/AoCH/vsN2MlMve8il35nxSqeyaINlMl9lnMd29qwWi+dsHeuFLvhwfKwdy+eYpyEvL/GmCONYfUHHuJUfUrYou9L+KGGrQcwB4eiJiy++mOK9Op44caI577zz3C0heNDLL7/cYA0QQtHhkKY6IFfz9n9wPkcffbQ7zOiUU05xVLSQPvjBD2Yf8Nlnn20OO+wwdw5JagNcbAcuWlCpzXa4FeOX511t5rzzspljXjZj520lq1g3zReaMRXwBaATQiwDBzvhYPAFRt4Njtov3hR+odu/nFKPab8s0quI89jOI+PXJaWT4vl2/HxMN0b39UP5/vY6JextWtO3YoTq0kzao48+6pwPDiDD1VaXXnqpOfPMM80999yz9p8HhMvfDj30UHea2u23325a7IeOgNWV+GOYMGGCawHhErYyG+BoLxQPHT3GjB3wD4416Ng9GhrQ5OAnB2JpnwOvPNQMu+k/tc8Yw8FqytWLYccPLNOnV5HPY9t/1nrlEouQXIpH+RAG5MXiWB1z2TozZnXdol922WXmS1/6Unav3gknnGAOOuggB0LR4RAoN70FhOl3DDxvt912zrnIg4+w8Q23iWJmDAHNYPS3sfmtzAY4Zyzxj90KvriMoSJfWklPmHNODGNImBHCFD0Gpu+YOtuNK4GG8PmDdjS3PjDbySAPeTgp0OisWJ6sA2TzBug3oos6QJ7lhsrhc0neIQd0zHqBfvOfOk6DTNmSPNiQerTPZ5Cy4MXqmXpe2pK2me4JcZ/+diWQuHOtsjqtWGjeXvFq8I48HKshj9Zgmc8995wbnz3iiCPccMiee+7pWkHglzkPqOkOCEu74Uwuuugidw0uHggtICznRssIzTyM/6AJ/F//9V/mQx/6kNtpW2YDHMqIBcyCzXrmjk4LwLJukacUm20J0r+we6aNFhCcEFpEDHA0MsAx0SEhjh3nwbLYlUutbaGsLCeVfmH6y647mNJbyC5juyHU40pv93+qTrHyYUPq+c8XqlOIBvs+3bfFOvhyjt4LZ8EWvjPfTJs+zYwdO5aPnsVf/epXzWmnnZblmZg7d677/l144YWuK3buueeas846y1x11VXuWmzptOR5QLHhENptqgPC+h7MeCGgGccAYB544AE3JjRlyhSz8847uxPWcALbDTe0nURYZgMcy0nF2BHf2i4gvwgpnRQPs2Wwc0n7lxOzY9hFD2fEwJkf5rFWFTr4ktcLVdTRLyOPTV/Gz/s28+Z9O34+r52QXJW2QvZ7Om2jlk3M2N3Gmsn3Tc5dVTiYXXfd1eAqagSMl6IV9JOf/KTUcEhTHRAeKHU1PbpbGOzCLAPubPe9adENcCnUMQbU2tpxIBmb6Yylrk9jHnEo+N2VF233Bi0hdMsWL1vpul/oivljQ9QLdSdYZqi8srQ8tmPPGis71lWCfIpHeyEMyIvFsTrmsjU5ZnXdomMpDG67YBg2bJhrFCxbtqzUcEhTHRAfpl6MLpnvfKhTZAMcdUMxu2Dgtdo/NssZg87g05hnTDnEaPYvslPrnHYHjQsVsW0D3Sy0kqZuuWGXtUVsCUHHD6GyfJmi+Ty288j45ad0UjzfTt58KZu9sAuWFzcph1MQ0fo59dRTzeabb+5aPrvssotbp1dmOGStcEASiO5OYyGi3ADI8QKU6zfdwZM05qUO64uFcBjXQWuGAYPLaP0goCV0jY1fW7jCcDGeY9h/240ebm7//uROZZHHMplvJO6362YG0/+xkMd26Flj9kAHXjGdFI82Jd6k1YtT5dXTVX4bAh/96EfNySefbN773ve6tXRoAWGSCKHMcIg6oDZ8s/84kpUnIrZaauqF93nMM86M2gTGd7C4cKFY4XyrpcMJIWBWDIvluPraEdv/zbJ6IZtgx+hSP5ZOOZ+8touUn9JJ8WLPUY/eHTbrldkb+Rh0xpU7OGwe93/JUHQ4RB2QRNGm5RjQhmLmyhNrOMuWD6fdaWDqzLYWCFo+KM+NCbVPv0OGraYF9lweDU1AYHITyuzBRWIxr+98WN0iwyHqgIhezlgOXPqDtMzHBj1957P/bh23Buxgy8e6Fx7lIasDOfBk2eSzTOarjPPYjj1rrB54hphOikd7IQzIi9U3VR51e2Tc0s+uAxpeedX6LbGTJH0qN1vIoDogDzY5CO2xumT9wU3mGUsFTKWjCya7PRiEZheMa31utTR/Oh5y9dYBybKqSoeew7edR6YRnSL2aD+mG6NTLxnrIHQSnrJMdUAeghiEHjliR7Nq3hudBkvhPOQMlqeWzEL3pG/8g5vpMnbHuAxwPAwY/0H4xNc/bOa/udzsveNmbTqWFhtIdQoV/Cv7fD42ZexV8DhqYi1BQB2Q90HhQLKWAcNd03f93drGXdCE/8Buo8w9dz7VSfojH9/OTJk+J9g1koKQwzofdqXAw5iQ7IINGdjfrf/hNoYRGw50Olwn9HN7EFi3hwKHf2V1CumGaJnCWpLQA8m69YNSBxSAl3vByMK4AxyNH/I4H+hAjosJORgN+hOz3nDT7khvMnx9J8P9T5TDuNFXjurYxgFZDYpAb0FAHZD3ScoxoFbBC40jhGhCJUtCjucJMQaT5w35aeSl3AR7HtEpN3zO4CJEP6Br1l3TzEVs1+sqoq5SJlb3ImX72FSS1zGgDEYcmVP1+ezqgDJ42xJDd9jatG7SthUjNA3Plgmk/Vkt0NjSYRpxSA70RgLGinCyImbJ5LhRIzYgi7rIZ6C+T5d5WX8+H21IHmxJOtMsIxT7+iGZejTWqZ5cI/ys7pMb0erdst1xPnuPcUCxWzHwkaaOekzxCr0OS1fa/lBcs94XRvJlOm4xHwe2OEVf1C6/VDF90uvJpWpMG5CRaeqUdRZSP1XP0J461iEVQw+hjJNP2V9beWj9dMf57E13QPVuxUgd9ZjiFf2gZRcsZKNe9wEzWaHjP0O2GqVNtF0xBLSE/vOs21wa0/qyTo5o/8muDrd2+NfpUNaPsfcMgTZkN4ldQ8Ztkvn/Sz20MGPLC2IWoc/umbTlyxMryvp85n0+9cg32gVzUHTH+eww3HQHlLoVI3XzRYqXvTwFEv5eMJiQLym/zKD7jgZyCLzOhwvgGv2SOSPeP07Rg4yWEKb1ERr5pcYXftEMe6C4txQAdrD2SD7brHueNVvZ/WtYp4SxJz4bZKQs0tJBsZ7cVgLbqZByIik9nyc/o0Z4kOWzhZ7DTPatrbl8n5a+Xc4Xr6L0hSsXm+kzpruztXx72HR63HHH+eTKz2dnAU11QPVuxUgd9ZjixQ4Q50OnYn8vGGTli+kvEpS2ICedkhykLnMuMcqQdi+xX/qTJx7iLj8EnV8g1oX1JR15+QV9QexHkzry2dyz2NYVykKgTdaDMfUZS7pMk19FzLpIWyEa+DE6dWP8rO69sAU0aP1hpnVMq8H+LT/g2I1QqPp8dpbRVAdU71aM1FGPKV7s6A7cihHjARCMJ225qpXYBOPYCxsUFkR/al+wciWlA0EdOCOG7pg86J5OB0ZlXUNpypLHmBUin3nEsh6h7iZ1YItpqe/T/TKlbE9I46qmTTbZJHorBs5Jxkmda1NYr9/6ZvjQ4dlRx3nq3l3nszfVAckHD92Kkbr5IsWLORlspHvppZdksZ3SOBb2rt/8zWy5yxGOLm/0pCAHPpGPDbJSlnFIjry8sSwXOlzEiEPNODtGW+iWgY/FjQh+N43bPygvZcCjPOXkAWk8q5kLJhd4G3ZZTzwzFm9iQSXCfdPnupj1Zr4INijD1wvRUGCM7irTzmda2uRztExuMTgPOXYrhjzDnHZ6Y9xd57P3CAcUuxUjdfNFipd6AeTZtb4cdvO++eSz5vkZNzlW6ytt0/FSTh6PGvr19s9Ipm7ZLth8e7UPA1oW7C7xckR0yRDgLHCwGb9M8uJEtj5wDIgf0OWAXfA4rjPR0vyBYpwAgzGtSfbP58GmHNO5rV2Gx9GCL9c+IV8kyDKoH6KBF6Pn1rNdMLwzMQdEO7097q7z2ZvugFK3YqRuvkjxevvLIJ8PzgCOA8d6HLj3GOd84GhIl7JMY4A5FnyedGDQkQPqMh2zl6pHTEfpPQ8B3NnXHeez97GDS00dZhs3bpxBywP3DuEWVATeivHQQw+Zww8/3Nxxxx2mtbXV3UuE/jhuaEzxin58OGj7luseNPvt/FlnomgXjK0PNuOZL1ov6NGWbwNbOHCWEGIEOCEedE8a+DKQDho2vMJ5UYb2KI/80893tCPYpUHs86DDeuKZmaatUFwEG9ZB2gvRwI/RqSvrKOtC+smH7tqUiwl///vfm/NO/4756Hs67sVjncvGs+c/aV4Z9LCZfO/khk1hTCx0PjsMvfXWW+4PN9rkDU1tAdW7FSN11GOKl/fhQ3Irn5hrlky/37HYxUILg+lDrjgyU5t03A2dBmUh93nbFbrklLajKo29Ox4hT0shMxpL2LEWfik4jgJR7B3jeAzyGBPiOA6cCzbB4qwhhCvPvM1Nte/QulEbwf53fJt/WtiBPMdoIIvroRk2sNPwaBUhhtPCtL48YsS0jwm5Z/bGh2DDdwgSG4kzywvG1q7s1jkZS5OtLX5eqE8XWWlU1FHWZYP2kwmkqKbbGgexMdYiB5I1vQWU50NNedYUL49tKYMW0O9+fLfZZ6NPOnJ/60DWszu63355cSYm19CguwI+A+TAn9u+c53rgPAlLRuGiRMR6Yhgk7/akoYd9LhzTNIgy3qN3H4Esp0CeJKOPOoPG9SDAmjy4DD/gDA+s5TpVJCX8fU9dtOyfI5vjt+neS2gsy8wH9/tpMoxmP3K42buivsLtYCqrkxTW0B5HyblWVO8vPalXJ+B62WLv/il58so5ZAmn3TIofVxje1+yODLSV7etO9MqBeiu4sP7ZYC3LbB7hjkUT/I+90s8KTz8fPy+VkeY8jKIOkyLWXKpmGXjpe2QjTwYnSpx7S02V11Z1katyGwVjigNflh1duKUW8WrMtS/vbKVz0LRkzY1UD3hQE0zGCBhssPsU6I3RvUH4fc+4EHivEgMWmXaehwNIixb0fSZdqXK5MP2Q3RUEaMzvJj/Ize1BFS1rL3xuqAvM9WbsWQX2qKye0KnAonDzG3KkhaFWlZF78OMs+y8GuOX3G0gLBOCLduYCwnJEsdP8bzSXnk9z7x/Z0GveX4kK9fLw9bUh9lhTD17YTkJI1OFHqS7tshn/Q8ZVNW42oQUAfk4YgTEQe27uaooVkwKR7iY4BYNuWlfFVplMFBYr8Okofy0CXE3jHMjnE2C10wP8iZNM6I0TafB3nakDTfVt48Brifbh+ohw5sssx6Nny5lK4v69tOPoueiOjDZVavXm2effZZs+2223biFTmZQh1QJwhtZlB/113xybE8WhkcU8GLTMcAeY4j8AWP2chDpy2UFSqDNsijPFc1g4+TFTE4HQp+HZGnDcZ59Cgr9aUesQKNdSUfun49yGNMGcRcqY1npB7Lp5Olw6S+jLe1t9BKPnRxCSQCzuSmI5Y6mjbmhz/8oTn//PMN1vAxFD2ZQh0QEWRszwOSYx4ky1h+uZDmyw+ZWLqq2R5ZtiyPXzxZPvigkwbnAyeEqXo/0BmwBUU9xlI+RCOfZSEv0yE+aYxD8uQxhgzLl1tEJB9p2qIs+TKG85F86EyxfxriCGDpDE6wkBu+y5xMoQ7Ix9prAfEFZQxxpBnzRWfeMRL/qAsRqZtQcSypJ2XxKy5/qUNykgYnhEO3ZMsI9lAXyNERIe/bhhxkKIt8vcCWCLt4MvZ1Y2VKOcjgL29I1TVlS2KWt6zeLoclL1/4whfcLvpzzz03e9wyJ1OoA8pgbE94LSC+7IyluE9Dnl9QKYc0W0CMfX4jefnl4K94Hn3Uj4sWedsG9dia4CJG0EO2+cyMqR+LpRzTjEM6sksU4hehpcqL2SuiE7NVmG7PA8KAetVh+cKVZu6sueZnP/tZF9N77rmnwV8onHHGGebggw82Y8eO7cQucjIFDagDIhJraSydkXwEfIFiPMhlx7vaAepGgnSwMh2zkUcmpqv07kFg1coVZsmSJebhhx/uUsDIkR239UomtkM98MAD7u/RRx+VLFPkZAoaUAdEJNrjlS++ZpY903YIl5z6ptgi8YvEtTPkIQY/RK83riRthNIrxDoflCFXZPvyWKEt+dxginrJ21ilE8J2BfdsdtaM8lxACR4Dt2JwZknyKMOYMshTjjTmKdtj4164Dmjo0E3cDNZPf/rTXLAvWrTI4DwgDDT/3//9n3nqqacM9oQ9+OCDZrfddjNFT6ZA4eqAcn0E5YVCzqwRq3JtC/ToJOBokH7fYTuZDYcOME+9uLCTWbmNAgyOyVAITggh1NTHFpINrP1QiPFkPSmDmPaRRpByIfspWkg3RMtTDusFWfnDkdF7yB3qKTy6m/f666+bESNGmEsvvdQVtWzZMrN06VJz0kknmRtvvNGUOZmiRzkgrC3AkZA4OIyhO+4iou1Q3H+Hkabl5Y7Nmv5CNtmywMI1/qLTVqjLUcWvPVsjKAdlMKCrhTphcJeD0cizC/al8Xu7AWc4HoyvYINqKJxz/jjXLQOPzwgb0FsQWasDPp5fDlaDhsApbuRl3R1T/JO6gpxM0onyeSEMGvN+OjSWxQKkLGmI+RyStq6mt9pqKzNt2rTs8ZH+2Mc+ltGOOeYYd2oFzpPGqRUXXHCBOeqoozL5VKLHOCCcNfLhD3/YPP/880b2Q7vjLqIUIMYOQq+3y3ucCL5c/JKFdHznE5IBLa9cTB906XSkXF46v5xSV6YxNT/a7hVjiwg82Pb1QAMmLBdpOXAMutsPZw9Go4wsx09LXZ+XyoccBGmMpX6IJvlIS5k8dff119V8mZMpmu6AcBwRRuO/8Y1vuDOZ5YfYXXcRyTL8dNm9YLETEf1yGs1ne5OsYqg7l3UZLJ9dCdAutd0z5jEOdat1EGxByDpwSwT2jsktCbAhj9vg83FPnD+2hXpiHxoCZZCmHOvOPHiNBtZB6kl8JD0km4ef2euFY0Dy+Yuk99hjj06LEGEDB9zjO4yp+rXmPCBU/E9/+pNzQLfccovZZ599QMpCd91FlBUQSAwdPcaMHtBWD1yvg53gcupc7gyXdJqSfNJCcuTljUN2oYtfavnLnbKHemBMaIF9JgSe74z0+rtt7p4V64TQYoMsy1wujhwBTfKgmwqN1o9lwmaoHNAaDdKm1E3ZynQmSw1NpxAocjJF01tAH/zgB910IG6s8MP06dPdKYn77befmTp1qtl+++3NpEmTDDxwkbUHKGOHHXg8l1+abYIvWGC2GTnWtLSfvcOXkDE06jXNQ184qd+11MYpfh38PCzCKYXokvbErDey8RtJhz63bbixHJv3+ZAhLa8DhE4q+Dj5eeiChnL9MkM0yKfqSFuQQ/BtgobZnh133LHTyl/QGT7/+c+bb33rW8xWGvfp36/TeVNVGW9Zai8KmNczRteb7oDgNWOh6ruIMLiN9QyxgGnJv9z5VCc2X2zGkunT+LIzlrJ8uSWPNCkXS8cGa9Gd4rGq1MW4DeQZOI7D+koeZGADYzGkQ57bNrCLHoF1hQzSlEXZclU1bGE2DnupEFza0hhgW3YBWTfwYZf4QEbyqA8Z1oU0qevzaJN2fR1fnnzK9+vXYtA6jx1KP2zYMKpoXACBpjugVJ274y4ijOjHAtYz9Fm2yo1XcKyCLzBfVG6AhA2sHuaLSpvg45hTGXBsKgPtMJ83xs5xtt143Q50URb+/Nkt0KQcZbHVwpcFD192SYdTwcA0aHIWCfWALGIEuREUeewlQ5gyfU626ppX84DOZ0AaAUfBykB8GEse08Dc54dokOfn48tLW1z9LWX4HH1sQwHvTMwB0Y7GxRDo0Q6ou+4iSkElFyJyoDQbkLSKl4hFeeD7A624SZR6dGLMp8qtx7tSlFtPNsVHXXjbqZTz6RgHwhnSCMdeMM45Mzgb7hVjDL48S5n1hD2mIRMLEpvQRYe+HjCdb20TW/JBQwjRYVfWkTq0xUFzqZvVXQehCVe3xD3aAXXXXUQpJENXM0t5+YUBPZX3edJOo+k1YUuWIb+waMFhTCi07slf4yRtyHSe55UtkJi8tCnTvrzkyVk9KSdlQPfzUlbT3YNAj3ZA3XUXUQpKzIK1th7oRHDxnh/YpAc9zxfG168i30gd/K6J1K1XFzwf5NEdwfogTNH7R3lga4fEwS+vXhmS72blJCGSRhlca+SLcLMtu70pWejWre9kv4R1O48V0GgYbL755l2AWKsPJMMAsX9FWb9+/dzy74svvjh4F1HRtQddkIsQQtO0fGER+9PEzFOPszjMR4rJyJCPydJWJlwwQafiq/t0OhUMBvPLDB20hORB9/5WD9olFszHYvm8KEfmQzrAAXXj7n3KxPQg+/PLp1KsU0xb1K0K406F9KLM8ccfb+68806D7+WoUaPMb3/7W8Mrenr1gWS4qJAP6n+eRdYe+DY65e15QMvu6tiMirEQ2c3gGhq82Cumv2xG2nOM/eC/yJBD877frpt1WtTn67XNG/nUtvwA2xqD00Ogc2jjpP9L2Xr6UpZWMQCN84MQ3ICzbQnJozz8G0Co52NAOh0481IO5fiOhXKMqc9nIZ0xx6bIxzPJMiiHmLbIp46U0XQbAr/+9a/d5lNsl0JjAReGfuc73zEXXXSR0QPJKnxLcDGhMaMyi9L5gIjNlFxZjLw/voCVw5IPGQQMcIIuBzrbOPn+o9xFQpT7tQQpS6JO2MOGgBbMX3/zuEsvtOUjkOcy7f+gg7rDLja3oq6Ug+NBcBtg7SwfpuZxxjS6ZT4+sIEg9ZHn5llsbsUXnXmJFVZp+/agKwO32sZOHXA7+q2CtCv1ZZq2SJN5Pgd5vSmu1Vabd955x2BTqR/gXPDnh5122slce+21Zr311nMsbJeaN2+eS+uBZD5aJfKNHErfSDFs5jeiI2X5K00aWyt+qwFfbrTayEfsbwYlj7/4yEMHQcojDRlOSVMPU/BwPrh3jHqsl4yp79uEjF8n0NxYky2zbECdWdeytpqp39ceSOZ/7lXUZ8G0ufZcn78YXHPuB2ynOPvss32y2W677RztySefdIuBcXU0WkUIRRYFO0X7r0cPQrOSazKW0/Aoly0WzpAwDx5oqTxkEKjbliv2X54HBAuydUJHQstoRZAPGls05EseaNBnSw48mQYf3Rq0pFzrxHaTkMcgMJwQZsskBpBnoHPy7YPPFpdsqWBAu14LiLZTsWzJQM7/nFK6XXi9cBp+89HbmP32299MnnxPl8etR3jsscfMrFmz3DjQiy++6E5P1APJ6qFWks8XGLF0JvjihfL+F1LKSZ7UzVNFKf9c+4ZPaVvaIF/SmA7xuAZH8uAkWOZz7coTj/ylS8m1M5gd44ppbmrlnV++M4B91JlOkCueEUOXXR86JuSZZv0bjVFeo3b43I2W1dvl//Ef/9HgDwPQxx13nDnooINKHUjWt7cD1hOej1+qnlCXWB3Y6onxU3TMimFMSK6kpiNK6YV4OFgNf1WH7rBZdR17sr3//d//Nffc09FiwjE5OClx9uzZvedAsp7yAbxq2gbXWkWFQr+IPs3PU13+gsdkKLu2xhwTarT+3O/FGPoynbLnYxlrDYIesplXP1WHdYWHQeuTTz7ZPPTQQ25bCu4G23LLLd1frziQrKd8kBiETi1EbKSeHJupYkAUtkJ2YvRG6hmTzWsb9eL0+ckTD8n2h/H5aR/dLLmvDHT5TBgzgqMAjeNH1C0bF7Y5uWzJvUP/yCOPdAfS77zzzmb58uVuABuzX3379jVr9YFkPe3jwSD0rGfiO+Zjv7J8DsnnPjH5Sws+vlwYbJV06sdi2vL5/hgL+LCLcvzA8mI8jAOxKwbZRXbdElpv1IM9Pl/IBvjYK4cxIblYkTZfgIANoTqDjnL4nBgj4ngReAyyLqTVi2N1TdnKdHrhIHQ9vEJ8OJqJEyeaCy+80MyfP9+dES3lii4K1lkwiaJN40zo1k3iWzE88ULZvFsOpPG8rRGp00iah5PJlkeeMiHD3eQsD9s1sFiR2zZkK4cyjNlK8m24rRbtywAoixi2qJOyK3WQls/SkL7eDd8JSqwRwgH1oVBkUbA6IA9JLERcZg9CQ8h+BT2ZvFkOPssxIOgWmW6OLbzDSYZvv7y4U5VQHssGwy9f8qjI3d/gUX55u23mIUs+bWBxpNxdDzq6WpiqhxPC7BhvwoC+XzcujpQ2IHer/UMrka0llgd90iCXN0idRhYrmia2gPr165s527zPmUduyJD4GVx59KuU6VEOKHQrBh42tcktxasSKNri9DHy7FqQh1iuo+Fq5ZCc1MmTxixOaCDV6W7f+ReJU9u+XdaD9ZJ88Pxn2/UDo12Z1IM8dJGnDa5opi3QMRvGbRtIR+ttlaRt2qg6ptNsxG6GhbaAGoGtYdke44Bit2KkNrmleA0j0a5QbyW0bPbL7grLA9+n+/mQDPVjMQdnfb7ftYBt/OHEQgz4ysB6gO8H8CQdeZZJPehARspiRTO7NLTpnI+V4xYOtoRoT8pnX/R223welsM8bReJWZ58vnp2GpGtZ0v5cQSa7oBSt2KkNrmlePHHrc95540lnW5G9X892RWAJdk1oWXJ596tkBzl88bbnvj+bP+U1GEZoMn0X9svAJSyrIesI/ngSTryfleFfF9WlouWGveekf59exD+10/Zz/znWW0HnIEu5WQdWCZp2Dvmd+HIyxv7NqlHPJiXMZ9V0jRdPQJNd0CpWzFSm9xSvD59ih+43W+jweZd7247thXjKy6IWyFG2u4Ofx1D+7tCe3dCco1+lGg9hPZPhVo6Mduox0c+vp07LtWXAU/WXeZl/SHzgd1GORuh1kmonpDDWBAuP8RZ02yRoLtGLFEflHOUPe6Dx38gD758blkX/xlieT4Xdf18SA8yrp4Xh7jrLg0XO7zxxhtms826XnBZZDik6Q4odStGapNbihc7ugM3HOCGjViYM2eOGdl/B/PWI20bD/rePsTgap7lt3ecW8zjOGADdPAZcOzGANt18YPU93m58944D/WwMdTvapHnx/hS3WMP3ecX0OfLPOo80k7LwwEgjQF5dJeQpw2k0To58Ni9MlUeRg8eHU22mdXuHUNgHudDz5vfsSMbdv0AZ8fyfF7ePGb4UE7IfsoGnmGVXYC3//77u/UuIdkjjjjCfO1rXwuxehUNPZUTTjjB3H777WbQoEFm0003Nd///vfNBz7wAfecRYdDmu6AUrdipDa5pXgxB4SDlHB+SSxcffXV5q+/mGrkSmg4FXz5uGbE3ywpnQvkfL5flpxZo01fJpSPDdbGZtTQhfC7GCzP39iK8sDz6XITK/hcl+PLyvvoOSgtu3B8HvDQ6sENrHKdEPnA8kqLtwxPWceLz6DNdbXVU/LzpG9ub83ADkIeW8Sin13/8oMf/CA7hsIvL9QS8GV6Qx6737EK+oknnjCDBw82WAmNnfN//OMfe+95QLilYvHijilmpnEWSYoX+8DRNaPHDsnce++9Ztrgx8ym89tmlaSzYFp+sUkL2QKN4wixDXf19KVdbu6UNKT5hffpdD556+vXReZlGuUgT7t8Rr98SUcdMeYzywrBkf6nzaM7hm4ZumwMtMs8ngG60lYMS+qEYv8sJdpL2aIM3hms9F3Xb8VYvXq1u/MdzgfhwAMPdC0/3IRaZjik6S2g0AtD2ujRo91ZI8yj24UzTNAETPEoXyRevXS5awFtaka4VgG+FGw5wN6G7auYkZZ05BHkl5VOICTXJp3/v/yi5tfqPFDOesg6olsFpwCepLt8e0HkdYrbeXxG1gktHL+1hi8z6k8edLB3zH8mWSbt+fYh02jwHQ1tpmzhc252aGnp0+kOtarqM+PNV8xjjz9mDjvssC4mjzrqKPPZz362C/2QQw7pRLviiiucY0YPpshwCI31aAeU2uSW4vHhysTohrUGDMjbIgLsqFNKvewhOz6NTsKn48vVqG0pz+M3fEfLcigbi+m0sHIZ4ZJTbqZqFuMLT6cEO9CRU/RwRgg43pXjRpSng6Qx6GIZAORYd/JSsW8nJCsxyD7nJi5EDNWxCtrgocPNZnY187HHHtvFHG4frheuvPJK8z//8z/mvvvuc6JFhkNYRo92QKlNbikeH66nxPzylqlPFTZS5Ze1T4eSKkPyMMCLgLEgrBNCjC8994JRlo6IedQTcp1XOJEbj307IcmyGIRs9kTaoMFDzMa2J3HooYc2XL0LLrjA4JIIzF6/973vdfpFhkNYcI9xQNhj4t+KgUqmNrmleHzAIjG6X36Qv47k+TTmEfuBL7fkkebLhvK0HeJVQStjHyuveRYQt1Sg28WuTqh+bOmg5YSxIOeEhCAdhj/2hXqiNYNAGaEWTfp2ICg/C1+xkc/G1+2t+a9//evuGNY///nPZuutt84es8xwSI9xQNnTBBKpTW4pXsBUXRI2ow7eeV8nx6Y+f61B5BcHaUlHHgF8nx6itUkX+49zoKfOfMUp+8db0CLqIOsKeohG+dD2Dcr7z0MdxhjL4XXUXDVd75lpE3rQx8ZVOCPaoW13FXS7wyEtJEdeKEZZITshWdJYPzOZlHU7xpgPZonvvvtuM3z4cPP66687QDbccENTZjhkrXBAa/SjX7qy05hK9iK2V8LP+3UL8UM0X6+RPM/eoU7MfogeosFOo3SWzZjnRDMfirnjXvKgh4AYdZD3jiFPPnVA85+fvFRM+ykZ5cUROP/88w3GetjtouRLL72k5wERjCri0KH0eZvj7MaEmva0IXmk5ak3bfuyPMvZp8fkfTnmQ/IhGuUZQ2YD20LhIDTXQWH7A7tg7DLBCWD8BnVmYGtmyMD+zrFgQBrdMayYhq3P2wPO6HD8Fh3LAo6oB0IIU9xwi3JCA+RSHnLZ4DMr2AsHoflojcRPPfVUUrzocIi2gDxY0QUbuEnbGANeyHpdCU+9bhb2sBK40V/kWD3QIghdIV23IjkEYmVKVcggcBAazgbPB4fC7hS3VkAOdUWdGajn59ES+rElgs8yKMOY3T3mUzHs0BFSTtaDtC5YTiZH43oIFBkOUQcUQJW/pgFWaRJeevmFzGsw9GXJq5tHLuRsWGbMAcAuZCSfzxeyV68e0g5XSqPlIp2UlPHtoWyMj0l5PgPrKnX8OkrbUk/qaLpaBNQBBfCUzfIAO0riCy1fZAqXfaFpm/YYx+jkl4lpO1V3yMhZMPnlB88PsCXp0GXAYDT3iaGFCDlcfugHtiBJp03Is7tGHmLQfUcGeui5QjTINiO02G0gGw4dUHnRQwetb4pv1662OuqAPDxxIuKs6XdkVKxLyeuQuDaFcWakgkSsHjF6o0WG7IRovl3IzLLjPTyCg+M+sWl4YAkdBugyQFduLUGe2zZ4lAdo/vQ7bcY+J5R3qd3SwbqxPF8++Lw6BkS4uiVWBxSAleuA2BVjHBBtmCTHLTiImtdIqB4Y1/C/kHnt+XK+/Ty2/XEV36afR11jOuBhuwYD8+iOgc5WjP+8rDdj6jNmedTz81KOMqRp3L0IqAPy8JWD0KF1QJ54qax0RkUNoctQhZ1Y+VXYlt0a2JN52R3zy5J5OB8ExNiy0UhAeSiHjoe60j5o6A4u8PeA6ZGshCuLcR4Q7gnDkRwyFDkPyN+nJ+2ts2n8ksZ+TX1Q8GLzz+dVnS9bDvRjIcSjo2C5oZgytIs8aTJNPg5QiwW/DjLPsSWMCYXqkaKlypN6GINiHoPZSGvojMDSpUvNAQccYK699tpODJwH9O53v9uMHTvW3Rc/b17b5Z6dhAIZbQH5oNiFiKvajzPFrRAIPEkPaXmYF+iSR75PA72KQLt+HWBb0pCHrE+ba49G9WmQRaDTaMu1/acN6NUL/LKyjpCXaerPsPWSAXoom/rkgQZ9eUIiB5i5WJF1Zj1D5eF5QYf90HP4eNDGz3M8M+u6rsQPP/ywGT9+vDsTSD5zmeORe7wDevvtt11zjw+M81mw3oChSLOPuqH4zRdnmxdXPOBYrfZExOWekJ/32F3kyV89r+NcI9IaifuOGJKJh+pQhpYZDiRCdn0xyPgD73n0YAcnTHJzKVqd/sDwJHtImR8m2MWM59023kwYd3nGYnlsudIO6c8F7ECZ/MyQn9BB6AyRf/qnfzKnnXaaOxUxI9pErz0PCA+59957mxkzZmTPi+MCcCobQtFjIDNjORKhL0UONRXJiYBceUynkVLl5wHnAyeEjaxTvvVHt8ARtvLYSNlfF3hLFi8yr732mrnpppu6PO6OO+5odtgBh+V2DfgeDhgwwNxxR8csMaR67XlAaP3MnDnTzJo1KxvwQgsIoUyzzxmI/BtgBhrMgvFYVgxc1jt3xv/VDZmWLZgQPy+NX8C88lKujK60UyadqkOK55cJWWzbOHDvMWaqTaOLhVYY6DKkHJJfXiO6sozuSre09DUjNhxYufm+7yw38+a92mUcBwXhDviYA4LzCYVeex7Q448/7hzPmDFjDE7jx5EdDGWafbQRijkL1mqZ3DbA5fkcrwjprQlas8vv7mfM83yUQcyBadxFj71j+JxAR+CUPdIcK0JaBspKGtPQcQPmk0npPfGo94xxm0pvvPHGSh6qV5wHFEJiur0iua9dDYqbLKZOnWrQ/Zo0aZLZY489CjX7cCvG4YcfHirK0XAz67B+bVfyUIgvPPKxF5my3R03u/zufr5G7dPJYJ0QPydiROfEfMy25PvbOHDUCaab8c7gQoNQGDdunDnxxBNDrHWG1mvPA8IBZbi2ByewIZx99tnuHNunn37aHQ0wdOjQ7EPmYdkLFiwwqVsxvvSlL2U6fgK/CM9OX2jefuSldtbumQhfcLl4EN0zuXCNeX+9CYzIFz0z2kAC5cuyqMoyma8ypu3YqmaUFXrWVB3wDDGdFI82iQHueufhZ+ShJYQxIYSplz1EcrA8OC9/d/wldve9H/r06Wv++Z//uVPrW8psscUWMrtOpnvteUCY8sMfw4QJE1wL6LHHHit8K8anP/1pmusSY7zpyetvMnNXtHX11rvqPdnsjj/LA2V/bIh5xrKAsrNg88UsmLQbKkvyy6Rpu5/dLhEbS6FMI+XEdDAGE+P59v3xG/C/Pf4GAyeEFpGsb8gmptmljG+f+b52zPFTn/rUOn8rBvEIxWWOR+7R0/A333yz2WCDDdzFcHhwDECjKYwmX5lmXwhE0nA3fGvrgYYOA+MKcqaG40GQB33cDw+iavQCPcjlGYQOfaloHOXikj6EKdPnkOxiroORxBCNN5pKOabZwmNexuia4GgNXO7nD4peZ8de/LU0UtdPp+oQOrAspI97yLAhVV5qSEx4ntBfRw93qpCNrX/6iP3swGfrlPjKMi/a4ySZ1bRF4Le//W0XHIqeB9THdnN67EoHHAH53e9+143/4F6mM8880zz66KPmrrvucpekoW+OKcHW1laDrhWu7Jk4cWIXcPISvve975lfn3eTaV0x2qm0fuzATqopB9FJMJChQwuwcpHyOLBchtZyIfkZIM3gt2YwRY8WkU+nfCymTepddM9JZvGSxWu8BYSLAC++5Cfmx5d3XnEcq3cj9If+cp+54icXmXvu+VMjat0i26NbQEcffbSZMmWK2Xnnnc3y5cvNqFGjzA033OCAKNPsSyG58SG7mtYFezsR2dpJtRDAQ+Avqcvov25BQH4OxB0F+dijG4buGM6ajp2/BH0OZNMGB6Ize5PB0dBdCPRoB4Tu1qWXXuoGoRcuXNhlcLlosy8F5qKnX+t0HAdleVQDf4EZgx8aH6Jed8T8lYZt/lLHypH1hIzUjenAJvUYx2TXNJ1rfVBHibtfT/CusX843lV2oWV9IbOB5XNgGzZvbR/sz3BtYv+gb98+7mRJWecq0gPeZb/2bcvpqjBXykaPdkB8spaWli7Oh7wix0BSNxS/+cSzZpTZvguLL6QfdxFcAwTWAUX5Xzy/eCkLnp/35ZmnHGPQQ2WBJoOUJz2PHmRDurQh45BciIbB5wn2D90xrBMKOSK5nQNlhAasZdmarhYB3Q3v4YmV0DL4XzDJW9fSoS85aZiqxx9DXtyowxh6/IMtphnTfiMxnA82sDKUsUUbGleDwFrRAqrmUfNZwSzY6AH7OOEBn9jGzfBwh3Q9C9x57c8K5dVP2adtXyZG9+WK5PPY9p/V7Np2gkCsvNDsHGWXbz6k7oxaCstUfeGE0BLCLBl31aPclD1Xr8nuv/7rJgTUAXnA1tsN74l3ynJnNeNOzJKZmM0YvWRxTj2P7Twyfl1SOimeb8fPx3RJv8aO76TGhHx7Lt/EMaBgfZpMrPr0CXVAiQ8UU+eY/paxFCePNOZDU+achpc80qifimnbl4nRfblG86wn6+jnaa/FtnjYDSMtFRPLkEyKR3nWh3kZx7BgHTkmRJ2ULcpo3IFAd5w+oQ6oA1+XGjp6jFuIiIychvfENFsHATldXkc0yPb1OeWeTY8HtfIR3WmH9mRFdMvqho6F+HVFe7NAd50+oQ7Ie2vQBZv1TNt5J/xFTv1SsmUAMyk5r5hCWZZVtJxYCwGVqceLVZgYkc+6YesI0+Qh9svhM0kZpOUUeyjvy6fyfh0n2pXpCBgT8mfButjRLpiDpLtOn1AH5L1xQ3fY2rRu0rYCusoWUN3BTq8efrbLYK8voPkgAmjtyEFnKcSBaSxaRAi2riY7VlP+tdh1QKF70cpWZtbTM829kyd3OlmUNs855xyDPz+UOXTMtyXz6oAkGjbt3wvmsQtnQ62BRowtj2xGbcRGb5bF1HpoLAo73EN0YvFty+eu/6BcL2wBvXeXXdz+Sv9kQ2CCNXehUObQsZA90sKlkatxZQjEuhqVFVDSUOwLXNJst6iH6gon4i8ihFzegG0b6I5RJ+iM8hrr4XLY1I1ztrC/Mm8oc+hYqgx1QB46y80yj1JNtmwLqLsd2NrwhWOXOLSi2Xc++NTyPBNkODuWa0yomtdhrbPSXadP6Epo71XwV0J7bM02EQE4npDzCVUJLRm2ZkJ80qQMD7rf6tQHc+rGAAALXElEQVR9yda4HQEcOnbdddcZnMW1ZMkSc8EFF9grk44qjY+2gEpDqAZ6EwJYKa2hKwLddfqEOiAPa9kFC3WbZFfIn9718zQdskNe3rjfrpuZd2a8klc8KpeqY+rZYgb9Z+tvrzZGPf1yWH+0ONDtYV7qo3yZD5VJGVlXyFGPdHa/SI/Z4iWU4EN34pG/dKLaHeuKWHecPqEOqCvOGYUvc0awCTTPOd7g8/089UBPfREol4pr89qOyIAMv1wp+RgvVUepE5OTMkj7cqhnjC67OzE5354z5v0LyYRooXp4prrUn3wcZgYndNFAPRGRmCCu+vQJdUACXdy68eiKx83CTRc56kMzpwlue/KErqR6lCX2Pu2Wvv3sh5d/1qGLzT/ZA1zsuhCzumNeeNmyZe6Y2th9TV1s5CQsf+sts3r1ajNoYOeTAXKpz4xIWfoKe88b7nobMtjOTsXkIuop8tv2yqa3bJ2HDum4PTYln4tn6/erbc5x10HFbsTIZaegEE7+vO/ee81eu+ycy8KcOXPMRhtvbN6VY2ZrqX1v3l7RM7qaPfpI1lzIVyz05JNPui9flWbPO+88dw/TZz7zmSrNmh/96EdmoHUSJ5xQwCsmanLllVe6W0fOOOOMhFTjrFtuucXcf//9BkffVhlg86qrrjI/+9nPqjTrLsXE/qdHHnmkUrt5jGHdDe7F23zz9OkCtOUc0EYbBRcXUoYxTheFw8aNM80O2gLyPgG0gqoOOFh/5MiRBtfeVhlwBvagQYMqt7vZZpu5X/6q6ztt2jQzfPjwyuv70ksvGVzLVHV98SWVl2FW+dnVs4XPAH95Q9XPnrfcsnI6DV8WQdVXBBSBwgioAyoMnSoqAopAWQTUAZVFUPUVAUWgMALqgApDp4qKgCJQFgF1QGURVH1FQBEojIDOghWGLr/iTjvtZN797nfnV8gpuc022+Sads1pLhPDTbOY3q86YCYQl0xWHTa261/23HPPqs2aoUOHmrFjx1ZuVw12IKDrgDqw0JQioAisYQS0C7aGAdfiFAFFoAMBdUAdWGhKEVAE1jAC6oDWMOBanCKgCHQgoA6oAwtNKQKKwBpGQB3QGgZci1MEFIEOBNQBdWBRSQrHTWC3Mf+woVEGXG374osvSlIyjWMxnnrqqaDMq6++ahYtajs6xBdI8Sj77LPPuk2nzCNmvRmvWrVKsk09u2+88YbBMSGhkNKth0vMLuvJ2K9vPbuheiptDSJQ01ApArvuuisO7Mn+7O76zP6ECRNqds1Kza6Hqe2xxx41e+RCxoslzjzzzJo9NqET257JWzvggANqdm1RzZ4FVPu3f/u3mnVUTibFk0YefPDBmr0VoWaPccjI1tFl9eYzfPOb38xl94knnnB12mqrrWrvec97ap/73OdqqAtCvTqlcEnZTdUX5absgq+h+QiY5leh99TA/trW7PENtVmzZtVsK8D92V9m94D2zBr3xZw9e3YNtGOPPdb9xZ5+/vz5tS9+8YvOnu+ATjvttNrRRx9ds62r2vPPP1/Dl/7WW291plI8CMBRXXbZZTV7zYpzNtIBXX/99bV99903qzueYeXKlbns2kPLa3CWsI96fehDH6r993//d13derik7KbqW8+uq5j+azoC6oAq/AjseTe1UaNGOYu2K9bJ8r//+7/XvvrVr2Y0e+Kda72w5ZIx2hNf/vKXa8cdd1zt0ksv7dICslek1NCCYTj33HNr+KIipHjg33333a719cADD3RxQGeddVbt1FNPhVjNr3/KLp7Bnhdcs+fyOF38s4ew1Q4++GCXT+mmcKlnN1XflN2skppoOgI6BlRhd3f69Onuwrf99tvPHZBlu2MGh3AhvPDCCwZbHBjGjBnjxlswthEKF154oZk0aZIZNmxYJ7ZtkZi///3vXWyBluLRCE7Be/jhh81ee+1FUhb/7W9/M1OnTjXbbrutq79tZZnFixfXtYuL7nCdL7ebYBzsV7/6lbGtoLq6KVxSdlHpWH3BS9kFX0PPQEAdUIWfg/05ccdc3nTTTQan9L3vfe8zhx12mMFAaOpq21AVYuc8YyDXtgzcPiXqDbFnIS9YsMANEMd4lMWh4rGAPVWHHnqowXnEtoVlZsyYYWwrI5dd2oTzgePCaX6nnHJKXd28uPh2UV6svuDltQtZDc1DQB1QhdiPHz/eXHvttWbTTTd1f3YQ1LVWcJlbVVfbwg4CWiYMb775pjvyNcWjbCq++uqrzemnn+6u7LWD5OZf/uVfzG233ebqDr1QmdIe6vGJT3zCXVx3++23u3vG69UpDy4huyg3Vl/w8tiFnIbmIqAOqEL8b775ZnPfffdlFtGFwI0KdgzE/aFbwIA0z3QmLU+MFgz0fFvo3qV49Wyj+4Zu3+uvv56Jov5bbrllLrvoStqZOXeI+u9+97tsN329OgEb/1kkLjG7qfriAerZzR5SE81FoOmjUL2oAvZmhhqm3e0vdg0zYpiR+uhHP+qecMqUKW76HYPPtiVRs9fa1r7yla/UffprrrmmyyA0Blht165m1wDVZs6cWbPOp3bvvfc6WymeLAyDzPbN6zQN/+lPf9oNlGPwd+7cuTUsKbA3TeSy+8lPftLVad68ebXXXnvN/dluYV3derik7KbqW8+uxELTzUNAZ8EqxN4ugqv967/+a80OMNdsN6y2++6715555pmsBDtQ69be2PGRmu2qOEeUMSOJkAOyrRQ3zW27GbURI0a4GSiqp3iUQRxyQPYamNq4ceNqW2yxRc2eB1Q7/vjj3ZQ65FN27eC7c2ZwaPLPnqUD1aQu+DFc6tlN1TdlFzwNPQMBPQ+oGxqgWI27cOFCN0jqm8fKaPzhepqyAd0l2Glp6XquXIpXr1ysrraLFIOHnZWxm9Itg0uqvmXs1sNJ+eURUAdUHkO1oAgoAgUR0EHogsCpmiKgCJRHQB1QeQzVgiKgCBREQB1QQeBUTRFQBMojoA6oPIZqQRFQBAoioA6oIHCqpggoAuURUAdUHkO1oAgoAgURUAdUEDhVUwQUgfIIqAMqj6FaUAQUgYIIqAMqCJyqKQKKQHkE1AGVx1AtKAKKQEEE1AEVBE7VFAFFoDwC6oDKY6gWFAFFoCAC6oAKAqdqioAiUB4BdUDlMVQLioAiUBABdUAFgVM1RUARKI+AOqDyGKoFRUARKIiAOqCCwKmaIqAIlEdAHVB5DNWCIqAIFERAHVBB4FRNEVAEyiOgDqg8hmpBEVAECiKgDqggcKqmCCgC5RFQB1QeQ7WgCCgCBRFQB1QQOFVTBBSB8gioAyqPoVpQBBSBggioAyoInKopAopAeQTUAZXHUC0oAopAQQTUARUETtUUAUWgPALqgMpjqBYUAUWgIALqgAoCp2qKgCJQHgF1QOUxVAuKgCJQEAF1QAWBUzVFQBEoj4A6oPIYqgVFQBEoiIA6oILAqZoioAiUR0AdUHkM1YIioAgUREAdUEHgVE0RUATKI6AOqDyGakERUAQKIqAOqCBwqqYIKALlEVAHVB5DtaAIKAIFEVAHVBA4VVMEFIHyCKgDKo+hWlAEFIGCCKgDKgicqikCikB5BNQBlcdQLSgCikBBBNQBFQRO1RQBRaA8AuqAymOoFhQBRaAgAuqACgKnaoqAIlAeAXVA5TFUC4qAIlAQAXVABYFTNUVAESiPgDqg8hiqBUVAESiIgDqggsCpmiKgCJRHQB1QeQzVgiKgCBREQB1QQeBUTRFQBMojoA6oPIZqQRFQBAoioA6oIHCqpggoAuURUAdUHkO1oAgoAgURUAdUEDhVUwQUgfIIqAMqj6FaUAQUgYIIqAMqCJyqKQKKQHkE1AGVx1AtKAKKQEEE1AEVBE7VFAFFoDwC6oDKY6gWFAFFoCAC/w89Lthpxi605QAAAABJRU5ErkJggg==" /><!-- --></p>
-<p>In some applications, one might want to symmetrize the matrix before
-plotting as follows.</p>
-<div class="sourceCode" id="cb7"><pre class="sourceCode r"><code class="sourceCode r"><span id="cb7-1"><a href="#cb7-1" aria-hidden="true" tabindex="-1"></a>d <span class="ot">&lt;-</span> <span class="fl">0.5</span><span class="sc">*</span>(d <span class="sc">+</span> <span class="fu">t</span>(d))</span>
-<span id="cb7-2"><a href="#cb7-2" aria-hidden="true" tabindex="-1"></a><span class="fu">plot</span>(d)</span></code></pre></div>
-<p><img src="data:image/png;base64,iVBORw0KGgoAAAANSUhEUgAAASAAAAEgCAYAAAAUg66AAAAEDmlDQ1BrQ0dDb2xvclNwYWNlR2VuZXJpY1JHQgAAOI2NVV1oHFUUPpu5syskzoPUpqaSDv41lLRsUtGE2uj+ZbNt3CyTbLRBkMns3Z1pJjPj/KRpKT4UQRDBqOCT4P9bwSchaqvtiy2itFCiBIMo+ND6R6HSFwnruTOzu5O4a73L3PnmnO9+595z7t4LkLgsW5beJQIsGq4t5dPis8fmxMQ6dMF90A190C0rjpUqlSYBG+PCv9rt7yDG3tf2t/f/Z+uuUEcBiN2F2Kw4yiLiZQD+FcWyXYAEQfvICddi+AnEO2ycIOISw7UAVxieD/Cyz5mRMohfRSwoqoz+xNuIB+cj9loEB3Pw2448NaitKSLLRck2q5pOI9O9g/t/tkXda8Tbg0+PszB9FN8DuPaXKnKW4YcQn1Xk3HSIry5ps8UQ/2W5aQnxIwBdu7yFcgrxPsRjVXu8HOh0qao30cArp9SZZxDfg3h1wTzKxu5E/LUxX5wKdX5SnAzmDx4A4OIqLbB69yMesE1pKojLjVdoNsfyiPi45hZmAn3uLWdpOtfQOaVmikEs7ovj8hFWpz7EV6mel0L9Xy23FMYlPYZenAx0yDB1/PX6dledmQjikjkXCxqMJS9WtfFCyH9XtSekEF+2dH+P4tzITduTygGfv58a5VCTH5PtXD7EFZiNyUDBhHnsFTBgE0SQIA9pfFtgo6cKGuhooeilaKH41eDs38Ip+f4At1Rq/sjr6NEwQqb/I/DQqsLvaFUjvAx+eWirddAJZnAj1DFJL0mSg/gcIpPkMBkhoyCSJ8lTZIxk0TpKDjXHliJzZPO50dR5ASNSnzeLvIvod0HG/mdkmOC0z8VKnzcQ2M/Yz2vKldduXjp9bleLu0ZWn7vWc+l0JGcaai10yNrUnXLP/8Jf59ewX+c3Wgz+B34Df+vbVrc16zTMVgp9um9bxEfzPU5kPqUtVWxhs6OiWTVW+gIfywB9uXi7CGcGW/zk98k/kmvJ95IfJn/j3uQ+4c5zn3Kfcd+AyF3gLnJfcl9xH3OfR2rUee80a+6vo7EK5mmXUdyfQlrYLTwoZIU9wsPCZEtP6BWGhAlhL3p2N6sTjRdduwbHsG9kq32sgBepc+xurLPW4T9URpYGJ3ym4+8zA05u44QjST8ZIoVtu3qE7fWmdn5LPdqvgcZz8Ww8BWJ8X3w0PhQ/wnCDGd+LvlHs8dRy6bLLDuKMaZ20tZrqisPJ5ONiCq8yKhYM5cCgKOu66Lsc0aYOtZdo5QCwezI4wm9J/v0X23mlZXOfBjj8Jzv3WrY5D+CsA9D7aMs2gGfjve8ArD6mePZSeCfEYt8CONWDw8FXTxrPqx/r9Vt4biXeANh8vV7/+/16ffMD1N8AuKD/A/8leAvFY9bLAAAAOGVYSWZNTQAqAAAACAABh2kABAAAAAEAAAAaAAAAAAACoAIABAAAAAEAAAEgoAMABAAAAAEAAAEgAAAAAKtAJY0AAEAASURBVHgB7Z0J3F5Fdf8nC4EkLAlbIGxBEDWAIAgVLaLUreCGVj/UWlncqKKCtYorUqu4tiKlVbug4l+BQhUFBIpVqSIGkYR9J4AsIZAFsm/vf77z3N/Neee9975P3ve+eUJyTj7POzNnzjkzc3Ln3DPLnRnVFyE4uAZcA66BHmhgdA/K9CJdA64B10DSgBsgfxBcA66BnmnADVDPVO8FuwZcA26A/BlwDbgGeqYBN0A9U70X7BpwDbgB8mfANeAa6JkG3AD1TPVesGvANeAGyJ8B14BroGcacAPUM9V7wa4B14AbIH8GXAOugZ5pwA1Qz1TvBbsGXANugPwZcA24BnqmATdAPVO9F+wacA24AfJnwDXgGuiZBtwA9Uz1XrBrwDXgBsifAdeAa6BnGnAD1DPVe8GuAdeAGyB/BlwDroGeacANUM9U7wW7BlwDboD8GXANuAZ6pgE3QD1TvRfsGnANuAHyZ8A14BromQbcAPVM9V6wa8A14AbInwHXgGugZxpwA9Qz1XvBrgHXgBsgfwZcA66BnmnADVDPVO8FuwZcA26A/BlwDbgGeqYBN0A9U70X7BpwDbgB8mfANeAa6JkG3AD1TPVesGvANeAGyJ8B14BroGcacAPUM9V7wa4B14AbIH8GXAOugZ5pwA1Qz1TvBbsGXANugPwZcA24BnqmATdAPVO9F+wacA24AfJnwDXgGuiZBtwA9Uz1XrBrwDXgBsifAdeAa6BnGnAD1DPVe8GuAdeAGyB/BlwDroGeacANUM9U7wW7BlwDboD8GXANuAZ6pgE3QD1TvRfsGnANuAHyZ8A14BromQbcAPVM9V6wa8A14AbInwHXgGugZxpwA9Qz1XvBrgHXgBsgfwZcA66BnmnADVDPVO8FuwZcA26A/BlwDbgGeqYBN0A9U70X7BpwDbgB8mfANeAa6JkG3AD1TPVesGvANeAGyJ8B14BroGcacAPUM9V7wa4B14AbIH8GXAOugZ5pwA1Qz1TvBbsGXANugPwZcA24BnqmATdA60H1p512WvjhD3/Yeklf+cpXwj//8z+3Lvff//3fw+c+97nW5f7oRz8Kp5xySutyr7nmmvDXf/3Xrcu95ZZbwtFHH926XBe4VgNj10Y9NlIamDdvXli0aFHr4hcsWBBWrlzZutynn346zJ8/v3W5ixcvDk8++WTrcpcuXRrmzp3butwVK1aExx57rHW5LnCtBtwDWqsLj7kGXAPrWQNugNazwr0414BrYK0G3ACt1YXHXAOugfWsATdA61nhXpxrwDWwVgNugNbqwmOuAdfAetbAJrcK9vDDDzeq+Je//GXYfPPNG2nWNfO+++4Lo0ePDpMnT15X1kb622+/PWyxxRbhoosuaqRb18xZs2aFJ554onW5M2bMCA888EDrcmfOnJlWq9rWA/9vTz31VGh6ZrbccsuwzTbbrKuKB6W/6aabwk9/+tPw3Oc+d1BaCNgysMcee4StttpqUPqFCxeGJUuWhJNPPnlQ2pEmGNUXYaQL2VDks2S955571laHZWKWto963RvC3EefDmvmLgqjNhsT+laujr9VYWVY0Y93szCuX5p8cGN22CqsWbC05F20YGEYO3ZMNGxb9JMBrXgQNGqzsakcxQkpFxg9YfOwfMnTYdxmE1J6xcolYRVZsW5jx49J5ZKBDPLyusGvdiQBFX+gWbNkeVi2bGkIW4wLW4QxA6iQD6AXAXIBcPADyAJIS+6KvtUhajKMHzU24eAbNWFcWLNwSdLD5hOi3iK91QMyJEvyctzKqKMl8xaEbaZsT1YYNWl86Iv6V10kT6H4VTfSorVlrVq9Osy8f0aYOnVqGDVqFGQD4Ljjjguf//znB+CHi/j6178ezvjMGWHKVlO6EjX3qblhmwnbhHFj+z+TVcxLli8JoyeODrMfmF2VvV5xm5QHtNlmm4U//vGPtQr+0pe+FO558NFw1llfC5878cKw6Pe/rqW1GWOnbBdWzVm7v2XCvgeGFY89FMbts1tY8j8zQ54P741hZtgl7JzE7P78F4cHb7o2TJ0yPTwy57ZAetWcBWURyEYGedAAwq2aH/PGbVfSjt1+Ulh2071lWpEJrzwwrJnzdL881YsQGDthUlj1dCx3sxDG7dupe8IX+Ske5QOjp6x90yJXOLV33J67pfKQJ7njnr9boltx00MJR2LsATuHZVfdntpDHeHf4vl7pfZLp+AFaoPao3rAN+FFHbokf0rUwz33Jr2hE/RZhjEPPtVDccqg3hZufejGgCfUtldsy6iK77333mHK1juG7R9e+39bRSfc9iHSdbnVLGoibDe9O7mSP1LhJmWAulHiHTMfScbn0//51nDCeReHHcOU8HiY08w6p3/+7rFDYix2/J8nO7xZPsJkfIhjfCzIgMjokDeVB8xAqpPkKkx00yvrOzV2eqBfW8RXhFNDxwBCN/UmQ1vkowsZvmAMJPQJIk71gh9IRrOQm+MSwaz0N/FRx8R/05x+elfdJY+wxBX1gE84GS7VZcc5nf/Dsn3xv0vGHhxtoZ4duSnwP+tJA26AMkWvumNOWHTtr5PxOXflBckYTXhsUXqbZ6RlkjeovACQm73q2WFa4SFgjPL8krGIKB9vYPdZnbfz6J22TLmkAeURAqKz5YIXHXEL1KlvzqJ+fCoXOuKUOe2xjgdg41aO6jVqSqd+5CFX6WmzOvxjDtgpsZGWLELohINg8wN3DstnPprqRR13v6rTfvKm8SeC+CiH+tFmaC3AJ9zqWY8Fyldd4Of/UPWQTGTZeoJXmrIStP8FTUfuM+zvsmXLwuo4JM1h/PjxaX4T/PLly8Oc+LLafffdc7LatK+CZaoZs92WyW1nGPTlb/xfwBPioUwdlE5a8UOExW9TGAnhFVoai1PchsTprOJRnFBx0YuGsAonfM5naYmTL7Bx4erCwWir8sEJT6g6lmFhgCnT0pEWDXGBDDNpDE0VSA55Nl5Hm2iqp36qWDZq3Otf//rAhHv+Y8EC+Pu///uw6667hsMOOywcfPDByRB1oxA3QJmWVj+5KA0zGBYtveLucMZR/xk+deZRpYfD29f+xG5xC2c9WtLbfMW7Dcu3cMFAGQLFbbnCiYZQ+cStPNEqJL+XoHqUYfRYBKq3QuFtuCrqXLDG8ApHaPlt3NIoTn6i2WSWaNTy6vDSSy9NK2esnvF7//vfH175yleGAw88MPzmN78JfMB8ww03hHvvvTfsv//+4WMf+1i1oAzrBihTyJrFcQWoADoDv9MPPiucccOHBhgV+yZWnJAhgEAdCrzkCWfTFideQtGow5QdoyBSuVU84MgXjX3rg9NwQ2WrDPhsnDQAvZXRwXZoabM8P8lVfl1IGQy/4FUdCbd9xwv6eTEqU2GVPPGTN/41/YdnVfTgBqtnU3l1MjdW/Lhx4wLDLX4YmgsuuCCce+65aXWQUw7e8pa3pKEX20I+8pGPhAsvvDB0s8DuBih7YpaGJRmm04llhOyDro4Lg42TFp1C8onrJxqlCXngU7qYKynTMW9SnPMQje0YebmigxYgP6cRPhHEP6K1cm1cdNawCkcILZ0Zzy8HDYcIc5mk9zz2wMRr61glR3IlT2mFln9F3ELRDVQZ2W74nuk0a8KasGz5svDQQw8N+LHvqQnWrFkT3vWud6WtB7vssksivf/++8O0adNKNvYjcUJBNycf+CR0qbZOZHzo7LOxaB5uOinDMQvquOCI204gHktfFbd06hAMIXgz2A6rYd3oOWvnN9IbPA7BbblNnVfli09pwrqObfNUH4WWnzge0LzC+xu3c1zmZi9VbMuYaGgU5jyPxEn/wQC9UCZh3fDK/l+o7MHk1rVjML71lb9Z3A9hV0vbKndJWBxmzZwVXvKSlwwQeeqppwZ+dXD11VeHxx9/vN/5SxxZsvXWW5cszBMBHOmy/fadvVllZhZxA5QppMoDgsR2coZj7BNi3sE++DJCFicDY3EqUjIVYgRED03qcNH4AdbwpHQ0eHgklh58acQKPnCCUl5htMaEzuQ6+XUGQnlJBsYkejo5yDNaaDKsF0K5VXyQMwSjbKufVM+IE8hQEGKYq4wQeqA91vigTzxCjLIMulx+yYQ+QWEw83TYCCehtwlbhz/5kz8Jv7rmV1Jx1+G//du/hRNOOCENxcS03XbbBc6QEijOBs7BQP8fg9F5vtEAxofVsRyavIicdrhpW5aND1fuhsAv4zCSdcHQaM6qrpzSGNURbGJ4vhS45JJLwjvf+c5+LWfZnWGYgPgOO+wQJk6cKFRt6AYoU03VEAwS+4bG89Gc0FH/+Nry7Z57RJno2qSVXUuUZcgLgFdxSwLe/uhMyYOIeGAoZdZ5MeAxgnUdmnLxkuSdqZ55Wnjk1BlV2kp5016+d/qJh2V4cHheMi7QzvvejeXQTZ4VeOjwjAj5seJJHZVWKPkehnDHHXcEvibIv0/jONzzzz8/fY/GyZ9f/OIXw7HHHtuVynwI1pWaqonmL+p891Sd61jXwMalgdtuuy1Mnz693Hio1jGcO/HEE8MLX/jC9ME1S/MM1boBN0AVWkrfRsUdnbmXkKfP+fzPEzf7hNi0yFsUsG/vnCcRFH9sHnF5KOJXGnLFCROYOZIOovM35Vfk8UbPAU9haTFpnOflaeoEveTYeJ0nk8so615kkK7ibZpIVz3mz1tcisdjWnDV3WH2L+5JdSQjzfvEOqvMfA4IGtpQgo2XSI9YDeDp1B3+zyUGn/zkJ+OHzMvCpEmd3fuWty7uBqhCM/qWSJPDkGAglJbh0OQrxuejHzw8nFEYIFx8TQ5XhSrSykt0cYWrxMXOk4YMZhJaNOKvCsWjOiaeYtiV08uY5PiqtIYtdXlV+BxH3WQQyLPGh3oyiVwFlo96MHG9QoY4Mix9vLM6xmqbbRO04JJOiriVb2kt3uND0wB7gPitC/gc0Lpoq4H2+jseb8j1LNeAa6BKA26AMq10swwPC0MBeSsMvS7/8KXh9MtPLHGZ2HI4h2ci70Q0kqN0N6GGacnDiXWxgHzwkqsweQKFRyWc5SOO3LrJZnl80FV5D1VDJ+RRLjKt94MMlsgFA3QSPRaB5Ut6N3nQUBe1xw6roGV4Bj9xC9CRR5j/LN7yeLx9DfgQLNPp1s/bO0zY4cCwe+yofF3Nw8kDbjsfLLj36jTqFGxUBIchwiP6xVV3VvLCL94Uj50DeamjYKBiWp1OdMoTnvqoU8ErSPlF3VQv8lI7Yog88WEYBMKRBp/KyzqtaAmRJ+CYNqWXR95Djtk3zLruwZRNWl+8IxM6cAAGi53QzN1Y/VK+rXsizv6k9sT/F5W7OrZLcdUfvTA3JJ1ZEfyfMpRTnnRBXasMqeVdX/Gx8dwejkBpG1bE49/mhQVtix2SvA3GALFtm+9MJkzovxOZy+HsMQCcTGfHmUM5AqBJU6sfnB+NxkPpfBiO1GCSVm9XOq/ikpFw8UG3eIzPIc/dMVz53d+XHYv8nN+mU76dA1IBRUgHEQ0oladQ5GxYTHTU1dSLDicZOb/aoB3L5Nu4ZBPKZbZnQyJXacq87rM/L70o0slDiSG80IHT3AwyVS/mgPL2KB9DkegiL4BMG8InnOSTT5xybQheOOoBkA9IBmUl4+Qfoya9jNSfnhsg9hbwZS1nBWNsXvrSl4Zvfetb5SamQw89NOiTf5TAHgTOQgY4AuDss88OfCi30047hcsvvzxMmTK8N8aY3SeHcTvsFj2gSWUnomPoDU1nrQKLv/PBBcn4pLd0JE7eSsFn6dJQJ+5K5m3Pjwdex0rozayOShpe4SVHoeokOtJ8lKmVOdLKk7ejkDzFFQon74U0oPLlbSSk8Ybk3SifNHFCeBW3slQvcLRHdZBRUJmJLtIID73A6kH8ylOY5GCQCl3LmJIPzspVmRvjTmjpY0MI7f9BT+rzhS98IWBk7r777vTjyNTzzjsv1QWDxN6D2bNnl0cB3HjjjSlvOEcANDUUD4jjPTmOY2V03/lhQOybmbh+kqU0oYYUL3/Vc9JRHtCArwMefD38ivMGFihPaUIrz5Zt+WR8LG3ipTzaUITCKVR5hMhIdEUdkc8PT6HqJ1rlkSZOKD7iAn0LZusoGaJRmwgtr/IJc36bp7jkSIbCxG/qRFq08QhrB6MBRhz0xyog78EHH6zKqsX11ADxuf4+++yTPCCGVpy7+7KXvSz87Gc/SxW+9dZbw4477phO+x87dmwaomn4NdQjADBqdb9V8ZR3juPQGcnpbVzhuQjf763Lm7v4yVtiYpp5IeaEJh53UL//BDqM6JRRPvRCxNDS2E6WyopvbUDlEpZv7pTT+QNeHonQ4PDACC3gCdR5ENAh35YhubaedhJbsjQJDb1wyGMehnbj+UkWnpulUXl4Y8Kz6xlQaNsIv/AqFz7kEEpGXk/w1EET16mA+C1Y3fMC3k4PJPqN+M83vvGNNNI4+uijw7777ht+97vfla19Rh5IhtH51Kc+lU5SoyX8h/7gBz8IRxxxRGoY161wnc3hhx+eTmI74IADwh/+8IeUN5QjALgVg2tL6n6nn356vGliVTqQjELo8PrZdKpA9scaB9Eq1D6hjKWUnZchOjqm8mScCBW3b3Dx1IV4IZJXRyO8OrzSeajywUtuTlOXljdEPh1d0E1b4BXgZQLyoIgrn1D54IFu5EMjGR2ueOlIvHGDjy3rnpkPf/jDIt2ow5tvvjnQP+h/OAbve9/7wmmnnZbaPJzRSE89IPs/hvF529velizsBz/4wZSFh8SRARdffHE6t+SQQw4JxxxzTDp7tukIACvXxvmOBTex7sf1KnhaOchLIFS8jqYKzzAGT+iDF/5Vv2zJU0hmisc3MZDe2EWZihM2GYjcw0iCij+SYXHE5REIj4GRNyKcPAfwtnyl8SasQcn5ZbTAqzxWm/BqJE+dX6HKbgoHo8Uzo2yVWSdLBor62VWwzeI1RHzdXffMnHXWWXUiNyr8N7/5zfDud7+7vNbqPe95T/jOd76T2jjU0QjMA3tbErl+/3AI0hvf+MY0mXzFFVeURoDvS/gJzjjjjHQKG5ewDecIAMmrCpv2AdUZH+TgqZCvsEr2N976/9JwjG/Ivn7EN6tIGnHIrtstLEY6pDoTuLr6VMlKRiN2wCqQTOTToWU0LK3tuDIM0EmucPCAG7/j2r05mrwmD/kqj/RwQMMsDJFWvKrkYaAokzpiSG1bquifybjF8TwgRhCf+MQnBjTjz/7szwK/HDhqlemRN7/5zYELJjn3+ZxzzklkyCJPYA8kG+w8oJ57QCy/H3nkkWHnnXcOP/nJT/otw/Pp/zXXXKN2peMfx4wZk45+HM4RAKXAHkQwPpO33LwHJXuRzzQNcJEi85Gt/+JNrnj6VcPKuvvPHnnkkfDVr341cDj9ZZddllT58Y9/PIVDGY3o/6LnHhAft2FM/umf/ildg0vFUA4ftOEZMc7E4qIYFMD8EGeNwPemN70pHY7EcZDrcgSAGl8X2ksDocFbsGFKVPwRXZ5l8fJ8ONRMH7Dyluatb5e85WHoDY5M64FZmbY87QOyOGh1oJnlY4UPSPnRe9PhYODqhizUE1DIvh7iqi95ydso2oRXgXdDiEztA6IszhKAD36OMmEimrqoPqqr6o5s5KR8czJkwts2FmUlWVc9XcpNuol5AG9e1Ym0lcvmxRI2wlWwCaMnht132z3IgJRtbYhw4iFzsNwEC3CJJ17Qv/zLvwxrNNJTA8T+Hq14MY4UcLXHtddem+aErrvuunTKPmfMcgYth10DwzkCQOVUhVttv3M4ZNVhKcvuybGdTJ1P/OpENs3Drk7JsMnyQ6eJ6S/H+NTnTgk7TNo8PG/aduH2F+2edhFreDJ5286hTnz9vbQYtoC7v+j0eV3snArlKJ/PHvhoU3VSfRRCa4ceNk6eIA2nYkL1E16hTkXUfBBDGcnSsAsa5dMW2sa+XOpIqDpquCk+6s8QCd3azzgoW/zEyzKjcQPgRyahhoGKqx7wUJ7SlJXg/E6wqf9lWMVeO8E20YuiT3JDxnBGIz01QFjUppPzGW4xzmSijzvb8/HkUI8AkBKrwqefeDQ8srxzS6YuBbRzO3orW17lC6d07rHYNDus/yF2Jo7y0Gcb8M9dsDx1EjoKnUQdgXQyJnHSFpwOP6uqD29zgfIXFp6G8sDn9cQwaDndxiWLUHM19mt0m2/5wZOWLHjhE472LI3toW20ByOidsGruvdFzwhvCZCnovbIWMEHDkD+gsKroo3ywBRCozh0gPRCXZOeE5aEIpt2yDGseD+nnHJKmi7B83n+85+ftskMZzTSUwPU7X8pQ7Lc+Ih3KEcAiLcq5ERE3dVuDYZo1WlJ2/x++GIVSxOb4rWhVo302Qa7p/GAtp23JOwQv6XCEAnwjkiz5Iy3BGiQYOsg+jwUTeqsxjhBp7ycZ32kqQ+elLwS0rY+Nk4ehsEODVN7iopaWlC5rLw9iTfqopRh9FLicqZNOP2KV7winHzyyWG//fZLc0d4QMzRAsMZjTwjDND6/n/XXe16A+cPt+ojL4K0aFM8Psw2LXob0pkYfvDBKsbn7a/aJ3lC855aGmZ883dlx8AL2iEOy9jXAs8jVkiM5+XYDipSaDQMFE4heXXtE81IhvLwVMZg9ZEHpOGZ5ctxyqsK+3k5FQSD5VewbPQo5oy484vbLtggbGGooxE3QFaLWdx2zLq4WPrlV3hANh8e5mrwbOZHDyCFcXVs7123Cff8sZNn51i23Xp8OY8i/NI4tAByuXqzp8ws3+aJT6HoRzJs8ixUjzIslsWpj/hUf9HYulbhbH4pp/B0kNW0LK8y/Vuw/lpkL11ufEQxlNFIz5fhVfkNMeRtzA9QqLjNy3F6S2teQfmEAlaBGFbhBWFgZtzWuU2Vr+gZkjApinfADy+JNG9l4VQf1UNh/uYWnnJtnuVXnUY6tOXnZeX1sboTn0LRWhlVOJtPXPyKa74qp1N+ovc5oCr1tIZzD6hClcwBLbvp3n7eBW/YquEN7DleaeZ59JBX8d9//sz0dmfOh2HXrGJClonps8+/MRkn5n3wevhhhLrxgOreKrzV8zxbL4Z7TM4CNp4QxZ/SMyjS0PUDZETjKjzL7sQJAVaZWM0TqD2c5wPIk0GHMkIqs6r+kiO+JKPwQJUnPoXgbVw8Kk/5hD31gMaOiXuAJqVqtPlnzKI4Wb+B3HfmBqjif3bVnAXh8TAnHUpGNg+3fcPauNircPaNm+fb/T14QnQIOiPeT9qsGD0jhmbM+eAlAXRcxZ8o5m4k13ZA25GUr/kR5YHP20XZyrfxVHjxRwaM+gLQ1QF56MDuFcKDszxqM/WhjmW9iqFSShdbGpBF/URry7U4aBheSZb4qDt5GDfhNAxTuyWT/ATuAUklIxK6AcrUOnri+ISZOmV6eTYPCB5adTq7MU7s8npIQ8cDbDcWWn7x1IVPL1lZTkqLRrdAEGKEtEfJlgut9TZIq67WI7F4Wy+8E5ahARvvYDp/JUc4eTBKE8pTIw+Do5A8VvGY9xIkgxrLZTkc2Sy5A9Ih9UOPCfCkolGjTXk94BNOXpdkwQ8f+TJ+ilse/s+UDpE2ge8D6uhhhP66AcoUy3EcIXq9j8y5LVTtA4KcN6tAnkcVDho6EsMwvY3FhwfEkRH6mlsPPuH5cfgF0Fm5beP7V92VOjI4eUDaL2PLJR/I3+bQqEMrT/VRCJ/26+Rx0gIN0ZAHqEMrX0NOGTLSK4qhKMZkdjQE4OQB4tUhg/YgU+0KhQeEXIZ0ef3zcsUPfSozhmor/MS19wcaxTU0VL0lF2OU2ugeEOoaMZBHPWIFPBMF61qe4dadh1kPdpMshloHxKV2GRc8BnkWGB+W6JWWHBk+pevCKgNVR+v4/hooh2H90ZtsihMr2P2sH3eAWRjKgWTuAVkNxjhDsLGTtgtTQ/wIsBgOQMLbm+3/DC80rBErb0qL09uafN70PMh2qCM+9vbg8TAHRJxhD0YLYyNjhIf0/cjw9tdOD5dd+0A4+sV7pBB5gMKUiH9UR6VVrzT5a+ZfwKve6U0fGeywy8Yli1CeGvHcKIKT5wO/0pIFLzzQKH+fZ20b7rovHpFuhmCqjwwAbWIox7AI/YCHX8M7yhG/5FMWXg6yiMOnEHrFCQF5QpLrQ7Ckln5/RuJ4ZDdA/VQcwuLFTw74FEMk86IbX+VR5JO5SstLEY/wyCOOcWJ4wEQznUpL7YR2pQgjdE40UKyOMUH90gOnhrs/3jk1UnVTWPc5gz5d0BBHQy+F8K/LEAz6qs8x5PHJEJGWXAxC/inGXYVRp16A6kdceqNNAoZS4NUe1UH8kk9ZkqXhlkJkKU4IaLhGXWX4UoYPwZIa8H50PLL2AXGgIGAPJCPvpJNOCh/72MfK84ISUc2fDcYA1d2KQb1x7ebEq5L56C2Hpryctpv0xInR+5k0PZHKA+ItykNJKI/CysrxShMCrO6IX6tR4PW2Za4HI8Tb277V5QVBy8StPcqDuiG/X2eJdEy4qlz4VF+VpbzhekBV3g/lyfBQntLEweNtyENRfZIHFPPwYPB0MDaqo/RGm6QbPBnqLvmUAYifOGWRL1nW24EfEE5yMPqA0snjAuGT0GghnYKIceGjVE4WZUOiwB5IBo7d0nhL5557bjpCR3RVYc/ngLgVgwOQ+J6EGy/e/va3Ry9k7b3fTWfNNuVVNXZ94+TeD7VchlsWWB2zRsjmPVPjDD8FZacvELlxFZ3CnF54wqY8S1cVHw5vlbwNDTd32aPhN9f+Jmy77bYDfhyzUQVtH4+sMnruAelWjKuvvjqdCf3qV7863YqBG9fk2jXlqXFDCRmCrVr+ZGcf0KxJlSIYPjH3IrddKzbg5PZr+KB0EmRWdsh/ojh3Rh+WLo9vbej5zAJZ/xzzxU/6P75yTTkvdfI33hA4YREgT8AbXsMgcKqHhiySB56D8vkqX/XHcxCvjUs2oeZK5EmAEw9DSuKE8igwIoqLBxrkA/cXK1TEyUen7M2RTOHFSxqaXKZwMvrQ40nh0UBLPbQ8z7CXOR7yZGzER1of/GqFkjJ7AaPGji43ZrZZ/vZjp4VD9zg0XHrZpQPEcjdfFeh4ZB1By2mKHI981113haYDyeo+IlcZPTVAuhXj+OOPT66avRUDA9Tk2jXlaWyqRq5LyBCMSeg45mv8z5fxofMrTijjRJk2LRpbF2hzsDg6kNIalijU8a4Pxg5z7vGdM5KQlbu04k9DDvKLuacwq9Ph8/Lr0rRTZYsmyYwdXRPtdOh5GDQDtFsGBTprSAxZvyhyGFJV6UxekQwGxoIJfOqn+uhmVs7ipj76P6IeuqqIeti6yOBRR7YKbMwwetToNISaPHly180cqeORe2qAdCuGtKBbMTA+QNNZs015dVaXsWtdHuUxn7Tvqulh1eonSZbeA3E6rrwJ0kDCxQ4mIF84xcmr6kgJH+kByU4dpZABns6mMjWXow5IPsZn9zg3tD5AhsSWZTuwxdfFqXtuxOpo6/DSpcp+zqueE2ZHYuHhY1VN+aSHA9ySwgmcdS81DmrnpM6NHTh6A4PFxaEA+mjjeOSeGiD7n1Z1K0aTa9eUV2dkmDh76KGHbLH94hwLe9GZ/xXGbt/xgGymDAE4DIbeqpaGiWENcYS3hki4NkLKl+fDvWOfO7HjBaUOnhlFyqNDlgYtej/Ua/zOcXk781iq2qX6anhFWt4GobwKDYtET4g8AM8CSPRZmSkj/pEHhRxrUJRPmN/2yvXXAtqIfNWDsrUtAe+HPC3lE2dim4n+NNQir4C0KBBXHgHOouJAdrzzKuBW3k0BRup45A3CANXditF080VTXtMDwdm2dcBxAhPiv26gqoOAwzgJUmcuvBzhRiLE+Hz6P9+aPKLv/dM1A4qwdVJmFU55Ix2iFwzAULyUofDQnmR8ioZpBzqGym53yNutuSCemToDlPNsrGmuzBqJ45HzKYP1rr+mWzGazpptylvvjdgACux2OJYbHoyBvBPbDLyRbqBuOb6Kt1uZ8FIvgfgUCr8uoYwJITvPlUZGVVx061LGxkyr45HvueeetCTPBYV777132WQOJOPY5Ntvvz2d877llmv//0qiikjPPaCmWzGazpptyqtoZ9eotBM6HoEwNfT/GBUBcuftPAx4hj0WR1r7bLRfBzr71tecDniADqePLuG3b2zytUdGNHgCentAL89HR3mUw5C4Zwag87LCIw+C+mI8tJEPIwQNfAxXgDrDpJUjGYRt3/GCRM+fhfEnPGlorZFSmYT8GAKlQ+mLFUH0wCTy9T+6tWwfcqxMaEirHuSzoRCdSS446QBa7TonnB3zwIme8qUX+6GsPgBGlkNHA20fj9xTAzTYrRhNZ8025Q3nYWEZnrOA0nEcxTI8XgNzJuyEroSI11xPHib6gk+7b8GJzsrTR5MYFmgxLBrq0ZmYXwIHaNUmJUy9OEfoA8e+IJzxvc4HrSpHnVF84FmaVxo5GA8ZUuhtXirH0FAPOq01qtDAgxwB8jByoiMEp/roY1TaCY6Qs5HUbuSIlji8oiUtAEd9ZEjA27oQZxmeEAMmmaIHD9i6J4T/GVEN9NQADXYrBi1vOmu2KW+oWuNQ+ibg4cUQAHY4IyMlnEIry3Yqi1c8GZfCmMjQKI+wSqbNJ07HwvgwMY0xeiLuHaoCK4s2AclIxJBOTlyfKZBHfcAzf8JBaoMB/HxgizEBMK7y3tQ2aAQYRLtLHO9LRoFyxTOYDiVPoQwOabweluWRIS9PdBtkuNmYfkPRtuo4OsS9Pmv3f7Yldkhy5MUPiXl9MTE5zEWFVdCUV0U/VJw6bDcdQB16qGW1wSdPqEoWK0k5qIPT2S0w9OOHsbAGhM7MD8AoAaRpuwwLR80CSqeE+SPvw6BSVMYuxw83La9nuHKcvz0N9NQDaq8ZIytJwxjCOrB5GCnSzP9Yg2VpJMfimBdS2r4ZwClPc0cJV6y4iQeZosPzOT3+uIH1jKP+MxWHcYFWy+YgSUuWHSJqODivGMolAfEPm/SQYzuzdjMzfKG9MiwskZOWLEKMC14JHg5yVKYMPOVgsHLvC/xwwRpX4jK6VXLLfP8YtUo9reHsc96a0I1VEJ3E/mw7hReOtDU+4EVDaEF40dg84fLOYmWIXzib5gZWPB55KaJRGaIlbcuwcdEONayTVYdvKsd6l/LAcvo6j8uWZ+M5P+kyfwM5O7mqjr3CrVmzJn2CkZfv5wHlGhlCeuz224QJ0w8MU296KGwWhx5NoAddb3zRgre4PA0dngoPuZ33oEPJs4CHFR2lU17kU6cDX1W+lUE51OPVx70wcNvG2XG1R/LIk0zigE3bOHmUxdK0XRnSChb5Lzpwl8CdZnPjcMzS4BVJFiEgHHG7Mkf+PnEFjAsaL8naDi0gegwqy+lzi1U0JrNVv1Qv+Dssqe7oQfWQbovsFIhWdbR5Hu+vgX/8x38MZ555ZmALjYAPw88+++zAxkyucL788svDlCmdSzRFUxW6B5RpZc3SFeUwCDdcP0smHA+1NTTgAXCKV6UTUfwjOaSJ07ksn/DCiUZ0Kh+8fuRZAH/Fl3+ZJqRZHcMYWSC/G7DtVBnW0Fw38+EkhmXudQGMBp1e9WD5/ZL/vTsZyrxNlKt6UDafXBByWBt41UehZKo+qje0xJVWvg0Hy7e0m1KclWs+ILdgPwxn1/j++++fzgOyNHVxnwPKNMOZ0FXL8PpiHHLNueTDGc2liMbm27wB+XGeBNBcCW8F5kBYvtYwDs/FLsPbTz5sfehcWj1CpsqF//ropeAJXRFlI5e3vuQwtIFGvOQprmEPnyzIACikDAHeCDzw4mVAgxFArkJoRUNcy/DUQ9sC4IdebUcv2q+kOkEj+H6MWJnCJ37moApZCsnPv+qvkpvk+ByQ1Bk4gvUd73hHWpn+zGc+U+KH82G4G6BSjQMj1oDY3MHw6rCE6kQ5T55Gfpp3KIxROQdhCrY8xCXf4g35gCVcJoUvjwaCJXpNTOe8qjtybFz1kWHBa6nyIOCBBiCk0ysUTp0/ERV/8nrYPJVtcYojGwMHEMfoKRSNQqtf4QYNN8I5oGUrFofH5z4eLrxw7SkK0sO+++4b+FUBpxy+/vWvD4cddli/7KF8GC4BboCkiYpQngVZdBCbFs6yydvA6IhWONEJr7QNtYIFTmNj0SuPEBBecXXg5DmwalYxCZ4Y459/+PjlyQgRCqgze2NkMG080cT83HBYLwgPgl3E8INP8y3RMChNSJu0GTBfBVM9COFdUOyMtviquK3Dy+OX8fbj1Jwe3awz9NIDiucBNRnfdW5LwbD88dXhiSeeCBdffPEAEaNHj640QFdeeWW49tpr0+/mm2/uxzeUD8MlwA2QNGHCsVM6X8OrU5NFh7ETxoa8fOMqXw+6PAh4BaJZGTuYlU8+D5vF2bTieiA5TEydj6/aBWniOsrJgU4NaOiC8eGzjevveLzstMmrKbyIZEByITEtOWQpjgeiNhIKT8gQizqFonwmiGcbXgyNeKFX/dhzpPZJHmVqyGZxksk8FJPTzAFRJrQYpTsfXJC+eE+4Yo7MTljroH/kD4CzBmCe8YhJ20wJ06dPDxdccEFXbVm4cGHgPCAmmn//+9+HO++8M3BMyW9/+9tw4IEHhqF+GE7hboAq/gt0LU8/L+OqtXuArJGAPT/SApx4UzgLzEAQDfKIl15OTAPyZoiXeYUHZMtUHIPHXInmM+BLcqM8OjbyNOdDHsaHOSGGZQA04rXxlFn8AZ9DzmNpKFPzN/BJrqXJ+fPDyCxt0kn0pizOypSBoiyGYjI+mkeCH+AMbgwc9PfsPqm8n408a6hIb+qAt8SK1jnnnJNUsWTJknRs8vvf//5w0UUXpbPaGYYJiHOG0sSJnRt9ha8K3QBVaEUekLJKA1EYBuGbQnjkAYnOpmUYyrxCtvjk6ZAGcg/ITopLhnhIqywZOXCSQRywc0Ic6UGHZc4GwMPAEAjgpfMmmmJDIXlpvkVEJgQPaNimtDyTkrSgY3MkZfKpRKpnJNBwULRlWdEA1YG8JvKRqdMNpRt5VqIjRA8ybNolTj0dOhrYa6+9Al+/C4i/8pWvLHHD+TB8gzJAfOrPqfv2xH0OKlu9erXank5i4/MLQdu3YkguoTp/Hrc0ebzs+BWdxHYoK1syUiep4FP+YCGehIYz0KaOnBlN6kcntLuhdZ7QlTMeCHPjsjiQ9tgce2AZn3Xdg2F8NBBMPCOXoY7OTMZwgGdYc39hpGCkE+N5vOajL0tbAWQEktCKP5pMrshKKIyFPJgqmmSgIo1CaNAJbUb36IZ2k87rkuao8CAjv4xTVRmOG6iB4XwYvsEYIA47etnLXhbuu+++MHXq1LKVI3EZWim8IsJGxLHbdY7jkDHhYeXBzx/aCvYSxSSu7QjKAAfQMXN5dGSGE9DoDayhhvIIAeFTwvwRXVlOUe+SL87X0ME0V6PyMD6vPnSPNCxD3N67bhNm3NYZmpFOnkthZBi+aJ5FmxHJB0ebiIMHlkZjx9zMnoUxS8iKP3gq7FHCG6GuGDQZAtVdbBiqAbiYSbn8AELaJjrkpbxCtugScfzDUAzAiGJ82WPkUK2Bgw46qN8mRKiG+mF4zw0QB9N/+9vfDp/85CfTmcy2ySN1GZotI4+vemJhnGCLk5bxbvhpj+3WyZZXEkO9TXM+0spTqH0nMmSJp3jQkzckuYUwOgxvbPg0b5LPj8jwCA+rlU/nxFgy9CFUOZZP9aPTqTw8H80JEd7zx4XpxlbkAzIImjuRcWBymTwBZZIWTnRK0/EVtxPB8P3iqjtTfahrWfcYV91lmKmzcCpXOGgok1B1IU0cnRImKCa5S0MdXwhAMq6mjgnpf7rSACMTOzrphqnnBuh///d/kwH66U9/Gl784hf3q/Ott94aRuIytH6FdJlQp5UrD1v5MBcyePuz1Jw6fYEjyD0dkzXkKB6MyrfyeePLCKk+FKKOpjkZ6okxWBHlkMdbf8q2E5IRwvsB+LRCoIO6MBp0UoE8HaXp5Ll3QdrSKf6cOPl7XfSaAOoK3fI4DKI+mosiT14MfAz7+L9Qe8gHoAeHDJWvupBGJ4kn0gCiUQgt+aUHlKj8z0hroOcG6CUveUm44YYb0m2LeWPtZWgzZsxIFxdy2yIu4FA2P3ErxvOe97y8mDI9f/78sPfkA8K4/XeL34Kt9SzoHHR2O78Ck+34EgJOZ83wQMsDID91gIKQTpTzJ+NR0Klj6E2vPHVGOlQVfyG+PDqDjgmd5Kk+lld5W03YLMyJIw+8H1bHmkA8dTQyMrr7HTqWuxnW6TJCVqhERz6016uuZhmePCAtl8eQ4VpevoxNIqz4g974Xo0yGSracolrCIZRxPBSF4DlZpas627F4CLNz372s4m27T+j4nlA9plpS/7YxfHMqzkbxg7LnhugJpet7cvQmNxmQ1UdfOtb3wq/POsXYcn/zEwnIlYNwep4LV7ekpbHlZen85UsjI2GRHQogDSgPBkk4VNm8YcVJIykZICuGoLpZgnJZLVrbpyjkXGgg9IJmRP6/lV3JekaNulzDAwAOOEhwntAlsVzVAeT3uz34X77KqOMUaTO10cZhNQLgy9PUm0+JxpdtVs4ygXER1xlgLP3gl1p+aOeBNID6StjXSxwFjLeed2h9Nts0/EWLY/Hu9dAzw1QU1VH4jI0lhTrgA1VvOnyZfg6+sHwMkSD0Y1UPgeJ5ef5UKfBQN4Bxuftr9onDcswPDI6dHDRYGzSsKy4xsbKhn65RRTx/K1OeoBxruAbDCXDMxhdXX6VbngeeGbqDFCdLMd3pwGmAjZY4DK0a665pqxfW5ehlQJrItqIWJPdiLYHtDcSrodM652oOHkVSjeFDEeYkGZOCCMjeRgW5ow0TIGuCkSf5+Hx6EeehoU53bqm25KzruU6/dA1sEEbIO4Le+973xuefjo+sHE/EDdQHnHEEWmXJZufzj///HDLLbeERYsWhS9+8Yvh2GOPHbomDGfygEx6sKh9c3b7DdNgMrvJt+Xm9HaOhzx5HVU80OLhsPRMqDirUvyeXrIyeUIqA8PCPI7mcpi8rgKMFsDZ0Baoi37gVTdLUxfP6295bbyOH3wuQ7TrYpzFs6mFixcvDo8+2lkxzNu+0R1INlKXoeWKq0rvGPofpqS5FUurSWkefN6+zDnQmbU6ZWlHIk5ZTHhrXsSWkeoQ6yVIxoAVrGIoxeqXAFptMqQdiTfO2wB4O5zPg9H56AcPD+wX0jk84r9m5iPJQ8ITeiTyyfAoX4ZKaRtqWCccOmXCuMmQi0Y8lDc7JpBF/VM6hoJkjIstD3XGB7wbIGmsOnzXu94VrrrqqnQl8y677BJ+/OMfl1edD/VAsg1mDogJYiadLegytLPOOitdepZfuTzUzU+2jG7jdPL84VXHZ6WJh5f8KjrLx7wMYOdm8oc/dZhIg2HT3IiNww8PhkLlggOg0xI2mx0FGB4AHPMy8DEZrVUyOjx1w1vRJjxwmsM59KQ/CRzvysed5ZJ2lEOnl2xC5NtletoCHtkYMegFWiGTwUhtjDuV8wlm8AK2EaBjVq0wNoknyhWONOUR0jYmwAHpJCXiH/LFr3x0Cp76qE2i39TD//7v/04fn/K1An31TW96U/j85z8fuM7cHkjGtpmTTjopHUj2ne98Z1C1bTAGqKmmbV+G1lSWLiaExhoOyyMDoeV28hRXyNgWOoXJq4g4vdlz2Xr41VHoCIClEw147edReeByUPng5WmAS0v6cUUoeQwxTd3AYyCuj3iA8sGpQ6ZPMaLxYFezvqJnpQxjhRyMUrpQMBoFa2To5MpXm2TAZsXyANLUAS8Mz0z10/yA5FE/AA8InPDg4CPN5DireAkX6w8OPrVbMsBbYzu+eDHAB7+VnYRt4n84I+iHP/xhOnIVVfC1wpw5nZeaH0jW4sMxevy4zjdgcxakh7Yb0epYdDY6Dw+5DAQPPqBQ8tTplVZo6egEWo4njjeijkFZApWvtGSoIwuf5EW+5HkIGUPodYyF5ELLjw7NhHOIXoE6tnZMcx00Boj9Nb8ojANiNTlNHIOGDLwa1R284jIIqjN5AG2SDjuYDg/1y9sr+ZTLcE9GSHSUhefGXNWceUuSOMWpO0ZVPIQbO8x74uHAHruXv/zlA5p6/PHHh+OOO24A/jnPeU7C3XHHHYG9eJdeemnAKwKGsicvMcY/zwgPSJXdUEN1WurHA6xOta71paNYWTl/ZSeNHdLyYHRsWjLUwUhjNPA6oBUw5JBREE7tYG7HzuPg+di76PNJaNHKYEleNyFGA6MgAwEPmwfZhMhk+JyYx/diDJOQb9tFucLBhx74IVPfmMn7ytsKPXk6t4h0r2F0PJCsqp7Drde2u04N06btEU4//fQBoqZNmzYAZxEs+syePTvNAz344IPh4IMPDn4gmdVQC3EdYaFhEyLzzl9XDB2Zh14ejsIqeslHNnE6vKVXGl7FZRSq5ImuLm9d8bSDYYrO1FFnoKNvGz0JeRO3z36yn+jc8ChN3SWjH4NJYFiA8+OtrpQPMLS77NoHknFR+yUzEazjH+Tm9VjXw/TXscgNinzzLSbEiz4np4+/17Vif/EXfxH4MQGNt/Ta177WDyRbVyU20XMrRg4yEDJCmnzWKhhGQysoaR6j6DjIEY81LJKvPNHRKfRNkjqIHYIRF55jJVRT1Qc5tny8A53pYzsseIZEvPHh1ZwK/Bq2KI6xwQN66YFTA6tdQJIVcXgpyGLHtCau4QcnYLKYNCF1T3nG80qeTMRrbgxDML/w4tAZoPknjA/GI7W3kEFdkucS6cp4kSe9MK/G/492PDOXJp5UQPwj2nwCXPmbevhf//VfacVLwzZOqeCkxAceeGBYB5Jpnm9T129l+zEQMhIyMJaQDqJOIjyrW3RC+NSZebhzfskV31DCqvKtHDoz5fJjWCPAS1OHE06eBWl5HsShZS8QHomAzmtxugaaq5jlwYiW0Bo/0nnnB0cdwVsDprpTHxkf6Zu0fvCAVxsIq8qgHDupT1pQh1f+ph5yJtfJJ5+c9tzxTSV3gz3rWc9Kv+HsyfM5oOzJspPQNosdznqo5fnYORRoyQenjiB+0dNRbOdW/lBCZKp81SuXQ77e6PrAkqtzAH3drnzNqVgZuTHBE2I4xpBIgIfE5K8mpsmHDqBMfCbyteIFXoaZuMC2h0nvR9BVkal24kHR1m3jipWd6MbwXRfzwGlSnIlltU16T/qI/IBkFkUkuawo5njlb+rhW9/61nQgPXd+LV26NG0GZvWLQ+w3igPJNqT/4HwOCG/FdnK9hS2O+oO3uNzY2DS0uReUG67BdGLLqqIlX+WkTkqnjDjbIcVXNQkNrgo03FIeHg4eFpsU+XaMb8gwQqLDSFnQMNLipFNw4lM+erE8tOEuZRahxWF8qmBd9VslY1PFYWi+8Y1vhK997Wth3rx5A249HeqePPeAsieq7kAyeTGQ54ZDIoTHQ7jusz9P7j7DCMsrWvD51/C88RkaMWehuSANlXibE9dbXXKawmRoCgLbKfFsdFZyE39THt6GNSzyfOwHrGnuJxqPJsDIUR8uJQQwJLkXYo1PkyzlUW4+7CMPOfYlIHoPu9cAmxDrrlx+Rh5I1n3T1w8lR7KOm945D6jKcMh7aKoNk6bwNtFWyU5DhCgYPjoLHUmGQnnqnHTUJkBGFQgvOdAIJ4NBWvEqGU04PB87HKuiRTaAkcD4wDM7YYb3B7lVhmd4Up17JDXgHlCFdjUEq8hapzdo09tWQ6OqMoQbTmdi+ZxhF/tfLKQ64XFknkaTlyFjiByMhU4xpH4yJuQx54PxxajgETEc+7IZxok2b5f1zpAzVMjlDlXOhsI3Zszofvptq15bbbX2Uoe2ZA5VzgZlgKpuxaBhTTdfNOUNRSkMwZY9fG/nQLJZxZnQ6yhI329VsWm1pWoIpmGWhmBpKBdX1QDlaQimoVlehuiui8M1C5bv3iJPtJTHLA0HyOv7MSaPdYMEeQsKYXxsCg0nFwL6Jov4bP5E0Ldg/xBX4dhhzaTyc+JOZFbOMGZ2LkZxDS8VYqCTjqI81R3ZwlscePERVx44PE2MLnwYXcJEU3iQOghfeOqThqix7g4jr4ENxgDV3YrR9JVtU95QVccQbIvt9gpT52xXLtlqbkcy9bBW4cExhKnzfjTcoRPn/BpmQUNHfd607cL1sQMBytPQSZ1MdVIoOtLIUTmWD6PAEr2lpSMmTyQaGOqePKL4sSpAh8SIaM6HFTR5M4kg5uN9aBWqzIt4PCaOd2VYZj2pxBf/QAsvZ0GrPoQYAulQ+oAHI1K1WoU+1EboAOkIfubXkvzC8IiWNls8daQ+yk+C/M+IaaDnBqjpVoymr2yb8oajrbpJaGTKe5Hh4A1rgbctOG18g95OQifDFTsD0OQBafmZHcYqg85EXJ0KGcrL55NkeFQPJrvFRx3uP39mp/xiwx70V3z5l+nqHDo+aQyDNgdyrKruvdTFfpJn7wfTUru8GuqYzwml78rIKIDOTlmahFYbqac8IB0VgnGgbnhmKl9yxEc+kAxoDKkfgFeG8VI+ODsMFV4GkXyHgRpgD9CTTz4Zdtpp7XEuohrKaKTnGxHtrRhqiEL7lS0z7B/5yEfChRdemI7taMoTf9shHQLjw8Ouzm/LqMKRT2eqy7P8itMZ6ED5crTyCZMxKxDElaZTyeuRoRQfb3VwwmMoqBcejo6tEC07n6EDb3/QWsDAqLODl/cEHXg8DH5amofGLu/LWFEPOn8dILcp3/JBi1x0Qln6zAK95vVX+eiMH+2hHLy5bsuzZW+scRyFd7/73WnjIff3vfSlLw2MWgSMRnbddddw2GGHpe/D9KW88uvCnntATbdiNH1l25SXnxukxnPDweGHH67kgPDhhx8OUzbfLYx7fv9bMUSojiuPQ50ePHEbYtnpuDIGOjZDwwp5U5JNSAdJ8z+xAwF0YNEpjxDAS0KmygWnYYN90yPP5qVE/INc5HOMBZ001csYF312ofqKj6/iqYOMDpPNgNKil2eDbOUxFMMQWSOgODrFO7o/1gv5tM++HdU2ZGm4hvGQbD45sTTUSZ+uiAYc9VLatkP/t7RHXhrhqrgDmM7GPpgqePOb35xejFV5GxOOr99/97vfhdtvvz1sueWWaSc0d/n9/Oc/f2afB9R0K0bTV7ZNeXUGiAPOOECpDs4777xw/b/PCCtueqj/xYRiKPb0DPBm2NMDFCGPKt4SxodQaUhkUDS8ACeg84IfHw2XOonolKcO3q8OlBE7LkMmGUEN48SPUQLgo7ODB5fkxA4vw6a62DDPow6qx+RiiGONHrx4D3R2CxgfgNWx+YuWpw9MMVAYIepxV/TQqBeyMax53ZnwBlR34qqHxYGnzshQu2WowfP/wstBvNCTD1Af5rjkGY2JhucrX/lKeQ5OIjJ/qoYiJnujia5ZsyYde4zxAV796lcnw7ts2bJgRyPkMVLhWzGO7ai7zgg6oOceUKca1X+5pYLzoAWKcxhSU57o8xBlvOhFL8rRZfpXv/pVmLnDXZVXM5dEMSIPyOLyON4JD7secnlA6szyjCwfb/B8bkNlKU9v+ZxOcjFc6nTItvykxQdeMsHXgeTafHAykHgJGBrVS+219Hkc4zN5y80T2npADHuYdEcWBkCyJFtydGiZ0oS0awBd/D8QznpLoTDwakOSUxgk6kObMJUYUZ4ZPjXYmG7FWLlyRViyZEm48847U9PtH17e9K0c3vCGN/RDcdohesGBGMpoRMI2aAO0++67p8apsjR0hx12CBMnThzWF7iSN9RQb0u57ZKjtyxp4vJClE+oTmVxiuutq3RTWFeW7VQYiipDp1UwyadO0FqPhTgiQtk2AAAlBUlEQVQ4DvJiWEJacyKUgbEAWBnToV7gmIgWHSFtItRQjPj3L70t4fSFPbJpT92clzUe1riq/k2hPDPpXaHVE/zCUxd+gMKU6MGfsWNHlcPBNotftvDReJnDzSE3KpTBB6f8muC73/1u+I//+I/yxpqhjEYkf4M2QHxly9mzJ5xwQpgWD0qyN1805alxQwlHTRgXxsY3cJjVmcORDDrynvHyPjqS5lXoNDmAgw7gAabzwAvg9uvBV8cAD852MtLqxBp2pHSsF52cTs/Miy1fcejEg2yAPOTzdiePNoDTKhf1AlSm4vCwdycH8FrxQiYGCl4t0yNfno3aqzbhXZAPPat8DMf4hmxGLAS51EtGRm3SKpjqofYoTWhxMqji50WQ4rHthLw4KIv/F7VdtOA3dth12t7h0Oi9/PIXv1jnptIHOaOdxaP99tsv8Q9lNKKCN2gD1PSVbVOeGjeUcOWDc8Oyp25PrDIcPLDMMWg1RXMTdfKh04NuafSWBUe+PCTh6aSKi09p5iXomAwNgLo6YPTEY+nAIUN58DMM6zeXFBmsERItnhBA58SwyEAkZExbT0GGh9WktK8oEpEvuRgp0aSd2tH4cJ7Q9T+6NYlL9Yr6Rj9qo8qjHsKrbokp/oEWnOoqvAyMndyX7nMPVjz8P1BmLkv5m2r40Y9+NB3D+n//939h7733LtXQNFIpiWoiG4wBqroVgzo3fWXblFfT3kHRS8OSwMWEj4c5YfdZk0r60VO2CivjJC9APAc+3xCeTq00IR5V6kyxk8h7WhUf8BxYyQG/OspnpQcQnfJ0wFjOqzReDWXpcxLViXzykGdx4NlXA/DdGZ1THVPGye7szmlkbCkTg6broWcniYXnEePa5wMaudDOjnHKw/hw0D2T1PfGutDxpSfoBbnREd6GlkZGifxUv+JFooUA8FX08tpsHrSbMjDnwyLN1VdfHU9TnBSeeOKJpI5tt902DGc0ssEYoKb/3KavbJvymmTW5W21/c5hwvQDw9S4EraZuSkB+jGh/+YrvSF5UJVnceIBlz/MGCV1dNWFCVN1VHjSmzh2GkB5mlS1b2grO9FFI6P6SDbzPngiyIcGjySlC4KyvMIwQpMP5fBc5O1oKKg03hHfn10f5VEWZzgz10M9VSdCwE4Yw0f9tU9odjRMyIkj4FJn4oNX9NpgCI46UFf4mEeSt6UPeZP+I12qRwzVVngFkquyFCp/Uw/PPPPMdPazhl3Sx0MPPeTnAUkZbYTshF7yPzM7HtBV/T2gXL71DJTHm1seiDyNKjp5KPBBR1peDmnkLI95dR4QZVTJRQZ5OewQjwjBW8H7wEuZFwnsEAxZrC7J68FIKC5Z6tCkue0idexoPADimkSmnHPiD0CGZFE3jK5w5GtIdW+kw/joyh+MUlk+hrkwjKKfDbMBaK8v6oIxsvz6P1E91FbDXpYFjcNADVStmFmqoY5GnhEekG3oSMe5F2yL5+wVwk1z+g1VdCIiHQCgI+ktqc4BHpwmd0kDXAAI0CnEj8GRgSKPODItzqYVJwRY1q8qnw9YZ3zzd4kGWgwDwHdl7LNRBxOvjAI04Gy+4uQB4umkQrn6RRqvgwlmDJOlQ4bkyvMQLnkdMV9bFvCwdJTHlFNfmm5kRfYbjnx2uN2sumHgaKcgGb5Yd7wy4vLOZhcEMpSqB2hbR9IyWsLLQyTPoTsNDGU04gYo0+2axUvjHNCCkF/NLKNCp05v5uhl0Hkt4HlYHHMN4DSZDa28E2torAzi8MnQ5HlKUweVVcqMfMynkMa7wdhpLuWSYmJVBpD2MEELrfb4YhCUb+MqUzwYUjo1h9Jr6IJReSTi4AcnUJpQk+7CIQcgTT35XgvjgvHZPdZX51hzHjXbAQT3R1qO/bCAjmcVq3laoUMuoFUwDNOMYh7P1hEahrvIEF4heQ4jpwE3QDW6ZRJ6mslTJ9eGQrKEM2T9ojbfxhNv5gH1Y4wJOs9gRmiATAxP4SFhIOwQTV6a5ZEBEE5plSu8rZtoCLmWR2nqS0eHRzjx2TRx0VBHGWfhkMNd9Hg9VcAqmmhtvsUhV+VgzJFJPqtuAlsn4Qjr8JbG4+1pwA1QhS5ZBauDcl6ihoAHPYcqnGjsUIyOAkCvjiO6hMdozekMwSzexiVDK1tVeRaXx1NdMSJ5hklThowUaHVwGT9DmtoCPrUpZlg+dXarH8UxbnhYeEI6VI0Dz7oByYU2lRuNEMC2AMlvqmsi3gD+jI2fgVij2VaVtp64eRjVlrBhynEDlCmQ84C0CoYREKjj5J1P+TleaYWiUyhDYstgSIRHQFm8xQF5CMxNMOTSvhbbySRT8xd4O5QLqN7kMayQfPLA2Xkem7ZxaAXgBWxAZDWKjYXURzyWRitpbCYEmFuZHUNLI++MeR3mqfB+7MWEWqKHH2B4afnBaV6JuICytaSuOZ29TvlTZafVM+HRDXJpD3NZ6vhfPask98gIaMANUKZUVsEqP0Y1no3enrk3BF4dP715o2xCPi7NDYbexLZ4aMTHnAjGQ3R0UuKSQwfkDjKAjgNAo44pPn0gq0nWhFdbjDFJbYlpGT46JqtlFjCWdFTVQR+ikqbdlI8ca9Q0HJIhQJ7KIA6PaNIO7zhHc0nEW3qW6K1RuDeWofYgA1C5tJ86MqFNKAMjI8nVy+CRrzzCHPCWqvA5naeHpwE3QF3qT53cklfh5MVYOnVYi6Mzl0bCZnQZp+NWlS/2PI8Ox88aB9ESil51Zde0cJZOe23Aaa+POr3kywhCQ2e3+ezZoQxoBWWZMQ/9afJZ+Xhah07vGNl7/rgw1UvtEQ3tUrnar4RcHQ9LnHwZPPERUieMDXUlzk/4FPE//TTAgWRcVLjjjjv2ww/lQDI3QP1U2EmMnRL3/2RXYvGGldHQsAkDkse16mTF9vOKimGdNT6Sa3k0dLK4PI5c5LDMr05MBxPe0stjoB0CcNBSlupIJ2W1iw4pD0hthI/VJ5V1T7wLDDpWruDn/B15IioD78Z2+tTRi+ElHR5Q2RgeTma8M3oveDz6tgwaDM/eu26Tjne9vPCAwAPUh3JpD9BPboGjHtYYQke9wctgMTydGr/jo2y7oRFah44GFi9eHI488shw4oknhg996EOlWoZ6PLIboFKFayPLbro3JbRZUEvmMhoK5SHwEPPwCi9JSisEr7gmn1VGSscJZqW1NC5ZiddMQksOeDvhXGXMoJHRIC4Al+QUQzIMhQwUnVOgsmiv5NBmTQ6LhxtLZbTES93gI+TzEnZiQ8+mRwDjI/nII07Z9xs8/LMj7ZXxB+/pl5+Y9gsxKc22g2RckBnbwxyO6o4scDJwGFrNqWEs5ZnJEJFP/JHYNgB9OKzVwA033JAMD4eSWRjO8cgbvAFasWJFcvfUYM5nYcOTYChun3irQnsoffoqviCyXgJxgdx+zphR5ySPh148eUi+vAobaoIZejoVoA5Dui96J6KxZSXC4g908KiOqofqaYdg4OrSeR7iJYM4ngzDNEAy2Gej83xSRpEnWdTNDtOSpxJxMhKiIyRPbbTlUhbnCQnIS15YNDTE8V7mxxCAFpw8Isq28bRxMdJoOKgQXts+0g4h/OVf/mU49dRTwxVXXNFPHRvtgWS0kpPVZs2aVTb4uc99bjoWEsRQ3b5S2CARdWKR5Wl9j6R5DdERirYulGFQKF7R52k6B93OdiI6tDqp6AmtDOLQpc4Wdwm3BZonQZ7t5Osi37bF1pm6ajNhLo+2zLjtsTQnNHnLHdNQibqAx2ho6KT6afiHnihP+iKedlAXBcjboS2A+IvsjSqYO+fRcPfdd4dTTjllQLte85rXBH5VQD8cPz7eNXfllf2yN9oDyfB+brvttjB79uxywktHPA7H7eunvYpEGnLF3dCDgVz9nC43DHapOqe1HS/Psx2GPNEKz9wF921pKJTzK02ns/MpdDJ1ONEMFtKmHJKXUEzY5nlVaerdBjDsoj0YiQ8c+4JwdtwpnQxL1AeQvKB1qFcbdRoJGWPHjk57odqWvf3kuCARDcmee+45QPTkyZMH4ISApwo22gPJbr311mR49thjj8B1IBzZIRiO2ycZbYXyAPR2zeXWGaqcToYlx9elkTu7LjPD01nf/trp4fsRL+ODAWGY0g3QNk3WQm+Nj7wM7Z3pRl4TjfVMcjrqgTGUh4LxwQj9Q5yvAUe9cmNrZVhDCq2ALQXiF05lKL2xhNtut328wWK3fpPIw2nbRnsg2cyZM9NtBNxkMWPGjMDwi4OuDzrooCGdQ8utGJywWAfczDphzviwYtVD6UwgTa5Crwlny6uHWR1aeZqQZn5nUpyYtfMZokkTr8Xkr3AYA8qEj53IdDbVQXnWYFB+bvTqjBidTcdjqLx17WDspZEXY3llgHUAmeQTSkcKbR5xW3/qSPsGG4LBgzEUYIS4WBHQ/h1W1K6MRknGER7pRnWxbSj/j4ohmGSz3Mwzw4UGVXDUUUeFk046qSprk8FtFAeSVf1vcRcR1/ZwBCTwiU98IhxzzDHhrrvuSmeTbL311iWbTuufP39+aLoVg7uN6uCiiy4Kdy18OIzbN17JfFO10bG86gT2mArymShWx1IHsHzEMTIaUikvGZQiQZwOI4NDJ2cnNCEgo5d4YucSaJJV6aoQGXRQazDUKavolSfjAw1GQsMg8YDja3gAY0IHtx3f8ovH1t8aBOV3G7JXiONdbZvqeFUnm6//L4sjPip+DvHOd76zn/dtaaqGMTZ/U4hvtAeSsdeAn+CMM85IHtAtt9wy5FsxXve610ncgJD5pnt+rq1rA7JLhDqkhlbqRApLwiJS93DndHpD53ilrcGyZak+0NXJsJ0b44V3wNyU9gepU1q5Klf1J8R4YVxkfIhLD3bopPJUN4XyciSbMC/TyrF0ilNvyQenOpwdDZ7mhK6LceRq2IheoGMntHjYSHnZtQ900lFmFYyOq65HH330RnUrRlU7h4MbzvHIG/Qy/CWXXBKYFONiOIAJaFxhXL7huH1Nyh69x+T0KQYfpGr4A73d7KcOqU4leeDB2SEYQy3LK9o2hmDp26m4siVvKNWzZqKXzqdOixHBUyKdt0VpZOXtU2eGD3mSKXka9qSOXjQ098hUhyK7LJ80fBjEpiEYdBg8rUBqwyJ1hV9zQny+gV7wTslL7YrtBqd2MSQVaAhGWxyaNfDjH/94AMFGeSDZU089FU477bQ0/8O9TF/96lfDEUccka7mGY7bN0B7BrHmgfnpZtR8CGY7psjrcHgq+l6MkI6LX2Xp2xiC2V3JqlNdaDu+DJYdElE30uqcyLH1JU1nVgeVPBkhaDX8UR48ApUlIyO8LQ8ccuwkMjiVkXiL3dMqQyF82pfEPiG8G05lVH2RA+TldbCdv+RRhnZC2zyPD66Bje5Asre97W3p/un9998/LF26NOyyyy7pbnhUMRy3r0mV9kjWabPiXFAFYDyA5MXEkDRxhSnT/Lk3TiznYHdCa6c1n3FIJvHlkUlp5oI4nlWbAzBy2gGt+lAGxsV6buAA+NlzJHng8DbodJJjaezxrNAKNCcFH50eGZafskUDD2Wy61gAPR6icOQD1AsDB//smLZ1faQoy9bPlgG/yqVe53z+56DS8a54RHg3lMlmUUINZTGK8tA0n8dEO9dPY4hSPEnyPyOlgQ16CMZw65xzzkmT0AsWLBgwuTxUt28wZY6dEm+GnJN9DGaYWNkC9DW6PB7etuByQ6QVNDqJ4muu6kwcy/ggL3WMYmVMnURfs5MPrfCprMKwqT7QAHROysrByidPlw6q4yPTDkXyzyrgoYPLm8EA0XG5yaIONCGveRs6tvWk7CmLtk1WnsqTwaBcC5aP+ki+hmO6BhpviW+9AHk59qRF8FwnJICmlzB69Kiw1YS1W0/aqsv4LWK330AOBNqgDZAUPnbs2AHGR3lDcfvEWxVyJjQfo+44Z0oyJFU0GsJYz4M3NnhwdPSqb7ksvf3MQ2XQuXUMBzilbRwcoLIUT8j4h84I2LJIi89+LMvKkd7yoredWzj4ARk/jBTGAJl0atGpviqrw7W2bNIaMilPMpVGFvxsQ6jSIXToWp+k5HzIV/nUU9dAq53yeDRcQwcOvdPAM8IArU/16ExojmTdIhoUgfVU1DE0nCFNXKG8FjpToim8miSriFcOweLwQPTw2iEZhkE3ZKhOKl/nENEp64Zg8NthDTLolGloEuPIghcagI4q+QnBn0ijkxLxHLQDW3SUQdwaMeRhZPBKAIwDOMoCiJftjMZT/OAll7pYmfDZdF4uaX7IYKIZ/tzTQYaMj4wTOAAvCkOGt+YwshpwA5TpVx7Q1DC9c0Vzls9wR50Hg6M3uCadhePhJ0/pTEx5tKq8B/IxIJqj0FtcBiJ13NhB9eang6nMRFt4RsQxEnhC1qCQpiNKPvXDi9FcDLLEQ12SgSmMBmmBPCyOS1VcX7Yn/kgoPDyUSTnURat2+hJd+bYtDFHhZyXMLscjI62OxeNA0KstAzkMO8FhNOTdULaFQ567Y3gw4jjulaM9+Jre7t7G6FAGk+BufKzmRi7uBijTrTygR+bcFqY9NnASWnM8sKU3dHzjWyMCTp6QDbNiyre7xdMRxa+hmLwA5RECGBpN/obC+KT5j7jyw/xPPn8jo6k6I4MOiiHCqCVZsQOT5m57vIN8Hol2qlPTiZHJ3A5lkUcaHjtBTD3BE6pjMxGt8mVgqdc+8UjW6+IcGvzcXqG2c4wqS+9zo3HBEMGj9iAH2WW5sQ0qDzrmfKgzBgfjwxnTmlexq23ygraNGzStUUK+w1oNtH36BH3EoQUNqLMgysYlGly/XzzbJwc6P1DFn9Oq41q8OpHFdROXURPt/efPHDBXQx71gjanV574bWjriYfBT/wKLX1THN6hAgeaYTSZE3p6ycpSjDVCIDG8eEaEGqKVxJt4hNMndt1113DYYYeFgw8+OK7T1C/UdKsq94AyTXEe0Ljpu8WrmftP5GqohZEgzltXHUhxhYiUZyEaDZdUnA6lJ4080dNhJZ88TRojmzhhAlM+XgFv+TR3EePWA+kQd4Yn0GgOBzz02p+k1Tm8IerMEGRhcWiYZBBq6KMhmPbbKE9DIfFQJvUTIFceELLIB0o9FUOwVNfC2yNf5aZ6VQzBGAZqCKbdziy7s5LFkAwPSIZHHpBWvDA06EKAB4RhUr7wm3I4UqdPuAeUPVX2UHrrsUAm40PcdirSgHDQwYsxyYcxHcqONyH50Mi7IIQfXjqlaBQn5KeyJA8cwxR1aOGbQuuNiA45QJ23wRwJP7wJwO4mTojsj+RpyJSXqXbCZud8rBh42GUN0EYZI9HY+RoMogAdSSafXNw++8n06QVxPCLmhPB21FaF4DBc7gFJkyHY0ydYef7IRz6S9uTxveZwwD2gTHt4QGO3mxSYhJZXIBJ5QXghVR1dOOjk8SiUDIXMmcjzsXLloVAGHUjeDJ3OfoyqspBnvQp41OlVlsI8T3yWvvSwxJSF6tAyCMkjyWhsUvJkNFSmaOykep0s8NplLd3TlirQt13koSMm02VI8rmdK2c8EF596B7lzmvKEeRDM+HXZzg27gOavGX7e5Fm33Vb+NUvf9nvZFG161Of+lTgl8NwDh3LZdm0GyCrjSKeltwbDiSzHdayC08nUdzmV8VlfMjLDUROb2mtfLwCQV3HpHPpDS9a0lYOeKVzObQpDfGKeRh1amTIyOAZ6Wt4lYE8ZOEBYYRUppWvMvP6SUaOl0zl56HaCp0MF8YIOTLcKl8GVTLgzXHK21jC/Z7//PR9ZX6yIe1jz10VDOfQsSp5wlWXptxNMLRDsLpPMfi4FMhXodLbmcPXiyEYXg5DKEIgj2u/UMqMf/B2GI5BjydEB9IQTnnyiFQWvKoPcTq6eEgLZhcRm8chXPo0groRZ/gH0FEtLdc83x+HhXgs6rx0Via+0QN1vr6or+qIHORpVUohOBkChmAClUk9VAZ54O0cDThkCWgHdaVc4pqMZ4WOeRyMJTKoLyGyiVvgKI/r73g80eLdycBamo0lzkfdo+MxI5vH7yu7heEcOtZUhhugJu3U5OmNXZNdounUAsXLsOFueGiYnLMej+SMRJjKK4xkLt8aT+jkfeBNyKDAQ17dcDOXSTrXIfwC8jBMwjEUZiMjRhd8rpcqD0lemWQSik7GiLQMEcaHOSEMD3NADv01MFKnT7gB6q/nYFfB8jkgkerh1nyN8ITwkE8nqguhYxUs70gMUeQ9wMubWmnlaS6FTpTXLw2RDA/lCMQnecIT6rgQ+HUaUr4RUcZFclLHjfUl1C7nvI62DOg4v5oOThnyaOStoC+ViRzaJyOl78iSZxLrmE9EI5sVO9WNEByytZJFeUwss89H3g00AnD85Anl80Wi21TDkTp9wlfBhvBE0THUOSx7jlM6Dy1PW3HKsHNBMpKDyYdP9cMjUFpzJ4Pxy6uoo9NQCWOATJVBKF6Vb8vE+NIGfqIjHzndtE08GBXi8HG7qmRQ3/xjU+g4R0i7pGWo6tq2KeHt6RPPfvazAx+Hf+ELXxi2CtwANaiQuYqqnzpGzqqOQYeCjzRhHUg2+cR561t6pW0eOH7yICSbsvAUBOrUuTzlK4RPngM40vyYUO4GrBdRRY8sAIOCTOiFy+lVJjS0UcZQK27kI6dbQEd4QMgjzgoZsnLdSR500LNEz+qYvCflb+ohp09geLiY8Gc/+1nQMcjD0YsboC61x3BJP3XuJlYNrxRW0TbliV40ecfjjW6BTpW/0ckXv6VtMz7UTkpnF+QGSd6L8m0IX67/Onp0pPkcqxvqzE9L7VVt0JyQLdvjIS3dT5q09siS4epkVNxINLydRMOtwQbEzxGwb3zjG8MeU6fFWdWols2qb0IYVeD7Vq9JtR81Zq0dFy7xx30chIuXLAljxo4JW241MaxaubrTYuTngBxkwhdXKhIUZQTlFWWNijSLn467siPdhC3XdmZ4yjqQKMqhzn3EJT/GE07yIyntgHfZ0mVhzai+MGGL8UjoB9CMoX4RVheyVZ74++mDciI9Za9YuSJdrzRx/IRUFjJSnYpH0PLneGhp65pYP+RZWL16VVj0VDywf/KkVDfVSzw84mnlJ7IVVU50wkNPmxRK9qood/Z996Y61y1Pi7bt8Mwzz0xDnN12G/g9YlVZDz/8cNhu++3DFl2sbPE8rli+PDz66NqVxCqZ6wPnBijT8h133BHWrOkYlixryMnTTz897LfffuEtb3nLkGVUMX79618PEyZMCO95z3uqsoeM++53v5tuHfnYxz42ZBlVjD/96U/Dr3/96/ClL32pKnvIOGR+73vfC9/+9reHLKOKkUsK+P7pppvidznrGdh3w714O+/c3RnVyQBtt13l5sK86pwuumzZsnTjTJ63vtO+CpZpnLvH2gYO1p86Ne6tnj69VdE77LBDmDhxYutyd9ppp/TWb7u+f/jDHwLue9tyH3rooTQf0bZcOqm9DLPV/7xBhPF/wK9baLvt3ZY7XLq1Y4fhSnJ+14BrwDWwjhpwA7SOCnNy14BroD0NuAFqT5cuyTXgGlhHDbgBWkeFOblrwDXQngbcALWnS5fkGnANrKMGfBVsHRU2FPJ99903HWU5FN4mHrbEczhU2zBt2rS0vN+2XFYCuWSybdg+7n/hiNC2Yeutt07Hj7Yt1+Wt1YDvA1qrC4+5BlwD61kDPgRbzwr34lwDroG1GnADtFYXHnMNuAbWswbcAK1nhXtxrgHXwFoNuAFaqwuPuQZcA+tZA26A1rPCvTjXgGtgrQbcAK3VRSuxFStWBL421o8PGi1wte2DDz5oUY1xvsy/8847K2kef/zxsHBh1SGrITTlSdg999yTPjpVmlD1Vrhq1SqbPajcJ598MiyJxz1UQVOdBtNLnVzVU2Fe38HkVtXTcetRA5wH5NCeBg444AAO+il/8ev6UvgZZ5zRF/es9MX9MH0HHXRQXzxyocyri5x22ml9L3nJS/plL1q0qO/II4/si9fk9o0fP77vQx/6UF80VImmKc8K+e1vf9sXb0Xoi8c4lOho6Mp6qw2f/vSnu5IbT8lLddprr7364hk2fX/1V3/VR12AwerUpJcmuU31pdwmueQ79F4DofdV2HhqEN+2ffH4hr7Zs2f3RS8g/eKbOTUwnlmTOuYDDzzQB+64445Lv7rWz5s3r++EE05I8nIDdOqpp/a97W1v64veVd99993XR6e/7LLLkqimPAgwVN/85jf74jUrydhYA3TBBRf0/emf/mlZd9qwcuXKruTGQ8v7MJbIp15HHHFE37/+678OyjuYXprkNtV3MLmpYv6n5xpwA9Tif0E876Zvl112SRLjUKyf5L/927/t+/CHP1zibr755uS9yHMpM4rI3/zN3/Qdf/zxfeecc84ADyhekdKHByP4zGc+00dHBZryyL/66quT93XttdcOMEAf//jH+0455RTI+vL6N8mlDfG84L54Lk/i5U88hK3v9a9/fUo38TbpZTC5TfVtkltW0iM914DPAbU43J05c2a68O3www9PB2TF4VjgEC7g/vvvD3ziINhjjz3SfAtzG1Xwta99LZx77rlhm2226ZcdPZLwxz/+cYAscE15EhK9qXDDDTeEF77whUKV4Y033hhmzJgR9tlnn1T/6GWFp59+elC5HHfKdb5xSJhkMQ/2gx/8IEQvaFDeJr00yaWguvqS1ySXfIcNQwNugFr8f4ivk3TM5cUXXxw4pe+QQw4JxxxzTGAitOlq26oqxLmdKnSaBI6eQeA7JcFWW8Wra+bPb8wTbdO3Y3xTxZnY0TsL0cMKs2bNCtHL6Equ5GN8MFyc5vfBD35wUN5u9ZLLpby6+pLXrVxoHXqnATdALer+xBNPDD/84Q/DjjvumH5xEjR5K7fcckto62pb5AB4JoKnnnoqHfnalCfapvC8884Lf/d3f5eu7I2T5OG9731vuPzyy1Pd4asq08qjHq95zWtCnHQOV1xxRbpnfLA6daOXKrmUW1df8rqRC51DbzXgBqhF/XOrxjXXXFNKZAgxZsyYEOdA0o9hgYC4znQWrpsQDwa+XBbDu6a8wWQzfGPY98QTT5Sk1P9Zz3pWV3IZSsaVuXSI+k9+8pPya/rB6oRu8rZYvdTJbaovDRhMbtlIj/RWAz2fhdqIKhBvZuhj2T2+sftYEWNF6hWveEVq4XXXXZeW35l8jp5E37HHHtv3gQ98YNDWf//73x8wCc0Eaxza9cU9QH3x5oa+aHz6fvWrXyVZTXm2MCaZ45PXbxn+da97XZooZ/L3kUce6WNLQbxpoiu5f/7nf57qNGfOnL65c+emXxwWDso7mF6a5DbVdzC5Vhce750GfBWsRd3HTXB973vf+/riBHNfHIb1veAFL+i7++67yxLiRG3aexPnR/riUCUZojKzJlJlgKKXkpa54zCjb8qUKWkFSuxNeaIhrDJA8RqYvqOOOqpvzz337IvX/fS9613vSkvq0DfJjZPvyZhh0OzvsMMOg7WRl/w6vQwmt6m+TXLJc9gwNODnAY2AA8puXK6wZZI0B3ZG82vjdkmGS8ipujSvKS+vU55md3XcpFh52Nlw5DbxDkcvTfUdjtxcL55uXwNugNrXqUt0DbgGutSAT0J3qSgncw24BtrXgBug9nXqEl0DroEuNeAGqEtFOZlrwDXQvgbcALWvU5foGnANdKkBN0BdKsrJXAOugfY14AaofZ26RNeAa6BLDbgB6lJRTuYacA20rwE3QO3r1CW6BlwDXWrADVCXinIy14BroH0NuAFqX6cu0TXgGuhSA26AulSUk7kGXAPta8ANUPs6dYmuAddAlxpwA9SlopzMNeAaaF8DboDa16lLdA24BrrUgBugLhXlZK4B10D7GnAD1L5OXaJrwDXQpQbcAHWpKCdzDbgG2teAG6D2deoSXQOugS414AaoS0U5mWvANdC+BtwAta9Tl+gacA10qQE3QF0qyslcA66B9jXgBqh9nbpE14BroEsNuAHqUlFO5hpwDbSvATdA7evUJboGXANdasANUJeKcjLXgGugfQ24AWpfpy7RNeAa6FIDboC6VJSTuQZcA+1rwA1Q+zp1ia4B10CXGnAD1KWinMw14BpoXwNugNrXqUt0DbgGutSAG6AuFeVkrgHXQPsacAPUvk5domvANdClBtwAdakoJ3MNuAba14AboPZ16hJdA66BLjXgBqhLRTmZa8A10L4G3AC1r1OX6BpwDXSpATdAXSrKyVwDroH2NeAGqH2dukTXgGugSw24AepSUU7mGnANtK8BN0Dt69QlugZcA11qwA1Ql4pyMteAa6B9DbgBal+nLtE14BroUgNugLpUlJO5BlwD7WvADVD7OnWJrgHXQJcacAPUpaKczDXgGmhfA26A2tepS3QNuAa61IAboC4V5WSuAddA+xpwA9S+Tl2ia8A10KUG3AB1qSgncw24BtrXgBug9nXqEl0DroEuNeAGqEtFOZlrwDXQvgbcALWvU5foGnANdKkBN0BdKsrJXAOugfY14AaofZ26RNeAa6BLDbgB6lJRTuYacA20rwE3QO3r1CW6BlwDXWrADVCXinIy14BroH0NuAFqX6cu0TXgGuhSA26AulSUk7kGXAPta8ANUPs6dYmuAddAlxr4//l9ebw4BTixAAAAAElFTkSuQmCC" /><!-- --></p>
-
-
-
-<!-- code folding -->
-
-
-<!-- dynamically load mathjax for compatibility with self-contained -->
-<script>
-  (function () {
-    var script = document.createElement("script");
-    script.type = "text/javascript";
-    script.src  = "https://mathjax.rstudio.com/latest/MathJax.js?config=TeX-AMS-MML_HTMLorMML";
-    document.getElementsByTagName("head")[0].appendChild(script);
-  })();
-</script>
-
-</body>
-</html>
diff --git a/vignettes/lct_example.R b/vignettes/lct_example.R
deleted file mode 100644
index 2fa5314..0000000
--- a/vignettes/lct_example.R
+++ /dev/null
@@ -1,121 +0,0 @@
-## ----setup, include=FALSE-----------------------------------------------------
-knitr::opts_chunk$set(echo = TRUE)
-
-## ----set_up, eval=FALSE-------------------------------------------------------
-#  nthreads <- as.integer(4)
-#  data_dir <- "./"
-
-## ----libraries, eval=FALSE----------------------------------------------------
-#  require("kalis")
-#  require("R.utils")
-#  require("data.table")
-#  require("fastcluster")
-#  require("Matrix")
-#  require("viridisLite")
-#  require("kgp")
-
-## ----declare_run_parameters, eval=FALSE---------------------------------------
-#  # Declare LS Model Parameters
-#  #########################################
-#  neg_log10_Ne <- 10
-#  neg_log10_mu <- 4
-#  
-#  # Declare Target Locus
-#  #########################################
-#  gene <- "lct"
-#  gene_target_pos <- 136608646 # rs4988235 in hg19 coordinates
-#  pos <- fread(paste0(data_dir, gene, ".legend.gz"))$position
-#  target_idx <- match(TRUE, pos >= gene_target_pos)
-#  
-#  # run kalis
-#  #########################################
-#  
-#  CacheHaplotypes(haps = paste0(data_dir, gene, ".hap.gz"))
-#  
-#  diff_map <- diff(fread(paste0(data_dir, gene, ".map"))[[3]])
-#  pars <- Parameters(rho = CalcRho(diff_map, s = 10^-neg_log10_Ne), mu = 10^-neg_log10_mu)
-#  fwd <- MakeForwardTable(pars)
-#  bck <- MakeBackwardTable(pars)
-#  
-#  Forward(fwd, pars, target_idx, nthreads = nthreads)
-#  Backward(bck, pars, target_idx, nthreads = nthreads)
-#  
-#  M <- DistMat(fwd, bck, type = "raw", nthreads = nthreads)
-
-## ----helper_functions, eval=FALSE---------------------------------------------
-#  plot_mat <- function(x, file, raster = TRUE, rel_scale = TRUE) {
-#  
-#    temp_col_scale <- rev(viridisLite::viridis(100))
-#  
-#    if(!rel_scale){
-#      mx <- ceiling(max(x, na.rm = TRUE))
-#      if(mx > 100) { stop("the max entry of x cannot exceed 100 for this plot's color scale") }
-#      temp_col_scale <- temp_col_scale[1:mx]
-#    }
-#  
-#    cairo_pdf(file)
-#    print(lattice::levelplot(x[, ncol(x):1],
-#                             useRaster = raster,
-#                             col.regions = grDevices::colorRampPalette(temp_col_scale)(100),
-#                             yaxt = "n", xaxt = "n", xlab = "", ylab = "", xaxt = "n"))
-#    dev.off()
-#  }
-#  
-#  interp_hapmap <- function(path,bp){
-#    d <- data.table::fread(path)
-#    approx(d$`Position(bp)`, d$`Map(cM)`, xout = bp, method = "linear", rule = 2)$y
-#  }
-#  
-#  dip2hapidx <- function(x){
-#    x <- 2*x
-#    c(rbind(x-1, x))
-#  }
-
-## ----make_plot,eval=FALSE-----------------------------------------------------
-#  # Load sample population information
-#  #########################################
-#  cluster_by <- "isAFR"
-#  id <- fread(paste0(data_dir, gene, ".sample"))$sample
-#  init_order_samples <- order(id)
-#  samples <- merge(data.table("id" = id), kgp3, by = "id")
-#  if(nrow(samples) != length(id)) { stop("some samples have been removed by merging with kgp3") }
-#  if(!all.equal(init_order_samples, order(samples$id))) { stop("some samples have been moved out of the order in lct.sample") }
-#  samples[,isAFR := ifelse(reg == "AFR", "AFR", "not_AFR")]
-#  
-#  # Symmeterize & Scale Distance Matrix at LCT
-#  ###############################################
-#  M <- (0.5/(neg_log10_mu*log(10))) * (M + t(M))
-#  
-#  # Permute & Cluster Distance Matrix
-#  ###################################################################
-#  diploid_perm <- order(samples$reg, samples$pop, samples$id)
-#  psamples <- samples[diploid_perm,]
-#  
-#  haploid_perm <- dip2hapidx(diploid_perm)
-#  
-#  pM <- M[, haploid_perm][haploid_perm,]
-#  
-#  hap_groups <- table(psamples[[cluster_by]])
-#  hap_groups <- hap_groups[unique(psamples[[cluster_by]])]
-#  
-#  baseline_idx <- c(0, cumsum(2*hap_groups)[-length(hap_groups)])
-#  names(baseline_idx) <- names(hap_groups)
-#  
-#  order_M <- as.list(hap_groups)
-#  names(order_M) <- names(hap_groups)
-#  
-#  for(i in 1:length(hap_groups)){
-#    current_pop_samples <- which(psamples[[cluster_by]] == names(hap_groups)[i])
-#    current_pop_haplotypes <- dip2hapidx(current_pop_samples)
-#    sM <- pM[current_pop_haplotypes, current_pop_haplotypes]
-#    order_M[[names(hap_groups)[i]]] <- baseline_idx[names(hap_groups)[i]] + fastcluster::hclust(as.dist(sM), method="average")$order
-#  }
-#  
-#  order_M <- unlist(order_M)
-#  cM <- pM[, order_M][order_M,]
-#  
-#  
-#  # Plot clustered Distance Matrix
-#  #########################################
-#  plot_mat(cM, paste0(data_dir, gene, "_dist_mat.pdf"))
-
diff --git a/vignettes/lct_example.html b/vignettes/lct_example.html
deleted file mode 100644
index a97c52a..0000000
--- a/vignettes/lct_example.html
+++ /dev/null
@@ -1,532 +0,0 @@
-<!DOCTYPE html>
-
-<html>
-
-<head>
-
-<meta charset="utf-8" />
-<meta name="generator" content="pandoc" />
-<meta http-equiv="X-UA-Compatible" content="IE=EDGE" />
-
-<meta name="viewport" content="width=device-width, initial-scale=1" />
-
-<meta name="author" content="Ryan R. Christ and Louis J. M. Aslett" />
-
-<meta name="date" content="2023-12-11" />
-
-<title>Reproducing kalis Paper LCT Example</title>
-
-<script>// Pandoc 2.9 adds attributes on both header and div. We remove the former (to
-// be compatible with the behavior of Pandoc < 2.8).
-document.addEventListener('DOMContentLoaded', function(e) {
-  var hs = document.querySelectorAll("div.section[class*='level'] > :first-child");
-  var i, h, a;
-  for (i = 0; i < hs.length; i++) {
-    h = hs[i];
-    if (!/^h[1-6]$/i.test(h.tagName)) continue;  // it should be a header h1-h6
-    a = h.attributes;
-    while (a.length > 0) h.removeAttribute(a[0].name);
-  }
-});
-</script>
-
-<style type="text/css">
-code{white-space: pre-wrap;}
-span.smallcaps{font-variant: small-caps;}
-span.underline{text-decoration: underline;}
-div.column{display: inline-block; vertical-align: top; width: 50%;}
-div.hanging-indent{margin-left: 1.5em; text-indent: -1.5em;}
-ul.task-list{list-style: none;}
-</style>
-
-
-
-<style type="text/css">
-code {
-white-space: pre;
-}
-.sourceCode {
-overflow: visible;
-}
-</style>
-<style type="text/css" data-origin="pandoc">
-pre > code.sourceCode { white-space: pre; position: relative; }
-pre > code.sourceCode > span { display: inline-block; line-height: 1.25; }
-pre > code.sourceCode > span:empty { height: 1.2em; }
-.sourceCode { overflow: visible; }
-code.sourceCode > span { color: inherit; text-decoration: inherit; }
-div.sourceCode { margin: 1em 0; }
-pre.sourceCode { margin: 0; }
-@media screen {
-div.sourceCode { overflow: auto; }
-}
-@media print {
-pre > code.sourceCode { white-space: pre-wrap; }
-pre > code.sourceCode > span { text-indent: -5em; padding-left: 5em; }
-}
-pre.numberSource code
-{ counter-reset: source-line 0; }
-pre.numberSource code > span
-{ position: relative; left: -4em; counter-increment: source-line; }
-pre.numberSource code > span > a:first-child::before
-{ content: counter(source-line);
-position: relative; left: -1em; text-align: right; vertical-align: baseline;
-border: none; display: inline-block;
--webkit-touch-callout: none; -webkit-user-select: none;
--khtml-user-select: none; -moz-user-select: none;
--ms-user-select: none; user-select: none;
-padding: 0 4px; width: 4em;
-color: #aaaaaa;
-}
-pre.numberSource { margin-left: 3em; border-left: 1px solid #aaaaaa; padding-left: 4px; }
-div.sourceCode
-{ }
-@media screen {
-pre > code.sourceCode > span > a:first-child::before { text-decoration: underline; }
-}
-code span.al { color: #ff0000; font-weight: bold; } 
-code span.an { color: #60a0b0; font-weight: bold; font-style: italic; } 
-code span.at { color: #7d9029; } 
-code span.bn { color: #40a070; } 
-code span.bu { color: #008000; } 
-code span.cf { color: #007020; font-weight: bold; } 
-code span.ch { color: #4070a0; } 
-code span.cn { color: #880000; } 
-code span.co { color: #60a0b0; font-style: italic; } 
-code span.cv { color: #60a0b0; font-weight: bold; font-style: italic; } 
-code span.do { color: #ba2121; font-style: italic; } 
-code span.dt { color: #902000; } 
-code span.dv { color: #40a070; } 
-code span.er { color: #ff0000; font-weight: bold; } 
-code span.ex { } 
-code span.fl { color: #40a070; } 
-code span.fu { color: #06287e; } 
-code span.im { color: #008000; font-weight: bold; } 
-code span.in { color: #60a0b0; font-weight: bold; font-style: italic; } 
-code span.kw { color: #007020; font-weight: bold; } 
-code span.op { color: #666666; } 
-code span.ot { color: #007020; } 
-code span.pp { color: #bc7a00; } 
-code span.sc { color: #4070a0; } 
-code span.ss { color: #bb6688; } 
-code span.st { color: #4070a0; } 
-code span.va { color: #19177c; } 
-code span.vs { color: #4070a0; } 
-code span.wa { color: #60a0b0; font-weight: bold; font-style: italic; } 
-</style>
-<script>
-// apply pandoc div.sourceCode style to pre.sourceCode instead
-(function() {
-  var sheets = document.styleSheets;
-  for (var i = 0; i < sheets.length; i++) {
-    if (sheets[i].ownerNode.dataset["origin"] !== "pandoc") continue;
-    try { var rules = sheets[i].cssRules; } catch (e) { continue; }
-    var j = 0;
-    while (j < rules.length) {
-      var rule = rules[j];
-      // check if there is a div.sourceCode rule
-      if (rule.type !== rule.STYLE_RULE || rule.selectorText !== "div.sourceCode") {
-        j++;
-        continue;
-      }
-      var style = rule.style.cssText;
-      // check if color or background-color is set
-      if (rule.style.color === '' && rule.style.backgroundColor === '') {
-        j++;
-        continue;
-      }
-      // replace div.sourceCode by a pre.sourceCode rule
-      sheets[i].deleteRule(j);
-      sheets[i].insertRule('pre.sourceCode{' + style + '}', j);
-    }
-  }
-})();
-</script>
-
-
-
-
-<style type="text/css">body {
-background-color: #fff;
-margin: 1em auto;
-max-width: 700px;
-overflow: visible;
-padding-left: 2em;
-padding-right: 2em;
-font-family: "Open Sans", "Helvetica Neue", Helvetica, Arial, sans-serif;
-font-size: 14px;
-line-height: 1.35;
-}
-#TOC {
-clear: both;
-margin: 0 0 10px 10px;
-padding: 4px;
-width: 400px;
-border: 1px solid #CCCCCC;
-border-radius: 5px;
-background-color: #f6f6f6;
-font-size: 13px;
-line-height: 1.3;
-}
-#TOC .toctitle {
-font-weight: bold;
-font-size: 15px;
-margin-left: 5px;
-}
-#TOC ul {
-padding-left: 40px;
-margin-left: -1.5em;
-margin-top: 5px;
-margin-bottom: 5px;
-}
-#TOC ul ul {
-margin-left: -2em;
-}
-#TOC li {
-line-height: 16px;
-}
-table {
-margin: 1em auto;
-border-width: 1px;
-border-color: #DDDDDD;
-border-style: outset;
-border-collapse: collapse;
-}
-table th {
-border-width: 2px;
-padding: 5px;
-border-style: inset;
-}
-table td {
-border-width: 1px;
-border-style: inset;
-line-height: 18px;
-padding: 5px 5px;
-}
-table, table th, table td {
-border-left-style: none;
-border-right-style: none;
-}
-table thead, table tr.even {
-background-color: #f7f7f7;
-}
-p {
-margin: 0.5em 0;
-}
-blockquote {
-background-color: #f6f6f6;
-padding: 0.25em 0.75em;
-}
-hr {
-border-style: solid;
-border: none;
-border-top: 1px solid #777;
-margin: 28px 0;
-}
-dl {
-margin-left: 0;
-}
-dl dd {
-margin-bottom: 13px;
-margin-left: 13px;
-}
-dl dt {
-font-weight: bold;
-}
-ul {
-margin-top: 0;
-}
-ul li {
-list-style: circle outside;
-}
-ul ul {
-margin-bottom: 0;
-}
-pre, code {
-background-color: #f7f7f7;
-border-radius: 3px;
-color: #333;
-white-space: pre-wrap; 
-}
-pre {
-border-radius: 3px;
-margin: 5px 0px 10px 0px;
-padding: 10px;
-}
-pre:not([class]) {
-background-color: #f7f7f7;
-}
-code {
-font-family: Consolas, Monaco, 'Courier New', monospace;
-font-size: 85%;
-}
-p > code, li > code {
-padding: 2px 0px;
-}
-div.figure {
-text-align: center;
-}
-img {
-background-color: #FFFFFF;
-padding: 2px;
-border: 1px solid #DDDDDD;
-border-radius: 3px;
-border: 1px solid #CCCCCC;
-margin: 0 5px;
-}
-h1 {
-margin-top: 0;
-font-size: 35px;
-line-height: 40px;
-}
-h2 {
-border-bottom: 4px solid #f7f7f7;
-padding-top: 10px;
-padding-bottom: 2px;
-font-size: 145%;
-}
-h3 {
-border-bottom: 2px solid #f7f7f7;
-padding-top: 10px;
-font-size: 120%;
-}
-h4 {
-border-bottom: 1px solid #f7f7f7;
-margin-left: 8px;
-font-size: 105%;
-}
-h5, h6 {
-border-bottom: 1px solid #ccc;
-font-size: 105%;
-}
-a {
-color: #0033dd;
-text-decoration: none;
-}
-a:hover {
-color: #6666ff; }
-a:visited {
-color: #800080; }
-a:visited:hover {
-color: #BB00BB; }
-a[href^="http:"] {
-text-decoration: underline; }
-a[href^="https:"] {
-text-decoration: underline; }
-
-code > span.kw { color: #555; font-weight: bold; } 
-code > span.dt { color: #902000; } 
-code > span.dv { color: #40a070; } 
-code > span.bn { color: #d14; } 
-code > span.fl { color: #d14; } 
-code > span.ch { color: #d14; } 
-code > span.st { color: #d14; } 
-code > span.co { color: #888888; font-style: italic; } 
-code > span.ot { color: #007020; } 
-code > span.al { color: #ff0000; font-weight: bold; } 
-code > span.fu { color: #900; font-weight: bold; } 
-code > span.er { color: #a61717; background-color: #e3d2d2; } 
-</style>
-
-
-
-
-</head>
-
-<body>
-
-
-
-
-<h1 class="title toc-ignore">Reproducing kalis Paper LCT Example</h1>
-<h4 class="author">Ryan R. Christ and Louis J. M. Aslett</h4>
-<h4 class="date">11 December 2023</h4>
-
-
-
-<div id="overview-accompanying-data" class="section level1">
-<h1>Overview &amp; Accompanying Data</h1>
-<p>This vignette reproduces the distance matrix included in the initial
-paper introducing our R package kalis. We infer the haplotype structure
-at the lactase gene (LCT) in 1000 Genomes Phase 3 data.</p>
-<p>Four data files are required. One is the recombination map
-<code>lct.map</code> that accompanies this vignette, although another
-recombination map of the user’s choosing may be used. Three files
-encoding the required 1000 Genomes haplotypes, <code>lct.hap.gz</code> ,
-<code>lct.legend.gz</code>, and <code>lct.sample</code>. All four files
-can be found in the <code>example</code> folder at Github repository <a href="https://github.com/louisaslett/kalis-bmc">louisaslett/kalis-bmc</a>.
-If the user would like to reconstruct these files directly from 1000
-Genomes data, we we provide instructions for doing so using
-<code>bcftools</code> at the end of this vignette.</p>
-</div>
-<div id="run-kalis-in-r" class="section level1">
-<h1>Run kalis in R</h1>
-<p>Start by declaring the number of cores available for kalis to use in
-this example (<code>nthreads</code>) and the data directory that should
-be used, <code>data_dir</code>. This data directory must contain the
-recombination map <code>lct.map</code>, <code>lct.hap.gz</code> ,
-<code>lct.legend.gz</code>, and <code>lct.sample</code>.</p>
-<div class="sourceCode" id="cb1"><pre class="sourceCode r"><code class="sourceCode r"><span id="cb1-1"><a href="#cb1-1" tabindex="-1"></a>nthreads <span class="ot">&lt;-</span> <span class="fu">as.integer</span>(<span class="dv">4</span>)</span>
-<span id="cb1-2"><a href="#cb1-2" tabindex="-1"></a>data_dir <span class="ot">&lt;-</span> <span class="st">&quot;./&quot;</span></span></code></pre></div>
-<p>No further changes should be needed to the following for
-replication.</p>
-<p>We load our required libraries for this vignette.</p>
-<div class="sourceCode" id="cb2"><pre class="sourceCode r"><code class="sourceCode r"><span id="cb2-1"><a href="#cb2-1" tabindex="-1"></a><span class="fu">require</span>(<span class="st">&quot;kalis&quot;</span>)</span>
-<span id="cb2-2"><a href="#cb2-2" tabindex="-1"></a><span class="fu">require</span>(<span class="st">&quot;R.utils&quot;</span>)</span>
-<span id="cb2-3"><a href="#cb2-3" tabindex="-1"></a><span class="fu">require</span>(<span class="st">&quot;data.table&quot;</span>)</span>
-<span id="cb2-4"><a href="#cb2-4" tabindex="-1"></a><span class="fu">require</span>(<span class="st">&quot;fastcluster&quot;</span>)</span>
-<span id="cb2-5"><a href="#cb2-5" tabindex="-1"></a><span class="fu">require</span>(<span class="st">&quot;Matrix&quot;</span>) </span>
-<span id="cb2-6"><a href="#cb2-6" tabindex="-1"></a><span class="fu">require</span>(<span class="st">&quot;viridisLite&quot;</span>)</span>
-<span id="cb2-7"><a href="#cb2-7" tabindex="-1"></a><span class="fu">require</span>(<span class="st">&quot;kgp&quot;</span>)</span></code></pre></div>
-<p>Now we’re ready to run kalis.</p>
-<div class="sourceCode" id="cb3"><pre class="sourceCode r"><code class="sourceCode r"><span id="cb3-1"><a href="#cb3-1" tabindex="-1"></a><span class="co"># Declare LS Model Parameters</span></span>
-<span id="cb3-2"><a href="#cb3-2" tabindex="-1"></a><span class="do">#########################################</span></span>
-<span id="cb3-3"><a href="#cb3-3" tabindex="-1"></a>neg_log10_Ne <span class="ot">&lt;-</span> <span class="dv">10</span></span>
-<span id="cb3-4"><a href="#cb3-4" tabindex="-1"></a>neg_log10_mu <span class="ot">&lt;-</span> <span class="dv">4</span></span>
-<span id="cb3-5"><a href="#cb3-5" tabindex="-1"></a></span>
-<span id="cb3-6"><a href="#cb3-6" tabindex="-1"></a><span class="co"># Declare Target Locus</span></span>
-<span id="cb3-7"><a href="#cb3-7" tabindex="-1"></a><span class="do">#########################################</span></span>
-<span id="cb3-8"><a href="#cb3-8" tabindex="-1"></a>gene <span class="ot">&lt;-</span> <span class="st">&quot;lct&quot;</span></span>
-<span id="cb3-9"><a href="#cb3-9" tabindex="-1"></a>gene_target_pos <span class="ot">&lt;-</span> <span class="dv">136608646</span> <span class="co"># rs4988235 in hg19 coordinates</span></span>
-<span id="cb3-10"><a href="#cb3-10" tabindex="-1"></a>pos <span class="ot">&lt;-</span> <span class="fu">fread</span>(<span class="fu">paste0</span>(data_dir, gene, <span class="st">&quot;.legend.gz&quot;</span>))<span class="sc">$</span>position</span>
-<span id="cb3-11"><a href="#cb3-11" tabindex="-1"></a>target_idx <span class="ot">&lt;-</span> <span class="fu">match</span>(<span class="cn">TRUE</span>, pos <span class="sc">&gt;=</span> gene_target_pos)</span>
-<span id="cb3-12"><a href="#cb3-12" tabindex="-1"></a></span>
-<span id="cb3-13"><a href="#cb3-13" tabindex="-1"></a><span class="co"># run kalis</span></span>
-<span id="cb3-14"><a href="#cb3-14" tabindex="-1"></a><span class="do">#########################################</span></span>
-<span id="cb3-15"><a href="#cb3-15" tabindex="-1"></a></span>
-<span id="cb3-16"><a href="#cb3-16" tabindex="-1"></a><span class="fu">CacheHaplotypes</span>(<span class="at">haps =</span> <span class="fu">paste0</span>(data_dir, gene, <span class="st">&quot;.hap.gz&quot;</span>))</span>
-<span id="cb3-17"><a href="#cb3-17" tabindex="-1"></a></span>
-<span id="cb3-18"><a href="#cb3-18" tabindex="-1"></a>diff_map <span class="ot">&lt;-</span> <span class="fu">diff</span>(<span class="fu">fread</span>(<span class="fu">paste0</span>(data_dir, gene, <span class="st">&quot;.map&quot;</span>))[[<span class="dv">3</span>]])</span>
-<span id="cb3-19"><a href="#cb3-19" tabindex="-1"></a>pars <span class="ot">&lt;-</span> <span class="fu">Parameters</span>(<span class="at">rho =</span> <span class="fu">CalcRho</span>(diff_map, <span class="at">s =</span> <span class="dv">10</span><span class="sc">^-</span>neg_log10_Ne), <span class="at">mu =</span> <span class="dv">10</span><span class="sc">^-</span>neg_log10_mu)</span>
-<span id="cb3-20"><a href="#cb3-20" tabindex="-1"></a>fwd <span class="ot">&lt;-</span> <span class="fu">MakeForwardTable</span>(pars)</span>
-<span id="cb3-21"><a href="#cb3-21" tabindex="-1"></a>bck <span class="ot">&lt;-</span> <span class="fu">MakeBackwardTable</span>(pars)</span>
-<span id="cb3-22"><a href="#cb3-22" tabindex="-1"></a></span>
-<span id="cb3-23"><a href="#cb3-23" tabindex="-1"></a><span class="fu">Forward</span>(fwd, pars, target_idx, <span class="at">nthreads =</span> nthreads)</span>
-<span id="cb3-24"><a href="#cb3-24" tabindex="-1"></a><span class="fu">Backward</span>(bck, pars, target_idx, <span class="at">nthreads =</span> nthreads)</span>
-<span id="cb3-25"><a href="#cb3-25" tabindex="-1"></a></span>
-<span id="cb3-26"><a href="#cb3-26" tabindex="-1"></a>M <span class="ot">&lt;-</span> <span class="fu">DistMat</span>(fwd, bck, <span class="at">type =</span> <span class="st">&quot;raw&quot;</span>, <span class="at">nthreads =</span> nthreads)</span></code></pre></div>
-<p>Note <code>M</code> may be plotted directly by calling
-<code>plot(M)</code>.</p>
-</div>
-<div id="post-processing-remake-paper-figure" class="section level1">
-<h1>Post-processing remake paper figure</h1>
-<p>Here we provide post-processing code to reproduce the heatmap in our
-paper from the distance matrix <code>M</code>. We start with a few
-helper functions.</p>
-<div class="sourceCode" id="cb4"><pre class="sourceCode r"><code class="sourceCode r"><span id="cb4-1"><a href="#cb4-1" tabindex="-1"></a>plot_mat <span class="ot">&lt;-</span> <span class="cf">function</span>(x, file, <span class="at">raster =</span> <span class="cn">TRUE</span>, <span class="at">rel_scale =</span> <span class="cn">TRUE</span>) {</span>
-<span id="cb4-2"><a href="#cb4-2" tabindex="-1"></a></span>
-<span id="cb4-3"><a href="#cb4-3" tabindex="-1"></a>  temp_col_scale <span class="ot">&lt;-</span> <span class="fu">rev</span>(viridisLite<span class="sc">::</span><span class="fu">viridis</span>(<span class="dv">100</span>))</span>
-<span id="cb4-4"><a href="#cb4-4" tabindex="-1"></a></span>
-<span id="cb4-5"><a href="#cb4-5" tabindex="-1"></a>  <span class="cf">if</span>(<span class="sc">!</span>rel_scale){</span>
-<span id="cb4-6"><a href="#cb4-6" tabindex="-1"></a>    mx <span class="ot">&lt;-</span> <span class="fu">ceiling</span>(<span class="fu">max</span>(x, <span class="at">na.rm =</span> <span class="cn">TRUE</span>))</span>
-<span id="cb4-7"><a href="#cb4-7" tabindex="-1"></a>    <span class="cf">if</span>(mx <span class="sc">&gt;</span> <span class="dv">100</span>) { <span class="fu">stop</span>(<span class="st">&quot;the max entry of x cannot exceed 100 for this plot&#39;s color scale&quot;</span>) }</span>
-<span id="cb4-8"><a href="#cb4-8" tabindex="-1"></a>    temp_col_scale <span class="ot">&lt;-</span> temp_col_scale[<span class="dv">1</span><span class="sc">:</span>mx]</span>
-<span id="cb4-9"><a href="#cb4-9" tabindex="-1"></a>  }</span>
-<span id="cb4-10"><a href="#cb4-10" tabindex="-1"></a></span>
-<span id="cb4-11"><a href="#cb4-11" tabindex="-1"></a>  <span class="fu">cairo_pdf</span>(file)</span>
-<span id="cb4-12"><a href="#cb4-12" tabindex="-1"></a>  <span class="fu">print</span>(lattice<span class="sc">::</span><span class="fu">levelplot</span>(x[, <span class="fu">ncol</span>(x)<span class="sc">:</span><span class="dv">1</span>],</span>
-<span id="cb4-13"><a href="#cb4-13" tabindex="-1"></a>                           <span class="at">useRaster =</span> raster,</span>
-<span id="cb4-14"><a href="#cb4-14" tabindex="-1"></a>                           <span class="at">col.regions =</span> grDevices<span class="sc">::</span><span class="fu">colorRampPalette</span>(temp_col_scale)(<span class="dv">100</span>),</span>
-<span id="cb4-15"><a href="#cb4-15" tabindex="-1"></a>                           <span class="at">yaxt =</span> <span class="st">&quot;n&quot;</span>, <span class="at">xaxt =</span> <span class="st">&quot;n&quot;</span>, <span class="at">xlab =</span> <span class="st">&quot;&quot;</span>, <span class="at">ylab =</span> <span class="st">&quot;&quot;</span>, <span class="at">xaxt =</span> <span class="st">&quot;n&quot;</span>))</span>
-<span id="cb4-16"><a href="#cb4-16" tabindex="-1"></a>  <span class="fu">dev.off</span>()</span>
-<span id="cb4-17"><a href="#cb4-17" tabindex="-1"></a>}</span>
-<span id="cb4-18"><a href="#cb4-18" tabindex="-1"></a></span>
-<span id="cb4-19"><a href="#cb4-19" tabindex="-1"></a>interp_hapmap <span class="ot">&lt;-</span> <span class="cf">function</span>(path,bp){</span>
-<span id="cb4-20"><a href="#cb4-20" tabindex="-1"></a>  d <span class="ot">&lt;-</span> data.table<span class="sc">::</span><span class="fu">fread</span>(path)</span>
-<span id="cb4-21"><a href="#cb4-21" tabindex="-1"></a>  <span class="fu">approx</span>(d<span class="sc">$</span><span class="st">`</span><span class="at">Position(bp)</span><span class="st">`</span>, d<span class="sc">$</span><span class="st">`</span><span class="at">Map(cM)</span><span class="st">`</span>, <span class="at">xout =</span> bp, <span class="at">method =</span> <span class="st">&quot;linear&quot;</span>, <span class="at">rule =</span> <span class="dv">2</span>)<span class="sc">$</span>y</span>
-<span id="cb4-22"><a href="#cb4-22" tabindex="-1"></a>}</span>
-<span id="cb4-23"><a href="#cb4-23" tabindex="-1"></a></span>
-<span id="cb4-24"><a href="#cb4-24" tabindex="-1"></a>dip2hapidx <span class="ot">&lt;-</span> <span class="cf">function</span>(x){</span>
-<span id="cb4-25"><a href="#cb4-25" tabindex="-1"></a>  x <span class="ot">&lt;-</span> <span class="dv">2</span><span class="sc">*</span>x</span>
-<span id="cb4-26"><a href="#cb4-26" tabindex="-1"></a>  <span class="fu">c</span>(<span class="fu">rbind</span>(x<span class="dv">-1</span>, x))</span>
-<span id="cb4-27"><a href="#cb4-27" tabindex="-1"></a>}</span></code></pre></div>
-<p>Now we can cluster <code>M</code> separately for African and
-non-African haplotypes.</p>
-<div class="sourceCode" id="cb5"><pre class="sourceCode r"><code class="sourceCode r"><span id="cb5-1"><a href="#cb5-1" tabindex="-1"></a><span class="co"># Load sample population information</span></span>
-<span id="cb5-2"><a href="#cb5-2" tabindex="-1"></a><span class="do">#########################################</span></span>
-<span id="cb5-3"><a href="#cb5-3" tabindex="-1"></a>cluster_by <span class="ot">&lt;-</span> <span class="st">&quot;isAFR&quot;</span></span>
-<span id="cb5-4"><a href="#cb5-4" tabindex="-1"></a>id <span class="ot">&lt;-</span> <span class="fu">fread</span>(<span class="fu">paste0</span>(data_dir, gene, <span class="st">&quot;.sample&quot;</span>))<span class="sc">$</span>sample</span>
-<span id="cb5-5"><a href="#cb5-5" tabindex="-1"></a>init_order_samples <span class="ot">&lt;-</span> <span class="fu">order</span>(id)</span>
-<span id="cb5-6"><a href="#cb5-6" tabindex="-1"></a>samples <span class="ot">&lt;-</span> <span class="fu">merge</span>(<span class="fu">data.table</span>(<span class="st">&quot;id&quot;</span> <span class="ot">=</span> id), kgp3, <span class="at">by =</span> <span class="st">&quot;id&quot;</span>)</span>
-<span id="cb5-7"><a href="#cb5-7" tabindex="-1"></a><span class="cf">if</span>(<span class="fu">nrow</span>(samples) <span class="sc">!=</span> <span class="fu">length</span>(id)) { <span class="fu">stop</span>(<span class="st">&quot;some samples have been removed by merging with kgp3&quot;</span>) }</span>
-<span id="cb5-8"><a href="#cb5-8" tabindex="-1"></a><span class="cf">if</span>(<span class="sc">!</span><span class="fu">all.equal</span>(init_order_samples, <span class="fu">order</span>(samples<span class="sc">$</span>id))) { <span class="fu">stop</span>(<span class="st">&quot;some samples have been moved out of the order in lct.sample&quot;</span>) }</span>
-<span id="cb5-9"><a href="#cb5-9" tabindex="-1"></a>samples[,isAFR <span class="sc">:=</span> <span class="fu">ifelse</span>(reg <span class="sc">==</span> <span class="st">&quot;AFR&quot;</span>, <span class="st">&quot;AFR&quot;</span>, <span class="st">&quot;not_AFR&quot;</span>)]</span>
-<span id="cb5-10"><a href="#cb5-10" tabindex="-1"></a></span>
-<span id="cb5-11"><a href="#cb5-11" tabindex="-1"></a><span class="co"># Symmeterize &amp; Scale Distance Matrix at LCT</span></span>
-<span id="cb5-12"><a href="#cb5-12" tabindex="-1"></a><span class="do">###############################################</span></span>
-<span id="cb5-13"><a href="#cb5-13" tabindex="-1"></a>M <span class="ot">&lt;-</span> (<span class="fl">0.5</span><span class="sc">/</span>(neg_log10_mu<span class="sc">*</span><span class="fu">log</span>(<span class="dv">10</span>))) <span class="sc">*</span> (M <span class="sc">+</span> <span class="fu">t</span>(M))</span>
-<span id="cb5-14"><a href="#cb5-14" tabindex="-1"></a></span>
-<span id="cb5-15"><a href="#cb5-15" tabindex="-1"></a><span class="co"># Permute &amp; Cluster Distance Matrix</span></span>
-<span id="cb5-16"><a href="#cb5-16" tabindex="-1"></a><span class="do">###################################################################</span></span>
-<span id="cb5-17"><a href="#cb5-17" tabindex="-1"></a>diploid_perm <span class="ot">&lt;-</span> <span class="fu">order</span>(samples<span class="sc">$</span>reg, samples<span class="sc">$</span>pop, samples<span class="sc">$</span>id)</span>
-<span id="cb5-18"><a href="#cb5-18" tabindex="-1"></a>psamples <span class="ot">&lt;-</span> samples[diploid_perm,]</span>
-<span id="cb5-19"><a href="#cb5-19" tabindex="-1"></a></span>
-<span id="cb5-20"><a href="#cb5-20" tabindex="-1"></a>haploid_perm <span class="ot">&lt;-</span> <span class="fu">dip2hapidx</span>(diploid_perm)</span>
-<span id="cb5-21"><a href="#cb5-21" tabindex="-1"></a></span>
-<span id="cb5-22"><a href="#cb5-22" tabindex="-1"></a>pM <span class="ot">&lt;-</span> M[, haploid_perm][haploid_perm,]</span>
-<span id="cb5-23"><a href="#cb5-23" tabindex="-1"></a></span>
-<span id="cb5-24"><a href="#cb5-24" tabindex="-1"></a>hap_groups <span class="ot">&lt;-</span> <span class="fu">table</span>(psamples[[cluster_by]])</span>
-<span id="cb5-25"><a href="#cb5-25" tabindex="-1"></a>hap_groups <span class="ot">&lt;-</span> hap_groups[<span class="fu">unique</span>(psamples[[cluster_by]])]</span>
-<span id="cb5-26"><a href="#cb5-26" tabindex="-1"></a></span>
-<span id="cb5-27"><a href="#cb5-27" tabindex="-1"></a>baseline_idx <span class="ot">&lt;-</span> <span class="fu">c</span>(<span class="dv">0</span>, <span class="fu">cumsum</span>(<span class="dv">2</span><span class="sc">*</span>hap_groups)[<span class="sc">-</span><span class="fu">length</span>(hap_groups)])</span>
-<span id="cb5-28"><a href="#cb5-28" tabindex="-1"></a><span class="fu">names</span>(baseline_idx) <span class="ot">&lt;-</span> <span class="fu">names</span>(hap_groups)</span>
-<span id="cb5-29"><a href="#cb5-29" tabindex="-1"></a></span>
-<span id="cb5-30"><a href="#cb5-30" tabindex="-1"></a>order_M <span class="ot">&lt;-</span> <span class="fu">as.list</span>(hap_groups)</span>
-<span id="cb5-31"><a href="#cb5-31" tabindex="-1"></a><span class="fu">names</span>(order_M) <span class="ot">&lt;-</span> <span class="fu">names</span>(hap_groups)</span>
-<span id="cb5-32"><a href="#cb5-32" tabindex="-1"></a></span>
-<span id="cb5-33"><a href="#cb5-33" tabindex="-1"></a><span class="cf">for</span>(i <span class="cf">in</span> <span class="dv">1</span><span class="sc">:</span><span class="fu">length</span>(hap_groups)){</span>
-<span id="cb5-34"><a href="#cb5-34" tabindex="-1"></a>  current_pop_samples <span class="ot">&lt;-</span> <span class="fu">which</span>(psamples[[cluster_by]] <span class="sc">==</span> <span class="fu">names</span>(hap_groups)[i])</span>
-<span id="cb5-35"><a href="#cb5-35" tabindex="-1"></a>  current_pop_haplotypes <span class="ot">&lt;-</span> <span class="fu">dip2hapidx</span>(current_pop_samples)</span>
-<span id="cb5-36"><a href="#cb5-36" tabindex="-1"></a>  sM <span class="ot">&lt;-</span> pM[current_pop_haplotypes, current_pop_haplotypes]</span>
-<span id="cb5-37"><a href="#cb5-37" tabindex="-1"></a>  order_M[[<span class="fu">names</span>(hap_groups)[i]]] <span class="ot">&lt;-</span> baseline_idx[<span class="fu">names</span>(hap_groups)[i]] <span class="sc">+</span> fastcluster<span class="sc">::</span><span class="fu">hclust</span>(<span class="fu">as.dist</span>(sM), <span class="at">method=</span><span class="st">&quot;average&quot;</span>)<span class="sc">$</span>order</span>
-<span id="cb5-38"><a href="#cb5-38" tabindex="-1"></a>}</span>
-<span id="cb5-39"><a href="#cb5-39" tabindex="-1"></a></span>
-<span id="cb5-40"><a href="#cb5-40" tabindex="-1"></a>order_M <span class="ot">&lt;-</span> <span class="fu">unlist</span>(order_M)</span>
-<span id="cb5-41"><a href="#cb5-41" tabindex="-1"></a>cM <span class="ot">&lt;-</span> pM[, order_M][order_M,]</span>
-<span id="cb5-42"><a href="#cb5-42" tabindex="-1"></a></span>
-<span id="cb5-43"><a href="#cb5-43" tabindex="-1"></a></span>
-<span id="cb5-44"><a href="#cb5-44" tabindex="-1"></a><span class="co"># Plot clustered Distance Matrix </span></span>
-<span id="cb5-45"><a href="#cb5-45" tabindex="-1"></a><span class="do">#########################################</span></span>
-<span id="cb5-46"><a href="#cb5-46" tabindex="-1"></a><span class="fu">plot_mat</span>(cM, <span class="fu">paste0</span>(data_dir, gene, <span class="st">&quot;_dist_mat.pdf&quot;</span>))</span></code></pre></div>
-</div>
-<div id="reconstructing-lct-files-directly-from-1000-genomes-data-with-bcftools" class="section level1">
-<h1>Reconstructing LCT files directly from 1000 Genomes data with
-bcftools</h1>
-<p>Download a phased VCF of Chromosome 2 from the 1000 Genomes website,
-<code>https://www.internationalgenome.org/</code>. Below, we assume that
-VCF has name <code>chr2.vcf.gz</code>. The 1000 Genomes Project
-periodically makes updates to the VCFs available. We used
-<code>ALLchr2phase3_shapeit2_mvncall_integrated_v5a20130502genotypes.vcf.gz</code>
-in our analysis. That data was in hg19 coordinates, so throughout this
-vignette, we work entirely in hg19 coordinates.</p>
-<p>Please be mindful that some modification of the recombination map and
-target locus index will be necessary if working with data based on a
-different build.</p>
-<p>If <code>bcftools</code> is not already installed, first install
-<code>bcftools</code> from
-<code>https://samtools.github.io/bcftools/</code>. Then from a bash
-terminal, run</p>
-<div class="sourceCode" id="cb6"><pre class="sourceCode bash"><code class="sourceCode bash"><span id="cb6-1"><a href="#cb6-1" tabindex="-1"></a><span class="ex">bcftools</span> view <span class="at">--regions</span> 2:136608646-136608646 <span class="at">--types</span> snps <span class="at">--min-ac</span> 2:minor <span class="at">-Ou</span> <span class="at">--threads</span> 1 chr2.vcf.gz <span class="kw">|</span> <span class="ex">bcftools</span> convert <span class="at">-h</span> lct <span class="at">--threads</span> 1</span></code></pre></div>
-<p>Note, both of the above commands take a <code>--threads</code>
-argument. Here, we’ve set it to <code>1</code> but this can increased to
-the number of available cores to increase the execution speed. See the
-<code>bcftools</code> documentation for more details.</p>
-</div>
-
-
-
-<!-- code folding -->
-
-
-<!-- dynamically load mathjax for compatibility with self-contained -->
-<script>
-  (function () {
-    var script = document.createElement("script");
-    script.type = "text/javascript";
-    script.src  = "https://mathjax.rstudio.com/latest/MathJax.js?config=TeX-AMS-MML_HTMLorMML";
-    document.getElementsByTagName("head")[0].appendChild(script);
-  })();
-</script>
-
-</body>
-</html>

From 6faf7a765810dadece8c2755d8033b13e318a946 Mon Sep 17 00:00:00 2001
From: Louis Aslett <louis.aslett@durham.ac.uk>
Date: Tue, 1 Oct 2024 17:56:41 +0100
Subject: [PATCH 31/43] Eliminate some dev testing code from MakeUpdateCache
 (still tracked in general_checkpoint_solver branch)

---
 R/Iterator.R | 42 +-----------------------------------------
 1 file changed, 1 insertion(+), 41 deletions(-)

diff --git a/R/Iterator.R b/R/Iterator.R
index 60e4046..538ca48 100644
--- a/R/Iterator.R
+++ b/R/Iterator.R
@@ -338,47 +338,10 @@ calc_tables <- function(propagation.cost,max.num.checkpoints, use.R = FALSE){
 }
 
 
-MakeUpdateCache <- function(sch, use.pi, cost.list = NULL, targets.idx = NULL){
+MakeUpdateCache <- function(sch, use.pi, targets.idx = NULL){
 
   force(targets.idx)
 
-  track.cost <- FALSE
-
-  if(!is.null(cost.list)){
-
-    mem.copy.cost = cost.list$mem.copy.cost
-    disk.read.cost = cost.list$disk.read.cost
-    disk.write.cost = cost.list$disk.write.cost
-    num.ram.ckpts = cost.list$num.ram.ckpts
-    num.disk.ckpts = cost.list$num.disk.ckpts
-    K <- num.ram.ckpts + num.disk.ckpts
-    track.cost <- TRUE
-    cost <- 0
-
-    transfer.cost <- function(to_k,from_k){
-      from_ram <- from_k <= num.ram.ckpts
-      to_ram <- to_k <= num.ram.ckpts
-
-      if(from_ram & to_ram){
-        return(mem.copy.cost)
-      }
-
-      if(!from_ram & to_ram){
-        return(disk.read.cost)
-      }
-    }
-
-    write.cost <- function(k){
-      if(k <= num.ram.ckpts ){
-        return(0)
-      }else{
-        return(disk.write.cost)
-      }
-    }
-
-  }
-
-
   exhausted <- FALSE
   current.ins <- leading.ins <- 1
   ancestor <- 1
@@ -415,10 +378,8 @@ MakeUpdateCache <- function(sch, use.pi, cost.list = NULL, targets.idx = NULL){
         akk <- sch$k[ancestor]
 
         if(akk != 0){
-          if(track.cost){ cost <<- cost + transfer.cost(kk,akk) }
           CopyTable(cache[[ kk ]],cache[[ akk ]])
         }else{
-          if(track.cost){ cost <<- cost + transfer.cost(kk,0) }
           if(use.pi){
             ResetTable(cache[[kk]]) # Pi could also be the baseline table here for the entire interval
           }else{
@@ -427,7 +388,6 @@ MakeUpdateCache <- function(sch, use.pi, cost.list = NULL, targets.idx = NULL){
         }
 
         # advance cache table from ancestor to current checkpoint destination
-        if(track.cost){ cost <<- cost + sum( d[ (sch$i[ancestor] + 1) : sch$i[current.ins] ])}
         if(!is.null(targets.idx)){
           Forward(cache[[kk]],pars,targets.idx[sch$i[current.ins]],nthreads)
         } else {

From 20794ef014c41eaae05e10b57c05c547c8647409 Mon Sep 17 00:00:00 2001
From: Louis Aslett <louis.aslett@durham.ac.uk>
Date: Tue, 1 Oct 2024 18:16:03 +0100
Subject: [PATCH 32/43] Include vignette building in installation instructions

---
 README.md | 5 +++--
 1 file changed, 3 insertions(+), 2 deletions(-)

diff --git a/README.md b/README.md
index 5a65285..07effd4 100644
--- a/README.md
+++ b/README.md
@@ -13,7 +13,7 @@ For now, the current development version can be installed using the [remotes](ht
 
 ```
 install.packages("remotes")
-remotes::install_github("louisaslett/kalis")
+remotes::install_github("louisaslett/kalis", build_vignettes = TRUE)
 ```
 
 Note that kalis uses various low-level optimisations meaning that you should ensure the compiler is targeting your local CPU architecture.
@@ -21,7 +21,8 @@ The simplest way to do this is to pass configure variables setting the correct `
 
 ```
 remotes::install_github("louisaslett/kalis",
-  configure.vars = c(kalis = "PKG_CFLAGS='-march=native -mtune=native -O3'"))
+  configure.vars = c(kalis = "PKG_CFLAGS='-march=native -mtune=native -O3'"),
+  build_vignettes = TRUE)
 ```
 
 If you do not have the correct flags set, kalis will fall back to an implementation which does not use the special vector instruction set architecture of your CPU and will provide a warning when you load the package in your R session.

From 1c9543a10bb7c11dcb37fee50e992087e4d7b4f6 Mon Sep 17 00:00:00 2001
From: Louis Aslett <louis.aslett@durham.ac.uk>
Date: Wed, 2 Oct 2024 18:43:33 +0100
Subject: [PATCH 33/43] First batch of documentation fixes, some TODO items
 remain in these.

---
 R/CladeMat.R                   | 39 ++++++++++++++++++++++++++--
 R/Clades.R                     | 40 +++++++++++++++++++++++------
 R/TableCache.R                 | 46 +++++++++++++++++++---------------
 man/CladeMat.Rd                | 38 ++++++++++++++++++++++++++--
 man/Clades.Rd                  | 27 +++++++++++++++-----
 man/CreateForwardTableCache.Rd | 21 ++++++++++------
 man/FillTableCache.Rd          | 14 ++---------
 7 files changed, 168 insertions(+), 57 deletions(-)

diff --git a/R/CladeMat.R b/R/CladeMat.R
index 2e1a601..ad8c6a7 100644
--- a/R/CladeMat.R
+++ b/R/CladeMat.R
@@ -1,7 +1,42 @@
-#' Fast Clade Matrix Construction
+#' Fast clade matrix construction
+#'
+#' Constructs a clade matrix using forward and backward tables.
+#' The clade matrix captures genetic relatedness information in the distances from the Li & Stephens model that are not captured in the called clades.
+#'
+#' `CladeMat()` uses the forward and backward tables to construct the corresponding clade matrix which can then be tested, for example using a standard quadratic form score statistic.
+#'
+#' @references
+#' Christ, R., Wang, X., Aslett, L.J.M., Steinsaltz, D. and Hall, I. (2024) "Clade Distillation for Genome-wide Association Studies." bioRxiv 2024.09.30.615852. Available at: \doi{10.1101/2024.09.30.615852}.
+#'
+#' @param fwd
+#'        a `kalisForwardTable` object, as returned by [MakeForwardTable()] and propagated to a target variant by [Forward()].
+#'        This table must be at the same variant location as argument `bck`.
+#' @param bck
+#'        a `kalisBackwardTable` object, as returned by [MakeBackwardTable()] and propagated to a target variant by [Backward()].
+#'        This table must be at the same variant location as argument `fwd`.
+#' @param M
+#'        a matrix with half the number of rows and columns as the corresponding forward/backward tables.
+#'        This matrix is overwritten in place with the clade matrix result for performance reasons.
+#' @param unit.dist
+#'        TODO
+#' @param thresh
+#'        TODO
+#' @param max1var
+#'        TODO
+#' @param nthreads
+#'        the number of CPU cores to use.
+#'        By default uses the `parallel` package to detect the number of physical cores.
+#'
+#' @return
+#' TODO: this returns from C the list containing neighbourhood, similarity and total clades info, but need full details and list structure.
+#'
+#' @examples
+#' # TODO
+#'
+#'
 #' @export CladeMat
 CladeMat <- function(fwd, bck, M, unit.dist, thresh = 0.2, max1var = FALSE,
-                    nthreads = min(parallel::detectCores(logical = FALSE), fwd$to_recipient-fwd$from_recipient+1)){
+                     nthreads = min(parallel::detectCores(logical = FALSE), fwd$to_recipient-fwd$from_recipient+1)){
 
   # input checks
   #########################
diff --git a/R/Clades.R b/R/Clades.R
index 0a29988..53c1d33 100644
--- a/R/Clades.R
+++ b/R/Clades.R
@@ -199,14 +199,38 @@ PruneCladeMat <- function(M, neigh, sprigs, prune = "singleton.info", from.recip
 #' Probabilistic Clades
 #'
 #' Utility for calling probabilistic clades at, in between, or excluding variants.
-#' @param fwd a forward table as returned by [MakeForwardTable()]
-#' @param bck a backward table as returned by [MakeBackwardTable()]
-#' @param pars a `kalisParameters` object, as returned by [Parameters()].
-#' @param beta.theta.opts a list; see Details for [DistMat()].
-#' @param safety.checks a logical, should safety checks be applied to the distances?  See [DistMat()].
-#' @param neighbors a logical, should nearest neighbors be pre-calculated?  See [Neighbors()].
-#' @param use.forking a logical, should forked processes be used?
-#' @param nthreads the number of CPU cores to use. Currently, no parallelism is used.
+#'
+#' TODO longer description
+#'
+#' @references
+#' Christ, R., Wang, X., Aslett, L.J.M., Steinsaltz, D. and Hall, I. (2024) "Clade Distillation for Genome-wide Association Studies." bioRxiv 2024.09.30.615852. Available at: \doi{10.1101/2024.09.30.615852}.
+#'
+#' @param fwd
+#'        a `kalisForwardTable` object, as returned by [MakeForwardTable()] and propagated to a target variant by [Forward()].
+#'        This table must be at the same variant location as argument `bck`.
+#' @param bck
+#'        a `kalisBackwardTable` object, as returned by [MakeBackwardTable()] and propagated to a target variant by [Backward()].
+#'        This table must be at the same variant location as argument `fwd`.
+#' @param pars
+#'        a `kalisParameters` object, as returned by [Parameters()].
+#' @param beta.theta.opts
+#'        a list; see Details in [DistMat()] documentation page.
+#' @param safety.checks
+#'        a logical, should safety checks be applied to the distances?
+#'        See [DistMat()].
+#' @param neighbors
+#'        a logical, should nearest neighbors be pre-calculated?
+#'        See [Neighbors()].
+#' @param use.forking
+#'        a logical, should forked processes be used?
+#' @param forking.chunk.size
+#'        TODO
+#' @param mc.preschedule
+#'        TODO
+#' @param nthreads
+#'        the number of CPU cores to use.
+#'        By default no parallelism is used.
+#'
 #' @return
 #'   a `kalisClades` object encoding probabilistic clade calls
 #'
diff --git a/R/TableCache.R b/R/TableCache.R
index 5de70dc..98287f1 100644
--- a/R/TableCache.R
+++ b/R/TableCache.R
@@ -16,16 +16,27 @@
 #' To use the cache, then instead of using the [Forward()] function,
 #' use [ForwardUsingTableCache()].
 #'
-#' @param pars a `kalisParameters` object, as returned by [Parameters()].
-#' @param size the maximum amount of RAM (in GB) to devote to this cache.
-#' @param from_recipient first recipient haplotype if creating a partial forward
-#'   table cache.  By default includes from the first recipient haplotype.
-#' @param to_recipient last recipient haplotype if creating a partial forward
-#'   table cache.  By default includes to the last recipient haplotype.
+#' @references
+#' Christ, R., Wang, X., Aslett, L.J.M., Steinsaltz, D. and Hall, I. (2024) "Clade Distillation for Genome-wide Association Studies." bioRxiv 2024.09.30.615852. Available at: \doi{10.1101/2024.09.30.615852}.
+#'
+#' @param pars
+#'        a `kalisParameters` object, as returned by [Parameters()].
+#' @param size
+#'        the maximum amount of RAM (in GB) to devote to this cache.
+#'        By default, 1GB.
+#' @param from_recipient
+#'        first recipient haplotype if creating a partial forward table cache.
+#'        By default includes from the first recipient haplotype.
+#' @param to_recipient
+#'        last recipient haplotype if creating a partial forward table cache.
+#'        By default includes to the last recipient haplotype.
+#' @param max.tables
+#'        positive integer indicating the maximum number of tables to use in the cache.
+#'        Both this and `size` will be honoured, so the number of tables may be smaller than this.
+#'        By default, equals \eqn{\lfloor\log_2(L)\rfloor}.
 #'
 #' @return
-#'   A list of forward tables representing a cache and ready to be filled is
-#'   returned.
+#'   A list of forward tables representing a cache and ready to be filled is returned.
 #'
 #' @seealso
 #'   [MakeForwardTable()] to make a forward table;
@@ -128,18 +139,13 @@ CreateForwardTableCache <- function(pars, size = 1, from_recipient = 1, to_recip
 #' To use the cache, then instead of using the [Forward()] function,
 #' use [ForwardUsingTableCache()].
 #'
-#' @param cache a cache of forward tables as generated by
-#'   [CreateForwardTableCache()]
-#' @param pars a `kalisParameters` object, as returned by [Parameters()].
-#' @param from the first locus which the geometrically spaced cache should be
-#'   built from.
-#'   By default the whole sequence length will be cached so this defaults to 1.
-#' @param to the last locus up to which the geometrically spaced cache should be
-#'   built.
-#'   By default the whole sequence length will be cached so this defaults to
-#'   `Inf`.
-#' @param nthreads the number of CPU cores to use.
-#'   By default no parallelism is used.
+#' @param cache
+#'        a cache of forward tables as generated by [CreateForwardTableCache()].
+#' @param pars
+#'        a `kalisParameters` object, as returned by [Parameters()].
+#' @param nthreads
+#'        the number of CPU cores to use.
+#'        By default uses the `parallel` package to detect the number of physical cores.
 #'
 #' @return
 #' There is nothing returned.
diff --git a/man/CladeMat.Rd b/man/CladeMat.Rd
index 7eed863..86af088 100644
--- a/man/CladeMat.Rd
+++ b/man/CladeMat.Rd
@@ -2,7 +2,7 @@
 % Please edit documentation in R/CladeMat.R
 \name{CladeMat}
 \alias{CladeMat}
-\title{Fast Clade Matrix Construction}
+\title{Fast clade matrix construction}
 \usage{
 CladeMat(
   fwd,
@@ -15,6 +15,40 @@ CladeMat(
     fwd$from_recipient + 1)
 )
 }
+\arguments{
+\item{fwd}{a \code{kalisForwardTable} object, as returned by \code{\link[=MakeForwardTable]{MakeForwardTable()}} and propagated to a target variant by \code{\link[=Forward]{Forward()}}.
+This table must be at the same variant location as argument \code{bck}.}
+
+\item{bck}{a \code{kalisBackwardTable} object, as returned by \code{\link[=MakeBackwardTable]{MakeBackwardTable()}} and propagated to a target variant by \code{\link[=Backward]{Backward()}}.
+This table must be at the same variant location as argument \code{fwd}.}
+
+\item{M}{a matrix with half the number of rows and columns as the corresponding forward/backward tables.
+This matrix is overwritten in place with the clade matrix result for performance reasons.}
+
+\item{unit.dist}{TODO}
+
+\item{thresh}{TODO}
+
+\item{max1var}{TODO}
+
+\item{nthreads}{the number of CPU cores to use.
+By default uses the \code{parallel} package to detect the number of physical cores.}
+}
+\value{
+TODO: this returns from C the list containing neighbourhood, similarity and total clades info, but need full details and list structure.
+}
 \description{
-Fast Clade Matrix Construction
+Constructs a clade matrix using forward and backward tables.
+The clade matrix captures genetic relatedness information in the distances from the Li & Stephens model that are not captured in the called clades.
+}
+\details{
+\code{CladeMat()} uses the forward and backward tables to construct the corresponding clade matrix which can then be tested, for example using a standard quadratic form score statistic.
+}
+\examples{
+# TODO
+
+
+}
+\references{
+Christ, R., Wang, X., Aslett, L.J.M., Steinsaltz, D. and Hall, I. (2024) "Clade Distillation for Genome-wide Association Studies." bioRxiv 2024.09.30.615852. Available at: \doi{10.1101/2024.09.30.615852}.
 }
diff --git a/man/Clades.Rd b/man/Clades.Rd
index b5552c5..8e8dee7 100644
--- a/man/Clades.Rd
+++ b/man/Clades.Rd
@@ -18,21 +18,30 @@ Clades(
 )
 }
 \arguments{
-\item{fwd}{a forward table as returned by \code{\link[=MakeForwardTable]{MakeForwardTable()}}}
+\item{fwd}{a \code{kalisForwardTable} object, as returned by \code{\link[=MakeForwardTable]{MakeForwardTable()}} and propagated to a target variant by \code{\link[=Forward]{Forward()}}.
+This table must be at the same variant location as argument \code{bck}.}
 
-\item{bck}{a backward table as returned by \code{\link[=MakeBackwardTable]{MakeBackwardTable()}}}
+\item{bck}{a \code{kalisBackwardTable} object, as returned by \code{\link[=MakeBackwardTable]{MakeBackwardTable()}} and propagated to a target variant by \code{\link[=Backward]{Backward()}}.
+This table must be at the same variant location as argument \code{fwd}.}
 
 \item{pars}{a \code{kalisParameters} object, as returned by \code{\link[=Parameters]{Parameters()}}.}
 
-\item{beta.theta.opts}{a list; see Details for \code{\link[=DistMat]{DistMat()}}.}
+\item{beta.theta.opts}{a list; see Details in \code{\link[=DistMat]{DistMat()}} documentation page.}
 
-\item{safety.checks}{a logical, should safety checks be applied to the distances?  See \code{\link[=DistMat]{DistMat()}}.}
+\item{safety.checks}{a logical, should safety checks be applied to the distances?
+See \code{\link[=DistMat]{DistMat()}}.}
 
-\item{neighbors}{a logical, should nearest neighbors be pre-calculated?  See \code{\link[=Neighbors]{Neighbors()}}.}
+\item{neighbors}{a logical, should nearest neighbors be pre-calculated?
+See \code{\link[=Neighbors]{Neighbors()}}.}
 
 \item{use.forking}{a logical, should forked processes be used?}
 
-\item{nthreads}{the number of CPU cores to use. Currently, no parallelism is used.}
+\item{forking.chunk.size}{TODO}
+
+\item{mc.preschedule}{TODO}
+
+\item{nthreads}{the number of CPU cores to use.
+By default no parallelism is used.}
 }
 \value{
 a \code{kalisClades} object encoding probabilistic clade calls
@@ -40,3 +49,9 @@ a \code{kalisClades} object encoding probabilistic clade calls
 \description{
 Utility for calling probabilistic clades at, in between, or excluding variants.
 }
+\details{
+TODO longer description
+}
+\references{
+Christ, R., Wang, X., Aslett, L.J.M., Steinsaltz, D. and Hall, I. (2024) "Clade Distillation for Genome-wide Association Studies." bioRxiv 2024.09.30.615852. Available at: \doi{10.1101/2024.09.30.615852}.
+}
diff --git a/man/CreateForwardTableCache.Rd b/man/CreateForwardTableCache.Rd
index 865844d..4914e47 100644
--- a/man/CreateForwardTableCache.Rd
+++ b/man/CreateForwardTableCache.Rd
@@ -15,17 +15,21 @@ CreateForwardTableCache(
 \arguments{
 \item{pars}{a \code{kalisParameters} object, as returned by \code{\link[=Parameters]{Parameters()}}.}
 
-\item{size}{the maximum amount of RAM (in GB) to devote to this cache.}
+\item{size}{the maximum amount of RAM (in GB) to devote to this cache.
+By default, 1GB.}
 
-\item{from_recipient}{first recipient haplotype if creating a partial forward
-table cache.  By default includes from the first recipient haplotype.}
+\item{from_recipient}{first recipient haplotype if creating a partial forward table cache.
+By default includes from the first recipient haplotype.}
 
-\item{to_recipient}{last recipient haplotype if creating a partial forward
-table cache.  By default includes to the last recipient haplotype.}
+\item{to_recipient}{last recipient haplotype if creating a partial forward table cache.
+By default includes to the last recipient haplotype.}
+
+\item{max.tables}{positive integer indicating the maximum number of tables to use in the cache.
+Both this and \code{size} will be honoured, so the number of tables may be smaller than this.
+By default, equals \eqn{\lfloor\log_2(L)\rfloor}.}
 }
 \value{
-A list of forward tables representing a cache and ready to be filled is
-returned.
+A list of forward tables representing a cache and ready to be filled is returned.
 }
 \description{
 Create an in-memory cache for forward tables to improve efficiency when
@@ -71,6 +75,9 @@ for(l in L:1) {
 }
 }
 
+}
+\references{
+Christ, R., Wang, X., Aslett, L.J.M., Steinsaltz, D. and Hall, I. (2024) "Clade Distillation for Genome-wide Association Studies." bioRxiv 2024.09.30.615852. Available at: \doi{10.1101/2024.09.30.615852}.
 }
 \seealso{
 \code{\link[=MakeForwardTable]{MakeForwardTable()}} to make a forward table;
diff --git a/man/FillTableCache.Rd b/man/FillTableCache.Rd
index dc3865a..531682a 100644
--- a/man/FillTableCache.Rd
+++ b/man/FillTableCache.Rd
@@ -12,22 +12,12 @@ FillTableCache(
 )
 }
 \arguments{
-\item{cache}{a cache of forward tables as generated by
-\code{\link[=CreateForwardTableCache]{CreateForwardTableCache()}}}
+\item{cache}{a cache of forward tables as generated by \code{\link[=CreateForwardTableCache]{CreateForwardTableCache()}}.}
 
 \item{pars}{a \code{kalisParameters} object, as returned by \code{\link[=Parameters]{Parameters()}}.}
 
 \item{nthreads}{the number of CPU cores to use.
-By default no parallelism is used.}
-
-\item{from}{the first locus which the geometrically spaced cache should be
-built from.
-By default the whole sequence length will be cached so this defaults to 1.}
-
-\item{to}{the last locus up to which the geometrically spaced cache should be
-built.
-By default the whole sequence length will be cached so this defaults to
-\code{Inf}.}
+By default uses the \code{parallel} package to detect the number of physical cores.}
 }
 \value{
 There is nothing returned.

From 4d751e357f8fd3b7f332b638b5229bc80a24d107 Mon Sep 17 00:00:00 2001
From: Louis Aslett <louis.aslett@durham.ac.uk>
Date: Wed, 2 Oct 2024 18:44:10 +0100
Subject: [PATCH 34/43] Update to description file with ORCIDs, first kalis
 paper, and bug reports URL.

---
 DESCRIPTION | 28 ++++++++++++++++------------
 1 file changed, 16 insertions(+), 12 deletions(-)

diff --git a/DESCRIPTION b/DESCRIPTION
index f4c25b9..de10ad6 100644
--- a/DESCRIPTION
+++ b/DESCRIPTION
@@ -3,23 +3,27 @@ Type: Package
 Title: High Performance Li & Stephens Local Ancestry Inference
 Version: 2.0.0
 Authors@R: c(person("Louis", "Aslett", role = c("aut", "cre"),
-                    email = "louis.aslett@durham.ac.uk"),
+                    email = "louis.aslett@durham.ac.uk",
+                    comment = c(ORCID = "0000-0003-2211-233X")),
              person("Ryan", "Christ", role = "aut",
-                    email = "rchrist@wustl.edu"))
+                    email = "rchrist@wustl.edu",
+                    comment = c(ORCID = "0000-0002-2049-3389")))
 Author: Louis Aslett [aut, cre],
   Ryan Christ [aut]
 Maintainer: Louis Aslett <louis.aslett@durham.ac.uk>
-Description: kalis provides a high performance implementation of the Li &
-  Stephens model <https://www.ncbi.nlm.nih.gov/pubmed/14704198> for local
-  ancestry inference (local referring to a region of the genome). For a set of N
-  phased haplotypes, kalis computes the posterior marginal probability of each
-  haplotype copying every other haplotype by running N hidden Markov models in
-  parallel. This yields an N x N distance matrix that summarizes the recent
-  local ancestry at each variant of interest. The package provides functionality
-  for specifying a recombination map, site-specific mutation rates, and
-  differing prior copying probabilities for each recipient haplotype. Extensive
-  use is made of low level threading and CPU vector instructions.
+Description: kalis <doi:10.1186/s12859-024-05688-8> provides a high performance 
+  implementation of the Li & Stephens model <doi:10.1093/genetics/165.4.2213> 
+  for local ancestry inference (local referring to a region of the genome). For 
+  a set of N phased haplotypes, kalis computes the posterior marginal
+  probability of each haplotype copying every other haplotype by running N
+  hidden Markov models in parallel. This yields an N x N distance matrix that
+  summarizes the recent local ancestry at each variant of interest. The package
+  provides functionality for specifying a recombination map, site-specific
+  mutation rates, and differing prior copying probabilities for each recipient
+  haplotype. Extensive use is made of low level threading and CPU vector
+  instructions.
 License: GPL (>= 3)
+BugReports: https://github.com/louisaslett/kalis/issues
 URL: https://kalis.louisaslett.com/, https://github.com/louisaslett/kalis
 LazyData: TRUE
 Depends: R (>= 3.5.0)

From e4243e2bd45c3e28642b0b0d092cb4f05d00e37c Mon Sep 17 00:00:00 2001
From: Louis Aslett <louis.aslett@durham.ac.uk>
Date: Wed, 2 Oct 2024 21:29:11 +0100
Subject: [PATCH 35/43] Second batch of documentation fixes, many TODOs remain.

---
 R/CalcTraces.R                  | 26 ++++++++++++++++
 R/Clades.R                      | 42 ++++++++++++++++++++++++--
 R/Iterator.R                    | 53 +++++++++++++++++++++++++++------
 R/Probs.R                       | 16 ++++++++--
 man/CalcTraces.Rd               | 42 ++++++++++++++++++++++++++
 man/ForwardIterator.Rd          | 44 ++++++++++++++++++++++-----
 man/PruneCladeMat.Rd            | 25 ++++++++++++++--
 man/Sprigs.Rd                   | 19 ++++++++++--
 man/plot.kalisDistanceMatrix.Rd | 15 ++++++++--
 9 files changed, 253 insertions(+), 29 deletions(-)
 create mode 100644 man/CalcTraces.Rd

diff --git a/R/CalcTraces.R b/R/CalcTraces.R
index aa8b32c..e64a807 100644
--- a/R/CalcTraces.R
+++ b/R/CalcTraces.R
@@ -1,3 +1,29 @@
+#' Title TODO
+#'
+#' Short Description TODO
+#'
+#' Long Description TODO
+#'
+#' @param M
+#'        TODO
+#' @param tX
+#'        TODO
+#' @param tQ
+#'        TODO
+#' @param J
+#'        TODO
+#' @param from_recipient
+#'        TODO
+#' @param nthreads
+#'        the number of CPU cores to use.
+#'        By default uses the `parallel` package to detect the number of physical cores.
+#'
+#' @return
+#' TODO
+#'
+#' @examples
+#' # TODO
+#'
 #' @export
 CalcTraces <- function(M, tX, tQ, J,
                        from_recipient = 1L,
diff --git a/R/Clades.R b/R/Clades.R
index 53c1d33..46d3b1c 100644
--- a/R/Clades.R
+++ b/R/Clades.R
@@ -17,7 +17,23 @@ get_neigh_seq <- function(x, i, return.lengths = FALSE){
   }
 }
 
-#' Sprigs
+#' Title TODO
+#'
+#' Short Description TODO
+#'
+#' Long Description TODO
+#'
+#' @param x
+#'        TODO
+#' @param old.sprigs
+#'        TODO
+#'
+#' @return
+#' TODO
+#'
+#' @examples
+#' # TODO
+#'
 #' @export Sprigs
 Sprigs <- function(x, old.sprigs = FALSE){
 
@@ -117,7 +133,29 @@ UpdateMatrixInPlace <- function(M,row.idx,col.idx,x){
 # test <- matrix(as.double(1:144),12,12)
 # UpdateMatrixInPlace(test,c(5,12,12),c(1,3,5),as.double(c(100,200,300)))
 
-#' PruneCladeMat
+#' Title TODO
+#'
+#' Short Description TODO
+#'
+#' Long Description TODO
+#'
+#' @param M
+#'        TODO
+#' @param neigh
+#'        TODO
+#' @param sprigs
+#'        TODO
+#' @param prune
+#'        TODO
+#' @param from.recipient
+#'        TODO
+#'
+#' @return
+#' TODO
+#'
+#' @examples
+#' # TODO
+#'
 #' @export PruneCladeMat
 PruneCladeMat <- function(M, neigh, sprigs, prune = "singleton.info", from.recipient = 1L){
 
diff --git a/R/Iterator.R b/R/Iterator.R
index 538ca48..5c89738 100644
--- a/R/Iterator.R
+++ b/R/Iterator.R
@@ -1,18 +1,53 @@
 #' Build an efficient iterator over loci
 #'
-#' Create a `kalisForwardIterator` for propagating a forward table iteratively over target loci using a table cache and optimal checkpointing.
+#' Create a `kalisForwardIterator` for propagating a forward table iteratively over target variants using a table cache and optimal checkpointing.
 #'
 #' See example.
 #'
+#' @references
+#' Christ, R., Wang, X., Aslett, L.J.M., Steinsaltz, D. and Hall, I. (2024) "Clade Distillation for Genome-wide Association Studies." bioRxiv 2024.09.30.615852. Available at: \doi{10.1101/2024.09.30.615852}.
 #'
-#' @param ram.ckpts an integer specifying the number of checkpoints to store in RAM
-#' @param targets a vector of loci to iterate over (starting with the most downstream target)
-#' @param base.fwd.table a `kalisForwardTable` either at the most upstream target, or if the targets are evenly spaced, one interval upstream of the most upstream target.
-#' `NULL` (the default) is interpretted as the prior `Pi`, see [Parameters()]
-#' @param disk.ckpts an integer specifying the number of checkpoints to store on disk
-#' @param disk.dir a path to a directory where a temporary folder may be made to store checkpoints on disk
-#' @param force.unif a logical, if `TRUE` iterate over targets as if they were uniformly spaced. WARNING: DO NOT use this in conjunction with the targets method, still experimental. With `force.unif = TRUE`, the resulting iterator appear to be targeting the first length(targets) variants with all methods, but in fact will be silently iterating over the original targets.
-#' @seealso [MakeForwardTable()] to create a `kalisForwardTable`.
+#' @param pars
+#'        a `kalisParameters` object, as returned by [Parameters()].
+#' @param ram.ckpts
+#'        an integer specifying the number of checkpoints to store in RAM.
+#' @param targets
+#'        a vector of variants to iterate over (starting with the most downstream target).
+#' @param base.fwd.table
+#'        a `kalisForwardTable` either at the most upstream target, or if the targets are evenly spaced, one interval upstream of the most upstream target.
+#'        If `NULL` (the default), this is interpreted as the prior `Pi`, see [Parameters()].
+#' @param disk.ckpts
+#'        an integer specifying the number of checkpoints to store on disk.
+#' @param disk.dir
+#'        a path to a directory where a temporary folder may be made to store checkpoints on disk.
+#' @param from_recipient
+#'        first recipient haplotype included in the tables of the cache, if creating a partial forward table.
+#'        By default all are included from the first recipient haplotype.
+#'        Haplotypes are indexed from 1.
+#' @param to_recipient
+#'        last recipient haplotype included in the tables of the cache, if creating a partial forward table.
+#'        By default all are included upto the last recipient haplotype.
+#'        Haplotypes are indexed from 1.
+#' @param lookup.tables
+#'        TODO
+#' @param cache
+#'        a `kalisCheckpointTable` object, as returned by [CreateForwardTableCache()] or this function.
+#'        By default `NULL`, which causes this function to create a new cache.
+#' @param save.cache
+#'        TODO
+#' @param exact
+#'        TODO
+#' @param force.unif
+#'        a logical, if `TRUE` iterate over targets as if they were uniformly spaced.
+#'        WARNING: DO NOT use this in conjunction with the targets method, still experimental.
+#'        With `force.unif = TRUE`, the resulting iterator will appear to be targeting the first `length(targets)` variants with all methods, but in fact will be silently iterating over the original targets.
+#'
+#' @return
+#' TODO
+#'
+#' @seealso
+#' [MakeForwardTable()] to create a `kalisForwardTable`;
+#' [CreateForwardTableCache()] to create a cache which can be used with this function.
 #'
 #' @examples
 #' \dontrun{
diff --git a/R/Probs.R b/R/Probs.R
index 152a8ef..a97303e 100644
--- a/R/Probs.R
+++ b/R/Probs.R
@@ -315,13 +315,23 @@ input_checks_for_probs_and_dist_mat <-  function(fwd,bck,beta.theta.opts = NULL)
 
 
 
-#' Plotting function for a kalisDistanceMatrix object
+#' Plotting function for a distance matrix
 #'
 #' Clusters the given distance matrix and generates a heatmap to display it.
 #'
-#' @param d a kalisDistanceMatrix
+#' @param x
+#'        a distance matrix, such as returned by [DistMat()].
+#' @param cluster.method
+#'        the agglomeration method to be used, which is passed to the [fastcluster::hclust()] function.
+#'        This must be (an unambiguous abbreviation of) one of "single", "complete", "average", "mcquitty", "ward.D", "ward.D2", "centroid" or "median".
+#' @param ...
+#'        further arguments to be passed on to the underlying [lattice::levelplot()] plotting function.
 #'
-#' @return There is nothing returned.
+#' @return
+#' No return value, called for side effects.
+#'
+#' @examples
+#' # TODO
 #'
 #' @export
 plot.kalisDistanceMatrix <- function(x, cluster.method = "average", ...) {
diff --git a/man/CalcTraces.Rd b/man/CalcTraces.Rd
new file mode 100644
index 0000000..cf94dec
--- /dev/null
+++ b/man/CalcTraces.Rd
@@ -0,0 +1,42 @@
+% Generated by roxygen2: do not edit by hand
+% Please edit documentation in R/CalcTraces.R
+\name{CalcTraces}
+\alias{CalcTraces}
+\title{Title TODO}
+\usage{
+CalcTraces(
+  M,
+  tX,
+  tQ,
+  J,
+  from_recipient = 1L,
+  nthreads = min(parallel::detectCores(logical = FALSE), ncol(M))
+)
+}
+\arguments{
+\item{M}{TODO}
+
+\item{tX}{TODO}
+
+\item{tQ}{TODO}
+
+\item{J}{TODO}
+
+\item{from_recipient}{TODO}
+
+\item{nthreads}{the number of CPU cores to use.
+By default uses the \code{parallel} package to detect the number of physical cores.}
+}
+\value{
+TODO
+}
+\description{
+Short Description TODO
+}
+\details{
+Long Description TODO
+}
+\examples{
+# TODO
+
+}
diff --git a/man/ForwardIterator.Rd b/man/ForwardIterator.Rd
index 9c2cb82..e16d46f 100644
--- a/man/ForwardIterator.Rd
+++ b/man/ForwardIterator.Rd
@@ -21,21 +21,45 @@ ForwardIterator(
 )
 }
 \arguments{
-\item{ram.ckpts}{an integer specifying the number of checkpoints to store in RAM}
+\item{pars}{a \code{kalisParameters} object, as returned by \code{\link[=Parameters]{Parameters()}}.}
 
-\item{targets}{a vector of loci to iterate over (starting with the most downstream target)}
+\item{ram.ckpts}{an integer specifying the number of checkpoints to store in RAM.}
+
+\item{targets}{a vector of variants to iterate over (starting with the most downstream target).}
 
 \item{base.fwd.table}{a \code{kalisForwardTable} either at the most upstream target, or if the targets are evenly spaced, one interval upstream of the most upstream target.
-\code{NULL} (the default) is interpretted as the prior \code{Pi}, see \code{\link[=Parameters]{Parameters()}}}
+If \code{NULL} (the default), this is interpreted as the prior \code{Pi}, see \code{\link[=Parameters]{Parameters()}}.}
+
+\item{disk.ckpts}{an integer specifying the number of checkpoints to store on disk.}
+
+\item{disk.dir}{a path to a directory where a temporary folder may be made to store checkpoints on disk.}
+
+\item{from_recipient}{first recipient haplotype included in the tables of the cache, if creating a partial forward table.
+By default all are included from the first recipient haplotype.
+Haplotypes are indexed from 1.}
+
+\item{to_recipient}{last recipient haplotype included in the tables of the cache, if creating a partial forward table.
+By default all are included upto the last recipient haplotype.
+Haplotypes are indexed from 1.}
 
-\item{disk.ckpts}{an integer specifying the number of checkpoints to store on disk}
+\item{lookup.tables}{TODO}
 
-\item{disk.dir}{a path to a directory where a temporary folder may be made to store checkpoints on disk}
+\item{cache}{a \code{kalisCheckpointTable} object, as returned by \code{\link[=CreateForwardTableCache]{CreateForwardTableCache()}} or this function.
+By default \code{NULL}, which causes this function to create a new cache.}
 
-\item{force.unif}{a logical, if \code{TRUE} iterate over targets as if they were uniformly spaced. WARNING: DO NOT use this in conjunction with the targets method, still experimental. With \code{force.unif = TRUE}, the resulting iterator appear to be targeting the first length(targets) variants with all methods, but in fact will be silently iterating over the original targets.}
+\item{save.cache}{TODO}
+
+\item{exact}{TODO}
+
+\item{force.unif}{a logical, if \code{TRUE} iterate over targets as if they were uniformly spaced.
+WARNING: DO NOT use this in conjunction with the targets method, still experimental.
+With \code{force.unif = TRUE}, the resulting iterator will appear to be targeting the first \code{length(targets)} variants with all methods, but in fact will be silently iterating over the original targets.}
+}
+\value{
+TODO
 }
 \description{
-Create a \code{kalisForwardIterator} for propagating a forward table iteratively over target loci using a table cache and optimal checkpointing.
+Create a \code{kalisForwardIterator} for propagating a forward table iteratively over target variants using a table cache and optimal checkpointing.
 }
 \details{
 See example.
@@ -55,7 +79,11 @@ for(t in targets(Iter)){
 }
 }
 
+}
+\references{
+Christ, R., Wang, X., Aslett, L.J.M., Steinsaltz, D. and Hall, I. (2024) "Clade Distillation for Genome-wide Association Studies." bioRxiv 2024.09.30.615852. Available at: \doi{10.1101/2024.09.30.615852}.
 }
 \seealso{
-\code{\link[=MakeForwardTable]{MakeForwardTable()}} to create a \code{kalisForwardTable}.
+\code{\link[=MakeForwardTable]{MakeForwardTable()}} to create a \code{kalisForwardTable};
+\code{\link[=CreateForwardTableCache]{CreateForwardTableCache()}} to create a cache which can be used with this function.
 }
diff --git a/man/PruneCladeMat.Rd b/man/PruneCladeMat.Rd
index 2cd1b48..e194061 100644
--- a/man/PruneCladeMat.Rd
+++ b/man/PruneCladeMat.Rd
@@ -2,10 +2,31 @@
 % Please edit documentation in R/Clades.R
 \name{PruneCladeMat}
 \alias{PruneCladeMat}
-\title{PruneCladeMat}
+\title{Title TODO}
 \usage{
 PruneCladeMat(M, neigh, sprigs, prune = "singleton.info", from.recipient = 1L)
 }
+\arguments{
+\item{M}{TODO}
+
+\item{neigh}{TODO}
+
+\item{sprigs}{TODO}
+
+\item{prune}{TODO}
+
+\item{from.recipient}{TODO}
+}
+\value{
+TODO
+}
 \description{
-PruneCladeMat
+Short Description TODO
+}
+\details{
+Long Description TODO
+}
+\examples{
+# TODO
+
 }
diff --git a/man/Sprigs.Rd b/man/Sprigs.Rd
index c7afd3b..01cec11 100644
--- a/man/Sprigs.Rd
+++ b/man/Sprigs.Rd
@@ -2,10 +2,25 @@
 % Please edit documentation in R/Clades.R
 \name{Sprigs}
 \alias{Sprigs}
-\title{Sprigs}
+\title{Title TODO}
 \usage{
 Sprigs(x, old.sprigs = FALSE)
 }
+\arguments{
+\item{x}{TODO}
+
+\item{old.sprigs}{TODO}
+}
+\value{
+TODO
+}
 \description{
-Sprigs
+Short Description TODO
+}
+\details{
+Long Description TODO
+}
+\examples{
+# TODO
+
 }
diff --git a/man/plot.kalisDistanceMatrix.Rd b/man/plot.kalisDistanceMatrix.Rd
index 4fe9413..5246eb4 100644
--- a/man/plot.kalisDistanceMatrix.Rd
+++ b/man/plot.kalisDistanceMatrix.Rd
@@ -2,16 +2,25 @@
 % Please edit documentation in R/Probs.R
 \name{plot.kalisDistanceMatrix}
 \alias{plot.kalisDistanceMatrix}
-\title{Plotting function for a kalisDistanceMatrix object}
+\title{Plotting function for a distance matrix}
 \usage{
 \method{plot}{kalisDistanceMatrix}(x, cluster.method = "average", ...)
 }
 \arguments{
-\item{d}{a kalisDistanceMatrix}
+\item{x}{a distance matrix, such as returned by \code{\link[=DistMat]{DistMat()}}.}
+
+\item{cluster.method}{the agglomeration method to be used, which is passed to the \code{\link[fastcluster:hclust]{fastcluster::hclust()}} function.
+This must be (an unambiguous abbreviation of) one of "single", "complete", "average", "mcquitty", "ward.D", "ward.D2", "centroid" or "median".}
+
+\item{...}{further arguments to be passed on to the underlying \code{\link[lattice:levelplot]{lattice::levelplot()}} plotting function.}
 }
 \value{
-There is nothing returned.
+No return value, called for side effects.
 }
 \description{
 Clusters the given distance matrix and generates a heatmap to display it.
 }
+\examples{
+# TODO
+
+}

From a6015ba6391f189f290c1f414d3e7bfa740c9075 Mon Sep 17 00:00:00 2001
From: Louis Aslett <louis.aslett@durham.ac.uk>
Date: Wed, 2 Oct 2024 21:54:09 +0100
Subject: [PATCH 36/43] Remove exit() call from CladeMat() C function.

---
 src/R_CladeMat.c | 5 +++--
 1 file changed, 3 insertions(+), 2 deletions(-)

diff --git a/src/R_CladeMat.c b/src/R_CladeMat.c
index 8512caa..b89cf75 100644
--- a/src/R_CladeMat.c
+++ b/src/R_CladeMat.c
@@ -744,8 +744,9 @@ SEXP CladeMat(SEXP Rfwd,
   int** neigh;
   neigh = malloc(sizeof(int*)*p);
   if(neigh == NULL) {
-    printf("Failed allocating neigh!\n");
-    exit(1);
+    REprintf("Error: failed allocating neigh!\n");
+    UNPROTECT(4);
+    KALIS_RETURN
   }
   SEXP RES_NNEIGH = PROTECT(Rf_allocVector(INTSXP, p+1));
   int* n_neigh = INTEGER(RES_NNEIGH);

From 047287bd4afc2005c64f2faefe6dd4d109db0522 Mon Sep 17 00:00:00 2001
From: Louis Aslett <louis.aslett@durham.ac.uk>
Date: Wed, 2 Oct 2024 21:59:18 +0100
Subject: [PATCH 37/43] Allocation checks not required for R_alloc (see Writing
 R Extensions)

---
 src/R_MatAndMul.c       | 4 ----
 src/R_MatAndMulBtwVar.c | 4 ----
 2 files changed, 8 deletions(-)

diff --git a/src/R_MatAndMul.c b/src/R_MatAndMul.c
index 61b1521..466a967 100644
--- a/src/R_MatAndMul.c
+++ b/src/R_MatAndMul.c
@@ -308,10 +308,6 @@ void MatAndMul_A(double* restrict res,
     pthread_attr_setdetachstate(&attr, PTHREAD_CREATE_JOINABLE);
 
     double *res_perth = (double*) R_alloc(r*(nthreads+1), sizeof(double));
-    if (res_perth == NULL) {
-      printf("Failed allocating res_perth!\n");
-      exit(1);
-    }
 
     size_t num_perth = c/nthreads;
     size_t rag_end   = c%nthreads;
diff --git a/src/R_MatAndMulBtwVar.c b/src/R_MatAndMulBtwVar.c
index 44d04fa..431e246 100644
--- a/src/R_MatAndMulBtwVar.c
+++ b/src/R_MatAndMulBtwVar.c
@@ -374,10 +374,6 @@ void MatAndMulBtwVar_A(double* restrict res,
     pthread_attr_setdetachstate(&attr, PTHREAD_CREATE_JOINABLE);
 
     double *res_perth = (double*) R_alloc(r*(nthreads+1), sizeof(double));
-    if (res_perth == NULL) {
-      printf("Failed allocating res_perth!\n");
-      exit(1);
-    }
 
     size_t num_perth = c/nthreads;
     size_t rag_end   = c%nthreads;

From cc97b9498b82421852cbf27e57117a0c0644e378 Mon Sep 17 00:00:00 2001
From: ryanchrist <ryan.christ7@gmail.com>
Date: Tue, 12 Nov 2024 10:56:44 -0600
Subject: [PATCH 38/43] documenting new kalis v2 functions

---
 R/CalcTraces.R    | 18 +++++++++---------
 R/CladeMat.R      |  8 ++++----
 R/FB.R            |  4 ++--
 man/Backward.Rd   |  2 +-
 man/CalcTraces.Rd | 18 +++++++++---------
 man/CladeMat.Rd   |  8 ++++----
 man/Forward.Rd    |  2 +-
 7 files changed, 30 insertions(+), 30 deletions(-)

diff --git a/R/CalcTraces.R b/R/CalcTraces.R
index e64a807..2262f15 100644
--- a/R/CalcTraces.R
+++ b/R/CalcTraces.R
@@ -1,25 +1,25 @@
-#' Title TODO
+#' Fast Calculation of Matrix Trace and Hilbert Schmidt Norm
 #'
-#' Short Description TODO
+#' Provides multithreaded calculation of trace and Hilbert Schmidt Norm of a matrix PMP (where P is a projection matrix) without explicitly forming PMP.
 #'
-#' Long Description TODO
+#' P here is assumed to have the form I-QQ' for some matrix Q of orthogonal columns
 #'
 #' @param M
-#'        TODO
+#'        a real symmetric R matrix
 #' @param tX
-#'        TODO
+#'        `t((Q %*% (J%*%Q)) - (M %*% Q))`
 #' @param tQ
-#'        TODO
+#'        `t(Q)`
 #' @param J
-#'        TODO
+#'        `crossprod(Q, M)`
 #' @param from_recipient
-#'        TODO
+#'        haplotype index at which to start trace calculation -- useful for distributed computation (experimental feature, more documentation to come TODO)
 #' @param nthreads
 #'        the number of CPU cores to use.
 #'        By default uses the `parallel` package to detect the number of physical cores.
 #'
 #' @return
-#' TODO
+#' a list containing three elements, the first is the trace `tr(PMP)`, the second is the *squared* Hilbert Schmidt Norm of PMP `tr((PMP)'PMP)`, the third is the diag of `PMP`.
 #'
 #' @examples
 #' # TODO
diff --git a/R/CladeMat.R b/R/CladeMat.R
index ad8c6a7..c6982d0 100644
--- a/R/CladeMat.R
+++ b/R/CladeMat.R
@@ -18,17 +18,17 @@
 #'        a matrix with half the number of rows and columns as the corresponding forward/backward tables.
 #'        This matrix is overwritten in place with the clade matrix result for performance reasons.
 #' @param unit.dist
-#'        TODO
+#'        the change in distance that is expected to correspond to a single mutation (typically \eqn{-log(\mu)}) for the LS model)
 #' @param thresh
-#'        TODO
+#'        a regularization parameter: differences distances must exceed this threshold (in `unit.dist` units) in order to used in forming the local relatedness matrix. Defaults to `0.2`.
 #' @param max1var
-#'        TODO
+#'        a logical regularization parameter. When TRUE, differences in distances exceeding 1 `unit.dist` are set to 1 (so that any edge in the latent ancestral tree with multiple mutations on them are treated as if only one mutation was on it).
 #' @param nthreads
 #'        the number of CPU cores to use.
 #'        By default uses the `parallel` package to detect the number of physical cores.
 #'
 #' @return
-#' TODO: this returns from C the list containing neighbourhood, similarity and total clades info, but need full details and list structure.
+#' A list, the first element contains a list of tied nearest neighbors (one for each haplotype). Other elements return other information to allow for efficient removal of singletons and sprigs by [PruneCladeMat()].
 #'
 #' @examples
 #' # TODO
diff --git a/R/FB.R b/R/FB.R
index 51476d3..5d3116b 100644
--- a/R/FB.R
+++ b/R/FB.R
@@ -6,7 +6,7 @@
 #' `Forward` implements the forward algorithm to advance the Li and Stephens rescaled hidden Markov model forward probabilities to a new target variant.
 #' Naturally, this can only propagate a table to variants downstream of its current position.
 #'
-#' For mathematical details please see Section 2 of the kalis paper (TODO: ref).
+#' For mathematical details please see Section 2 of the kalis paper (https://doi.org/10.1186/s12859-024-05688-8).
 #' Note that the precise formulation of the forward equation is determined by whether the flag `use.spiedel` is set in the parameters provided in `pars`.
 #'
 #' @param fwd a `kalisForwardTable` object, as returned by
@@ -111,7 +111,7 @@ Forward <- function(fwd,
 #' variant.
 #' Naturally, this can only propagate a table to variants upstream of its current position.
 #'
-#' For mathematical details please see Section 2 of the kalis paper (TODO: ref).
+#' For mathematical details please see Section 2 of the kalis paper (https://doi.org/10.1186/s12859-024-05688-8).
 #' Note that the precise formulation of the backward equation is determined by whether the flag `use.spiedel` is set in the parameters provided in `pars`.
 #'
 #' **Beta-theta space**
diff --git a/man/Backward.Rd b/man/Backward.Rd
index 761619b..7cc3256 100644
--- a/man/Backward.Rd
+++ b/man/Backward.Rd
@@ -45,7 +45,7 @@ The table is updated in-place.
 variant.
 Naturally, this can only propagate a table to variants upstream of its current position.
 
-For mathematical details please see Section 2 of the kalis paper (TODO: ref).
+For mathematical details please see Section 2 of the kalis paper (https://doi.org/10.1186/s12859-024-05688-8).
 Note that the precise formulation of the backward equation is determined by whether the flag \code{use.spiedel} is set in the parameters provided in \code{pars}.
 
 \strong{Beta-theta space}
diff --git a/man/CalcTraces.Rd b/man/CalcTraces.Rd
index cf94dec..db508ef 100644
--- a/man/CalcTraces.Rd
+++ b/man/CalcTraces.Rd
@@ -2,7 +2,7 @@
 % Please edit documentation in R/CalcTraces.R
 \name{CalcTraces}
 \alias{CalcTraces}
-\title{Title TODO}
+\title{Fast Calculation of Matrix Trace and Hilbert Schmidt Norm}
 \usage{
 CalcTraces(
   M,
@@ -14,27 +14,27 @@ CalcTraces(
 )
 }
 \arguments{
-\item{M}{TODO}
+\item{M}{a real symmetric R matrix}
 
-\item{tX}{TODO}
+\item{tX}{\code{t((Q \%*\% (J\%*\%Q)) - (M \%*\% Q))}}
 
-\item{tQ}{TODO}
+\item{tQ}{\code{t(Q)}}
 
-\item{J}{TODO}
+\item{J}{\code{crossprod(Q, M)}}
 
-\item{from_recipient}{TODO}
+\item{from_recipient}{haplotype index at which to start trace calculation -- useful for distributed computation (experimental feature, more documentation to come TODO)}
 
 \item{nthreads}{the number of CPU cores to use.
 By default uses the \code{parallel} package to detect the number of physical cores.}
 }
 \value{
-TODO
+a list containing three elements, the first is the trace \code{tr(PMP)}, the second is the \emph{squared} Hilbert Schmidt Norm of PMP \verb{tr((PMP)'PMP)}, the third is the diag of \code{PMP}.
 }
 \description{
-Short Description TODO
+Provides multithreaded calculation of trace and Hilbert Schmidt Norm of a matrix PMP (where P is a projection matrix) without explicitly forming PMP.
 }
 \details{
-Long Description TODO
+P here is assumed to have the form I-QQ' for some matrix Q of orthogonal columns
 }
 \examples{
 # TODO
diff --git a/man/CladeMat.Rd b/man/CladeMat.Rd
index 86af088..70836af 100644
--- a/man/CladeMat.Rd
+++ b/man/CladeMat.Rd
@@ -25,17 +25,17 @@ This table must be at the same variant location as argument \code{fwd}.}
 \item{M}{a matrix with half the number of rows and columns as the corresponding forward/backward tables.
 This matrix is overwritten in place with the clade matrix result for performance reasons.}
 
-\item{unit.dist}{TODO}
+\item{unit.dist}{the change in distance that is expected to correspond to a single mutation (typically \eqn{-log(\mu)}) for the LS model)}
 
-\item{thresh}{TODO}
+\item{thresh}{a regularization parameter: differences distances must exceed this threshold (in \code{unit.dist} units) in order to used in forming the local relatedness matrix. Defaults to \code{0.2}.}
 
-\item{max1var}{TODO}
+\item{max1var}{a logical regularization parameter. When TRUE, differences in distances exceeding 1 \code{unit.dist} are set to 1 (so that any edge in the latent ancestral tree with multiple mutations on them are treated as if only one mutation was on it).}
 
 \item{nthreads}{the number of CPU cores to use.
 By default uses the \code{parallel} package to detect the number of physical cores.}
 }
 \value{
-TODO: this returns from C the list containing neighbourhood, similarity and total clades info, but need full details and list structure.
+A list, the first element contains a list of tied nearest neighbors (one for each haplotype). Other elements return other information to allow for efficient removal of singletons and sprigs by \code{\link[=PruneCladeMat]{PruneCladeMat()}}.
 }
 \description{
 Constructs a clade matrix using forward and backward tables.
diff --git a/man/Forward.Rd b/man/Forward.Rd
index dbb7ceb..aa6aad1 100644
--- a/man/Forward.Rd
+++ b/man/Forward.Rd
@@ -40,7 +40,7 @@ The table is updated in-place.
 \code{Forward} implements the forward algorithm to advance the Li and Stephens rescaled hidden Markov model forward probabilities to a new target variant.
 Naturally, this can only propagate a table to variants downstream of its current position.
 
-For mathematical details please see Section 2 of the kalis paper (TODO: ref).
+For mathematical details please see Section 2 of the kalis paper (https://doi.org/10.1186/s12859-024-05688-8).
 Note that the precise formulation of the forward equation is determined by whether the flag \code{use.spiedel} is set in the parameters provided in \code{pars}.
 }
 \examples{

From 4cde13f7fbbc0e9b8ff2b64563c5d6a2b4f38f15 Mon Sep 17 00:00:00 2001
From: Louis Aslett <louis.aslett@durham.ac.uk>
Date: Wed, 13 Nov 2024 15:22:22 +0000
Subject: [PATCH 39/43] Tweaks to added documentation

---
 R/CalcTraces.R    | 14 ++++++++++----
 R/CladeMat.R      | 11 +++++++----
 R/FB.R            |  9 +++++++--
 man/Backward.Rd   |  5 ++++-
 man/CalcTraces.Rd | 14 ++++++++++----
 man/CladeMat.Rd   | 11 +++++++----
 man/Forward.Rd    |  5 ++++-
 7 files changed, 49 insertions(+), 20 deletions(-)

diff --git a/R/CalcTraces.R b/R/CalcTraces.R
index 2262f15..6248959 100644
--- a/R/CalcTraces.R
+++ b/R/CalcTraces.R
@@ -1,8 +1,8 @@
 #' Fast Calculation of Matrix Trace and Hilbert Schmidt Norm
 #'
-#' Provides multithreaded calculation of trace and Hilbert Schmidt Norm of a matrix PMP (where P is a projection matrix) without explicitly forming PMP.
+#' Provides multithreaded calculation of trace and Hilbert Schmidt Norm of a matrix \eqn{PMP} (where \eqn{P} is a projection matrix and \eqn{M} is real symmetric) without explicitly forming \eqn{PMP}.
 #'
-#' P here is assumed to have the form I-QQ' for some matrix Q of orthogonal columns
+#' \eqn{P} here is assumed to have the form \eqn{I-QQ'} for some matrix \eqn{Q} of orthogonal columns.
 #'
 #' @param M
 #'        a real symmetric R matrix
@@ -13,13 +13,19 @@
 #' @param J
 #'        `crossprod(Q, M)`
 #' @param from_recipient
-#'        haplotype index at which to start trace calculation -- useful for distributed computation (experimental feature, more documentation to come TODO)
+#'        haplotype index at which to start trace calculation --- useful for distributed computation (experimental feature, more documentation to come<!-- TODO -->)
 #' @param nthreads
 #'        the number of CPU cores to use.
 #'        By default uses the `parallel` package to detect the number of physical cores.
 #'
 #' @return
-#' a list containing three elements, the first is the trace `tr(PMP)`, the second is the *squared* Hilbert Schmidt Norm of PMP `tr((PMP)'PMP)`, the third is the diag of `PMP`.
+#' A list containing three elements:
+#'
+#' \describe{
+#'   \item{`trace`}{the trace, \eqn{\mathrm{tr}(PMP)};}
+#'   \item{`hsnorm2`}{the *squared* Hilbert Schmidt Norm of \eqn{PMP}, \eqn{\mathrm{tr}((PMP)'PMP)};}
+#'   \item{`diag`}{the diagonal of \eqn{PMP}.}
+#' }
 #'
 #' @examples
 #' # TODO
diff --git a/R/CladeMat.R b/R/CladeMat.R
index c6982d0..d00d4b6 100644
--- a/R/CladeMat.R
+++ b/R/CladeMat.R
@@ -18,17 +18,20 @@
 #'        a matrix with half the number of rows and columns as the corresponding forward/backward tables.
 #'        This matrix is overwritten in place with the clade matrix result for performance reasons.
 #' @param unit.dist
-#'        the change in distance that is expected to correspond to a single mutation (typically \eqn{-log(\mu)}) for the LS model)
+#'        the change in distance that is expected to correspond to a single mutation (typically \eqn{-\log(\mu)}) for the LS model)
 #' @param thresh
-#'        a regularization parameter: differences distances must exceed this threshold (in `unit.dist` units) in order to used in forming the local relatedness matrix. Defaults to `0.2`.
+#'        a regularization parameter: <!-- TODO: can't parse this sentence --> differences distances must exceed this threshold (in `unit.dist` units) in order to used in forming the local relatedness matrix.
+#'        Defaults to `0.2`.
 #' @param max1var
-#'        a logical regularization parameter. When TRUE, differences in distances exceeding 1 `unit.dist` are set to 1 (so that any edge in the latent ancestral tree with multiple mutations on them are treated as if only one mutation was on it).
+#'        a logical regularization parameter.
+#'        When `TRUE`, differences in distances exceeding 1 `unit.dist` are set to 1 (so that any edge in the latent ancestral tree with multiple mutations on them are treated as if only one mutation was on it).
 #' @param nthreads
 #'        the number of CPU cores to use.
 #'        By default uses the `parallel` package to detect the number of physical cores.
 #'
 #' @return
-#' A list, the first element contains a list of tied nearest neighbors (one for each haplotype). Other elements return other information to allow for efficient removal of singletons and sprigs by [PruneCladeMat()].
+#' A list, the first element contains a list of tied nearest neighbours (one for each haplotype).
+#' Other elements of the returned list are for internal use by [PruneCladeMat()] to allow for efficient removal of singletons and sprigs.
 #'
 #' @examples
 #' # TODO
diff --git a/R/FB.R b/R/FB.R
index 5d3116b..1023c80 100644
--- a/R/FB.R
+++ b/R/FB.R
@@ -6,9 +6,12 @@
 #' `Forward` implements the forward algorithm to advance the Li and Stephens rescaled hidden Markov model forward probabilities to a new target variant.
 #' Naturally, this can only propagate a table to variants downstream of its current position.
 #'
-#' For mathematical details please see Section 2 of the kalis paper (https://doi.org/10.1186/s12859-024-05688-8).
+#' For mathematical details please see Section 2 of the kalis paper (Aslett and Christ, 2024).
 #' Note that the precise formulation of the forward equation is determined by whether the flag `use.spiedel` is set in the parameters provided in `pars`.
 #'
+#' @references
+#' Aslett, L.J.M. and Christ, R.R. (2024) "kalis: a modern implementation of the Li & Stephens model for local ancestry inference in R", *BMC Bioinformatics*, **25**(1). Available at: \doi{10.1186/s12859-024-05688-8}.
+#'
 #' @param fwd a `kalisForwardTable` object, as returned by
 #'   [MakeForwardTable()].
 #' @param pars a `kalisParameters` object, as returned by
@@ -111,7 +114,7 @@ Forward <- function(fwd,
 #' variant.
 #' Naturally, this can only propagate a table to variants upstream of its current position.
 #'
-#' For mathematical details please see Section 2 of the kalis paper (https://doi.org/10.1186/s12859-024-05688-8).
+#' For mathematical details please see Section 2 of the kalis paper (Aslett and Christ, 2024).
 #' Note that the precise formulation of the backward equation is determined by whether the flag `use.spiedel` is set in the parameters provided in `pars`.
 #'
 #' **Beta-theta space**
@@ -123,6 +126,8 @@ Forward <- function(fwd,
 #' A backward table in beta-theta space (with `beta.theta = TRUE`) can be propagated to an upstream variant without incorporating that variant, thereby moving to beta space (`beta.theta = FALSE`), and vice versa.
 #' However, while a backward table in beta space (`beta.theta = FALSE`) can be updated to incorporate the current variant, a backward table that is already in beta-theta space can not move to beta space without changing variants -- that would involve "forgetting" the current variant (see Examples).
 #'
+#' @references
+#' Aslett, L.J.M. and Christ, R.R. (2024) "kalis: a modern implementation of the Li & Stephens model for local ancestry inference in R", *BMC Bioinformatics*, **25**(1). Available at: \doi{10.1186/s12859-024-05688-8}.
 #'
 #' @param bck a `kalisBackwardTable` object, as returned by
 #'   [MakeBackwardTable()].
diff --git a/man/Backward.Rd b/man/Backward.Rd
index 7cc3256..021e524 100644
--- a/man/Backward.Rd
+++ b/man/Backward.Rd
@@ -45,7 +45,7 @@ The table is updated in-place.
 variant.
 Naturally, this can only propagate a table to variants upstream of its current position.
 
-For mathematical details please see Section 2 of the kalis paper (https://doi.org/10.1186/s12859-024-05688-8).
+For mathematical details please see Section 2 of the kalis paper (Aslett and Christ, 2024).
 Note that the precise formulation of the backward equation is determined by whether the flag \code{use.spiedel} is set in the parameters provided in \code{pars}.
 
 \strong{Beta-theta space}
@@ -99,6 +99,9 @@ bck
 try(Backward(bck, pars, 125, beta.theta = FALSE))
 bck
 
+}
+\references{
+Aslett, L.J.M. and Christ, R.R. (2024) "kalis: a modern implementation of the Li & Stephens model for local ancestry inference in R", \emph{BMC Bioinformatics}, \strong{25}(1). Available at: \doi{10.1186/s12859-024-05688-8}.
 }
 \seealso{
 \code{\link[=MakeBackwardTable]{MakeBackwardTable()}} to generate a backward table;
diff --git a/man/CalcTraces.Rd b/man/CalcTraces.Rd
index db508ef..cf45ffe 100644
--- a/man/CalcTraces.Rd
+++ b/man/CalcTraces.Rd
@@ -22,19 +22,25 @@ CalcTraces(
 
 \item{J}{\code{crossprod(Q, M)}}
 
-\item{from_recipient}{haplotype index at which to start trace calculation -- useful for distributed computation (experimental feature, more documentation to come TODO)}
+\item{from_recipient}{haplotype index at which to start trace calculation --- useful for distributed computation (experimental feature, more documentation to come\if{html}{\out{<!-- TODO -->}})}
 
 \item{nthreads}{the number of CPU cores to use.
 By default uses the \code{parallel} package to detect the number of physical cores.}
 }
 \value{
-a list containing three elements, the first is the trace \code{tr(PMP)}, the second is the \emph{squared} Hilbert Schmidt Norm of PMP \verb{tr((PMP)'PMP)}, the third is the diag of \code{PMP}.
+A list containing three elements:
+
+\describe{
+\item{\code{trace}}{the trace, \eqn{\mathrm{tr}(PMP)};}
+\item{\code{hsnorm2}}{the \emph{squared} Hilbert Schmidt Norm of \eqn{PMP}, \eqn{\mathrm{tr}((PMP)'PMP)};}
+\item{\code{diag}}{the diagonal of \eqn{PMP}.}
+}
 }
 \description{
-Provides multithreaded calculation of trace and Hilbert Schmidt Norm of a matrix PMP (where P is a projection matrix) without explicitly forming PMP.
+Provides multithreaded calculation of trace and Hilbert Schmidt Norm of a matrix \eqn{PMP} (where \eqn{P} is a projection matrix and \eqn{M} is real symmetric) without explicitly forming \eqn{PMP}.
 }
 \details{
-P here is assumed to have the form I-QQ' for some matrix Q of orthogonal columns
+\eqn{P} here is assumed to have the form \eqn{I-QQ'} for some matrix \eqn{Q} of orthogonal columns.
 }
 \examples{
 # TODO
diff --git a/man/CladeMat.Rd b/man/CladeMat.Rd
index 70836af..1d7eee6 100644
--- a/man/CladeMat.Rd
+++ b/man/CladeMat.Rd
@@ -25,17 +25,20 @@ This table must be at the same variant location as argument \code{fwd}.}
 \item{M}{a matrix with half the number of rows and columns as the corresponding forward/backward tables.
 This matrix is overwritten in place with the clade matrix result for performance reasons.}
 
-\item{unit.dist}{the change in distance that is expected to correspond to a single mutation (typically \eqn{-log(\mu)}) for the LS model)}
+\item{unit.dist}{the change in distance that is expected to correspond to a single mutation (typically \eqn{-\log(\mu)}) for the LS model)}
 
-\item{thresh}{a regularization parameter: differences distances must exceed this threshold (in \code{unit.dist} units) in order to used in forming the local relatedness matrix. Defaults to \code{0.2}.}
+\item{thresh}{a regularization parameter: \if{html}{\out{<!-- TODO: can't parse this sentence -->}} differences distances must exceed this threshold (in \code{unit.dist} units) in order to used in forming the local relatedness matrix.
+Defaults to \code{0.2}.}
 
-\item{max1var}{a logical regularization parameter. When TRUE, differences in distances exceeding 1 \code{unit.dist} are set to 1 (so that any edge in the latent ancestral tree with multiple mutations on them are treated as if only one mutation was on it).}
+\item{max1var}{a logical regularization parameter.
+When \code{TRUE}, differences in distances exceeding 1 \code{unit.dist} are set to 1 (so that any edge in the latent ancestral tree with multiple mutations on them are treated as if only one mutation was on it).}
 
 \item{nthreads}{the number of CPU cores to use.
 By default uses the \code{parallel} package to detect the number of physical cores.}
 }
 \value{
-A list, the first element contains a list of tied nearest neighbors (one for each haplotype). Other elements return other information to allow for efficient removal of singletons and sprigs by \code{\link[=PruneCladeMat]{PruneCladeMat()}}.
+A list, the first element contains a list of tied nearest neighbours (one for each haplotype).
+Other elements of the returned list are for internal use by \code{\link[=PruneCladeMat]{PruneCladeMat()}} to allow for efficient removal of singletons and sprigs.
 }
 \description{
 Constructs a clade matrix using forward and backward tables.
diff --git a/man/Forward.Rd b/man/Forward.Rd
index aa6aad1..7784f31 100644
--- a/man/Forward.Rd
+++ b/man/Forward.Rd
@@ -40,7 +40,7 @@ The table is updated in-place.
 \code{Forward} implements the forward algorithm to advance the Li and Stephens rescaled hidden Markov model forward probabilities to a new target variant.
 Naturally, this can only propagate a table to variants downstream of its current position.
 
-For mathematical details please see Section 2 of the kalis paper (https://doi.org/10.1186/s12859-024-05688-8).
+For mathematical details please see Section 2 of the kalis paper (Aslett and Christ, 2024).
 Note that the precise formulation of the forward equation is determined by whether the flag \code{use.spiedel} is set in the parameters provided in \code{pars}.
 }
 \examples{
@@ -68,6 +68,9 @@ fwd
 Forward(fwd, pars, 50)
 fwd
 
+}
+\references{
+Aslett, L.J.M. and Christ, R.R. (2024) "kalis: a modern implementation of the Li & Stephens model for local ancestry inference in R", \emph{BMC Bioinformatics}, \strong{25}(1). Available at: \doi{10.1186/s12859-024-05688-8}.
 }
 \seealso{
 \code{\link[=MakeForwardTable]{MakeForwardTable()}} to generate a forward table;

From 1ad8095a872fb4c166404540a4377be564cc3eb4 Mon Sep 17 00:00:00 2001
From: Louis Aslett <louis.aslett@durham.ac.uk>
Date: Wed, 13 Nov 2024 15:22:59 +0000
Subject: [PATCH 40/43] Fix pkgdown maths

---
 _pkgdown.yml | 7 ++++++-
 1 file changed, 6 insertions(+), 1 deletion(-)

diff --git a/_pkgdown.yml b/_pkgdown.yml
index 0199daf..fb165dd 100644
--- a/_pkgdown.yml
+++ b/_pkgdown.yml
@@ -1,11 +1,16 @@
 url: https://kalis.louisaslett.com/
 template:
   bootstrap: 5
-  bootswatch: spacelab
   bslib:
+    bootswatch: spacelab
     base_font: {google: "PT Serif"}
     heading_font: {google: "Roboto Slab"}
     code_font: {google: "JetBrains Mono"}
+  includes:
+    in_header: |
+      <link rel="stylesheet" href="https://cdn.jsdelivr.net/npm/katex@0.16.11/dist/katex.min.css" integrity="sha384-nB0miv6/jRmo5UMMR1wu3Gz6NLsoTkbqJghGIsx//Rlm+ZU03BU6SQNC66uf4l5+" crossorigin="anonymous">
+      <script defer src="https://cdn.jsdelivr.net/npm/katex@0.16.11/dist/katex.min.js" integrity="sha384-7zkQWkzuo3B5mTepMUcHkMB5jZaolc2xDwL6VFqjFALcbeS9Ggm/Yr2r3Dy4lfFg" crossorigin="anonymous"></script>
+      <script defer src="https://cdn.jsdelivr.net/npm/katex@0.16.11/dist/contrib/auto-render.min.js" integrity="sha384-43gviWU0YVjaDtb/GhzOouOXtZMP/7XUzwPTstBeZFe/+rCMvRwr4yROQP43s0Xk" crossorigin="anonymous" onload="renderMathInElement(document.body);"></script>
 navbar:
   structure:
     left: [reference,articles,paper]

From a9ed50a7ced217007b42a696f1832d7a3546ad46 Mon Sep 17 00:00:00 2001
From: Louis Aslett <louis.aslett@durham.ac.uk>
Date: Wed, 13 Nov 2024 15:48:03 +0000
Subject: [PATCH 41/43] Add kalis paper to all v1 functions and tidy other
 references in v1 function docs

---
 R/CacheHaplotypes.R             |  9 +++++++++
 R/CacheSummary.R                |  3 +++
 R/IndividualSequenceIO_H5.R     |  3 +++
 R/Parameters.R                  | 25 +++++++++++++------------
 R/Probs.R                       | 14 +++++++++++---
 R/SmallHaps-data.R              |  4 +++-
 R/TableMaker.R                  | 12 ++++++++++++
 man/CacheHaplotypes.Rd          |  3 +++
 man/CacheSummary.Rd             |  3 +++
 man/CalcRho.Rd                  |  8 +++++---
 man/ClearHaplotypeCache.Rd      |  3 +++
 man/CopyTable.Rd                |  3 +++
 man/DistMat.Rd                  |  4 +++-
 man/MakeBackwardTable.Rd        |  3 +++
 man/MakeForwardTable.Rd         |  3 +++
 man/Parameters.Rd               |  8 ++++----
 man/PostProbs.Rd                |  3 +++
 man/QueryCache.Rd               |  3 +++
 man/ResetTable.Rd               |  3 +++
 man/SmallHaps.Rd                |  4 +++-
 man/WriteHaplotypes.Rd          |  3 +++
 man/plot.kalisDistanceMatrix.Rd |  3 +++
 22 files changed, 102 insertions(+), 25 deletions(-)

diff --git a/R/CacheHaplotypes.R b/R/CacheHaplotypes.R
index dcc6b3c..fe5e967 100644
--- a/R/CacheHaplotypes.R
+++ b/R/CacheHaplotypes.R
@@ -48,6 +48,9 @@ assign("L", NA, envir = pkgVars) # must be integer
 #'
 #'
 #'
+#' @references
+#' Aslett, L.J.M. and Christ, R.R. (2024) "kalis: a modern implementation of the Li & Stephens model for local ancestry inference in R", *BMC Bioinformatics*, **25**(1). Available at: \doi{10.1186/s12859-024-05688-8}.
+#'
 #' @param haps can be the name of a file from which the haplotypes are to be read, or can be an R matrix containing only 0/1s.
 #'   See Details section for supported file types.
 #' @param loci.idx an optional vector of indices specifying the variants to load into the cache, indexed from 1.
@@ -219,6 +222,9 @@ CacheHaplotypes.err <- function(err) {
 #' To achieve higher performance, kalis internally represents haplotypes in an efficient raw binary format in memory which cannot be directly viewed or manipulated in R.
 #' This function enables you to copy whole or partial views of haplotypes/variants out of this low-level format and into a standard R matrix of 0's and 1's.
 #'
+#' @references
+#' Aslett, L.J.M. and Christ, R.R. (2024) "kalis: a modern implementation of the Li & Stephens model for local ancestry inference in R", *BMC Bioinformatics*, **25**(1). Available at: \doi{10.1186/s12859-024-05688-8}.
+#'
 #' @param loci.idx which variants to retrieve from the cache, specified as a (vector) index.
 #'   This enables specifying variants by offset in the order they were loaded into the cache (from 1 to the number of variants).
 #' @param hap.idx which haplotypes to retrieve from the cache, specified as a (vector) index.
@@ -295,6 +301,9 @@ QueryCache <- function(loci.idx = NULL, hap.idx = NULL) {
 #' In particular, this cache sits outside R's memory management and will never be garbage collected (unless R is quit or the package is unloaded).
 #' Therefore, this function is provided to enable freeing the memory used by this cache.
 #'
+#' @references
+#' Aslett, L.J.M. and Christ, R.R. (2024) "kalis: a modern implementation of the Li & Stephens model for local ancestry inference in R", *BMC Bioinformatics*, **25**(1). Available at: \doi{10.1186/s12859-024-05688-8}.
+#'
 #' @return Nothing is returned.
 #'
 #' @seealso [CacheHaplotypes()] to create a haplotype cache;
diff --git a/R/CacheSummary.R b/R/CacheSummary.R
index 8c5b77a..c923096 100644
--- a/R/CacheSummary.R
+++ b/R/CacheSummary.R
@@ -1,5 +1,8 @@
 #' Retrieve information about the haplotype cache
 #'
+#' @references
+#' Aslett, L.J.M. and Christ, R.R. (2024) "kalis: a modern implementation of the Li & Stephens model for local ancestry inference in R", *BMC Bioinformatics*, **25**(1). Available at: \doi{10.1186/s12859-024-05688-8}.
+#'
 #' @return
 #'   `CacheSummary()` prints information about the current state of the kalis cache.
 #'     Also invisibly returns a vector giving the dimensions of the cached haplotype data (num variants, num haplotypes), or `NULL` if the cache is empty.
diff --git a/R/IndividualSequenceIO_H5.R b/R/IndividualSequenceIO_H5.R
index ac3f74c..d6b593c 100644
--- a/R/IndividualSequenceIO_H5.R
+++ b/R/IndividualSequenceIO_H5.R
@@ -11,6 +11,9 @@
 #'
 #' Note that if `hdf5.file` exists but does not contain a dataset named `haps`, then `WriteHaplotypes` will simply create a `haps` dataset within the existing file.
 #'
+#' @references
+#' Aslett, L.J.M. and Christ, R.R. (2024) "kalis: a modern implementation of the Li & Stephens model for local ancestry inference in R", *BMC Bioinformatics*, **25**(1). Available at: \doi{10.1186/s12859-024-05688-8}.
+#'
 #' @param hdf5.file the name of the file which the haplotypes are to be written to.
 #' @param haps a vector or a matrix where each column is a haplotype to be stored in the file `hdf5.file`.
 #' @param hap.ids a character vector naming haplotypes when writing, or which haplotypes are to be read.
diff --git a/R/Parameters.R b/R/Parameters.R
index 846ef91..187194e 100644
--- a/R/Parameters.R
+++ b/R/Parameters.R
@@ -6,11 +6,16 @@
 #'
 #' **NOTE:** the corresponding haplotype data *must* have already been inserted into the kalis cache by a call to [CacheHaplotypes()], since this function performs checks to confirm the dimensionality matches.
 #'
-#' TODO: add kalis paper cross ref.
 #' See page 3 in Supplemental Information for the original ChromoPainter paper (Lawson et al., 2012) for motivation behind our parameterisation, which is as follows:
 #'
 #' \deqn{\rho = 1 - \exp(-s \times cM^\gamma)}{\rho = 1 - exp(-s * cM^\gamma)}
 #'
+#' For a complete description, see the main kalis paper, Aslett and Christ (2024).
+#'
+#' @references
+#' Aslett, L.J.M. and Christ, R.R. (2024) "kalis: a modern implementation of the Li & Stephens model for local ancestry inference in R", *BMC Bioinformatics*, **25**(1). Available at: \doi{10.1186/s12859-024-05688-8}.
+#'
+#' Lawson, D.J., Hellenthal, G., Myers, S. and Falush, D. (2012). "Inference of population structure using dense haplotype data", *PLoS genetics*, **8**(1). Available at: \doi{10.1371/journal.pgen.1002453}.
 #'
 #' @param cM a vector specifying the recombination distance between variants in centimorgans.
 #'   Note element i of this vector should be the distance between variants `i` and `i+1` (not `i` and `i-1`), and thus length one less than the number of variants.
@@ -25,10 +30,6 @@
 #'
 #' @seealso [Parameters()] to use the resulting recombination probabilities to construct a `kalisParameters` object.
 #'
-#' @references
-#'   Lawson, D. J., Hellenthal, G., Myers, S., & Falush, D. (2012). Inference of
-#'   population structure using dense haplotype data. *PLoS genetics*, **8**(1).
-#'
 #' @examples
 #' # Load the mini example data and recombination map from the package built-in #' # dataset
 #' data("SmallHaps")
@@ -119,6 +120,13 @@ CalcRho <- function(cM = 0, s = 1, gamma = 1, floor = TRUE) {
 #'
 #' Note that there is a computational cost associated with non-uniform copying probabilities, so it is recommended to leave the default of uniform probabilities when appropriate (**Note:** *do not* specify a uniform matrix when uniform probabilities are intended, since this would end up incurring the computational cost of non-uniform probabilities).
 #'
+#' @references
+#' Aslett, L.J.M. and Christ, R.R. (2024) "kalis: a modern implementation of the Li & Stephens model for local ancestry inference in R", *BMC Bioinformatics*, **25**(1). Available at: \doi{10.1186/s12859-024-05688-8}.
+#'
+#' Lawson, D.J., Hellenthal, G., Myers, S.R. and Falush, D. (2012). "Inference of population structure using dense haplotype data", *PLoS Genetics*, **8**(1). Available at: \doi{10.1371/journal.pgen.1002453}.
+#'
+#' Speidel, L., Forest, M., Shi, S. and Myers, S.R. (2019). "A method for genome-wide genealogy estimation for thousands of samples", *Nature Genetics*, **51**, p. 1321-1329. Available at: \doi{10.1038/s41588-019-0484-x}.
+#'
 #' @param rho recombination probability vector (must be \eqn{L-1} long).
 #'   See [CalcRho()] for assistance constructing this from a recombination
 #'   map/distances.
@@ -140,13 +148,6 @@ CalcRho <- function(cM = 0, s = 1, gamma = 1, floor = TRUE) {
 #' @seealso [MakeForwardTable()] and [MakeBackwardTable()] which construct table objects which internally reference a parameters environment;
 #'   [Forward()] and [Backward()] which propagate those tables according to the Li and Stephens model.
 #'
-#' @references
-#'   Lawson, D. J., Hellenthal, G., Myers, S., & Falush, D. (2012). Inference of
-#'   population structure using dense haplotype data. *PLoS genetics*, **8**(1).
-#'
-#'   Speidel, L., Forest, M., Shi, S., & Myers, S. (2019). A method for
-#'   genome-wide genealogy estimation for thousands of samples. *Nature Genetics*, **51**(1321–1329).
-#'
 #' @examples
 #' # Load the mini example data and recombination map from the package built-in #' # dataset
 #' data("SmallHaps")
diff --git a/R/Probs.R b/R/Probs.R
index a97303e..77f6024 100644
--- a/R/Probs.R
+++ b/R/Probs.R
@@ -43,6 +43,9 @@
 #' Typically, that is simply \eqn{N \times N}{N x N} for \eqn{N} haplotypes.
 #' However, if kalis is being run in a distributed manner, `M` will be a \eqn{N \times R}{N x R} matrix where \eqn{R} is the number of recipient haplotypes on the current machine.
 #'
+#' @references
+#' Aslett, L.J.M. and Christ, R.R. (2024) "kalis: a modern implementation of the Li & Stephens model for local ancestry inference in R", *BMC Bioinformatics*, **25**(1). Available at: \doi{10.1186/s12859-024-05688-8}.
+#'
 #' @param fwd a forward table as returned by [MakeForwardTable()] and propagated to a target variant by [Forward()].
 #'   Must be at the same variant as `bck` (unless `bck` is in "beta-theta space" in which case if must be downstream ... see [Backward()] for details).
 #' @param bck a backward table as returned by [MakeBackwardTable()] and propagated to a target variant by [Backward()].
@@ -164,6 +167,11 @@ PostProbs <- function(fwd, bck, unif.on.underflow = FALSE, M = NULL, beta.theta.
 #' Typically, that is simply \eqn{N \times N}{N x N} for \eqn{N} haplotypes.
 #' However, if kalis is being run in a distributed manner, `M` will be a \eqn{N \times R}{N x R} matrix where \eqn{R} is the number of recipient haplotypes on the current machine.
 #'
+#' @references
+#' Aslett, L.J.M. and Christ, R.R. (2024) "kalis: a modern implementation of the Li & Stephens model for local ancestry inference in R", *BMC Bioinformatics*, **25**(1). Available at: \doi{10.1186/s12859-024-05688-8}.
+#'
+#' Speidel, L., Forest, M., Shi, S. and Myers, S.R. (2019). "A method for genome-wide genealogy estimation for thousands of samples", *Nature Genetics*, **51**, p. 1321-1329. Available at: \doi{10.1038/s41588-019-0484-x}.
+#'
 #' @param fwd a forward table as returned by [MakeForwardTable()] and propagated to a target variant by [Forward()].
 #'   Must be at the same variant as `bck` (unless `bck` is in "beta-theta space" in which case if must be downstream ... see [Backward()] for details).
 #' @param bck a backward table as returned by [MakeBackwardTable()] and propagated to a target variant by [Backward()].
@@ -184,9 +192,6 @@ PostProbs <- function(fwd, bck, unif.on.underflow = FALSE, M = NULL, beta.theta.
 #'
 #'   If you wish to plot this matrix or perform clustering, you may want to symmetrize the matrix first.
 #'
-#' @references
-#'   Speidel, L., Forest, M., Shi, S., & Myers, S. (2019). A method for genome-wide genealogy estimation for thousands of samples. *Nature Genetics*, **51**(1321–1329).
-#'
 #' @seealso
 #'   [PostProbs()] to calculate the posterior marginal probabilities \eqn{p_{ji}}{p_(j,i)};
 #'   [Forward()] to propagate a Forward table to a new variant;
@@ -319,6 +324,9 @@ input_checks_for_probs_and_dist_mat <-  function(fwd,bck,beta.theta.opts = NULL)
 #'
 #' Clusters the given distance matrix and generates a heatmap to display it.
 #'
+#' @references
+#' Aslett, L.J.M. and Christ, R.R. (2024) "kalis: a modern implementation of the Li & Stephens model for local ancestry inference in R", *BMC Bioinformatics*, **25**(1). Available at: \doi{10.1186/s12859-024-05688-8}.
+#'
 #' @param x
 #'        a distance matrix, such as returned by [DistMat()].
 #' @param cluster.method
diff --git a/R/SmallHaps-data.R b/R/SmallHaps-data.R
index 26dfcfa..fe57838 100644
--- a/R/SmallHaps-data.R
+++ b/R/SmallHaps-data.R
@@ -14,7 +14,9 @@
 #' @keywords datasets
 #'
 #' @references
-#'   Kelleher, J., Etheridge, A. M., & McVean, G. (2016). Efficient coalescent simulation and genealogical analysis for large sample sizes. *PLoS computational biology*, **12**(5).
+#' Aslett, L.J.M. and Christ, R.R. (2024) "kalis: a modern implementation of the Li & Stephens model for local ancestry inference in R", *BMC Bioinformatics*, **25**(1). Available at: \doi{10.1186/s12859-024-05688-8}.
+#'
+#' Kelleher, J., Etheridge, A.M. and McVean, G. (2016) "Efficient coalescent simulation and genealogical analysis for large sample sizes", *PLoS Computational Biology*, **12**(5). Available at: \doi{10.1371/journal.pcbi.1004842}.
 #'
 #' @examples
 #' data("SmallHaps")
diff --git a/R/TableMaker.R b/R/TableMaker.R
index 8792c21..b5fc56c 100644
--- a/R/TableMaker.R
+++ b/R/TableMaker.R
@@ -10,6 +10,9 @@
 #'
 #' Since each column corresponds to an independent Li and Stephens hidden Markov model (ie for each recipient), it is possible to create a partial forward table object which corresponds to a subset of recipients using the `from_recipient` and `to_recipient` arguments.
 #'
+#' @references
+#' Aslett, L.J.M. and Christ, R.R. (2024) "kalis: a modern implementation of the Li & Stephens model for local ancestry inference in R", *BMC Bioinformatics*, **25**(1). Available at: \doi{10.1186/s12859-024-05688-8}.
+#'
 #' @param pars a `kalisParameters` object specifying the genetics parameters to be associated with this forward table.
 #'   These parameters can be set up by using the [Parameters()] function.
 #' @param from_recipient first recipient haplotype included if creating a partial forward table.
@@ -130,6 +133,9 @@ print.kalisForwardTable <- function(x, ...) {
 #'
 #' Since each column corresponds to an independent Li and Stephens hidden Markov model (ie for each recipient), it is possible to create a partial backward table object which corresponds to a subset of recipients using the `from_recipient` and `to_recipient` arguments.
 #'
+#' @references
+#' Aslett, L.J.M. and Christ, R.R. (2024) "kalis: a modern implementation of the Li & Stephens model for local ancestry inference in R", *BMC Bioinformatics*, **25**(1). Available at: \doi{10.1186/s12859-024-05688-8}.
+#'
 #' @param pars a `kalisParameters` object specifying the genetics parameters to be associated with this backward table.
 #'   These parameters can be set up by using the [Parameters()] function.
 #' @param from_recipient first recipient haplotype included if creating a partial backward table.
@@ -249,6 +255,9 @@ print.kalisBackwardTable <- function(x, ...) {
 #'
 #' This function is therefore designed to enable explicit copying of tables.
 #'
+#' @references
+#' Aslett, L.J.M. and Christ, R.R. (2024) "kalis: a modern implementation of the Li & Stephens model for local ancestry inference in R", *BMC Bioinformatics*, **25**(1). Available at: \doi{10.1186/s12859-024-05688-8}.
+#'
 #' @param to a `kalisForwardTable` or `kalisBackwardTable` object which is to be copied into.
 #' @param from a `kalisForwardTable` or `kalisBackwardTable` object which is to be copied from.
 #'
@@ -340,6 +349,9 @@ CopyTable <- function(to, from) {
 #' It is *much* faster to reset a forward/backward table rather than remove and make a new one.
 #' This function marks a table as reset so that it will be propagated as if freshly allocated.
 #'
+#' @references
+#' Aslett, L.J.M. and Christ, R.R. (2024) "kalis: a modern implementation of the Li & Stephens model for local ancestry inference in R", *BMC Bioinformatics*, **25**(1). Available at: \doi{10.1186/s12859-024-05688-8}.
+#'
 #' @param tbl a `kalisForwardTable` or `kalisBackwardTable` object
 #'   which is to be reset.
 #'
diff --git a/man/CacheHaplotypes.Rd b/man/CacheHaplotypes.Rd
index b22bed1..98f5f69 100644
--- a/man/CacheHaplotypes.Rd
+++ b/man/CacheHaplotypes.Rd
@@ -143,6 +143,9 @@ CacheHaplotypes(haps)
 data("SmallHaps")
 CacheHaplotypes(SmallHaps)
 
+}
+\references{
+Aslett, L.J.M. and Christ, R.R. (2024) "kalis: a modern implementation of the Li & Stephens model for local ancestry inference in R", \emph{BMC Bioinformatics}, \strong{25}(1). Available at: \doi{10.1186/s12859-024-05688-8}.
 }
 \seealso{
 \code{\link[=CacheSummary]{CacheSummary()}} for a list detailing the current cache status;
diff --git a/man/CacheSummary.Rd b/man/CacheSummary.Rd
index d53cddd..da7a847 100644
--- a/man/CacheSummary.Rd
+++ b/man/CacheSummary.Rd
@@ -40,3 +40,6 @@ N()
 L()
 
 }
+\references{
+Aslett, L.J.M. and Christ, R.R. (2024) "kalis: a modern implementation of the Li & Stephens model for local ancestry inference in R", \emph{BMC Bioinformatics}, \strong{25}(1). Available at: \doi{10.1186/s12859-024-05688-8}.
+}
diff --git a/man/CalcRho.Rd b/man/CalcRho.Rd
index 3f87fbd..4714f4b 100644
--- a/man/CalcRho.Rd
+++ b/man/CalcRho.Rd
@@ -30,10 +30,11 @@ This is a utility function to calculate the recombination probabilities rho (the
 
 \strong{NOTE:} the corresponding haplotype data \emph{must} have already been inserted into the kalis cache by a call to \code{\link[=CacheHaplotypes]{CacheHaplotypes()}}, since this function performs checks to confirm the dimensionality matches.
 
-TODO: add kalis paper cross ref.
 See page 3 in Supplemental Information for the original ChromoPainter paper (Lawson et al., 2012) for motivation behind our parameterisation, which is as follows:
 
 \deqn{\rho = 1 - \exp(-s \times cM^\gamma)}{\rho = 1 - exp(-s * cM^\gamma)}
+
+For a complete description, see the main kalis paper, Aslett and Christ (2024).
 }
 \examples{
 # Load the mini example data and recombination map from the package built-in #' # dataset
@@ -49,8 +50,9 @@ rho
 
 }
 \references{
-Lawson, D. J., Hellenthal, G., Myers, S., & Falush, D. (2012). Inference of
-population structure using dense haplotype data. \emph{PLoS genetics}, \strong{8}(1).
+Aslett, L.J.M. and Christ, R.R. (2024) "kalis: a modern implementation of the Li & Stephens model for local ancestry inference in R", \emph{BMC Bioinformatics}, \strong{25}(1). Available at: \doi{10.1186/s12859-024-05688-8}.
+
+Lawson, D.J., Hellenthal, G., Myers, S. and Falush, D. (2012). "Inference of population structure using dense haplotype data", \emph{PLoS genetics}, \strong{8}(1). Available at: \doi{10.1371/journal.pgen.1002453}.
 }
 \seealso{
 \code{\link[=Parameters]{Parameters()}} to use the resulting recombination probabilities to construct a \code{kalisParameters} object.
diff --git a/man/ClearHaplotypeCache.Rd b/man/ClearHaplotypeCache.Rd
index 7afce6c..9e832b5 100644
--- a/man/ClearHaplotypeCache.Rd
+++ b/man/ClearHaplotypeCache.Rd
@@ -31,6 +31,9 @@ ClearHaplotypeCache()
 # Verify it is gone
 CacheSummary()
 
+}
+\references{
+Aslett, L.J.M. and Christ, R.R. (2024) "kalis: a modern implementation of the Li & Stephens model for local ancestry inference in R", \emph{BMC Bioinformatics}, \strong{25}(1). Available at: \doi{10.1186/s12859-024-05688-8}.
 }
 \seealso{
 \code{\link[=CacheHaplotypes]{CacheHaplotypes()}} to create a haplotype cache;
diff --git a/man/CopyTable.Rd b/man/CopyTable.Rd
index 1020f2f..a8d044d 100644
--- a/man/CopyTable.Rd
+++ b/man/CopyTable.Rd
@@ -61,6 +61,9 @@ Forward(fwd, pars, 30)
 fwd
 fwd2
 
+}
+\references{
+Aslett, L.J.M. and Christ, R.R. (2024) "kalis: a modern implementation of the Li & Stephens model for local ancestry inference in R", \emph{BMC Bioinformatics}, \strong{25}(1). Available at: \doi{10.1186/s12859-024-05688-8}.
 }
 \seealso{
 \code{\link[=MakeForwardTable]{MakeForwardTable()}}, \code{\link[=MakeBackwardTable]{MakeBackwardTable()}} to create tables which can be copied into.
diff --git a/man/DistMat.Rd b/man/DistMat.Rd
index ffe3e6c..cf38ad3 100644
--- a/man/DistMat.Rd
+++ b/man/DistMat.Rd
@@ -129,7 +129,9 @@ plot(d)
 
 }
 \references{
-Speidel, L., Forest, M., Shi, S., & Myers, S. (2019). A method for genome-wide genealogy estimation for thousands of samples. \emph{Nature Genetics}, \strong{51}(1321–1329).
+Aslett, L.J.M. and Christ, R.R. (2024) "kalis: a modern implementation of the Li & Stephens model for local ancestry inference in R", \emph{BMC Bioinformatics}, \strong{25}(1). Available at: \doi{10.1186/s12859-024-05688-8}.
+
+Speidel, L., Forest, M., Shi, S. and Myers, S.R. (2019). "A method for genome-wide genealogy estimation for thousands of samples", \emph{Nature Genetics}, \strong{51}, p. 1321-1329. Available at: \doi{10.1038/s41588-019-0484-x}.
 }
 \seealso{
 \code{\link[=PostProbs]{PostProbs()}} to calculate the posterior marginal probabilities \eqn{p_{ji}}{p_(j,i)};
diff --git a/man/MakeBackwardTable.Rd b/man/MakeBackwardTable.Rd
index 5b78dcb..4718432 100644
--- a/man/MakeBackwardTable.Rd
+++ b/man/MakeBackwardTable.Rd
@@ -62,6 +62,9 @@ bck
 
 # Now ready to run the HMM backward recursions with Backward() ...
 
+}
+\references{
+Aslett, L.J.M. and Christ, R.R. (2024) "kalis: a modern implementation of the Li & Stephens model for local ancestry inference in R", \emph{BMC Bioinformatics}, \strong{25}(1). Available at: \doi{10.1186/s12859-024-05688-8}.
 }
 \seealso{
 \code{\link[=Backward]{Backward()}} to propagate the newly created \code{kalisBackwardTable};
diff --git a/man/MakeForwardTable.Rd b/man/MakeForwardTable.Rd
index a93c354..9e60ee9 100644
--- a/man/MakeForwardTable.Rd
+++ b/man/MakeForwardTable.Rd
@@ -61,6 +61,9 @@ fwd
 
 # Now ready to run the HMM forward recursions with Forward() ...
 
+}
+\references{
+Aslett, L.J.M. and Christ, R.R. (2024) "kalis: a modern implementation of the Li & Stephens model for local ancestry inference in R", \emph{BMC Bioinformatics}, \strong{25}(1). Available at: \doi{10.1186/s12859-024-05688-8}.
 }
 \seealso{
 \code{\link[=Forward]{Forward()}} to propagate the newly created \code{kalisForwardTable};
diff --git a/man/Parameters.Rd b/man/Parameters.Rd
index 0b14657..f34bdf7 100644
--- a/man/Parameters.Rd
+++ b/man/Parameters.Rd
@@ -98,11 +98,11 @@ fwd
 
 }
 \references{
-Lawson, D. J., Hellenthal, G., Myers, S., & Falush, D. (2012). Inference of
-population structure using dense haplotype data. \emph{PLoS genetics}, \strong{8}(1).
+Aslett, L.J.M. and Christ, R.R. (2024) "kalis: a modern implementation of the Li & Stephens model for local ancestry inference in R", \emph{BMC Bioinformatics}, \strong{25}(1). Available at: \doi{10.1186/s12859-024-05688-8}.
 
-Speidel, L., Forest, M., Shi, S., & Myers, S. (2019). A method for
-genome-wide genealogy estimation for thousands of samples. \emph{Nature Genetics}, \strong{51}(1321–1329).
+Lawson, D.J., Hellenthal, G., Myers, S.R. and Falush, D. (2012). "Inference of population structure using dense haplotype data", \emph{PLoS Genetics}, \strong{8}(1). Available at: \doi{10.1371/journal.pgen.1002453}.
+
+Speidel, L., Forest, M., Shi, S. and Myers, S.R. (2019). "A method for genome-wide genealogy estimation for thousands of samples", \emph{Nature Genetics}, \strong{51}, p. 1321-1329. Available at: \doi{10.1038/s41588-019-0484-x}.
 }
 \seealso{
 \code{\link[=MakeForwardTable]{MakeForwardTable()}} and \code{\link[=MakeBackwardTable]{MakeBackwardTable()}} which construct table objects which internally reference a parameters environment;
diff --git a/man/PostProbs.Rd b/man/PostProbs.Rd
index 389927a..8b15103 100644
--- a/man/PostProbs.Rd
+++ b/man/PostProbs.Rd
@@ -104,6 +104,9 @@ Backward(bck, pars, 100)
 p <- PostProbs(fwd, bck)
 d <- DistMat(fwd, bck)
 
+}
+\references{
+Aslett, L.J.M. and Christ, R.R. (2024) "kalis: a modern implementation of the Li & Stephens model for local ancestry inference in R", \emph{BMC Bioinformatics}, \strong{25}(1). Available at: \doi{10.1186/s12859-024-05688-8}.
 }
 \seealso{
 \code{\link[=DistMat]{DistMat()}} to generate calculate \eqn{d_{ji}}{d_(j,i)} distances directly;
diff --git a/man/QueryCache.Rd b/man/QueryCache.Rd
index dc5de1d..67621a1 100644
--- a/man/QueryCache.Rd
+++ b/man/QueryCache.Rd
@@ -36,6 +36,9 @@ CacheHaplotypes(haps)
 res <- QueryCache(50:150, 10:11)
 all(res == haps[50:150, 10:11])
 
+}
+\references{
+Aslett, L.J.M. and Christ, R.R. (2024) "kalis: a modern implementation of the Li & Stephens model for local ancestry inference in R", \emph{BMC Bioinformatics}, \strong{25}(1). Available at: \doi{10.1186/s12859-024-05688-8}.
 }
 \seealso{
 \code{\link[=CacheHaplotypes]{CacheHaplotypes()}} to fill the memory cache with haplotype data.
diff --git a/man/ResetTable.Rd b/man/ResetTable.Rd
index 9797a48..024ef5c 100644
--- a/man/ResetTable.Rd
+++ b/man/ResetTable.Rd
@@ -42,6 +42,9 @@ ResetTable(fwd)
 Forward(fwd, pars, 5)
 fwd
 
+}
+\references{
+Aslett, L.J.M. and Christ, R.R. (2024) "kalis: a modern implementation of the Li & Stephens model for local ancestry inference in R", \emph{BMC Bioinformatics}, \strong{25}(1). Available at: \doi{10.1186/s12859-024-05688-8}.
 }
 \seealso{
 \code{\link[=MakeForwardTable]{MakeForwardTable()}}, \code{\link[=MakeBackwardTable]{MakeBackwardTable()}} to create fresh tables.
diff --git a/man/SmallHaps.Rd b/man/SmallHaps.Rd
index 6ff1916..5b540b1 100644
--- a/man/SmallHaps.Rd
+++ b/man/SmallHaps.Rd
@@ -40,6 +40,8 @@ pars
 
 }
 \references{
-Kelleher, J., Etheridge, A. M., & McVean, G. (2016). Efficient coalescent simulation and genealogical analysis for large sample sizes. \emph{PLoS computational biology}, \strong{12}(5).
+Aslett, L.J.M. and Christ, R.R. (2024) "kalis: a modern implementation of the Li & Stephens model for local ancestry inference in R", \emph{BMC Bioinformatics}, \strong{25}(1). Available at: \doi{10.1186/s12859-024-05688-8}.
+
+Kelleher, J., Etheridge, A.M. and McVean, G. (2016) "Efficient coalescent simulation and genealogical analysis for large sample sizes", \emph{PLoS Computational Biology}, \strong{12}(5). Available at: \doi{10.1371/journal.pcbi.1004842}.
 }
 \keyword{datasets}
diff --git a/man/WriteHaplotypes.Rd b/man/WriteHaplotypes.Rd
index 5d2d0fe..a27eed8 100644
--- a/man/WriteHaplotypes.Rd
+++ b/man/WriteHaplotypes.Rd
@@ -94,6 +94,9 @@ CacheHaplotypes("~/myhaps.h5")
 all(haps == QueryCache())
 }
 
+}
+\references{
+Aslett, L.J.M. and Christ, R.R. (2024) "kalis: a modern implementation of the Li & Stephens model for local ancestry inference in R", \emph{BMC Bioinformatics}, \strong{25}(1). Available at: \doi{10.1186/s12859-024-05688-8}.
 }
 \seealso{
 \code{\link[=CacheHaplotypes]{CacheHaplotypes()}} to fill the kalis cache with haplotypes.
diff --git a/man/plot.kalisDistanceMatrix.Rd b/man/plot.kalisDistanceMatrix.Rd
index 5246eb4..9ca8ec3 100644
--- a/man/plot.kalisDistanceMatrix.Rd
+++ b/man/plot.kalisDistanceMatrix.Rd
@@ -24,3 +24,6 @@ Clusters the given distance matrix and generates a heatmap to display it.
 # TODO
 
 }
+\references{
+Aslett, L.J.M. and Christ, R.R. (2024) "kalis: a modern implementation of the Li & Stephens model for local ancestry inference in R", \emph{BMC Bioinformatics}, \strong{25}(1). Available at: \doi{10.1186/s12859-024-05688-8}.
+}

From 13dbdc4eb143fcb40a6c51cf393c3e433b60d5b0 Mon Sep 17 00:00:00 2001
From: Louis Aslett <louis.aslett@durham.ac.uk>
Date: Wed, 13 Nov 2024 17:19:28 +0000
Subject: [PATCH 42/43] Documentation and exported function review by Ryan
 (pushed by me)

---
 DESCRIPTION                 |   6 +-
 NAMESPACE                   |   7 +-
 R/CladeMat.R                |   2 +-
 R/Clades.R                  | 635 ++++++++++++++++++------------------
 R/Iterator.R                |  44 ++-
 man/CalcCheckpointTables.Rd |  28 ++
 man/CladeMat.Rd             |   2 +-
 man/CladeMat_old.Rd         |  36 --
 man/Clades.Rd               |  57 ----
 man/ForwardIterator.Rd      |  19 +-
 man/Neighbors.Rd            |  21 --
 man/PruneCladeMat.Rd        |  23 +-
 man/Sprigs.Rd               |  17 +-
 man/Sprigs_old.Rd           |  21 --
 14 files changed, 419 insertions(+), 499 deletions(-)
 create mode 100644 man/CalcCheckpointTables.Rd
 delete mode 100644 man/CladeMat_old.Rd
 delete mode 100644 man/Clades.Rd
 delete mode 100644 man/Neighbors.Rd
 delete mode 100644 man/Sprigs_old.Rd

diff --git a/DESCRIPTION b/DESCRIPTION
index de10ad6..9ccd4fc 100644
--- a/DESCRIPTION
+++ b/DESCRIPTION
@@ -39,8 +39,7 @@ Imports:
     grDevices,
     RColorBrewer,
     lobstr,
-    prettyunits,
-    data.table
+    prettyunits
 RoxygenNote: 7.3.2
 Roxygen: list(markdown = TRUE)
 Suggests: 
@@ -51,7 +50,8 @@ Suggests:
     rmarkdown,
     fastcluster,
     lattice,
-    testthat (>= 3.0.0)
+    testthat (>= 3.0.0),
+    data.table
 VignetteBuilder: knitr
 Encoding: UTF-8
 Config/testthat/edition: 3
diff --git a/NAMESPACE b/NAMESPACE
index f280572..9b46aee 100644
--- a/NAMESPACE
+++ b/NAMESPACE
@@ -11,11 +11,10 @@ S3method(targets,kalisIterator)
 export(Backward)
 export(CacheHaplotypes)
 export(CacheSummary)
+export(CalcCheckpointTables)
 export(CalcRho)
 export(CalcTraces)
 export(CladeMat)
-export(CladeMat_old)
-export(Clades)
 export(ClearHaplotypeCache)
 export(CopyTable)
 export(CreateForwardTableCache)
@@ -28,7 +27,6 @@ export(L)
 export(MakeBackwardTable)
 export(MakeForwardTable)
 export(N)
-export(Neighbors)
 export(Parameters)
 export(PostProbs)
 export(PruneCladeMat)
@@ -36,12 +34,9 @@ export(QueryCache)
 export(ReadHaplotypes)
 export(ResetTable)
 export(Sprigs)
-export(Sprigs_old)
 export(WriteHaplotypes)
-export(calc_tables)
 import(checkmate)
 import(dplyr)
-importFrom(data.table,frank)
 importFrom(digest,digest)
 importFrom(glue,glue)
 importFrom(glue,glue_collapse)
diff --git a/R/CladeMat.R b/R/CladeMat.R
index d00d4b6..9af70ed 100644
--- a/R/CladeMat.R
+++ b/R/CladeMat.R
@@ -20,7 +20,7 @@
 #' @param unit.dist
 #'        the change in distance that is expected to correspond to a single mutation (typically \eqn{-\log(\mu)}) for the LS model)
 #' @param thresh
-#'        a regularization parameter: <!-- TODO: can't parse this sentence --> differences distances must exceed this threshold (in `unit.dist` units) in order to used in forming the local relatedness matrix.
+#'        a regularization parameter: differences of distances must exceed this threshold (in `unit.dist` units) in order to cause the introduction of a probabilistic clade.
 #'        Defaults to `0.2`.
 #' @param max1var
 #'        a logical regularization parameter.
diff --git a/R/Clades.R b/R/Clades.R
index 46d3b1c..dc5612b 100644
--- a/R/Clades.R
+++ b/R/Clades.R
@@ -17,19 +17,24 @@ get_neigh_seq <- function(x, i, return.lengths = FALSE){
   }
 }
 
-#' Title TODO
+#' Greedy sprig calling based on nearest neighbourhoods
 #'
-#' Short Description TODO
+#' Infer sprigs (very small clades) within a local phylogeny based on one-directional nearest neighbourhoods assigned to each haplotype
 #'
-#' Long Description TODO
+#' Call maximal cliques within a directed graph where edges correspond to nearest neighbour relationships
 #'
 #' @param x
-#'        TODO
+#'        list of where each entry is a nearest neighborhood of integers as returned by [CladeMat()]
 #' @param old.sprigs
-#'        TODO
+#'        If TRUE, use an earlier (undocumented) version of maximal clique calling, defaults to FALSE.
 #'
 #' @return
-#' TODO
+#' a list containing:
+#' \describe{
+#'   \item{`assignments`}{a vector of integers such that `assignments[i]` gives the sprig to which haplotype `i` belongs. `NA` if a haplotype was not assigned to a sprig.}
+#'   \item{`to.prune`}{a vector of logicals, `to.prune[i]==TRUE` when haplotype i has been assigned to a sprig}
+#'   \item{`num.sprigs`}{total number of sprigs calls, equal to `max(assignements,rm.na=TRUE)`}
+#' }
 #'
 #' @examples
 #' # TODO
@@ -133,33 +138,33 @@ UpdateMatrixInPlace <- function(M,row.idx,col.idx,x){
 # test <- matrix(as.double(1:144),12,12)
 # UpdateMatrixInPlace(test,c(5,12,12),c(1,3,5),as.double(c(100,200,300)))
 
-#' Title TODO
+#' Prune called sprigs or singletons from inferred clade matrix
 #'
-#' Short Description TODO
-#'
-#' Long Description TODO
+#' Use haplotype nearest neighborhoods and other information returned by [CladeMat()] to efficiently remove structure corresponding to singletons or called sprigs from clade matrix 'M'
 #'
 #' @param M
-#'        TODO
+#'        clade matrix such as that updated by [CladeMat()]
 #' @param neigh
-#'        TODO
+#'        a list of nearest neighborhoods as retuned by [CladeMat()]
 #' @param sprigs
-#'        TODO
+#'        a sprigs object as returned by [Sprigs()]
 #' @param prune
-#'        TODO
-#' @param from.recipient
-#'        TODO
+#'        a character indicating the type of information to be removed from the [CladeMat()]. See Details.
+#' @param from_recipient
+#'        haplotype index at which to start trace calculation --- useful for distributed computation (experimental feature, more documentation to come<!-- TODO -->)
 #'
 #' @return
-#' TODO
+#' There is nothing returned.
+#'
+#' **NOTE:** for performance reasons, `M` is updated in-place.
 #'
 #' @examples
 #' # TODO
 #'
 #' @export PruneCladeMat
-PruneCladeMat <- function(M, neigh, sprigs, prune = "singleton.info", from.recipient = 1L){
+PruneCladeMat <- function(M, neigh, sprigs, prune = "singleton.info", from_recipient = 1L){
 
-  if(!from.recipient%%2){stop("from.recipient must be odd and encode the index of the first recipient haplotype")}
+  if(!from_recipient%%2){stop("from_recipient must be odd and encode the index of the first recipient haplotype")}
 
   N.recipients <- 2 * ncol(M)
 
@@ -168,7 +173,7 @@ PruneCladeMat <- function(M, neigh, sprigs, prune = "singleton.info", from.recip
     v <- neigh[[2]][[2]] - neigh[[2]][[1]]
     v <- v[seq.int(1,N.recipients,2)] + v[seq.int(2,N.recipients,2)]
     UpdateMatrixInPlace(M,
-                        seq.int(from = (from.recipient+1L)/2L,length.out = ncol(M)),
+                        seq.int(from = (from_recipient+1L)/2L,length.out = ncol(M)),
                         seq.int(from = 1, to = ncol(M)),
                         v)
 
@@ -233,187 +238,179 @@ PruneCladeMat <- function(M, neigh, sprigs, prune = "singleton.info", from.recip
 
 
 
-
-#' Probabilistic Clades
-#'
-#' Utility for calling probabilistic clades at, in between, or excluding variants.
-#'
-#' TODO longer description
-#'
-#' @references
-#' Christ, R., Wang, X., Aslett, L.J.M., Steinsaltz, D. and Hall, I. (2024) "Clade Distillation for Genome-wide Association Studies." bioRxiv 2024.09.30.615852. Available at: \doi{10.1101/2024.09.30.615852}.
-#'
-#' @param fwd
-#'        a `kalisForwardTable` object, as returned by [MakeForwardTable()] and propagated to a target variant by [Forward()].
-#'        This table must be at the same variant location as argument `bck`.
-#' @param bck
-#'        a `kalisBackwardTable` object, as returned by [MakeBackwardTable()] and propagated to a target variant by [Backward()].
-#'        This table must be at the same variant location as argument `fwd`.
-#' @param pars
-#'        a `kalisParameters` object, as returned by [Parameters()].
-#' @param beta.theta.opts
-#'        a list; see Details in [DistMat()] documentation page.
-#' @param safety.checks
-#'        a logical, should safety checks be applied to the distances?
-#'        See [DistMat()].
-#' @param neighbors
-#'        a logical, should nearest neighbors be pre-calculated?
-#'        See [Neighbors()].
-#' @param use.forking
-#'        a logical, should forked processes be used?
-#' @param forking.chunk.size
-#'        TODO
-#' @param mc.preschedule
-#'        TODO
-#' @param nthreads
-#'        the number of CPU cores to use.
-#'        By default no parallelism is used.
-#'
-#' @return
-#'   a `kalisClades` object encoding probabilistic clade calls
-#'
-#' @importFrom data.table frank
-#' @export Clades
-Clades <- function(fwd, bck, pars, beta.theta.opts = NULL,
-                   safety.checks = FALSE, neighbors = FALSE,
-                   #use.bettermc = FALSE,
-                   use.forking = FALSE,
-                   forking.chunk.size = 100L,
-                   mc.preschedule = FALSE, # FALSE is more conservative of memory but means many new forked processes need to be launched so it's slower than TRUE
-                   nthreads = 1L){
-  # currently only outputs a list but should eventually also output a matrix of integers and an attribute list of clades
-
-  unit.mut.dist <- -log(pars$pars$mu)
-
-  M <- DistMat(fwd, bck, beta.theta.opts = beta.theta.opts, nthreads = nthreads)
-
-  if(safety.checks){
-    M[!is.finite(M)] <- 0
-    diag(M) <- NA_real_
-  }
-
-  rank_donors_func <- function(x, type="linear_20", neighbors = FALSE, mac.range = c(NA,NA)){
-    rank_donors_func_res <- as.list(1:length(x))
-    for(j in 1:length(x)){
-      d.ranks <- data.table::frank(M[,x[j]], na.last = FALSE, ties.method = "first")
-      phi <- c(diff(M[order(d.ranks),x[j]]),0)
-      phi[1] <- 0
-      phi <- phi / unit.mut.dist # an N-long vector
-      if(type == "linear_20"){
-        phi[phi > 1] <- 1
-        phi[phi < 0.2] <- 0
-      } else if(type == "step_80"){
-        phi[phi < 0.8] <- 0
-        phi[phi > 0] <- 1
-      }
-
-      if(!is.na(mac.range[1])){phi[1:mac.range[1]] <- 0}
-      if(!is.na(mac.range[2])){phi[mac.range[2]:nrow(fwd$alpha)] <- 0}
-
-      i <- which(phi!=0)
-
-      # compress phi
-      clades <- cbind(i,phi[i]) # if i = integer(0) (no clades called), clades will be a 0 x 2 matrix.
-      attr(d.ranks,"clades") <- clades
-
-      if(neighbors){
-        attr(d.ranks,"neighbors") <- if(nrow(clades)){
-          match(2:clades[1,1],d.ranks)
-        } else {
-          NA_integer_
-        }
-      }
-
-      rank_donors_func_res[[j]] <- d.ranks
-    }
-    rank_donors_func_res
-  }
-
-
-  chunks <- chunk_int(ncol(M), chunk.size = forking.chunk.size)
-
-  if(use.forking){
-    # if(use.bettermc){
-    #   rank.list <- bettermc::mclapply(chunks, rank_donors_func, neighbors = neighbors, mc.preschedule = mc.preschedule, mc.cores=nthreads, mc.share.copy = FALSE)
-    # } else {
-      rank.list <- parallel::mclapply(chunks, rank_donors_func, neighbors = neighbors, mc.preschedule = mc.preschedule, mc.cores=nthreads)
-    #}
-  } else {
-    rank.list <- lapply(chunks, rank_donors_func, neighbors = neighbors) # this matrix is ranked in each column, not scaled by Ne or Mu
-  }
-
-  rank.list <- unlist(rank.list,recursive = FALSE)
-
-  attr(rank.list,"from_recipient") <- fwd$from_recipient
-  attr(rank.list,"to_recipient")   <- fwd$to_recipient
-
-  class(rank.list) <- c("kalisClades","list") # rank.list is a list where each element is a vector of ranks with attributes clades
-
-  rank.list
-}
-
-
-#' Neighbors
-#'
-#' Utility for calling tied nearest neighbors for each recipient haplotype
-#' @param x a `kalisClades` object returned by [Clades()]
-#' @param use.forking a logical, should forked processes be used?
-#' @param nthreads the number of CPU cores to use. Currently, no parallelism is used.
-#' @return
-#'   a `kalisNeighbors` encoding the nearest neighbors for each recipient haplotype
-#'
-#' @export Neighbors
-Neighbors <- function(x,
-                      #use.bettermc = FALSE,
-                      use.forking = FALSE, nthreads = 1L){
-  # currently only supports list x but should support matrix x as well
-
-  if(!is.null(attr(x[[1]],"neighbors"))){
-
-    neighbors <- lapply(x,function(z){attr(z,"neighbors")})
-
-  } else {
-
-
-    call_neighbors <- function(z){
-      # x should be a vector of ranks with attribute "clades"
-      clades <- attr(z,"clades")
-      if(nrow(clades)){
-        match(2:clades[1,1],z)
-      } else {
-        NA_integer_
-      }
-    }
-
-    if(use.forking){
-      # if(use.bettermc){
-      #   neighbors <- bettermc::mclapply(x, call_neighbors, mc.cores = nthreads, mc.share.copy = FALSE)
-      # } else {
-        neighbors <- parallel::mclapply(x, call_neighbors, mc.cores = nthreads)
-      #}
-    } else {
-      neighbors <- lapply(x,call_neighbors)
-    }
-  }
-
-  attr(neighbors,"from_recipient") <- attr(x,"from_recipient")
-  attr(neighbors,"to_recipient")   <- attr(x,"to_recipient")
-  class(neighbors) <- c("kalisNeighbors","list")
-
-  neighbors
-}
+# Predecessor to CladeMat with some extra functionality, kept for future reference.
+# #' Probabilistic Clades
+# #'
+# #' Utility for calling probabilistic clades at, in between, or excluding variants.
+# #'
+# #' ...? longer description
+# #'
+# #' @references
+# #' Christ, R., Wang, X., Aslett, L.J.M., Steinsaltz, D. and Hall, I. (2024) "Clade Distillation for Genome-wide Association Studies." bioRxiv 2024.09.30.615852. Available at: \doi{10.1101/2024.09.30.615852}.
+# #'
+# #' @param fwd
+# #'        a `kalisForwardTable` object, as returned by [MakeForwardTable()] and propagated to a target variant by [Forward()].
+# #'        This table must be at the same variant location as argument `bck`.
+# #' @param bck
+# #'        a `kalisBackwardTable` object, as returned by [MakeBackwardTable()] and propagated to a target variant by [Backward()].
+# #'        This table must be at the same variant location as argument `fwd`.
+# #' @param pars
+# #'        a `kalisParameters` object, as returned by [Parameters()].
+# #' @param beta.theta.opts
+# #'        a list; see Details in [DistMat()] documentation page.
+# #' @param safety.checks
+# #'        a logical, should safety checks be applied to the distances?
+# #'        See [DistMat()].
+# #' @param neighbors
+# #'        a logical, should nearest neighbors be pre-calculated?
+# #'        See [Neighbors()].
+# #' @param use.forking
+# #'        a logical, should forked processes be used?
+# #' @param forking.chunk.size
+# #'        ...?
+# #' @param mc.preschedule
+# #'        ...?
+# #' @param nthreads
+# #'        the number of CPU cores to use.
+# #'        By default no parallelism is used.
+# #'
+# #' @return
+# #'   a `kalisClades` object encoding probabilistic clade calls
+# #'
+# #' @importFrom data.table frank
+# #' @export Clades
+# Clades <- function(fwd, bck, pars, beta.theta.opts = NULL,
+#                    safety.checks = FALSE, neighbors = FALSE,
+#                    #use.bettermc = FALSE,
+#                    use.forking = FALSE,
+#                    forking.chunk.size = 100L,
+#                    mc.preschedule = FALSE, # FALSE is more conservative of memory but means many new forked processes need to be launched so it's slower than TRUE
+#                    nthreads = 1L){
+#   # currently only outputs a list but should eventually also output a matrix of integers and an attribute list of clades
+#
+#   unit.mut.dist <- -log(pars$pars$mu)
+#
+#   M <- DistMat(fwd, bck, beta.theta.opts = beta.theta.opts, nthreads = nthreads)
+#
+#   if(safety.checks){
+#     M[!is.finite(M)] <- 0
+#     diag(M) <- NA_real_
+#   }
+#
+#   rank_donors_func <- function(x, type="linear_20", neighbors = FALSE, mac.range = c(NA,NA)){
+#     rank_donors_func_res <- as.list(1:length(x))
+#     for(j in 1:length(x)){
+#       d.ranks <- data.table::frank(M[,x[j]], na.last = FALSE, ties.method = "first")
+#       phi <- c(diff(M[order(d.ranks),x[j]]),0)
+#       phi[1] <- 0
+#       phi <- phi / unit.mut.dist # an N-long vector
+#       if(type == "linear_20"){
+#         phi[phi > 1] <- 1
+#         phi[phi < 0.2] <- 0
+#       } else if(type == "step_80"){
+#         phi[phi < 0.8] <- 0
+#         phi[phi > 0] <- 1
+#       }
+#
+#       if(!is.na(mac.range[1])){phi[1:mac.range[1]] <- 0}
+#       if(!is.na(mac.range[2])){phi[mac.range[2]:nrow(fwd$alpha)] <- 0}
+#
+#       i <- which(phi!=0)
+#
+#       # compress phi
+#       clades <- cbind(i,phi[i]) # if i = integer(0) (no clades called), clades will be a 0 x 2 matrix.
+#       attr(d.ranks,"clades") <- clades
+#
+#       if(neighbors){
+#         attr(d.ranks,"neighbors") <- if(nrow(clades)){
+#           match(2:clades[1,1],d.ranks)
+#         } else {
+#           NA_integer_
+#         }
+#       }
+#
+#       rank_donors_func_res[[j]] <- d.ranks
+#     }
+#     rank_donors_func_res
+#   }
+#
+#
+#   chunks <- chunk_int(ncol(M), chunk.size = forking.chunk.size)
+#
+#   if(use.forking){
+#     # if(use.bettermc){
+#     #   rank.list <- bettermc::mclapply(chunks, rank_donors_func, neighbors = neighbors, mc.preschedule = mc.preschedule, mc.cores=nthreads, mc.share.copy = FALSE)
+#     # } else {
+#       rank.list <- parallel::mclapply(chunks, rank_donors_func, neighbors = neighbors, mc.preschedule = mc.preschedule, mc.cores=nthreads)
+#     #}
+#   } else {
+#     rank.list <- lapply(chunks, rank_donors_func, neighbors = neighbors) # this matrix is ranked in each column, not scaled by Ne or Mu
+#   }
+#
+#   rank.list <- unlist(rank.list,recursive = FALSE)
+#
+#   attr(rank.list,"from_recipient") <- fwd$from_recipient
+#   attr(rank.list,"to_recipient")   <- fwd$to_recipient
+#
+#   class(rank.list) <- c("kalisClades","list") # rank.list is a list where each element is a vector of ranks with attributes clades
+#
+#   rank.list
+# }
+#
+#
+# #' Neighbors
+# #'
+# #' Utility for calling tied nearest neighbors for each recipient haplotype
+# #' @param x a `kalisClades` object returned by [Clades()]
+# #' @param use.forking a logical, should forked processes be used?
+# #' @param nthreads the number of CPU cores to use. Currently, no parallelism is used.
+# #' @return
+# #'   a `kalisNeighbors` encoding the nearest neighbors for each recipient haplotype
+# #'
+# #' @export Neighbors
+# Neighbors <- function(x,
+#                       #use.bettermc = FALSE,
+#                       use.forking = FALSE, nthreads = 1L){
+#   # currently only supports list x but should support matrix x as well
+#
+#   if(!is.null(attr(x[[1]],"neighbors"))){
+#
+#     neighbors <- lapply(x,function(z){attr(z,"neighbors")})
+#
+#   } else {
+#
+#
+#     call_neighbors <- function(z){
+#       # x should be a vector of ranks with attribute "clades"
+#       clades <- attr(z,"clades")
+#       if(nrow(clades)){
+#         match(2:clades[1,1],z)
+#       } else {
+#         NA_integer_
+#       }
+#     }
+#
+#     if(use.forking){
+#       # if(use.bettermc){
+#       #   neighbors <- bettermc::mclapply(x, call_neighbors, mc.cores = nthreads, mc.share.copy = FALSE)
+#       # } else {
+#         neighbors <- parallel::mclapply(x, call_neighbors, mc.cores = nthreads)
+#       #}
+#     } else {
+#       neighbors <- lapply(x,call_neighbors)
+#     }
+#   }
+#
+#   attr(neighbors,"from_recipient") <- attr(x,"from_recipient")
+#   attr(neighbors,"to_recipient")   <- attr(x,"to_recipient")
+#   class(neighbors) <- c("kalisNeighbors","list")
+#
+#   neighbors
+# }
 
 
-#' Sprigs
-#'
-#' Utility for calling sprigs from probabilistic clades
-#' @param x a `kalisNeighbors` object returned by [Neighbors()], a `kalisClades` object returned by [Clades()] with `neighbors = TRUE`, or a list
-#' @param use.forking a logical, should forked processes be used?
-#' @param nthreads the number of CPU cores to use. Currently, no parallelism is used.
-#' @return
-#'   a `kalisSprigs` object assigning each haplotype to a sprig
-#'
-#' @export Sprigs_old
+# Old sprigs and clademat have many ideas (including adjustments for pop structure)
+# that are not incorporated into new functions -- ideas to come back to
 Sprigs_old <- function(x, use.forking = FALSE, nthreads = 1L, add.self = TRUE){
 
   # this version of Sprigs still has a bit of randomness in it's sprig building between runs on the same input
@@ -493,126 +490,126 @@ Sprigs_old <- function(x, use.forking = FALSE, nthreads = 1L, add.self = TRUE){
   roster
 }
 
-#Testing Sprigs
-# kalis::Sprigs(list(
-#   1:2,
-#   1:2,
-#   3:7,
-#   1:10,
-#   1:10,
-#   1:10,
-#   5:11
-# ))
-
-#' CladeMat OLD
-#'
-#' Utility for contructing a probabilistic clade matrix
-#' @param x a `kalisClades` object returned by [Clades()]
-#' @param ploidy an integer, the ploidy of the organism
-#' @param sprigs.to.prune a `kalisSprigs` object returned by [Sprigs()] encoding sprigs that should be excluded from the matrix returned
-#' @param assemble a logical, if `FALSE` return the clade matrix as a list of columns rather than as a symmetrized matrix
-#' @param use.forking a logical, should forked processes be used?
-#' @param nthreads the number of CPU cores to use. Currently, no parallelism is used.
-#' @return
-#'   a matrix representation of the probabilistic clades provided
-#'
-#' @export CladeMat_old
-CladeMat_old <- function(x, ploidy = 2L, sprigs.to.prune = NULL, assemble = TRUE,
-                         #use.bettermc = FALSE,
-                         use.forking = FALSE, forking.chunk.size = 100L, mc.preschedule = FALSE, nthreads = 1L){
-
-  # prepare sprigs
-  if(is.null(sprigs.to.prune)){sprigs.to.prune <- integer()}
-  sl <- length(sprigs.to.prune)
-  if(sl){sprig.sizes <- tabulate(sprigs.to.prune)}
-
-  n.recipient.samples <- as.integer(length(x)/ploidy)
-
-  chunks <- chunk_int(n.recipient.samples, chunk.size = forking.chunk.size)
-
-  if(ploidy == 1){
-    omega_func <- function(s){
-      omega_func_res <- as.list(1:length(s))
-      for(j in 1:length(s)){
-
-        N <- length(x[[s[j]]])
-
-        idx <- attr(x[[s[j]]],"clades")[,1]
-        phi <- attr(x[[s[j]]],"clades")[,2]
-
-        # prune sprig
-        if(sl && !is.na(sprigs.to.prune[s[j]]) && length(idx) && sprig.sizes[sprigs.to.prune[s[j]]] == idx[1]){
-          idx <- idx[-1]
-          phi <- phi[-1]
-        }
-
-        # we know that phi[N] = 0, so there must always be a 0 appended
-        omega_func_res[[j]] <-  inverse.rle(list("values" =  c(rev(cumsum(rev(phi/idx))),0),
-                                                 "lengths" = diff(c(0,idx,N))))[x[[s[j]]]]
-
-      }
-      omega_func_res
-    }
-
-  } else if(ploidy == 2){
-
-    omega_func <- function(s){
-      omega_func_res <- as.list(1:length(s))
-      for(j in 1:length(s)){
-        N <- length(x[[s[j]]])
-
-        idx <- attr(x[[s[j]*2-1]],"clades")[,1]
-        phi <- attr(x[[s[j]*2-1]],"clades")[,2]
-
-        idx2 <- attr(x[[s[j]*2]],"clades")[,1]
-        phi2 <- attr(x[[s[j]*2]],"clades")[,2]
-
-
-        if(sl && !is.na(sprigs.to.prune[s[j]*2-1]) && length(idx) && sprig.sizes[sprigs.to.prune[s[j]*2-1]] == idx[1]){
-          idx <- idx[-1]
-          phi <- phi[-1]
-        }
-
-        if(sl && !is.na(sprigs.to.prune[s[j]*2]) && length(idx2) && sprig.sizes[sprigs.to.prune[s[j]*2]] == idx2[1]){
-          idx2 <- idx2[-1]
-          phi2 <- phi2[-1]
-        }
-
-        # we know that phi[N] = 0, so there must always be a 0 appended
-        w <- inverse.rle(list("values" =  c(rev(cumsum(rev(phi/idx))),0),
-                              "lengths" = diff(c(0,idx,N))))[x[[s[j]*2-1]]] +
-          inverse.rle(list("values" =  c(rev(cumsum(rev(phi2/idx2))),0),
-                           "lengths" = diff(c(0,idx2,N))))[x[[s[j]*2]]]
-
-        omega_func_res[[j]] <- w[seq(1,N,by=2)] + w[seq(2,N,by=2)]
-      }
-      omega_func_res
-    }
-
-  } else {
-    stop("Relatedness currently only supports ploidy  = 1 or 2")
-  }
-
-  # we don't simplify this list to a matrix at this stage to help preserve memory.
-  if(use.forking){
-    # if(use.bettermc){
-    #   res <- bettermc::mclapply(chunks, omega_func, mc.preschedule = mc.preschedule, mc.cores=nthreads, mc.share.copy = FALSE)
-    # } else {
-      res <- parallel::mclapply(chunks, omega_func, mc.preschedule = mc.preschedule, mc.cores=nthreads)
-    #}
-  } else {
-    res <- lapply(chunks, omega_func)
-  }
-
-  res <- unlist(res, recursive = FALSE)
-
-  if(assemble){
-    res <- do.call(cbind,res)
-    res <- 0.5 * (res + t(res))
-  }
-
-  res
-}
+##Testing Sprigs
+## kalis::Sprigs(list(
+##   1:2,
+##   1:2,
+##   3:7,
+##   1:10,
+##   1:10,
+##   1:10,
+##   5:11
+## ))
+#
+# #' CladeMat OLD
+# #'
+# #' Utility for contructing a probabilistic clade matrix
+# #' @param x a `kalisClades` object returned by [Clades()]
+# #' @param ploidy an integer, the ploidy of the organism
+# #' @param sprigs.to.prune a `kalisSprigs` object returned by [Sprigs()] encoding sprigs that should be excluded from the matrix returned
+# #' @param assemble a logical, if `FALSE` return the clade matrix as a list of columns rather than as a symmetrized matrix
+# #' @param use.forking a logical, should forked processes be used?
+# #' @param nthreads the number of CPU cores to use. Currently, no parallelism is used.
+# #' @return
+# #'   a matrix representation of the probabilistic clades provided
+# #'
+# #' @export CladeMat_old
+#CladeMat_old <- function(x, ploidy = 2L, sprigs.to.prune = NULL, assemble = TRUE,
+#                         #use.bettermc = FALSE,
+#                         use.forking = FALSE, forking.chunk.size = 100L, mc.preschedule = FALSE, nthreads = 1L){
+#
+#  # prepare sprigs
+#  if(is.null(sprigs.to.prune)){sprigs.to.prune <- integer()}
+#  sl <- length(sprigs.to.prune)
+#  if(sl){sprig.sizes <- tabulate(sprigs.to.prune)}
+#
+#  n.recipient.samples <- as.integer(length(x)/ploidy)
+#
+#  chunks <- chunk_int(n.recipient.samples, chunk.size = forking.chunk.size)
+#
+#  if(ploidy == 1){
+#    omega_func <- function(s){
+#      omega_func_res <- as.list(1:length(s))
+#      for(j in 1:length(s)){
+#
+#        N <- length(x[[s[j]]])
+#
+#        idx <- attr(x[[s[j]]],"clades")[,1]
+#        phi <- attr(x[[s[j]]],"clades")[,2]
+#
+#        # prune sprig
+#        if(sl && !is.na(sprigs.to.prune[s[j]]) && length(idx) && sprig.sizes[sprigs.to.prune[s[j]]] == idx[1]){
+#          idx <- idx[-1]
+#          phi <- phi[-1]
+#        }
+#
+#        # we know that phi[N] = 0, so there must always be a 0 appended
+#        omega_func_res[[j]] <-  inverse.rle(list("values" =  c(rev(cumsum(rev(phi/idx))),0),
+#                                                 "lengths" = diff(c(0,idx,N))))[x[[s[j]]]]
+#
+#      }
+#      omega_func_res
+#    }
+#
+#  } else if(ploidy == 2){
+#
+#    omega_func <- function(s){
+#      omega_func_res <- as.list(1:length(s))
+#      for(j in 1:length(s)){
+#        N <- length(x[[s[j]]])
+#
+#        idx <- attr(x[[s[j]*2-1]],"clades")[,1]
+#        phi <- attr(x[[s[j]*2-1]],"clades")[,2]
+#
+#        idx2 <- attr(x[[s[j]*2]],"clades")[,1]
+#        phi2 <- attr(x[[s[j]*2]],"clades")[,2]
+#
+#
+#        if(sl && !is.na(sprigs.to.prune[s[j]*2-1]) && length(idx) && sprig.sizes[sprigs.to.prune[s[j]*2-1]] == idx[1]){
+#          idx <- idx[-1]
+#          phi <- phi[-1]
+#        }
+#
+#        if(sl && !is.na(sprigs.to.prune[s[j]*2]) && length(idx2) && sprig.sizes[sprigs.to.prune[s[j]*2]] == idx2[1]){
+#          idx2 <- idx2[-1]
+#          phi2 <- phi2[-1]
+#        }
+#
+#        # we know that phi[N] = 0, so there must always be a 0 appended
+#        w <- inverse.rle(list("values" =  c(rev(cumsum(rev(phi/idx))),0),
+#                              "lengths" = diff(c(0,idx,N))))[x[[s[j]*2-1]]] +
+#          inverse.rle(list("values" =  c(rev(cumsum(rev(phi2/idx2))),0),
+#                           "lengths" = diff(c(0,idx2,N))))[x[[s[j]*2]]]
+#
+#        omega_func_res[[j]] <- w[seq(1,N,by=2)] + w[seq(2,N,by=2)]
+#      }
+#      omega_func_res
+#    }
+#
+#  } else {
+#    stop("Relatedness currently only supports ploidy  = 1 or 2")
+#  }
+#
+#  # we don't simplify this list to a matrix at this stage to help preserve memory.
+#  if(use.forking){
+#    # if(use.bettermc){
+#    #   res <- bettermc::mclapply(chunks, omega_func, mc.preschedule = mc.preschedule, mc.cores=nthreads, mc.share.copy = FALSE)
+#    # } else {
+#      res <- parallel::mclapply(chunks, omega_func, mc.preschedule = mc.preschedule, mc.cores=nthreads)
+#    #}
+#  } else {
+#    res <- lapply(chunks, omega_func)
+#  }
+#
+#  res <- unlist(res, recursive = FALSE)
+#
+#  if(assemble){
+#    res <- do.call(cbind,res)
+#    res <- 0.5 * (res + t(res))
+#  }
+#
+#  res
+#}
 
 chunk_int <- function(n, chunk.size = 100){
   # subdivide 1:n into chunks of size at most chunk.size
diff --git a/R/Iterator.R b/R/Iterator.R
index 5c89738..061a20f 100644
--- a/R/Iterator.R
+++ b/R/Iterator.R
@@ -1,6 +1,6 @@
 #' Build an efficient iterator over loci
 #'
-#' Create a `kalisForwardIterator` for propagating a forward table iteratively over target variants using a table cache and optimal checkpointing.
+#' Function factory to create a `kalisForwardIterator` for propagating a forward table iteratively over target variants using a table cache and optimal checkpointing.
 #'
 #' See example.
 #'
@@ -29,21 +29,27 @@
 #'        By default all are included upto the last recipient haplotype.
 #'        Haplotypes are indexed from 1.
 #' @param lookup.tables
-#'        TODO
+#'        an optional list as returned by [CalcCheckpointTables()].
 #' @param cache
 #'        a `kalisCheckpointTable` object, as returned by [CreateForwardTableCache()] or this function.
 #'        By default `NULL`, which causes this function to create a new cache.
 #' @param save.cache
-#'        TODO
-#' @param exact
-#'        TODO
+#'        a logical.
+#'        When `TRUE` does not reliquish the table cache upon exhaustion of the iterator.
+#'        Defaults to `FALSE`.
 #' @param force.unif
 #'        a logical, if `TRUE` iterate over targets as if they were uniformly spaced.
 #'        WARNING: DO NOT use this in conjunction with the targets method, still experimental.
 #'        With `force.unif = TRUE`, the resulting iterator will appear to be targeting the first `length(targets)` variants with all methods, but in fact will be silently iterating over the original targets.
 #'
 #' @return
-#' TODO
+#' A function for iterating over the set of target variants.
+#' The returned function has prototype:
+#'
+#' `function(fwd, pars, t, nthreads = 1)`
+#'
+#' which matches the standard [Forward()] function, but which uses the table cache to speed up propagation to the target variant.
+#' See [Forward()] for an explanation of arguments.
 #'
 #' @seealso
 #' [MakeForwardTable()] to create a `kalisForwardTable`;
@@ -76,7 +82,6 @@ ForwardIterator <- function(pars,
                             lookup.tables = NULL,
                             cache = NULL,
                             save.cache = FALSE,
-                            exact = TRUE,
                             force.unif = FALSE){
 
   force(force.unif)
@@ -169,7 +174,7 @@ ForwardIterator <- function(pars,
 
     if(is.null(lookup.tables)){
       message("Calculating Optimal Checkpoint Schedule")
-      lookup.tables <- calc_tables(propagation.cost,num.available.ckpts)
+      lookup.tables <- CalcCheckpointTables(propagation.cost,num.available.ckpts)
     }
 
     cost.table <- lookup.tables$cost
@@ -338,8 +343,29 @@ plot.kalisIterator <- function(x, ...){
 }
 
 
+#' Calculate Checkpoint Tables
+#'
+#' Calculate look up tables for solving optimal checkpointing problems with dynamic programming.
+#'
+#' @references
+#' Christ, R., Wang, X., Aslett, L.J.M., Steinsaltz, D. and Hall, I. (2024) "Clade Distillation for Genome-wide Association Studies." bioRxiv 2024.09.30.615852. Available at: \doi{10.1101/2024.09.30.615852}.
+#'
+#' @param propagation.cost
+#'        a non-negative vector such that `propagation.cost[i]` gives the relative amount of time or cost required to propagate `i` steps
+#' @param max.num.checkpoints
+#'        the maximum number of checkpoints that should be considered when building the checkpoint table.
+#' @param use.R
+#'        a logical, when TRUE use base R rather than C implementation of table building. Defaults to FALSE.
+#'
+#' @return
+#' a list containing:
+#' \describe{
+#'   \item{`cost`}{the matrix \eqn{F} in Christ et al. (2024)}
+#'   \item{`index`}{the matrix \eqn{H} in Christ et al. (2024)}
+#' }
+#'
 #' @export
-calc_tables <- function(propagation.cost,max.num.checkpoints, use.R = FALSE){
+CalcCheckpointTables <- function(propagation.cost,max.num.checkpoints, use.R = FALSE){
   start <- proc.time()
 
   propagation.cost <- as.numeric(propagation.cost)
diff --git a/man/CalcCheckpointTables.Rd b/man/CalcCheckpointTables.Rd
new file mode 100644
index 0000000..5e772f0
--- /dev/null
+++ b/man/CalcCheckpointTables.Rd
@@ -0,0 +1,28 @@
+% Generated by roxygen2: do not edit by hand
+% Please edit documentation in R/Iterator.R
+\name{CalcCheckpointTables}
+\alias{CalcCheckpointTables}
+\title{Calculate Checkpoint Tables}
+\usage{
+CalcCheckpointTables(propagation.cost, max.num.checkpoints, use.R = FALSE)
+}
+\arguments{
+\item{propagation.cost}{a non-negative vector such that \code{propagation.cost[i]} gives the relative amount of time or cost required to propagate \code{i} steps}
+
+\item{max.num.checkpoints}{the maximum number of checkpoints that should be considered when building the checkpoint table.}
+
+\item{use.R}{a logical, when TRUE use base R rather than C implementation of table building. Defaults to FALSE.}
+}
+\value{
+a list containing:
+\describe{
+\item{\code{cost}}{the matrix \eqn{F} in Christ et al. (2024)}
+\item{\code{index}}{the matrix \eqn{H} in Christ et al. (2024)}
+}
+}
+\description{
+Calculate look up tables for solving optimal checkpointing problems with dynamic programming.
+}
+\references{
+Christ, R., Wang, X., Aslett, L.J.M., Steinsaltz, D. and Hall, I. (2024) "Clade Distillation for Genome-wide Association Studies." bioRxiv 2024.09.30.615852. Available at: \doi{10.1101/2024.09.30.615852}.
+}
diff --git a/man/CladeMat.Rd b/man/CladeMat.Rd
index 1d7eee6..81e8ba5 100644
--- a/man/CladeMat.Rd
+++ b/man/CladeMat.Rd
@@ -27,7 +27,7 @@ This matrix is overwritten in place with the clade matrix result for performance
 
 \item{unit.dist}{the change in distance that is expected to correspond to a single mutation (typically \eqn{-\log(\mu)}) for the LS model)}
 
-\item{thresh}{a regularization parameter: \if{html}{\out{<!-- TODO: can't parse this sentence -->}} differences distances must exceed this threshold (in \code{unit.dist} units) in order to used in forming the local relatedness matrix.
+\item{thresh}{a regularization parameter: differences of distances must exceed this threshold (in \code{unit.dist} units) in order to cause the introduction of a probabilistic clade.
 Defaults to \code{0.2}.}
 
 \item{max1var}{a logical regularization parameter.
diff --git a/man/CladeMat_old.Rd b/man/CladeMat_old.Rd
deleted file mode 100644
index 7695578..0000000
--- a/man/CladeMat_old.Rd
+++ /dev/null
@@ -1,36 +0,0 @@
-% Generated by roxygen2: do not edit by hand
-% Please edit documentation in R/Clades.R
-\name{CladeMat_old}
-\alias{CladeMat_old}
-\title{CladeMat OLD}
-\usage{
-CladeMat_old(
-  x,
-  ploidy = 2L,
-  sprigs.to.prune = NULL,
-  assemble = TRUE,
-  use.forking = FALSE,
-  forking.chunk.size = 100L,
-  mc.preschedule = FALSE,
-  nthreads = 1L
-)
-}
-\arguments{
-\item{x}{a \code{kalisClades} object returned by \code{\link[=Clades]{Clades()}}}
-
-\item{ploidy}{an integer, the ploidy of the organism}
-
-\item{sprigs.to.prune}{a \code{kalisSprigs} object returned by \code{\link[=Sprigs]{Sprigs()}} encoding sprigs that should be excluded from the matrix returned}
-
-\item{assemble}{a logical, if \code{FALSE} return the clade matrix as a list of columns rather than as a symmetrized matrix}
-
-\item{use.forking}{a logical, should forked processes be used?}
-
-\item{nthreads}{the number of CPU cores to use. Currently, no parallelism is used.}
-}
-\value{
-a matrix representation of the probabilistic clades provided
-}
-\description{
-Utility for contructing a probabilistic clade matrix
-}
diff --git a/man/Clades.Rd b/man/Clades.Rd
deleted file mode 100644
index 8e8dee7..0000000
--- a/man/Clades.Rd
+++ /dev/null
@@ -1,57 +0,0 @@
-% Generated by roxygen2: do not edit by hand
-% Please edit documentation in R/Clades.R
-\name{Clades}
-\alias{Clades}
-\title{Probabilistic Clades}
-\usage{
-Clades(
-  fwd,
-  bck,
-  pars,
-  beta.theta.opts = NULL,
-  safety.checks = FALSE,
-  neighbors = FALSE,
-  use.forking = FALSE,
-  forking.chunk.size = 100L,
-  mc.preschedule = FALSE,
-  nthreads = 1L
-)
-}
-\arguments{
-\item{fwd}{a \code{kalisForwardTable} object, as returned by \code{\link[=MakeForwardTable]{MakeForwardTable()}} and propagated to a target variant by \code{\link[=Forward]{Forward()}}.
-This table must be at the same variant location as argument \code{bck}.}
-
-\item{bck}{a \code{kalisBackwardTable} object, as returned by \code{\link[=MakeBackwardTable]{MakeBackwardTable()}} and propagated to a target variant by \code{\link[=Backward]{Backward()}}.
-This table must be at the same variant location as argument \code{fwd}.}
-
-\item{pars}{a \code{kalisParameters} object, as returned by \code{\link[=Parameters]{Parameters()}}.}
-
-\item{beta.theta.opts}{a list; see Details in \code{\link[=DistMat]{DistMat()}} documentation page.}
-
-\item{safety.checks}{a logical, should safety checks be applied to the distances?
-See \code{\link[=DistMat]{DistMat()}}.}
-
-\item{neighbors}{a logical, should nearest neighbors be pre-calculated?
-See \code{\link[=Neighbors]{Neighbors()}}.}
-
-\item{use.forking}{a logical, should forked processes be used?}
-
-\item{forking.chunk.size}{TODO}
-
-\item{mc.preschedule}{TODO}
-
-\item{nthreads}{the number of CPU cores to use.
-By default no parallelism is used.}
-}
-\value{
-a \code{kalisClades} object encoding probabilistic clade calls
-}
-\description{
-Utility for calling probabilistic clades at, in between, or excluding variants.
-}
-\details{
-TODO longer description
-}
-\references{
-Christ, R., Wang, X., Aslett, L.J.M., Steinsaltz, D. and Hall, I. (2024) "Clade Distillation for Genome-wide Association Studies." bioRxiv 2024.09.30.615852. Available at: \doi{10.1101/2024.09.30.615852}.
-}
diff --git a/man/ForwardIterator.Rd b/man/ForwardIterator.Rd
index e16d46f..0c027a8 100644
--- a/man/ForwardIterator.Rd
+++ b/man/ForwardIterator.Rd
@@ -16,7 +16,6 @@ ForwardIterator(
   lookup.tables = NULL,
   cache = NULL,
   save.cache = FALSE,
-  exact = TRUE,
   force.unif = FALSE
 )
 }
@@ -42,24 +41,30 @@ Haplotypes are indexed from 1.}
 By default all are included upto the last recipient haplotype.
 Haplotypes are indexed from 1.}
 
-\item{lookup.tables}{TODO}
+\item{lookup.tables}{an optional list as returned by \code{\link[=CalcCheckpointTables]{CalcCheckpointTables()}}.}
 
 \item{cache}{a \code{kalisCheckpointTable} object, as returned by \code{\link[=CreateForwardTableCache]{CreateForwardTableCache()}} or this function.
 By default \code{NULL}, which causes this function to create a new cache.}
 
-\item{save.cache}{TODO}
-
-\item{exact}{TODO}
+\item{save.cache}{a logical.
+When \code{TRUE} does not reliquish the table cache upon exhaustion of the iterator.
+Defaults to \code{FALSE}.}
 
 \item{force.unif}{a logical, if \code{TRUE} iterate over targets as if they were uniformly spaced.
 WARNING: DO NOT use this in conjunction with the targets method, still experimental.
 With \code{force.unif = TRUE}, the resulting iterator will appear to be targeting the first \code{length(targets)} variants with all methods, but in fact will be silently iterating over the original targets.}
 }
 \value{
-TODO
+A function for iterating over the set of target variants.
+The returned function has prototype:
+
+\verb{function(fwd, pars, t, nthreads = 1)}
+
+which matches the standard \code{\link[=Forward]{Forward()}} function, but which uses the table cache to speed up propagation to the target variant.
+See \code{\link[=Forward]{Forward()}} for an explanation of arguments.
 }
 \description{
-Create a \code{kalisForwardIterator} for propagating a forward table iteratively over target variants using a table cache and optimal checkpointing.
+Function factory to create a \code{kalisForwardIterator} for propagating a forward table iteratively over target variants using a table cache and optimal checkpointing.
 }
 \details{
 See example.
diff --git a/man/Neighbors.Rd b/man/Neighbors.Rd
deleted file mode 100644
index 63e1695..0000000
--- a/man/Neighbors.Rd
+++ /dev/null
@@ -1,21 +0,0 @@
-% Generated by roxygen2: do not edit by hand
-% Please edit documentation in R/Clades.R
-\name{Neighbors}
-\alias{Neighbors}
-\title{Neighbors}
-\usage{
-Neighbors(x, use.forking = FALSE, nthreads = 1L)
-}
-\arguments{
-\item{x}{a \code{kalisClades} object returned by \code{\link[=Clades]{Clades()}}}
-
-\item{use.forking}{a logical, should forked processes be used?}
-
-\item{nthreads}{the number of CPU cores to use. Currently, no parallelism is used.}
-}
-\value{
-a \code{kalisNeighbors} encoding the nearest neighbors for each recipient haplotype
-}
-\description{
-Utility for calling tied nearest neighbors for each recipient haplotype
-}
diff --git a/man/PruneCladeMat.Rd b/man/PruneCladeMat.Rd
index e194061..9a7b8c9 100644
--- a/man/PruneCladeMat.Rd
+++ b/man/PruneCladeMat.Rd
@@ -2,29 +2,28 @@
 % Please edit documentation in R/Clades.R
 \name{PruneCladeMat}
 \alias{PruneCladeMat}
-\title{Title TODO}
+\title{Prune called sprigs or singletons from inferred clade matrix}
 \usage{
-PruneCladeMat(M, neigh, sprigs, prune = "singleton.info", from.recipient = 1L)
+PruneCladeMat(M, neigh, sprigs, prune = "singleton.info", from_recipient = 1L)
 }
 \arguments{
-\item{M}{TODO}
+\item{M}{clade matrix such as that updated by \code{\link[=CladeMat]{CladeMat()}}}
 
-\item{neigh}{TODO}
+\item{neigh}{a list of nearest neighborhoods as retuned by \code{\link[=CladeMat]{CladeMat()}}}
 
-\item{sprigs}{TODO}
+\item{sprigs}{a sprigs object as returned by \code{\link[=Sprigs]{Sprigs()}}}
 
-\item{prune}{TODO}
+\item{prune}{a character indicating the type of information to be removed from the \code{\link[=CladeMat]{CladeMat()}}. See Details.}
 
-\item{from.recipient}{TODO}
+\item{from_recipient}{haplotype index at which to start trace calculation --- useful for distributed computation (experimental feature, more documentation to come\if{html}{\out{<!-- TODO -->}})}
 }
 \value{
-TODO
+There is nothing returned.
+
+\strong{NOTE:} for performance reasons, \code{M} is updated in-place.
 }
 \description{
-Short Description TODO
-}
-\details{
-Long Description TODO
+Use haplotype nearest neighborhoods and other information returned by \code{\link[=CladeMat]{CladeMat()}} to efficiently remove structure corresponding to singletons or called sprigs from clade matrix 'M'
 }
 \examples{
 # TODO
diff --git a/man/Sprigs.Rd b/man/Sprigs.Rd
index 01cec11..b276ab0 100644
--- a/man/Sprigs.Rd
+++ b/man/Sprigs.Rd
@@ -2,23 +2,28 @@
 % Please edit documentation in R/Clades.R
 \name{Sprigs}
 \alias{Sprigs}
-\title{Title TODO}
+\title{Greedy sprig calling based on nearest neighbourhoods}
 \usage{
 Sprigs(x, old.sprigs = FALSE)
 }
 \arguments{
-\item{x}{TODO}
+\item{x}{list of where each entry is a nearest neighborhood of integers as returned by \code{\link[=CladeMat]{CladeMat()}}}
 
-\item{old.sprigs}{TODO}
+\item{old.sprigs}{If TRUE, use an earlier (undocumented) version of maximal clique calling, defaults to FALSE.}
 }
 \value{
-TODO
+a list containing:
+\describe{
+\item{\code{assignments}}{a vector of integers such that \code{assignments[i]} gives the sprig to which haplotype \code{i} belongs. \code{NA} if a haplotype was not assigned to a sprig.}
+\item{\code{to.prune}}{a vector of logicals, \code{to.prune[i]==TRUE} when haplotype i has been assigned to a sprig}
+\item{\code{num.sprigs}}{total number of sprigs calls, equal to \code{max(assignements,rm.na=TRUE)}}
+}
 }
 \description{
-Short Description TODO
+Infer sprigs (very small clades) within a local phylogeny based on one-directional nearest neighbourhoods assigned to each haplotype
 }
 \details{
-Long Description TODO
+Call maximal cliques within a directed graph where edges correspond to nearest neighbour relationships
 }
 \examples{
 # TODO
diff --git a/man/Sprigs_old.Rd b/man/Sprigs_old.Rd
deleted file mode 100644
index 4e76fb2..0000000
--- a/man/Sprigs_old.Rd
+++ /dev/null
@@ -1,21 +0,0 @@
-% Generated by roxygen2: do not edit by hand
-% Please edit documentation in R/Clades.R
-\name{Sprigs_old}
-\alias{Sprigs_old}
-\title{Sprigs}
-\usage{
-Sprigs_old(x, use.forking = FALSE, nthreads = 1L, add.self = TRUE)
-}
-\arguments{
-\item{x}{a \code{kalisNeighbors} object returned by \code{\link[=Neighbors]{Neighbors()}}, a \code{kalisClades} object returned by \code{\link[=Clades]{Clades()}} with \code{neighbors = TRUE}, or a list}
-
-\item{use.forking}{a logical, should forked processes be used?}
-
-\item{nthreads}{the number of CPU cores to use. Currently, no parallelism is used.}
-}
-\value{
-a \code{kalisSprigs} object assigning each haplotype to a sprig
-}
-\description{
-Utility for calling sprigs from probabilistic clades
-}

From 1b029526f4ae690096d3bd5e3be83bf22be63760 Mon Sep 17 00:00:00 2001
From: Louis Aslett <louis.aslett@durham.ac.uk>
Date: Wed, 13 Nov 2024 18:14:19 +0000
Subject: [PATCH 43/43] Final documentation sweep for correct references, and
 other minor tweaks

---
 R/CalcTraces.R                 |   3 +
 R/CladeMat.R                   |   2 +-
 R/Clades.R                     |  27 +++---
 R/Iterator.R                   |  12 +--
 R/Parameters.R                 |   6 +-
 R/Probs.R                      |   2 +-
 R/TableCache.R                 | 147 +++++++++++++++------------------
 README.md                      |  19 ++++-
 man/CalcCheckpointTables.Rd    |  10 ++-
 man/CalcRho.Rd                 |   2 +-
 man/CalcTraces.Rd              |   3 +
 man/CladeMat.Rd                |   2 +-
 man/CreateForwardTableCache.Rd |  22 ++---
 man/DistMat.Rd                 |   2 +-
 man/FillTableCache.Rd          |  27 +++---
 man/ForwardIterator.Rd         |   2 +-
 man/ForwardUsingTableCache.Rd  |  47 ++++-------
 man/Parameters.Rd              |   4 +-
 man/PruneCladeMat.Rd           |   8 +-
 man/Sprigs.Rd                  |  17 ++--
 20 files changed, 183 insertions(+), 181 deletions(-)

diff --git a/R/CalcTraces.R b/R/CalcTraces.R
index 6248959..0c105a7 100644
--- a/R/CalcTraces.R
+++ b/R/CalcTraces.R
@@ -4,6 +4,9 @@
 #'
 #' \eqn{P} here is assumed to have the form \eqn{I-QQ'} for some matrix \eqn{Q} of orthogonal columns.
 #'
+#' @references
+#' Christ, R.R., Wang, X., Aslett, L.J.M., Steinsaltz, D. and Hall, I. (2024) "Clade Distillation for Genome-wide Association Studies", bioRxiv 2024.09.30.615852. Available at: \doi{10.1101/2024.09.30.615852}.
+#'
 #' @param M
 #'        a real symmetric R matrix
 #' @param tX
diff --git a/R/CladeMat.R b/R/CladeMat.R
index 9af70ed..7bda476 100644
--- a/R/CladeMat.R
+++ b/R/CladeMat.R
@@ -6,7 +6,7 @@
 #' `CladeMat()` uses the forward and backward tables to construct the corresponding clade matrix which can then be tested, for example using a standard quadratic form score statistic.
 #'
 #' @references
-#' Christ, R., Wang, X., Aslett, L.J.M., Steinsaltz, D. and Hall, I. (2024) "Clade Distillation for Genome-wide Association Studies." bioRxiv 2024.09.30.615852. Available at: \doi{10.1101/2024.09.30.615852}.
+#' Christ, R.R., Wang, X., Aslett, L.J.M., Steinsaltz, D. and Hall, I. (2024) "Clade Distillation for Genome-wide Association Studies", bioRxiv 2024.09.30.615852. Available at: \doi{10.1101/2024.09.30.615852}.
 #'
 #' @param fwd
 #'        a `kalisForwardTable` object, as returned by [MakeForwardTable()] and propagated to a target variant by [Forward()].
diff --git a/R/Clades.R b/R/Clades.R
index dc5612b..ef6fdcb 100644
--- a/R/Clades.R
+++ b/R/Clades.R
@@ -19,21 +19,24 @@ get_neigh_seq <- function(x, i, return.lengths = FALSE){
 
 #' Greedy sprig calling based on nearest neighbourhoods
 #'
-#' Infer sprigs (very small clades) within a local phylogeny based on one-directional nearest neighbourhoods assigned to each haplotype
+#' Infer sprigs (very small clades) within a local phylogeny based on one-directional nearest neighbourhoods assigned to each haplotype.
 #'
-#' Call maximal cliques within a directed graph where edges correspond to nearest neighbour relationships
+#' Call maximal cliques within a directed graph where edges correspond to nearest neighbour relationships.
+#'
+#' @references
+#' Christ, R.R., Wang, X., Aslett, L.J.M., Steinsaltz, D. and Hall, I. (2024) "Clade Distillation for Genome-wide Association Studies", bioRxiv 2024.09.30.615852. Available at: \doi{10.1101/2024.09.30.615852}.
 #'
 #' @param x
-#'        list of where each entry is a nearest neighborhood of integers as returned by [CladeMat()]
+#'        list of integers where each entry is a nearest neighbourhood as returned by [CladeMat()]
 #' @param old.sprigs
-#'        If TRUE, use an earlier (undocumented) version of maximal clique calling, defaults to FALSE.
+#'        If `TRUE`, use an earlier (undocumented) version of maximal clique calling, defaults to `FALSE`.
 #'
 #' @return
 #' a list containing:
 #' \describe{
-#'   \item{`assignments`}{a vector of integers such that `assignments[i]` gives the sprig to which haplotype `i` belongs. `NA` if a haplotype was not assigned to a sprig.}
-#'   \item{`to.prune`}{a vector of logicals, `to.prune[i]==TRUE` when haplotype i has been assigned to a sprig}
-#'   \item{`num.sprigs`}{total number of sprigs calls, equal to `max(assignements,rm.na=TRUE)`}
+#'   \item{`assignments`}{a vector of integers such that `$assignments[i]` gives the sprig to which haplotype `i` belongs. `NA` if a haplotype was not assigned to a sprig.}
+#'   \item{`to.prune`}{a vector of logicals, `$to.prune[i]==TRUE` when haplotype i has been assigned to a sprig}
+#'   \item{`num.sprigs`}{total number of sprigs calls, equal to `max($assignements, rm.na = TRUE)`}
 #' }
 #'
 #' @examples
@@ -140,7 +143,10 @@ UpdateMatrixInPlace <- function(M,row.idx,col.idx,x){
 
 #' Prune called sprigs or singletons from inferred clade matrix
 #'
-#' Use haplotype nearest neighborhoods and other information returned by [CladeMat()] to efficiently remove structure corresponding to singletons or called sprigs from clade matrix 'M'
+#' Use haplotype nearest neighbourhoods and other information returned by [CladeMat()] to efficiently remove structure corresponding to singletons or called sprigs from clade matrix 'M'
+#'
+#' @references
+#' Christ, R.R., Wang, X., Aslett, L.J.M., Steinsaltz, D. and Hall, I. (2024) "Clade Distillation for Genome-wide Association Studies", bioRxiv 2024.09.30.615852. Available at: \doi{10.1101/2024.09.30.615852}.
 #'
 #' @param M
 #'        clade matrix such as that updated by [CladeMat()]
@@ -149,7 +155,8 @@ UpdateMatrixInPlace <- function(M,row.idx,col.idx,x){
 #' @param sprigs
 #'        a sprigs object as returned by [Sprigs()]
 #' @param prune
-#'        a character indicating the type of information to be removed from the [CladeMat()]. See Details.
+#'        a character indicating the type of information to be removed from the [CladeMat()].
+#'        See Details.
 #' @param from_recipient
 #'        haplotype index at which to start trace calculation --- useful for distributed computation (experimental feature, more documentation to come<!-- TODO -->)
 #'
@@ -246,7 +253,7 @@ PruneCladeMat <- function(M, neigh, sprigs, prune = "singleton.info", from_recip
 # #' ...? longer description
 # #'
 # #' @references
-# #' Christ, R., Wang, X., Aslett, L.J.M., Steinsaltz, D. and Hall, I. (2024) "Clade Distillation for Genome-wide Association Studies." bioRxiv 2024.09.30.615852. Available at: \doi{10.1101/2024.09.30.615852}.
+# #' Christ, R.R., Wang, X., Aslett, L.J.M., Steinsaltz, D. and Hall, I. (2024) "Clade Distillation for Genome-wide Association Studies", bioRxiv 2024.09.30.615852. Available at: \doi{10.1101/2024.09.30.615852}.
 # #'
 # #' @param fwd
 # #'        a `kalisForwardTable` object, as returned by [MakeForwardTable()] and propagated to a target variant by [Forward()].
diff --git a/R/Iterator.R b/R/Iterator.R
index 061a20f..4a2984d 100644
--- a/R/Iterator.R
+++ b/R/Iterator.R
@@ -5,7 +5,7 @@
 #' See example.
 #'
 #' @references
-#' Christ, R., Wang, X., Aslett, L.J.M., Steinsaltz, D. and Hall, I. (2024) "Clade Distillation for Genome-wide Association Studies." bioRxiv 2024.09.30.615852. Available at: \doi{10.1101/2024.09.30.615852}.
+#' Christ, R.R., Wang, X., Aslett, L.J.M., Steinsaltz, D. and Hall, I. (2024) "Clade Distillation for Genome-wide Association Studies", bioRxiv 2024.09.30.615852. Available at: \doi{10.1101/2024.09.30.615852}.
 #'
 #' @param pars
 #'        a `kalisParameters` object, as returned by [Parameters()].
@@ -348,17 +348,19 @@ plot.kalisIterator <- function(x, ...){
 #' Calculate look up tables for solving optimal checkpointing problems with dynamic programming.
 #'
 #' @references
-#' Christ, R., Wang, X., Aslett, L.J.M., Steinsaltz, D. and Hall, I. (2024) "Clade Distillation for Genome-wide Association Studies." bioRxiv 2024.09.30.615852. Available at: \doi{10.1101/2024.09.30.615852}.
+#' Christ, R.R., Wang, X., Aslett, L.J.M., Steinsaltz, D. and Hall, I. (2024) "Clade Distillation for Genome-wide Association Studies", bioRxiv 2024.09.30.615852. Available at: \doi{10.1101/2024.09.30.615852}.
 #'
 #' @param propagation.cost
-#'        a non-negative vector such that `propagation.cost[i]` gives the relative amount of time or cost required to propagate `i` steps
+#'        a non-negative vector such that `propagation.cost[i]` gives the relative amount of time or cost required to propagate `i` steps.
 #' @param max.num.checkpoints
 #'        the maximum number of checkpoints that should be considered when building the checkpoint table.
 #' @param use.R
-#'        a logical, when TRUE use base R rather than C implementation of table building. Defaults to FALSE.
+#'        a logical, when `TRUE` use base R rather than C implementation of table building.
+#'        Defaults to `FALSE`.
 #'
 #' @return
-#' a list containing:
+#' A list containing:
+#'
 #' \describe{
 #'   \item{`cost`}{the matrix \eqn{F} in Christ et al. (2024)}
 #'   \item{`index`}{the matrix \eqn{H} in Christ et al. (2024)}
diff --git a/R/Parameters.R b/R/Parameters.R
index 187194e..ecc4693 100644
--- a/R/Parameters.R
+++ b/R/Parameters.R
@@ -15,7 +15,7 @@
 #' @references
 #' Aslett, L.J.M. and Christ, R.R. (2024) "kalis: a modern implementation of the Li & Stephens model for local ancestry inference in R", *BMC Bioinformatics*, **25**(1). Available at: \doi{10.1186/s12859-024-05688-8}.
 #'
-#' Lawson, D.J., Hellenthal, G., Myers, S. and Falush, D. (2012). "Inference of population structure using dense haplotype data", *PLoS genetics*, **8**(1). Available at: \doi{10.1371/journal.pgen.1002453}.
+#' Lawson, D.J., Hellenthal, G., Myers, S. and Falush, D. (2012) "Inference of population structure using dense haplotype data", *PLoS genetics*, **8**(1). Available at: \doi{10.1371/journal.pgen.1002453}.
 #'
 #' @param cM a vector specifying the recombination distance between variants in centimorgans.
 #'   Note element i of this vector should be the distance between variants `i` and `i+1` (not `i` and `i-1`), and thus length one less than the number of variants.
@@ -123,9 +123,9 @@ CalcRho <- function(cM = 0, s = 1, gamma = 1, floor = TRUE) {
 #' @references
 #' Aslett, L.J.M. and Christ, R.R. (2024) "kalis: a modern implementation of the Li & Stephens model for local ancestry inference in R", *BMC Bioinformatics*, **25**(1). Available at: \doi{10.1186/s12859-024-05688-8}.
 #'
-#' Lawson, D.J., Hellenthal, G., Myers, S.R. and Falush, D. (2012). "Inference of population structure using dense haplotype data", *PLoS Genetics*, **8**(1). Available at: \doi{10.1371/journal.pgen.1002453}.
+#' Lawson, D.J., Hellenthal, G., Myers, S.R. and Falush, D. (2012) "Inference of population structure using dense haplotype data", *PLoS Genetics*, **8**(1). Available at: \doi{10.1371/journal.pgen.1002453}.
 #'
-#' Speidel, L., Forest, M., Shi, S. and Myers, S.R. (2019). "A method for genome-wide genealogy estimation for thousands of samples", *Nature Genetics*, **51**, p. 1321-1329. Available at: \doi{10.1038/s41588-019-0484-x}.
+#' Speidel, L., Forest, M., Shi, S. and Myers, S.R. (2019) "A method for genome-wide genealogy estimation for thousands of samples", *Nature Genetics*, **51**, p. 1321-1329. Available at: \doi{10.1038/s41588-019-0484-x}.
 #'
 #' @param rho recombination probability vector (must be \eqn{L-1} long).
 #'   See [CalcRho()] for assistance constructing this from a recombination
diff --git a/R/Probs.R b/R/Probs.R
index 77f6024..fd0a30b 100644
--- a/R/Probs.R
+++ b/R/Probs.R
@@ -170,7 +170,7 @@ PostProbs <- function(fwd, bck, unif.on.underflow = FALSE, M = NULL, beta.theta.
 #' @references
 #' Aslett, L.J.M. and Christ, R.R. (2024) "kalis: a modern implementation of the Li & Stephens model for local ancestry inference in R", *BMC Bioinformatics*, **25**(1). Available at: \doi{10.1186/s12859-024-05688-8}.
 #'
-#' Speidel, L., Forest, M., Shi, S. and Myers, S.R. (2019). "A method for genome-wide genealogy estimation for thousands of samples", *Nature Genetics*, **51**, p. 1321-1329. Available at: \doi{10.1038/s41588-019-0484-x}.
+#' Speidel, L., Forest, M., Shi, S. and Myers, S.R. (2019) "A method for genome-wide genealogy estimation for thousands of samples", *Nature Genetics*, **51**, p. 1321-1329. Available at: \doi{10.1038/s41588-019-0484-x}.
 #'
 #' @param fwd a forward table as returned by [MakeForwardTable()] and propagated to a target variant by [Forward()].
 #'   Must be at the same variant as `bck` (unless `bck` is in "beta-theta space" in which case if must be downstream ... see [Backward()] for details).
diff --git a/R/TableCache.R b/R/TableCache.R
index 98287f1..be31026 100644
--- a/R/TableCache.R
+++ b/R/TableCache.R
@@ -1,23 +1,15 @@
 #' Create cache for forward tables
 #'
-#' Create an in-memory cache for forward tables to improve efficiency when
-#' iterating in reverse along the haplotype sequences.
-#'
-#' If the objective is to run the Li and Stephens hidden Markov model both
-#' forwards and backwards to the same locus (and to do so for every possible
-#' locus), then considerable efficiency can be achieved by first performing a
-#' full scan forwards, filling a geometrically spaced cache whilst doing so.
-#' Then, by working backwards, the backward propagation moves one locus at a
-#' time and the forward propagation can move backwards by moving forward from a
-#' recently cached local table.
-#'
-#' Memory for a cache can be allocated using this function and should then be
-#' filled with [FillTableCache()].
-#' To use the cache, then instead of using the [Forward()] function,
-#' use [ForwardUsingTableCache()].
+#' Create an in-memory cache for forward tables to improve efficiency when iterating in reverse along the haplotype sequences.
+#'
+#' If the objective is to run the Li and Stephens hidden Markov model both forwards and backwards to the same locus (and to do so for every possible locus), then considerable efficiency can be achieved by first performing a full scan forwards, filling a geometrically spaced cache whilst doing so.
+#' Then, by working backwards, the backward propagation moves one locus at a time and the forward propagation can move backwards by moving forward from a recently cached local table.
+#'
+#' Memory for a cache can be allocated using this function and should then be filled with [FillTableCache()].
+#' To use the cache, then instead of using the [Forward()] function, use [ForwardUsingTableCache()].
 #'
 #' @references
-#' Christ, R., Wang, X., Aslett, L.J.M., Steinsaltz, D. and Hall, I. (2024) "Clade Distillation for Genome-wide Association Studies." bioRxiv 2024.09.30.615852. Available at: \doi{10.1101/2024.09.30.615852}.
+#' Christ, R.R., Wang, X., Aslett, L.J.M., Steinsaltz, D. and Hall, I. (2024) "Clade Distillation for Genome-wide Association Studies", bioRxiv 2024.09.30.615852. Available at: \doi{10.1101/2024.09.30.615852}.
 #'
 #' @param pars
 #'        a `kalisParameters` object, as returned by [Parameters()].
@@ -36,13 +28,15 @@
 #'        By default, equals \eqn{\lfloor\log_2(L)\rfloor}.
 #'
 #' @return
-#'   A list of forward tables representing a cache and ready to be filled is returned.
+#' A list of forward tables representing a cache and ready to be filled is returned.
 #'
 #' @seealso
-#'   [MakeForwardTable()] to make a forward table;
-#'   [FillTableCache()] to fill a cache;
-#'   [ForwardUsingTableCache()] to use a cache;
-#'   [Forward()] for forward function without using a cache.
+#' [MakeForwardTable()] to make a forward table;
+#' [FillTableCache()] to fill a cache;
+#' [ForwardUsingTableCache()] to use a cache;
+#' [Forward()] for forward function without using a cache.
+#'
+#' Alternatively, see [ForwardIterator()] to create an iterator which internally creates or uses a table cache.
 #'
 #' @examples
 #' \dontrun{
@@ -122,22 +116,16 @@ CreateForwardTableCache <- function(pars, size = 1, from_recipient = 1, to_recip
 
 #' Fill a forward table cache
 #'
-#' An in-memory cache for forward tables can be filled using this function, for
-#' either the whole sequence length or some sub-sequence.
+#' An in-memory cache for forward tables can be filled using this function, for either the whole sequence length or some sub-sequence.
 #'
-#' If the objective is to run the Li and Stephens hidden Markov model both
-#' forwards and backwards to the same locus (and to do so for every possible
-#' locus), then considerable efficiency can be achieved by first performing a
-#' full scan forwards, filling a geometrically spaced cache whilst doing so.
-#' Then, by working backwards, the backward propagation moves one locus at a
-#' time and the forward propagation can move backwards by moving forward from a
-#' recently cached local table.
+#' If the objective is to run the Li and Stephens hidden Markov model both forwards and backwards to the same locus (and to do so for every possible locus), then considerable efficiency can be achieved by first performing a full scan forwards, filling a geometrically spaced cache whilst doing so.
+#' Then, by working backwards, the backward propagation moves one locus at a time and the forward propagation can move backwards by moving forward from a recently cached local table.
 #'
-#' Memory for a cache can be allocated using
-#' [CreateForwardTableCache()] and should then be filled with this
-#' function.
-#' To use the cache, then instead of using the [Forward()] function,
-#' use [ForwardUsingTableCache()].
+#' Memory for a cache can be allocated using [CreateForwardTableCache()] and should then be filled with this function.
+#' To use the cache, then instead of using the [Forward()] function, use [ForwardUsingTableCache()].
+#'
+#' @references
+#' Christ, R.R., Wang, X., Aslett, L.J.M., Steinsaltz, D. and Hall, I. (2024) "Clade Distillation for Genome-wide Association Studies", bioRxiv 2024.09.30.615852. Available at: \doi{10.1101/2024.09.30.615852}.
 #'
 #' @param cache
 #'        a cache of forward tables as generated by [CreateForwardTableCache()].
@@ -149,13 +137,16 @@ CreateForwardTableCache <- function(pars, size = 1, from_recipient = 1, to_recip
 #'
 #' @return
 #' There is nothing returned.
-#' For performance reasons, `cache` is updated in-place.
+#'
+#' **NOTE:** for performance reasons, `cache` is updated in-place.
 #'
 #' @seealso
-#'   [MakeForwardTable()] to make a forward table;
-#'   [CreateForwardTableCache()] to generate a cache;
-#'   [ForwardUsingTableCache()] to use a cache;
-#'   [Forward()] for forward function without using a cache.
+#' [MakeForwardTable()] to make a forward table;
+#' [CreateForwardTableCache()] to generate a cache;
+#' [ForwardUsingTableCache()] to use a cache;
+#' [Forward()] for forward function without using a cache.
+#'
+#' Alternatively, see [ForwardIterator()] to create an iterator which internally creates or uses a table cache.
 #'
 #' @examples
 #' \dontrun{
@@ -244,52 +235,44 @@ FillTableCache <- function(cache,
 
 #' Use a forward table cache to propagate
 #'
-#' An in-memory cache for forward tables, which has already been filled, can be
-#' used to move more quickly to a specified locus.
-#'
-#' If the objective is to run the Li and Stephens hidden Markov model both
-#' forwards and backwards to the same locus (and to do so for every possible
-#' locus), then considerable efficiency can be achieved by first performing a
-#' full scan forwards, filling a geometrically spaced cache whilst doing so.
-#' Then, by working backwards, the backward propagation moves one locus at a
-#' time and the forward propagation can move backwards by moving forward from a
-#' recently cached local table.
-#'
-#' Memory for a cache can be allocated using
-#' [CreateForwardTableCache()] and should then be filled with
-#' [FillTableCache()].
-#' To use the cache, then instead of using the [Forward()] function,
-#' use this function.
-#'
-#' Note that the `cache` which is passed to this function will be
-#' dynamically updated based on the locus requested: the assumption is that
-#' the cache is used to propagate in reverse so any cache entries for a locus
-#' position past `t` are taken to be no longer needed and that space will
-#' redeployed to more densely fill the cache with earlier locus positions.
-#'
-#' @param fwd a `kalisForwardTable` object, as returned by
-#'   [MakeForwardTable()].
-#' @param pars a `kalisParameters` object, as returned by [Parameters()].
-#' @param cache a cache of forward tables as generated by
-#'   [CreateForwardTableCache()] and filled using
-#'   [FillTableCache()].
-#' @param t a locus position to move the forward table to, starting the forward
-#'   propagation from whatever table in the `cache` variable is immediately
-#'   before locus `t`.
-#'   By default, it simply advances to the previous locus (which is the natural
-#'   direction to move when using the cache).
-#' @param nthreads the number of CPU cores to use.
-#'   By default no parallelism is used.
+#' An in-memory cache for forward tables, which has already been filled, can be used to move more quickly to a specified locus.
+#'
+#' If the objective is to run the Li and Stephens hidden Markov model both forwards and backwards to the same locus (and to do so for every possible locus), then considerable efficiency can be achieved by first performing a full scan forwards, filling a geometrically spaced cache whilst doing so.
+#' Then, by working backwards, the backward propagation moves one locus at a time and the forward propagation can move backwards by moving forward from a recently cached local table.
+#'
+#' Memory for a cache can be allocated using [CreateForwardTableCache()] and should then be filled with [FillTableCache()].
+#' To use the cache, then instead of using the [Forward()] function, use this function.
+#'
+#' Note that the `cache` which is passed to this function will be dynamically updated based on the locus requested: the assumption is that the cache is used to propagate in reverse so any cache entries for a locus position past `t` are taken to be no longer needed and that space will redeployed to more densely fill the cache with earlier locus positions.
+#'
+#' @references
+#' Christ, R.R., Wang, X., Aslett, L.J.M., Steinsaltz, D. and Hall, I. (2024) "Clade Distillation for Genome-wide Association Studies", bioRxiv 2024.09.30.615852. Available at: \doi{10.1101/2024.09.30.615852}.
+#'
+#' @param fwd
+#'        a `kalisForwardTable` object, as returned by [MakeForwardTable()].
+#' @param pars
+#'        a `kalisParameters` object, as returned by [Parameters()].
+#' @param cache
+#'        a cache of forward tables as generated by [CreateForwardTableCache()] and filled using [FillTableCache()].
+#' @param t
+#'        a locus position to move the forward table to, starting the forward propagation from whatever table in the `cache` variable is immediately before locus `t`.
+#'        By default, it simply advances to the previous locus (which is the natural direction to move when using the cache).
+#' @param nthreads
+#'        the number of CPU cores to use.
+#'        By default no parallelism is used.
 #'
 #' @return
-#'   There is nothing returned.
-#'   For performance reasons, `fwd` is updated in-place.
+#' There is nothing returned.
+#'
+#' **NOTE:** for performance reasons, `fwd` is updated in-place.
 #'
 #' @seealso
-#'   [MakeForwardTable()] to make a forward table;
-#'   [CreateForwardTableCache()] to generate a cache;
-#'   [FillTableCache()] to fill a cache;
-#'   [Forward()] for forward function without using a cache.
+#' [MakeForwardTable()] to make a forward table;
+#' [CreateForwardTableCache()] to generate a cache;
+#' [FillTableCache()] to fill a cache;
+#' [Forward()] for forward function without using a cache.
+#'
+#' Alternatively, see [ForwardIterator()] to create an iterator which internally creates or uses a table cache.
 #'
 #' @examples
 #' \dontrun{
diff --git a/README.md b/README.md
index 07effd4..c274843 100644
--- a/README.md
+++ b/README.md
@@ -29,7 +29,7 @@ If you do not have the correct flags set, kalis will fall back to an implementat
 
 ## Citation
 
-If you make use of this software, please cite:
+If you make use of this software, please cite the primary reference:
 
 > Aslett L. J. M., Christ R. R. (2024). "kalis: a modern implementation of the Li & Stephens model for local ancestry inference in R." _BMC Bioinformatics_, *25*(1), 1-18. [doi:10.1186/s12859-024-05688-8](https://doi.org/10.1186/s12859-024-05688-8>).
 
@@ -47,3 +47,20 @@ bibTeX:
   doi = {10.1186/s12859-024-05688-8}
 }
 ```
+
+Some additional functions were added after the above publication to enable checkpointing and clade matrix construction, which are described in:
+
+> Christ, R.R., Wang, X., Aslett, L.J.M., Steinsaltz, D. and Hall, I. (2024) "Clade Distillation for Genome-wide Association Studies", _bioRxiv 2024.09.30.615852_. [doi:10.1101/2024.09.30.615852](https://doi.org/10.1101/2024.09.30.615852).
+
+bibTeX:
+
+```
+@Article{,
+  title = {Clade Distillation for Genome-wide Association Studies},
+  author = {Christ, R. R. and Wang, X. and Aslett, L. J. M. and Steinsaltz, D. and Hall, I.},
+  journal = {bioRxiv},
+  year = {2024},
+  number = {2024.09.30.615852},
+  doi = {10.1101/2024.09.30.615852}
+}
+```
diff --git a/man/CalcCheckpointTables.Rd b/man/CalcCheckpointTables.Rd
index 5e772f0..398d0df 100644
--- a/man/CalcCheckpointTables.Rd
+++ b/man/CalcCheckpointTables.Rd
@@ -7,14 +7,16 @@
 CalcCheckpointTables(propagation.cost, max.num.checkpoints, use.R = FALSE)
 }
 \arguments{
-\item{propagation.cost}{a non-negative vector such that \code{propagation.cost[i]} gives the relative amount of time or cost required to propagate \code{i} steps}
+\item{propagation.cost}{a non-negative vector such that \code{propagation.cost[i]} gives the relative amount of time or cost required to propagate \code{i} steps.}
 
 \item{max.num.checkpoints}{the maximum number of checkpoints that should be considered when building the checkpoint table.}
 
-\item{use.R}{a logical, when TRUE use base R rather than C implementation of table building. Defaults to FALSE.}
+\item{use.R}{a logical, when \code{TRUE} use base R rather than C implementation of table building.
+Defaults to \code{FALSE}.}
 }
 \value{
-a list containing:
+A list containing:
+
 \describe{
 \item{\code{cost}}{the matrix \eqn{F} in Christ et al. (2024)}
 \item{\code{index}}{the matrix \eqn{H} in Christ et al. (2024)}
@@ -24,5 +26,5 @@ a list containing:
 Calculate look up tables for solving optimal checkpointing problems with dynamic programming.
 }
 \references{
-Christ, R., Wang, X., Aslett, L.J.M., Steinsaltz, D. and Hall, I. (2024) "Clade Distillation for Genome-wide Association Studies." bioRxiv 2024.09.30.615852. Available at: \doi{10.1101/2024.09.30.615852}.
+Christ, R.R., Wang, X., Aslett, L.J.M., Steinsaltz, D. and Hall, I. (2024) "Clade Distillation for Genome-wide Association Studies", bioRxiv 2024.09.30.615852. Available at: \doi{10.1101/2024.09.30.615852}.
 }
diff --git a/man/CalcRho.Rd b/man/CalcRho.Rd
index 4714f4b..8259b5d 100644
--- a/man/CalcRho.Rd
+++ b/man/CalcRho.Rd
@@ -52,7 +52,7 @@ rho
 \references{
 Aslett, L.J.M. and Christ, R.R. (2024) "kalis: a modern implementation of the Li & Stephens model for local ancestry inference in R", \emph{BMC Bioinformatics}, \strong{25}(1). Available at: \doi{10.1186/s12859-024-05688-8}.
 
-Lawson, D.J., Hellenthal, G., Myers, S. and Falush, D. (2012). "Inference of population structure using dense haplotype data", \emph{PLoS genetics}, \strong{8}(1). Available at: \doi{10.1371/journal.pgen.1002453}.
+Lawson, D.J., Hellenthal, G., Myers, S. and Falush, D. (2012) "Inference of population structure using dense haplotype data", \emph{PLoS genetics}, \strong{8}(1). Available at: \doi{10.1371/journal.pgen.1002453}.
 }
 \seealso{
 \code{\link[=Parameters]{Parameters()}} to use the resulting recombination probabilities to construct a \code{kalisParameters} object.
diff --git a/man/CalcTraces.Rd b/man/CalcTraces.Rd
index cf45ffe..c5936e9 100644
--- a/man/CalcTraces.Rd
+++ b/man/CalcTraces.Rd
@@ -46,3 +46,6 @@ Provides multithreaded calculation of trace and Hilbert Schmidt Norm of a matrix
 # TODO
 
 }
+\references{
+Christ, R.R., Wang, X., Aslett, L.J.M., Steinsaltz, D. and Hall, I. (2024) "Clade Distillation for Genome-wide Association Studies", bioRxiv 2024.09.30.615852. Available at: \doi{10.1101/2024.09.30.615852}.
+}
diff --git a/man/CladeMat.Rd b/man/CladeMat.Rd
index 81e8ba5..5987d63 100644
--- a/man/CladeMat.Rd
+++ b/man/CladeMat.Rd
@@ -53,5 +53,5 @@ The clade matrix captures genetic relatedness information in the distances from
 
 }
 \references{
-Christ, R., Wang, X., Aslett, L.J.M., Steinsaltz, D. and Hall, I. (2024) "Clade Distillation for Genome-wide Association Studies." bioRxiv 2024.09.30.615852. Available at: \doi{10.1101/2024.09.30.615852}.
+Christ, R.R., Wang, X., Aslett, L.J.M., Steinsaltz, D. and Hall, I. (2024) "Clade Distillation for Genome-wide Association Studies", bioRxiv 2024.09.30.615852. Available at: \doi{10.1101/2024.09.30.615852}.
 }
diff --git a/man/CreateForwardTableCache.Rd b/man/CreateForwardTableCache.Rd
index 4914e47..b15508d 100644
--- a/man/CreateForwardTableCache.Rd
+++ b/man/CreateForwardTableCache.Rd
@@ -32,22 +32,14 @@ By default, equals \eqn{\lfloor\log_2(L)\rfloor}.}
 A list of forward tables representing a cache and ready to be filled is returned.
 }
 \description{
-Create an in-memory cache for forward tables to improve efficiency when
-iterating in reverse along the haplotype sequences.
+Create an in-memory cache for forward tables to improve efficiency when iterating in reverse along the haplotype sequences.
 }
 \details{
-If the objective is to run the Li and Stephens hidden Markov model both
-forwards and backwards to the same locus (and to do so for every possible
-locus), then considerable efficiency can be achieved by first performing a
-full scan forwards, filling a geometrically spaced cache whilst doing so.
-Then, by working backwards, the backward propagation moves one locus at a
-time and the forward propagation can move backwards by moving forward from a
-recently cached local table.
+If the objective is to run the Li and Stephens hidden Markov model both forwards and backwards to the same locus (and to do so for every possible locus), then considerable efficiency can be achieved by first performing a full scan forwards, filling a geometrically spaced cache whilst doing so.
+Then, by working backwards, the backward propagation moves one locus at a time and the forward propagation can move backwards by moving forward from a recently cached local table.
 
-Memory for a cache can be allocated using this function and should then be
-filled with \code{\link[=FillTableCache]{FillTableCache()}}.
-To use the cache, then instead of using the \code{\link[=Forward]{Forward()}} function,
-use \code{\link[=ForwardUsingTableCache]{ForwardUsingTableCache()}}.
+Memory for a cache can be allocated using this function and should then be filled with \code{\link[=FillTableCache]{FillTableCache()}}.
+To use the cache, then instead of using the \code{\link[=Forward]{Forward()}} function, use \code{\link[=ForwardUsingTableCache]{ForwardUsingTableCache()}}.
 }
 \examples{
 \dontrun{
@@ -77,11 +69,13 @@ for(l in L:1) {
 
 }
 \references{
-Christ, R., Wang, X., Aslett, L.J.M., Steinsaltz, D. and Hall, I. (2024) "Clade Distillation for Genome-wide Association Studies." bioRxiv 2024.09.30.615852. Available at: \doi{10.1101/2024.09.30.615852}.
+Christ, R.R., Wang, X., Aslett, L.J.M., Steinsaltz, D. and Hall, I. (2024) "Clade Distillation for Genome-wide Association Studies", bioRxiv 2024.09.30.615852. Available at: \doi{10.1101/2024.09.30.615852}.
 }
 \seealso{
 \code{\link[=MakeForwardTable]{MakeForwardTable()}} to make a forward table;
 \code{\link[=FillTableCache]{FillTableCache()}} to fill a cache;
 \code{\link[=ForwardUsingTableCache]{ForwardUsingTableCache()}} to use a cache;
 \code{\link[=Forward]{Forward()}} for forward function without using a cache.
+
+Alternatively, see \code{\link[=ForwardIterator]{ForwardIterator()}} to create an iterator which internally creates or uses a table cache.
 }
diff --git a/man/DistMat.Rd b/man/DistMat.Rd
index cf38ad3..8a917c8 100644
--- a/man/DistMat.Rd
+++ b/man/DistMat.Rd
@@ -131,7 +131,7 @@ plot(d)
 \references{
 Aslett, L.J.M. and Christ, R.R. (2024) "kalis: a modern implementation of the Li & Stephens model for local ancestry inference in R", \emph{BMC Bioinformatics}, \strong{25}(1). Available at: \doi{10.1186/s12859-024-05688-8}.
 
-Speidel, L., Forest, M., Shi, S. and Myers, S.R. (2019). "A method for genome-wide genealogy estimation for thousands of samples", \emph{Nature Genetics}, \strong{51}, p. 1321-1329. Available at: \doi{10.1038/s41588-019-0484-x}.
+Speidel, L., Forest, M., Shi, S. and Myers, S.R. (2019) "A method for genome-wide genealogy estimation for thousands of samples", \emph{Nature Genetics}, \strong{51}, p. 1321-1329. Available at: \doi{10.1038/s41588-019-0484-x}.
 }
 \seealso{
 \code{\link[=PostProbs]{PostProbs()}} to calculate the posterior marginal probabilities \eqn{p_{ji}}{p_(j,i)};
diff --git a/man/FillTableCache.Rd b/man/FillTableCache.Rd
index 531682a..9777548 100644
--- a/man/FillTableCache.Rd
+++ b/man/FillTableCache.Rd
@@ -21,26 +21,18 @@ By default uses the \code{parallel} package to detect the number of physical cor
 }
 \value{
 There is nothing returned.
-For performance reasons, \code{cache} is updated in-place.
+
+\strong{NOTE:} for performance reasons, \code{cache} is updated in-place.
 }
 \description{
-An in-memory cache for forward tables can be filled using this function, for
-either the whole sequence length or some sub-sequence.
+An in-memory cache for forward tables can be filled using this function, for either the whole sequence length or some sub-sequence.
 }
 \details{
-If the objective is to run the Li and Stephens hidden Markov model both
-forwards and backwards to the same locus (and to do so for every possible
-locus), then considerable efficiency can be achieved by first performing a
-full scan forwards, filling a geometrically spaced cache whilst doing so.
-Then, by working backwards, the backward propagation moves one locus at a
-time and the forward propagation can move backwards by moving forward from a
-recently cached local table.
+If the objective is to run the Li and Stephens hidden Markov model both forwards and backwards to the same locus (and to do so for every possible locus), then considerable efficiency can be achieved by first performing a full scan forwards, filling a geometrically spaced cache whilst doing so.
+Then, by working backwards, the backward propagation moves one locus at a time and the forward propagation can move backwards by moving forward from a recently cached local table.
 
-Memory for a cache can be allocated using
-\code{\link[=CreateForwardTableCache]{CreateForwardTableCache()}} and should then be filled with this
-function.
-To use the cache, then instead of using the \code{\link[=Forward]{Forward()}} function,
-use \code{\link[=ForwardUsingTableCache]{ForwardUsingTableCache()}}.
+Memory for a cache can be allocated using \code{\link[=CreateForwardTableCache]{CreateForwardTableCache()}} and should then be filled with this function.
+To use the cache, then instead of using the \code{\link[=Forward]{Forward()}} function, use \code{\link[=ForwardUsingTableCache]{ForwardUsingTableCache()}}.
 }
 \examples{
 \dontrun{
@@ -68,10 +60,15 @@ for(l in L:1) {
 }
 }
 
+}
+\references{
+Christ, R.R., Wang, X., Aslett, L.J.M., Steinsaltz, D. and Hall, I. (2024) "Clade Distillation for Genome-wide Association Studies", bioRxiv 2024.09.30.615852. Available at: \doi{10.1101/2024.09.30.615852}.
 }
 \seealso{
 \code{\link[=MakeForwardTable]{MakeForwardTable()}} to make a forward table;
 \code{\link[=CreateForwardTableCache]{CreateForwardTableCache()}} to generate a cache;
 \code{\link[=ForwardUsingTableCache]{ForwardUsingTableCache()}} to use a cache;
 \code{\link[=Forward]{Forward()}} for forward function without using a cache.
+
+Alternatively, see \code{\link[=ForwardIterator]{ForwardIterator()}} to create an iterator which internally creates or uses a table cache.
 }
diff --git a/man/ForwardIterator.Rd b/man/ForwardIterator.Rd
index 0c027a8..1cbf5aa 100644
--- a/man/ForwardIterator.Rd
+++ b/man/ForwardIterator.Rd
@@ -86,7 +86,7 @@ for(t in targets(Iter)){
 
 }
 \references{
-Christ, R., Wang, X., Aslett, L.J.M., Steinsaltz, D. and Hall, I. (2024) "Clade Distillation for Genome-wide Association Studies." bioRxiv 2024.09.30.615852. Available at: \doi{10.1101/2024.09.30.615852}.
+Christ, R.R., Wang, X., Aslett, L.J.M., Steinsaltz, D. and Hall, I. (2024) "Clade Distillation for Genome-wide Association Studies", bioRxiv 2024.09.30.615852. Available at: \doi{10.1101/2024.09.30.615852}.
 }
 \seealso{
 \code{\link[=MakeForwardTable]{MakeForwardTable()}} to create a \code{kalisForwardTable};
diff --git a/man/ForwardUsingTableCache.Rd b/man/ForwardUsingTableCache.Rd
index 09f1bad..8493328 100644
--- a/man/ForwardUsingTableCache.Rd
+++ b/man/ForwardUsingTableCache.Rd
@@ -14,52 +14,34 @@ ForwardUsingTableCache(
 )
 }
 \arguments{
-\item{fwd}{a \code{kalisForwardTable} object, as returned by
-\code{\link[=MakeForwardTable]{MakeForwardTable()}}.}
+\item{fwd}{a \code{kalisForwardTable} object, as returned by \code{\link[=MakeForwardTable]{MakeForwardTable()}}.}
 
 \item{pars}{a \code{kalisParameters} object, as returned by \code{\link[=Parameters]{Parameters()}}.}
 
-\item{cache}{a cache of forward tables as generated by
-\code{\link[=CreateForwardTableCache]{CreateForwardTableCache()}} and filled using
-\code{\link[=FillTableCache]{FillTableCache()}}.}
+\item{cache}{a cache of forward tables as generated by \code{\link[=CreateForwardTableCache]{CreateForwardTableCache()}} and filled using \code{\link[=FillTableCache]{FillTableCache()}}.}
 
-\item{t}{a locus position to move the forward table to, starting the forward
-propagation from whatever table in the \code{cache} variable is immediately
-before locus \code{t}.
-By default, it simply advances to the previous locus (which is the natural
-direction to move when using the cache).}
+\item{t}{a locus position to move the forward table to, starting the forward propagation from whatever table in the \code{cache} variable is immediately before locus \code{t}.
+By default, it simply advances to the previous locus (which is the natural direction to move when using the cache).}
 
 \item{nthreads}{the number of CPU cores to use.
 By default no parallelism is used.}
 }
 \value{
 There is nothing returned.
-For performance reasons, \code{fwd} is updated in-place.
+
+\strong{NOTE:} for performance reasons, \code{fwd} is updated in-place.
 }
 \description{
-An in-memory cache for forward tables, which has already been filled, can be
-used to move more quickly to a specified locus.
+An in-memory cache for forward tables, which has already been filled, can be used to move more quickly to a specified locus.
 }
 \details{
-If the objective is to run the Li and Stephens hidden Markov model both
-forwards and backwards to the same locus (and to do so for every possible
-locus), then considerable efficiency can be achieved by first performing a
-full scan forwards, filling a geometrically spaced cache whilst doing so.
-Then, by working backwards, the backward propagation moves one locus at a
-time and the forward propagation can move backwards by moving forward from a
-recently cached local table.
+If the objective is to run the Li and Stephens hidden Markov model both forwards and backwards to the same locus (and to do so for every possible locus), then considerable efficiency can be achieved by first performing a full scan forwards, filling a geometrically spaced cache whilst doing so.
+Then, by working backwards, the backward propagation moves one locus at a time and the forward propagation can move backwards by moving forward from a recently cached local table.
 
-Memory for a cache can be allocated using
-\code{\link[=CreateForwardTableCache]{CreateForwardTableCache()}} and should then be filled with
-\code{\link[=FillTableCache]{FillTableCache()}}.
-To use the cache, then instead of using the \code{\link[=Forward]{Forward()}} function,
-use this function.
+Memory for a cache can be allocated using \code{\link[=CreateForwardTableCache]{CreateForwardTableCache()}} and should then be filled with \code{\link[=FillTableCache]{FillTableCache()}}.
+To use the cache, then instead of using the \code{\link[=Forward]{Forward()}} function, use this function.
 
-Note that the \code{cache} which is passed to this function will be
-dynamically updated based on the locus requested: the assumption is that
-the cache is used to propagate in reverse so any cache entries for a locus
-position past \code{t} are taken to be no longer needed and that space will
-redeployed to more densely fill the cache with earlier locus positions.
+Note that the \code{cache} which is passed to this function will be dynamically updated based on the locus requested: the assumption is that the cache is used to propagate in reverse so any cache entries for a locus position past \code{t} are taken to be no longer needed and that space will redeployed to more densely fill the cache with earlier locus positions.
 }
 \examples{
 \dontrun{
@@ -87,10 +69,15 @@ for(l in L:1) {
 }
 }
 
+}
+\references{
+Christ, R.R., Wang, X., Aslett, L.J.M., Steinsaltz, D. and Hall, I. (2024) "Clade Distillation for Genome-wide Association Studies", bioRxiv 2024.09.30.615852. Available at: \doi{10.1101/2024.09.30.615852}.
 }
 \seealso{
 \code{\link[=MakeForwardTable]{MakeForwardTable()}} to make a forward table;
 \code{\link[=CreateForwardTableCache]{CreateForwardTableCache()}} to generate a cache;
 \code{\link[=FillTableCache]{FillTableCache()}} to fill a cache;
 \code{\link[=Forward]{Forward()}} for forward function without using a cache.
+
+Alternatively, see \code{\link[=ForwardIterator]{ForwardIterator()}} to create an iterator which internally creates or uses a table cache.
 }
diff --git a/man/Parameters.Rd b/man/Parameters.Rd
index f34bdf7..4c34afd 100644
--- a/man/Parameters.Rd
+++ b/man/Parameters.Rd
@@ -100,9 +100,9 @@ fwd
 \references{
 Aslett, L.J.M. and Christ, R.R. (2024) "kalis: a modern implementation of the Li & Stephens model for local ancestry inference in R", \emph{BMC Bioinformatics}, \strong{25}(1). Available at: \doi{10.1186/s12859-024-05688-8}.
 
-Lawson, D.J., Hellenthal, G., Myers, S.R. and Falush, D. (2012). "Inference of population structure using dense haplotype data", \emph{PLoS Genetics}, \strong{8}(1). Available at: \doi{10.1371/journal.pgen.1002453}.
+Lawson, D.J., Hellenthal, G., Myers, S.R. and Falush, D. (2012) "Inference of population structure using dense haplotype data", \emph{PLoS Genetics}, \strong{8}(1). Available at: \doi{10.1371/journal.pgen.1002453}.
 
-Speidel, L., Forest, M., Shi, S. and Myers, S.R. (2019). "A method for genome-wide genealogy estimation for thousands of samples", \emph{Nature Genetics}, \strong{51}, p. 1321-1329. Available at: \doi{10.1038/s41588-019-0484-x}.
+Speidel, L., Forest, M., Shi, S. and Myers, S.R. (2019) "A method for genome-wide genealogy estimation for thousands of samples", \emph{Nature Genetics}, \strong{51}, p. 1321-1329. Available at: \doi{10.1038/s41588-019-0484-x}.
 }
 \seealso{
 \code{\link[=MakeForwardTable]{MakeForwardTable()}} and \code{\link[=MakeBackwardTable]{MakeBackwardTable()}} which construct table objects which internally reference a parameters environment;
diff --git a/man/PruneCladeMat.Rd b/man/PruneCladeMat.Rd
index 9a7b8c9..6c15511 100644
--- a/man/PruneCladeMat.Rd
+++ b/man/PruneCladeMat.Rd
@@ -13,7 +13,8 @@ PruneCladeMat(M, neigh, sprigs, prune = "singleton.info", from_recipient = 1L)
 
 \item{sprigs}{a sprigs object as returned by \code{\link[=Sprigs]{Sprigs()}}}
 
-\item{prune}{a character indicating the type of information to be removed from the \code{\link[=CladeMat]{CladeMat()}}. See Details.}
+\item{prune}{a character indicating the type of information to be removed from the \code{\link[=CladeMat]{CladeMat()}}.
+See Details.}
 
 \item{from_recipient}{haplotype index at which to start trace calculation --- useful for distributed computation (experimental feature, more documentation to come\if{html}{\out{<!-- TODO -->}})}
 }
@@ -23,9 +24,12 @@ There is nothing returned.
 \strong{NOTE:} for performance reasons, \code{M} is updated in-place.
 }
 \description{
-Use haplotype nearest neighborhoods and other information returned by \code{\link[=CladeMat]{CladeMat()}} to efficiently remove structure corresponding to singletons or called sprigs from clade matrix 'M'
+Use haplotype nearest neighbourhoods and other information returned by \code{\link[=CladeMat]{CladeMat()}} to efficiently remove structure corresponding to singletons or called sprigs from clade matrix 'M'
 }
 \examples{
 # TODO
 
 }
+\references{
+Christ, R.R., Wang, X., Aslett, L.J.M., Steinsaltz, D. and Hall, I. (2024) "Clade Distillation for Genome-wide Association Studies", bioRxiv 2024.09.30.615852. Available at: \doi{10.1101/2024.09.30.615852}.
+}
diff --git a/man/Sprigs.Rd b/man/Sprigs.Rd
index b276ab0..5536dea 100644
--- a/man/Sprigs.Rd
+++ b/man/Sprigs.Rd
@@ -7,25 +7,28 @@
 Sprigs(x, old.sprigs = FALSE)
 }
 \arguments{
-\item{x}{list of where each entry is a nearest neighborhood of integers as returned by \code{\link[=CladeMat]{CladeMat()}}}
+\item{x}{list of integers where each entry is a nearest neighbourhood as returned by \code{\link[=CladeMat]{CladeMat()}}}
 
-\item{old.sprigs}{If TRUE, use an earlier (undocumented) version of maximal clique calling, defaults to FALSE.}
+\item{old.sprigs}{If \code{TRUE}, use an earlier (undocumented) version of maximal clique calling, defaults to \code{FALSE}.}
 }
 \value{
 a list containing:
 \describe{
-\item{\code{assignments}}{a vector of integers such that \code{assignments[i]} gives the sprig to which haplotype \code{i} belongs. \code{NA} if a haplotype was not assigned to a sprig.}
-\item{\code{to.prune}}{a vector of logicals, \code{to.prune[i]==TRUE} when haplotype i has been assigned to a sprig}
-\item{\code{num.sprigs}}{total number of sprigs calls, equal to \code{max(assignements,rm.na=TRUE)}}
+\item{\code{assignments}}{a vector of integers such that \verb{$assignments[i]} gives the sprig to which haplotype \code{i} belongs. \code{NA} if a haplotype was not assigned to a sprig.}
+\item{\code{to.prune}}{a vector of logicals, \verb{$to.prune[i]==TRUE} when haplotype i has been assigned to a sprig}
+\item{\code{num.sprigs}}{total number of sprigs calls, equal to \verb{max($assignements, rm.na = TRUE)}}
 }
 }
 \description{
-Infer sprigs (very small clades) within a local phylogeny based on one-directional nearest neighbourhoods assigned to each haplotype
+Infer sprigs (very small clades) within a local phylogeny based on one-directional nearest neighbourhoods assigned to each haplotype.
 }
 \details{
-Call maximal cliques within a directed graph where edges correspond to nearest neighbour relationships
+Call maximal cliques within a directed graph where edges correspond to nearest neighbour relationships.
 }
 \examples{
 # TODO
 
 }
+\references{
+Christ, R.R., Wang, X., Aslett, L.J.M., Steinsaltz, D. and Hall, I. (2024) "Clade Distillation for Genome-wide Association Studies", bioRxiv 2024.09.30.615852. Available at: \doi{10.1101/2024.09.30.615852}.
+}