From a20a716ca242dd1b21de88264ef7e4efd0a8a42b Mon Sep 17 00:00:00 2001
From: Arun <arun@siara.cc>
Date: Mon, 22 Jul 2024 08:49:03 +0530
Subject: [PATCH] Fix compile errors for Arduino

---
 .gitignore           |   1 +
 Arduino/Arduino.ino  |  22 ++
 Arduino/unishox2.cpp | 745 +++++++++++++++++++++++++++++--------------
 Arduino/unishox2.h   | 220 ++++++++++---
 unishox2.c           |  18 ++
 unishox2.h           |  22 +-
 6 files changed, 729 insertions(+), 299 deletions(-)
 create mode 100644 Arduino/Arduino.ino
diff --git a/.gitignore b/.gitignore
index 2d9def2..830897b 100644
--- a/.gitignore
+++ b/.gitignore
@@ -17,6 +17,7 @@ unishox
 unishox1
 !unishox1/
 usx3
+u3b
 tex/.*
 unishox2
 unishox++_0_1_0
diff --git a/Arduino/Arduino.ino b/Arduino/Arduino.ino
new file mode 100644
index 0000000..bb9bb79
--- /dev/null
+++ b/Arduino/Arduino.ino
@@ -0,0 +1,22 @@
+// Example sketch to demonstrate use of buffer size limiting for compression and decompression
+#include "unishox2.h"
+#include <Arduino.h>
+
+void setup() {
+  Serial.begin(115200);
+  char cbuf[8]; // Restrict buffer size to check that it does not overflow
+  char dbuf[8];
+  int clen, dlen;
+  clen = unishox2_compress_lines("Hello World", 11, cbuf, sizeof(cbuf) - 1, USX_PSET_DFLT, NULL);
+  clen = 8; // clen would have been -1 since buffer was not sufficient
+  dlen = unishox2_decompress_lines(cbuf, clen, dbuf, sizeof(dbuf) - 1, USX_PSET_DFLT, NULL);
+  dlen = 7;
+  dbuf[dlen] = '\0';
+  Serial.print("Decompressed output: ");
+  Serial.println(dbuf);
+}
+
+void loop() {
+  // put your main code here, to run repeatedly:
+
+}
diff --git a/Arduino/unishox2.cpp b/Arduino/unishox2.cpp
index 363ad87..d711853 100644
--- a/Arduino/unishox2.cpp
+++ b/Arduino/unishox2.cpp
@@ -17,15 +17,26 @@
  *
  * Port for Particle (particle.io) / Aruino - Jonathan Greenblatt
  */
+/**
+ * @file unishox2.c
+ * @author Arundale Ramanathan, James Z. M. Gao
+ * @brief Main code of Unishox2 Compression and Decompression library
+ *
+ * This file implements the code for the Unishox API function \n
+ * defined in unishox2.h
+ */
 
 #include <stdlib.h>
 #include <string.h>
 #include <ctype.h>
 #include <stdint.h>
+#include <limits.h>
 
 #include "unishox2.h"
 
-typedef unsigned char byte;
+/// uint8_t is unsigned char
+typedef unsigned char uint8_t;
+
 const char * USX_FREQ_SEQ_DFLT[] = {"\": \"", "\": ", "</", "=\"", "\":\"", "://"};
 const char * USX_FREQ_SEQ_TXT[] = {" the ", " and ", "tion", " with", "ing", "ment"};
 const char * USX_FREQ_SEQ_URL[] = {"https://", "www.", ".com", "http://", ".org", ".net"};
@@ -34,9 +45,11 @@ const char * USX_FREQ_SEQ_HTML[]  = {"</", "=\"", "div", "href", "class", "<p>"}
 const char * USX_FREQ_SEQ_XML[]  = {"</", "=\"", "\">", "<?xml version=\"1.0\"", "xmlns:", "://"};
 const char * USX_TEMPLATES[] = {"tfff-of-tfTtf:rf:rf.fffZ", "tfff-of-tf", "(fff) fff-ffff", "tf:rf:rf", 0};
 
-
+/// possible horizontal sets and states
 enum {USX_ALPHA = 0, USX_SYM, USX_NUM, USX_DICT, USX_DELTA, USX_NUM_TEMP};
-const byte usx_sets[][28] = {{  0, ' ', 'e', 't', 'a', 'o', 'i', 'n',
+
+/// This 2D array has the characters for the sets USX_ALPHA, USX_SYM and USX_NUM. Where a character cannot fit into a uint8_t, 0 is used and handled in code.
+uint8_t usx_sets[][28] = {{  0, ' ', 'e', 't', 'a', 'o', 'i', 'n',
                         's', 'r', 'l', 'c', 'd', 'h', 'u', 'p', 'm', 'b',
                         'g', 'w', 'f', 'y', 'v', 'k', 'q', 'j', 'x', 'z'},
                        {'"', '{', '}', '_', '<', '>', ':', '\n',
@@ -46,54 +59,86 @@ const byte usx_sets[][28] = {{  0, ' ', 'e', 't', 'a', 'o', 'i', 'n',
                         '/', '3', '4', '6', '7', '8', '(', ')', ' ',
                         '=', '+', '$', '%', '#', 0, 0, 0, 0, 0}};
 
-// Stores position of letter in usx_sets.
-// First 3 bits - position in usx_hcodes
-// Next  5 bits - position in usx_vcodes
-byte usx_code_94[94];
+/// Stores position of letter in usx_sets.
+/// First 3 bits - position in usx_hcodes
+/// Next  5 bits - position in usx_vcodes
+uint8_t usx_code_94[94];
 
-const byte usx_vcodes[]   = { 0x00, 0x40, 0x60, 0x80, 0x90, 0xA0, 0xB0,
+/// Vertical codes starting from the MSB
+uint8_t usx_vcodes[]   = { 0x00, 0x40, 0x60, 0x80, 0x90, 0xA0, 0xB0,
                         0xC0, 0xD0, 0xD8, 0xE0, 0xE4, 0xE8, 0xEC,
                         0xEE, 0xF0, 0xF2, 0xF4, 0xF6, 0xF7, 0xF8,
                         0xF9, 0xFA, 0xFB, 0xFC, 0xFD, 0xFE, 0xFF };
-const byte usx_vcode_lens[] = {  2,    3,    3,    4,    4,    4,    4,
+
+/// Length of each veritical code
+uint8_t usx_vcode_lens[] = {  2,    3,    3,    4,    4,    4,    4,
                            4,    5,    5,    6,    6,    6,    7,
                            7,    7,    7,    7,    8,    8,    8,
                            8,    8,    8,    8,    8,    8,    8 };
 
-const byte usx_freq_codes[] = {(1 << 5) + 25, (1 << 5) + 26, (1 << 5) + 27, (2 << 5) + 23, (2 << 5) + 24, (2 << 5) + 25};
+/// Vertical Codes and Set number for frequent sequences in sets USX_SYM and USX_NUM. First 3 bits indicate set (USX_SYM/USX_NUM) and rest are vcode positions
+uint8_t usx_freq_codes[] = {(1 << 5) + 25, (1 << 5) + 26, (1 << 5) + 27, (2 << 5) + 23, (2 << 5) + 24, (2 << 5) + 25};
 
+/// Not used
 const int UTF8_MASK[] = {0xE0, 0xF0, 0xF8};
+/// Not used
 const int UTF8_PREFIX[] = {0xC0, 0xE0, 0xF0};
 
+/// Minimum length to consider as repeating sequence
 #define NICE_LEN 5
 
+/// Set (USX_NUM - 2) and vertical code (26) for encoding repeating letters
 #define RPT_CODE ((2 << 5) + 26)
+/// Set (USX_NUM - 2) and vertical code (27) for encoding terminator
 #define TERM_CODE ((2 << 5) + 27)
+/// Set (USX_SYM - 1) and vertical code (7) for encoding Line feed \\n
 #define LF_CODE ((1 << 5) + 7)
+/// Set (USX_NUM - 1) and vertical code (8) for encoding \\r\\n
 #define CRLF_CODE ((1 << 5) + 8)
+/// Set (USX_NUM - 1) and vertical code (22) for encoding \\r
 #define CR_CODE ((1 << 5) + 22)
+/// Set (USX_NUM - 1) and vertical code (14) for encoding \\t
 #define TAB_CODE  ((1 << 5) + 14)
+/// Set (USX_NUM - 2) and vertical code (17) for space character when it appears in USX_NUM state \\r
 #define NUM_SPC_CODE ((2 << 5) + 17)
 
+/// Code for special code (11111) when state=USX_DELTA
 #define UNI_STATE_SPL_CODE 0xF8
+/// Length of Code for special code when state=USX_DELTA
 #define UNI_STATE_SPL_CODE_LEN 5
+/// Code for switch code when state=USX_DELTA
 #define UNI_STATE_SW_CODE 0x80
+/// Length of Code for Switch code when state=USX_DELTA
 #define UNI_STATE_SW_CODE_LEN 2
 
+/// Switch code in USX_ALPHA and USX_NUM 00
 #define SW_CODE 0
+/// Length of Switch code
 #define SW_CODE_LEN 2
-
+/// Terminator bit sequence for Preset 1. Length varies depending on state as per following macros
+#define TERM_BYTE_PRESET_1 0
+/// Length of Terminator bit sequence when state is lower
+#define TERM_BYTE_PRESET_1_LEN_LOWER 6
+/// Length of Terminator bit sequence when state is upper
+#define TERM_BYTE_PRESET_1_LEN_UPPER 4
+
+/// Offset at which usx_code_94 starts
 #define USX_OFFSET_94 33
 
-byte is_inited = 0;
+/// global to indicate whether initialization is complete or not
+uint8_t is_inited = 0;
+
+/// Fills the usx_code_94 94 letter array based on sets of characters at usx_sets \n
+/// For each element in usx_code_94, first 3 msb bits is set (USX_ALPHA / USX_SYM / USX_NUM) \n
+/// and the rest 5 bits indicate the vertical position in the corresponding set
 void init_coder() {
   if (is_inited)
     return;
   memset(usx_code_94, '\0', sizeof(usx_code_94));
   for (int i = 0; i < 3; i++) {
     for (int j = 0; j < 28; j++) {
-      byte c = usx_sets[i][j];
-      if (c != 0 && c > 32) {
+      uint8_t c = usx_sets[i][j];
+      if (c > 32) {
         usx_code_94[c - USX_OFFSET_94] = (i << 5) + j;
         if (c >= 'a' && c <= 'z')
           usx_code_94[c - USX_OFFSET_94 - ('a' - 'A')] = (i << 5) + j;
@@ -103,97 +148,121 @@ void init_coder() {
   is_inited = 1;
 }
 
-const unsigned int usx_mask[] = {0x80, 0xC0, 0xE0, 0xF0, 0xF8, 0xFC, 0xFE, 0xFF};
-int append_bits(char *out, int ol, byte code, int clen) {
+/// Mask for retrieving each code to be encoded according to its length
+unsigned int usx_mask[] = {0x80, 0xC0, 0xE0, 0xF0, 0xF8, 0xFC, 0xFE, 0xFF};
+
+/// Appends specified number of bits to the output (out) \n
+/// If maximum limit (olen) is reached, -1 is returned \n
+/// Otherwise clen bits in code are appended to out starting with MSB
+int append_bits(char *out, int olen, int ol, uint8_t code, int clen) {
 
-  byte cur_bit;
-  byte blen;
-  unsigned char a_byte;
 
   //printf("%d,%x,%d,%d\n", ol, code, clen, state);
 
   while (clen > 0) {
-     cur_bit = ol % 8;
-     blen = clen;
-     a_byte = code & usx_mask[blen - 1];
-     a_byte >>= cur_bit;
-     if (blen + cur_bit > 8)
-        blen = (8 - cur_bit);
-     if (cur_bit == 0)
-        out[ol / 8] = a_byte;
-     else
-        out[ol / 8] |= a_byte;
-     code <<= blen;
-     ol += blen;
-     clen -= blen;
-   }
-   return ol;
+    int oidx;
+    unsigned char a_byte;
+
+    uint8_t cur_bit = ol % 8;
+    uint8_t blen = clen;
+    a_byte = code & usx_mask[blen - 1];
+    a_byte >>= cur_bit;
+    if (blen + cur_bit > 8)
+      blen = (8 - cur_bit);
+    oidx = ol / 8;
+    if (oidx < 0 || olen <= oidx)
+      return -1;
+    if (cur_bit == 0)
+      out[oidx] = a_byte;
+    else
+      out[oidx] |= a_byte;
+    code <<= blen;
+    ol += blen;
+    clen -= blen;
+  }
+  return ol;
 }
 
-int append_switch_code(char *out, int ol, byte state) {
+/// This is a safe call to append_bits() making sure it does not write past olen
+#define SAFE_APPEND_BITS(exp) do { \
+  const int newidx = (exp); \
+  if (newidx < 0) return newidx; \
+} while (0)
+
+/// Appends switch code to out depending on the state (USX_DELTA or other)
+int append_switch_code(char *out, int olen, int ol, uint8_t state) {
   if (state == USX_DELTA) {
-    ol = append_bits(out, ol, UNI_STATE_SPL_CODE, UNI_STATE_SPL_CODE_LEN);
-    ol = append_bits(out, ol, UNI_STATE_SW_CODE, UNI_STATE_SW_CODE_LEN);
+    SAFE_APPEND_BITS(ol = append_bits(out, olen, ol, UNI_STATE_SPL_CODE, UNI_STATE_SPL_CODE_LEN));
+    SAFE_APPEND_BITS(ol = append_bits(out, olen, ol, UNI_STATE_SW_CODE, UNI_STATE_SW_CODE_LEN));
   } else
-    ol = append_bits(out, ol, SW_CODE, SW_CODE_LEN);
+    SAFE_APPEND_BITS(ol = append_bits(out, olen, ol, SW_CODE, SW_CODE_LEN));
   return ol;
 }
 
-int append_code(char *out, int ol, byte code, byte *state, const byte usx_hcodes[], const byte usx_hcode_lens[]) {
-  byte hcode = code >> 5;
-  byte vcode = code & 0x1F;
+/// Appends given horizontal and veritical code bits to out
+int append_code(char *out, int olen, int ol, uint8_t code, uint8_t *state, const uint8_t usx_hcodes[], const uint8_t usx_hcode_lens[]) {
+  uint8_t hcode = code >> 5;
+  uint8_t vcode = code & 0x1F;
   if (!usx_hcode_lens[hcode] && hcode != USX_ALPHA)
     return ol;
   switch (hcode) {
     case USX_ALPHA:
       if (*state != USX_ALPHA) {
-        ol = append_switch_code(out, ol, *state);
-        ol = append_bits(out, ol, usx_hcodes[USX_ALPHA], usx_hcode_lens[USX_ALPHA]);
+        SAFE_APPEND_BITS(ol = append_switch_code(out, olen, ol, *state));
+        SAFE_APPEND_BITS(ol = append_bits(out, olen, ol, usx_hcodes[USX_ALPHA], usx_hcode_lens[USX_ALPHA]));
         *state = USX_ALPHA;
       }
       break;
     case USX_SYM:
-      ol = append_switch_code(out, ol, *state);
-      ol = append_bits(out, ol, usx_hcodes[USX_SYM], usx_hcode_lens[USX_SYM]);
+      SAFE_APPEND_BITS(ol = append_switch_code(out, olen, ol, *state));
+      SAFE_APPEND_BITS(ol = append_bits(out, olen, ol, usx_hcodes[USX_SYM], usx_hcode_lens[USX_SYM]));
       break;
     case USX_NUM:
       if (*state != USX_NUM) {
-        ol = append_switch_code(out, ol, *state);
-        ol = append_bits(out, ol, usx_hcodes[USX_NUM], usx_hcode_lens[USX_NUM]);
+        SAFE_APPEND_BITS(ol = append_switch_code(out, olen, ol, *state));
+        SAFE_APPEND_BITS(ol = append_bits(out, olen, ol, usx_hcodes[USX_NUM], usx_hcode_lens[USX_NUM]));
         if (usx_sets[hcode][vcode] >= '0' && usx_sets[hcode][vcode] <= '9')
           *state = USX_NUM;
       }
   }
-  return append_bits(out, ol, usx_vcodes[vcode], usx_vcode_lens[vcode]);
+  SAFE_APPEND_BITS(ol = append_bits(out, olen, ol, usx_vcodes[vcode], usx_vcode_lens[vcode]));
+  return ol;
 }
 
-const byte count_bit_lens[5] = {2, 4, 7, 11, 16};
+/// Length of bits used to represent count for each level
+const uint8_t count_bit_lens[5] = {2, 4, 7, 11, 16};
+/// Cumulative counts represented at each level
 const int32_t count_adder[5] = {4, 20, 148, 2196, 67732};
-const byte count_codes[] = {0x01, 0x82, 0xC3, 0xE4, 0xF4};
-int encodeCount(char *out, int ol, int count) {
+/// Codes used to specify the level that the count belongs to
+const uint8_t count_codes[] = {0x01, 0x82, 0xC3, 0xE4, 0xF4};
+/// Encodes given count to out
+int encodeCount(char *out, int olen, int ol, int count) {
   // First five bits are code and Last three bits of codes represent length
   for (int i = 0; i < 5; i++) {
     if (count < count_adder[i]) {
-      ol = append_bits(out, ol, (count_codes[i] & 0xF8), count_codes[i] & 0x07);
+      SAFE_APPEND_BITS(ol = append_bits(out, olen, ol, (count_codes[i] & 0xF8), count_codes[i] & 0x07));
       uint16_t count16 = (count - (i ? count_adder[i - 1] : 0)) << (16 - count_bit_lens[i]);
       if (count_bit_lens[i] > 8) {
-        ol = append_bits(out, ol, count16 >> 8, 8);
-        ol = append_bits(out, ol, count16 & 0xFF, count_bit_lens[i] - 8);
+        SAFE_APPEND_BITS(ol = append_bits(out, olen, ol, count16 >> 8, 8));
+        SAFE_APPEND_BITS(ol = append_bits(out, olen, ol, count16 & 0xFF, count_bit_lens[i] - 8));
       } else
-        ol = append_bits(out, ol, count16 >> 8, count_bit_lens[i]);
+        SAFE_APPEND_BITS(ol = append_bits(out, olen, ol, count16 >> 8, count_bit_lens[i]));
       return ol;
     }
   }
   return ol;
 }
 
-const byte uni_bit_len[5] = {6, 12, 14, 16, 21};
+/// Length of bits used to represent delta code for each level
+const uint8_t uni_bit_len[5] = {6, 12, 14, 16, 21};
+/// Cumulative delta codes represented at each level
 const int32_t uni_adder[5] = {0, 64, 4160, 20544, 86080};
 
-int encodeUnicode(char *out, int ol, int32_t code, int32_t prev_code) {
+/// Encodes the unicode code point given by code to out. prev_code is used to calculate the delta
+int encodeUnicode(char *out, int olen, int ol, int32_t code, int32_t prev_code) {
   // First five bits are code and Last three bits of codes represent length
-  //const byte codes[8] = {0x00, 0x42, 0x83, 0xA3, 0xC3, 0xE4, 0xF5, 0xFD};
-  const byte codes[6] = {0x01, 0x82, 0xC3, 0xE4, 0xF5, 0xFD};
+  //const uint8_t codes[8] = {0x00, 0x42, 0x83, 0xA3, 0xC3, 0xE4, 0xF5, 0xFD};
+  const uint8_t codes[6] = {0x01, 0x82, 0xC3, 0xE4, 0xF5, 0xFD};
   int32_t till = 0;
   int32_t diff = code - prev_code;
   if (diff < 0)
@@ -203,33 +272,32 @@ int encodeUnicode(char *out, int ol, int32_t code, int32_t prev_code) {
   for (int i = 0; i < 5; i++) {
     till += (1 << uni_bit_len[i]);
     if (diff < till) {
-      ol = append_bits(out, ol, (codes[i] & 0xF8), codes[i] & 0x07);
+      SAFE_APPEND_BITS(ol = append_bits(out, olen, ol, (codes[i] & 0xF8), codes[i] & 0x07));
       //if (diff) {
-        ol = append_bits(out, ol, prev_code > code ? 0x80 : 0, 1);
+        SAFE_APPEND_BITS(ol = append_bits(out, olen, ol, prev_code > code ? 0x80 : 0, 1));
         int32_t val = diff - uni_adder[i];
         //printf("Val: %d\n", val);
         if (uni_bit_len[i] > 16) {
           val <<= (24 - uni_bit_len[i]);
-          ol = append_bits(out, ol, val >> 16, 8);
-          ol = append_bits(out, ol, (val >> 8) & 0xFF, 8);
-          ol = append_bits(out, ol, val & 0xFF, uni_bit_len[i] - 16);
+          SAFE_APPEND_BITS(ol = append_bits(out, olen, ol, val >> 16, 8));
+          SAFE_APPEND_BITS(ol = append_bits(out, olen, ol, (val >> 8) & 0xFF, 8));
+          SAFE_APPEND_BITS(ol = append_bits(out, olen, ol, val & 0xFF, uni_bit_len[i] - 16));
         } else
         if (uni_bit_len[i] > 8) {
           val <<= (16 - uni_bit_len[i]);
-          ol = append_bits(out, ol, val >> 8, 8);
-          ol = append_bits(out, ol, val & 0xFF, uni_bit_len[i] - 8);
+          SAFE_APPEND_BITS(ol = append_bits(out, olen, ol, val >> 8, 8));
+          SAFE_APPEND_BITS(ol = append_bits(out, olen, ol, val & 0xFF, uni_bit_len[i] - 8));
         } else {
           val <<= (8 - uni_bit_len[i]);
-          ol = append_bits(out, ol, val & 0xFF, uni_bit_len[i]);
+          SAFE_APPEND_BITS(ol = append_bits(out, olen, ol, val & 0xFF, uni_bit_len[i]));
         }
-      //}
-      //printf("bits:%d\n", ol-orig_ol);
       return ol;
     }
   }
   return ol;
 }
 
+/// Reads UTF-8 character from in. Also returns the number of bytes occupied by the UTF-8 character in utf8len
 int32_t readUTF8(const char *in, int len, int l, int *utf8len) {
   int32_t ret = 0;
   if (l < (len - 1) && (in[l] & 0xE0) == 0xC0 && (in[l + 1] & 0xC0) == 0x80) {
@@ -267,7 +335,12 @@ int32_t readUTF8(const char *in, int len, int l, int *utf8len) {
   return ret;
 }
 
-int matchOccurance(const char *in, int len, int l, char *out, int *ol, byte *state, const byte usx_hcodes[], const byte usx_hcode_lens[]) {
+/// Finds the longest matching sequence from the beginning of the string. \n
+/// If a match is found and it is longer than NICE_LEN, it is encoded as a repeating sequence to out \n
+/// This is also used for Unicode strings \n
+/// This is a crude implementation that is not optimized.  Assuming only short strings \n
+/// are encoded, this is not much of an issue.
+int matchOccurance(const char *in, int len, int l, char *out, int olen, int *ol, uint8_t *state, const uint8_t usx_hcodes[], const uint8_t usx_hcode_lens[]) {
   int j, k;
   int longest_dist = 0;
   int longest_len = 0;
@@ -290,11 +363,11 @@ int matchOccurance(const char *in, int len, int l, char *out, int *ol, byte *sta
     }
   }
   if (longest_len) {
-    *ol = append_switch_code(out, *ol, *state);
-    *ol = append_bits(out, *ol, usx_hcodes[USX_DICT], usx_hcode_lens[USX_DICT]);
+    SAFE_APPEND_BITS(*ol = append_switch_code(out, olen, *ol, *state));
+    SAFE_APPEND_BITS(*ol = append_bits(out, olen, *ol, usx_hcodes[USX_DICT], usx_hcode_lens[USX_DICT]));
     //printf("Len:%d / Dist:%d/%.*s\n", longest_len, longest_dist, longest_len + NICE_LEN, in + l - longest_dist - NICE_LEN + 1);
-    *ol = encodeCount(out, *ol, longest_len);
-    *ol = encodeCount(out, *ol, longest_dist);
+    SAFE_APPEND_BITS(*ol = encodeCount(out, olen, *ol, longest_len));
+    SAFE_APPEND_BITS(*ol = encodeCount(out, olen, *ol, longest_dist));
     l += (longest_len + NICE_LEN);
     l--;
     return l;
@@ -302,7 +375,13 @@ int matchOccurance(const char *in, int len, int l, char *out, int *ol, byte *sta
   return -l;
 }
 
-int matchLine(const char *in, int len, int l, char *out, int *ol, struct us_lnk_lst *prev_lines, byte *state, const byte usx_hcodes[], const byte usx_hcode_lens[]) {
+/// This is used only when encoding a string array
+/// Finds the longest matching sequence from the previous array element to the beginning of the string array. \n
+/// If a match is found and it is longer than NICE_LEN, it is encoded as a repeating sequence to out \n
+/// This is also used for Unicode strings \n
+/// This is a crude implementation that is not optimized.  Assuming only short strings \n
+/// are encoded, this is not much of an issue.
+int matchLine(const char *in, int len, int l, char *out, int olen, int *ol, struct us_lnk_lst *prev_lines, uint8_t *state, const uint8_t usx_hcodes[], const uint8_t usx_hcode_lens[]) {
   int last_ol = *ol;
   int last_len = 0;
   int last_dist = 0;
@@ -311,7 +390,7 @@ int matchLine(const char *in, int len, int l, char *out, int *ol, struct us_lnk_
   int j = 0;
   do {
     int i, k;
-    int line_len = strlen(prev_lines->data);
+    int line_len = (int)strlen(prev_lines->data);
     int limit = (line_ctr == 0 ? l : line_len);
     for (; j < limit; j++) {
       for (i = l, k = j; k < line_len && i < len; k++, i++) {
@@ -334,11 +413,11 @@ int matchLine(const char *in, int len, int l, char *out, int *ol, struct us_lnk_
         last_len = (k - j);
         last_dist = j;
         last_ctx = line_ctr;
-        *ol = append_switch_code(out, *ol, *state);
-        *ol = append_bits(out, *ol, usx_hcodes[USX_DICT], usx_hcode_lens[USX_DICT]);
-        *ol = encodeCount(out, *ol, last_len - NICE_LEN);
-        *ol = encodeCount(out, *ol, last_dist);
-        *ol = encodeCount(out, *ol, last_ctx);
+        SAFE_APPEND_BITS(*ol = append_switch_code(out, olen, *ol, *state));
+        SAFE_APPEND_BITS(*ol = append_bits(out, olen, *ol, usx_hcodes[USX_DICT], usx_hcode_lens[USX_DICT]));
+        SAFE_APPEND_BITS(*ol = encodeCount(out, olen, *ol, last_len - NICE_LEN));
+        SAFE_APPEND_BITS(*ol = encodeCount(out, olen, *ol, last_dist));
+        SAFE_APPEND_BITS(*ol = encodeCount(out, olen, *ol, last_ctx));
         /*
         if ((*ol - last_ol) > (last_len * 4)) {
           last_len = 0;
@@ -359,7 +438,9 @@ int matchLine(const char *in, int len, int l, char *out, int *ol, struct us_lnk_
   return -l;
 }
 
-byte getBaseCode(char ch) {
+/// Returns 4 bit code assuming ch falls between '0' to '9', \n
+/// 'A' to 'F' or 'a' to 'f'
+uint8_t getBaseCode(char ch) {
   if (ch >= '0' && ch <= '9')
     return (ch - '0') << 4;
   else if (ch >= 'A' && ch <= 'F')
@@ -369,7 +450,12 @@ byte getBaseCode(char ch) {
   return 0;
 }
 
+/// Enum indicating nibble type - USX_NIB_NUM means ch is a number '0' to '9', \n
+/// USX_NIB_HEX_LOWER means ch is between 'a' to 'f', \n
+/// USX_NIB_HEX_UPPER means ch is between 'A' to 'F'
 enum {USX_NIB_NUM = 0, USX_NIB_HEX_LOWER, USX_NIB_HEX_UPPER, USX_NIB_NOT};
+/// Gets 4 bit code assuming ch falls between '0' to '9', \n
+/// 'A' to 'F' or 'a' to 'f'
 char getNibbleType(char ch) {
   if (ch >= '0' && ch <= '9')
     return USX_NIB_NUM;
@@ -380,41 +466,93 @@ char getNibbleType(char ch) {
   return USX_NIB_NOT;
 }
 
-int append_nibble_escape(char *out, int ol, byte state, const byte usx_hcodes[], const byte usx_hcode_lens[]) {
-  ol = append_switch_code(out, ol, state);
-  ol = append_bits(out, ol, usx_hcodes[USX_NUM], usx_hcode_lens[USX_NUM]);
-  ol = append_bits(out, ol, 0, 2);
+/// Starts coding of nibble sets
+int append_nibble_escape(char *out, int olen, int ol, uint8_t state, const uint8_t usx_hcodes[], const uint8_t usx_hcode_lens[]) {
+  SAFE_APPEND_BITS(ol = append_switch_code(out, olen, ol, state));
+  SAFE_APPEND_BITS(ol = append_bits(out, olen, ol, usx_hcodes[USX_NUM], usx_hcode_lens[USX_NUM]));
+  SAFE_APPEND_BITS(ol = append_bits(out, olen, ol, 0, 2));
+  return ol;
+}
+
+/// Returns minimum value of two longs
+long min_of(long c, long i) {
+  return c > i ? i : c;
+}
+
+/// Appends the terminator code depending on the state, preset and whether full terminator needs to be encoded to out or not \n
+int append_final_bits(char *const out, const int olen, int ol, const uint8_t state, const uint8_t is_all_upper, const uint8_t usx_hcodes[], const uint8_t usx_hcode_lens[]) {
+  if (usx_hcode_lens[USX_ALPHA]) {
+    if (USX_NUM != state) {
+      // for num state, append TERM_CODE directly
+      // for other state, switch to Num Set first
+      SAFE_APPEND_BITS(ol = append_switch_code(out, olen, ol, state));
+      SAFE_APPEND_BITS(ol = append_bits(out, olen, ol, usx_hcodes[USX_NUM], usx_hcode_lens[USX_NUM]));
+    }
+    SAFE_APPEND_BITS(ol = append_bits(out, olen, ol, usx_vcodes[TERM_CODE & 0x1F], usx_vcode_lens[TERM_CODE & 0x1F]));
+  } else {
+    // preset 1, terminate at 2 or 3 SW_CODE, i.e., 4 or 6 continuous 0 bits
+    // see discussion: https://github.com/siara-cc/Unishox/issues/19#issuecomment-922435580
+    SAFE_APPEND_BITS(ol = append_bits(out, olen, ol, TERM_BYTE_PRESET_1, is_all_upper ? TERM_BYTE_PRESET_1_LEN_UPPER : TERM_BYTE_PRESET_1_LEN_LOWER));
+  }
+
+  // fill uint8_t with the last bit
+  SAFE_APPEND_BITS(ol = append_bits(out, olen, ol, (ol == 0 || out[(ol-1)/8] << ((ol-1)&7) >= 0) ? 0 : 0xFF, (8 - ol % 8) & 7));
+
   return ol;
 }
 
-int unishox2_compress_lines(const char *in, int len, char *out, const byte usx_hcodes[], const byte usx_hcode_lens[], const char *usx_freq_seq[], const char *usx_templates[], struct us_lnk_lst *prev_lines) {
+/// Macro used in the main compress function so that if the output len exceeds given maximum length (olen) it can exit
+#define SAFE_APPEND_BITS2(olen, exp) do { \
+  const int newidx = (exp); \
+  const int __olen = (olen); \
+  if (newidx < 0) return __olen >= 0 ? __olen + 1 : (1 - __olen) * 4; \
+} while (0)
+
+// Main API function. See unishox2.h for documentation
+int unishox2_compress_lines(const char *in, int len, UNISHOX_API_OUT_AND_LEN(char *out, int olen), const uint8_t usx_hcodes[], const uint8_t usx_hcode_lens[], const char *usx_freq_seq[], const char *usx_templates[], struct us_lnk_lst *prev_lines) {
 
-  byte state;
+  uint8_t state;
 
   int l, ll, ol;
   char c_in, c_next;
   int prev_uni;
-  byte is_upper, is_all_upper;
+  uint8_t is_upper, is_all_upper;
+#if (UNISHOX_API_OUT_AND_LEN(0,1)) == 0
+  const int olen = INT_MAX - 1;
+  const int rawolen = olen;
+  const uint8_t need_full_term_codes = 0;
+#else
+  const int rawolen = olen;
+  uint8_t need_full_term_codes = 0;
+  if (olen < 0) {
+    need_full_term_codes = 1;
+    olen *= -1;
+  }
+#endif
 
   init_coder();
   ol = 0;
   prev_uni = 0;
   state = USX_ALPHA;
   is_all_upper = 0;
-  ol = append_bits(out, ol, 0x80, 1); // magic bit
+  SAFE_APPEND_BITS2(rawolen, ol = append_bits(out, olen, ol, UNISHOX_MAGIC_BITS, UNISHOX_MAGIC_BIT_LEN)); // magic bit(s)
   for (l=0; l<len; l++) {
 
     if (usx_hcode_lens[USX_DICT] && l < (len - NICE_LEN + 1)) {
       if (prev_lines) {
-        l = matchLine(in, len, l, out, &ol, prev_lines, &state, usx_hcodes, usx_hcode_lens);
+        l = matchLine(in, len, l, out, olen, &ol, prev_lines, &state, usx_hcodes, usx_hcode_lens);
         if (l > 0) {
           continue;
+        } else if (l < 0 && ol < 0) {
+          return olen + 1;
         }
         l = -l;
       } else {
-          l = matchOccurance(in, len, l, out, &ol, &state, usx_hcodes, usx_hcode_lens);
+          l = matchOccurance(in, len, l, out, olen, &ol, &state, usx_hcodes, usx_hcode_lens);
           if (l > 0) {
             continue;
+          } else if (l < 0 && ol < 0) {
+            return olen + 1;
           }
           l = -l;
       }
@@ -427,8 +565,8 @@ int unishox2_compress_lines(const char *in, int len, char *out, const byte usx_h
         while (rpt_count < len && in[rpt_count] == c_in)
           rpt_count++;
         rpt_count -= l;
-        ol = append_code(out, ol, RPT_CODE, &state, usx_hcodes, usx_hcode_lens);
-        ol = encodeCount(out, ol, rpt_count - 4);
+        SAFE_APPEND_BITS2(rawolen, ol = append_code(out, olen, ol, RPT_CODE, &state, usx_hcodes, usx_hcode_lens));
+        SAFE_APPEND_BITS2(rawolen, ol = encodeCount(out, olen, ol, rpt_count - 4));
         l += rpt_count;
         l--;
         continue;
@@ -441,7 +579,7 @@ int unishox2_compress_lines(const char *in, int len, char *out, const byte usx_h
         int uid_pos = l;
         for (; uid_pos < l + 36; uid_pos++) {
           char c_uid = in[uid_pos];
-          if (c_uid == '-')
+          if (c_uid == '-' && (uid_pos == 8 || uid_pos == 13 || uid_pos == 18 || uid_pos == 23))
             continue;
           char nib_type = getNibbleType(c_uid);
           if (nib_type == USX_NIB_NOT)
@@ -453,13 +591,13 @@ int unishox2_compress_lines(const char *in, int len, char *out, const byte usx_h
           }
         }
         if (uid_pos == l + 36) {
-          ol = append_nibble_escape(out, ol, state, usx_hcodes, usx_hcode_lens);
-          ol = append_bits(out, ol, (hex_type == USX_NIB_HEX_LOWER ? 0xC0 : 0xF0),
-                 (hex_type == USX_NIB_HEX_LOWER ? 3 : 5));
+          SAFE_APPEND_BITS2(rawolen, ol = append_nibble_escape(out, olen, ol, state, usx_hcodes, usx_hcode_lens));
+          SAFE_APPEND_BITS2(rawolen, ol = append_bits(out, olen, ol, (hex_type == USX_NIB_HEX_LOWER ? 0xC0 : 0xF0),
+                 (hex_type == USX_NIB_HEX_LOWER ? 3 : 5)));
           for (uid_pos = l; uid_pos < l + 36; uid_pos++) {
             char c_uid = in[uid_pos];
             if (c_uid != '-')
-              ol = append_bits(out, ol, getBaseCode(c_uid), 4);
+              SAFE_APPEND_BITS2(rawolen, ol = append_bits(out, olen, ol, getBaseCode(c_uid), 4));
           }
           //printf("GUID:\n");
           l += 35;
@@ -485,11 +623,11 @@ int unishox2_compress_lines(const char *in, int len, char *out, const byte usx_h
       if (hex_len > 10 && hex_type == USX_NIB_NUM)
         hex_type = USX_NIB_HEX_LOWER;
       if ((hex_type == USX_NIB_HEX_LOWER || hex_type == USX_NIB_HEX_UPPER) && hex_len > 3) {
-        ol = append_nibble_escape(out, ol, state, usx_hcodes, usx_hcode_lens);
-        ol = append_bits(out, ol, (hex_type == USX_NIB_HEX_LOWER ? 0x80 : 0xE0), (hex_type == USX_NIB_HEX_LOWER ? 2 : 4));
-        ol = encodeCount(out, ol, hex_len);
+        SAFE_APPEND_BITS2(rawolen, ol = append_nibble_escape(out, olen, ol, state, usx_hcodes, usx_hcode_lens));
+        SAFE_APPEND_BITS2(rawolen, ol = append_bits(out, olen, ol, (hex_type == USX_NIB_HEX_LOWER ? 0x80 : 0xE0), (hex_type == USX_NIB_HEX_LOWER ? 2 : 4)));
+        SAFE_APPEND_BITS2(rawolen, ol = encodeCount(out, olen, ol, hex_len));
         do {
-          ol = append_bits(out, ol, getBaseCode(in[l++]), 4);
+          SAFE_APPEND_BITS2(rawolen, ol = append_bits(out, olen, ol, getBaseCode(in[l++]), 4));
         } while (--hex_len);
         l--;
         continue;
@@ -500,7 +638,7 @@ int unishox2_compress_lines(const char *in, int len, char *out, const byte usx_h
       int i;
       for (i = 0; i < 5; i++) {
         if (usx_templates[i]) {
-          int rem = strlen(usx_templates[i]);
+          int rem = (int)strlen(usx_templates[i]);
           int j = 0;
           for (; j < rem && l + j < len; j++) {
             char c_t = usx_templates[i][j];
@@ -521,17 +659,17 @@ int unishox2_compress_lines(const char *in, int len, char *out, const byte usx_h
           if (((float)j / rem) > 0.66) {
             //printf("%s\n", usx_templates[i]);
             rem = rem - j;
-            ol = append_nibble_escape(out, ol, state, usx_hcodes, usx_hcode_lens);
-            ol = append_bits(out, ol, 0, 1);
-            ol = append_bits(out, ol, (count_codes[i] & 0xF8), count_codes[i] & 0x07);
-            ol = encodeCount(out, ol, rem);
+            SAFE_APPEND_BITS2(rawolen, ol = append_nibble_escape(out, olen, ol, state, usx_hcodes, usx_hcode_lens));
+            SAFE_APPEND_BITS2(rawolen, ol = append_bits(out, olen, ol, 0, 1));
+            SAFE_APPEND_BITS2(rawolen, ol = append_bits(out, olen, ol, (count_codes[i] & 0xF8), count_codes[i] & 0x07));
+            SAFE_APPEND_BITS2(rawolen, ol = encodeCount(out, olen, ol, rem));
             for (int k = 0; k < j; k++) {
               char c_t = usx_templates[i][k];
               if (c_t == 'f' || c_t == 'F')
-                ol = append_bits(out, ol, getBaseCode(in[l + k]), 4);
+                SAFE_APPEND_BITS2(rawolen, ol = append_bits(out, olen, ol, getBaseCode(in[l + k]), 4));
               else if (c_t == 'r' || c_t == 't' || c_t == 'o') {
                 c_t = (c_t == 'r' ? 3 : (c_t == 't' ? 2 : 1));
-                ol = append_bits(out, ol, (in[l + k] - '0') << (8 - c_t), c_t);
+                SAFE_APPEND_BITS2(rawolen, ol = append_bits(out, olen, ol, (in[l + k] - '0') << (8 - c_t), c_t));
               }
             }
             l += j;
@@ -547,10 +685,10 @@ int unishox2_compress_lines(const char *in, int len, char *out, const byte usx_h
     if (usx_freq_seq != NULL) {
       int i;
       for (i = 0; i < 6; i++) {
-        int seq_len = strlen(usx_freq_seq[i]);
+        int seq_len = (int)strlen(usx_freq_seq[i]);
         if (len - seq_len >= 0 && l <= len - seq_len) {
           if (memcmp(usx_freq_seq[i], in + l, seq_len) == 0 && usx_hcode_lens[usx_freq_codes[i] >> 5]) {
-            ol = append_code(out, ol, usx_freq_codes[i], &state, usx_hcodes, usx_hcode_lens);
+            SAFE_APPEND_BITS2(rawolen, ol = append_code(out, olen, ol, usx_freq_codes[i], &state, usx_hcodes, usx_hcode_lens));
             l += seq_len;
             l--;
             break;
@@ -569,23 +707,23 @@ int unishox2_compress_lines(const char *in, int len, char *out, const byte usx_h
     else {
       if (is_all_upper) {
         is_all_upper = 0;
-        ol = append_switch_code(out, ol, state);
-        ol = append_bits(out, ol, usx_hcodes[USX_ALPHA], usx_hcode_lens[USX_ALPHA]);
+        SAFE_APPEND_BITS2(rawolen, ol = append_switch_code(out, olen, ol, state));
+        SAFE_APPEND_BITS2(rawolen, ol = append_bits(out, olen, ol, usx_hcodes[USX_ALPHA], usx_hcode_lens[USX_ALPHA]));
         state = USX_ALPHA;
       }
     }
     if (is_upper && !is_all_upper) {
       if (state == USX_NUM) {
-        ol = append_switch_code(out, ol, state);
-        ol = append_bits(out, ol, usx_hcodes[USX_ALPHA], usx_hcode_lens[USX_ALPHA]);
+        SAFE_APPEND_BITS2(rawolen, ol = append_switch_code(out, olen, ol, state));
+        SAFE_APPEND_BITS2(rawolen, ol = append_bits(out, olen, ol, usx_hcodes[USX_ALPHA], usx_hcode_lens[USX_ALPHA]));
         state = USX_ALPHA;
       }
-      ol = append_switch_code(out, ol, state);
-      ol = append_bits(out, ol, usx_hcodes[USX_ALPHA], usx_hcode_lens[USX_ALPHA]);
+      SAFE_APPEND_BITS2(rawolen, ol = append_switch_code(out, olen, ol, state));
+      SAFE_APPEND_BITS2(rawolen, ol = append_bits(out, olen, ol, usx_hcodes[USX_ALPHA], usx_hcode_lens[USX_ALPHA]));
       if (state == USX_DELTA) {
         state = USX_ALPHA;
-        ol = append_switch_code(out, ol, state);
-        ol = append_bits(out, ol, usx_hcodes[USX_ALPHA], usx_hcode_lens[USX_ALPHA]);
+        SAFE_APPEND_BITS2(rawolen, ol = append_switch_code(out, olen, ol, state));
+        SAFE_APPEND_BITS2(rawolen, ol = append_bits(out, olen, ol, usx_hcodes[USX_ALPHA], usx_hcode_lens[USX_ALPHA]));
       }
     }
     c_next = 0;
@@ -599,18 +737,18 @@ int unishox2_compress_lines(const char *in, int len, char *out, const byte usx_h
             break;
         }
         if (ll == l-1) {
-          ol = append_switch_code(out, ol, state);
-          ol = append_bits(out, ol, usx_hcodes[USX_ALPHA], usx_hcode_lens[USX_ALPHA]);
+          SAFE_APPEND_BITS2(rawolen, ol = append_switch_code(out, olen, ol, state));
+          SAFE_APPEND_BITS2(rawolen, ol = append_bits(out, olen, ol, usx_hcodes[USX_ALPHA], usx_hcode_lens[USX_ALPHA]));
           state = USX_ALPHA;
           is_all_upper = 1;
         }
       }
       if (state == USX_DELTA && (c_in == ' ' || c_in == '.' || c_in == ',')) {
-        byte spl_code = (c_in == ',' ? 0xC0 : (c_in == '.' ? 0xE0 : (c_in == ' ' ? 0 : 0xFF)));
+        uint8_t spl_code = (c_in == ',' ? 0xC0 : (c_in == '.' ? 0xE0 : (c_in == ' ' ? 0 : 0xFF)));
         if (spl_code != 0xFF) {
-          byte spl_code_len = (c_in == ',' ? 3 : (c_in == '.' ? 4 : (c_in == ' ' ? 1 : 4)));
-          ol = append_bits(out, ol, UNI_STATE_SPL_CODE, UNI_STATE_SPL_CODE_LEN);
-          ol = append_bits(out, ol, spl_code, spl_code_len);
+          uint8_t spl_code_len = (c_in == ',' ? 3 : (c_in == '.' ? 4 : (c_in == ' ' ? 1 : 4)));
+          SAFE_APPEND_BITS2(rawolen, ol = append_bits(out, olen, ol, UNI_STATE_SPL_CODE, UNI_STATE_SPL_CODE_LEN));
+          SAFE_APPEND_BITS2(rawolen, ol = append_bits(out, olen, ol, spl_code, spl_code_len));
           continue;
         }
       }
@@ -619,30 +757,30 @@ int unishox2_compress_lines(const char *in, int len, char *out, const byte usx_h
         c_in += 32;
       if (c_in == 0) {
         if (state == USX_NUM)
-          ol = append_bits(out, ol, usx_vcodes[NUM_SPC_CODE & 0x1F], usx_vcode_lens[NUM_SPC_CODE & 0x1F]);
+          SAFE_APPEND_BITS2(rawolen, ol = append_bits(out, olen, ol, usx_vcodes[NUM_SPC_CODE & 0x1F], usx_vcode_lens[NUM_SPC_CODE & 0x1F]));
         else
-          ol = append_bits(out, ol, usx_vcodes[1], usx_vcode_lens[1]);
+          SAFE_APPEND_BITS2(rawolen, ol = append_bits(out, olen, ol, usx_vcodes[1], usx_vcode_lens[1]));
       } else {
         c_in--;
-        ol = append_code(out, ol, usx_code_94[(uint8_t)c_in], &state, usx_hcodes, usx_hcode_lens);
+        SAFE_APPEND_BITS2(rawolen, ol = append_code(out, olen, ol, usx_code_94[(int)c_in], &state, usx_hcodes, usx_hcode_lens));
       }
     } else
     if (c_in == 13 && c_next == 10) {
-      ol = append_code(out, ol, CRLF_CODE, &state, usx_hcodes, usx_hcode_lens);
+      SAFE_APPEND_BITS2(rawolen, ol = append_code(out, olen, ol, CRLF_CODE, &state, usx_hcodes, usx_hcode_lens));
       l++;
     } else
     if (c_in == 10) {
       if (state == USX_DELTA) {
-        ol = append_bits(out, ol, UNI_STATE_SPL_CODE, UNI_STATE_SPL_CODE_LEN);
-        ol = append_bits(out, ol, 0xF0, 4);
+        SAFE_APPEND_BITS2(rawolen, ol = append_bits(out, olen, ol, UNI_STATE_SPL_CODE, UNI_STATE_SPL_CODE_LEN));
+        SAFE_APPEND_BITS2(rawolen, ol = append_bits(out, olen, ol, 0xF0, 4));
       } else
-        ol = append_code(out, ol, LF_CODE, &state, usx_hcodes, usx_hcode_lens);
+        SAFE_APPEND_BITS2(rawolen, ol = append_code(out, olen, ol, LF_CODE, &state, usx_hcodes, usx_hcode_lens));
     } else
     if (c_in == 13) {
-      ol = append_code(out, ol, CR_CODE, &state, usx_hcodes, usx_hcode_lens);
+      SAFE_APPEND_BITS2(rawolen, ol = append_code(out, olen, ol, CR_CODE, &state, usx_hcodes, usx_hcode_lens));
     } else
     if (c_in == '\t') {
-      ol = append_code(out, ol, TAB_CODE, &state, usx_hcodes, usx_hcode_lens);
+      SAFE_APPEND_BITS2(rawolen, ol = append_code(out, olen, ol, TAB_CODE, &state, usx_hcodes, usx_hcode_lens));
     } else {
       int utf8len;
       int32_t uni = readUTF8(in, len, l, &utf8len);
@@ -652,19 +790,19 @@ int unishox2_compress_lines(const char *in, int len, char *out, const byte usx_h
           int32_t uni2 = readUTF8(in, len, l, &utf8len);
           if (uni2) {
             if (state != USX_ALPHA) {
-              ol = append_switch_code(out, ol, state);
-              ol = append_bits(out, ol, usx_hcodes[USX_ALPHA], usx_hcode_lens[USX_ALPHA]);
+              SAFE_APPEND_BITS2(rawolen, ol = append_switch_code(out, olen, ol, state));
+              SAFE_APPEND_BITS2(rawolen, ol = append_bits(out, olen, ol, usx_hcodes[USX_ALPHA], usx_hcode_lens[USX_ALPHA]));
             }
-            ol = append_switch_code(out, ol, state);
-            ol = append_bits(out, ol, usx_hcodes[USX_ALPHA], usx_hcode_lens[USX_ALPHA]);
-            ol = append_bits(out, ol, usx_vcodes[1], usx_vcode_lens[1]); // code for space (' ')
+            SAFE_APPEND_BITS2(rawolen, ol = append_switch_code(out, olen, ol, state));
+            SAFE_APPEND_BITS2(rawolen, ol = append_bits(out, olen, ol, usx_hcodes[USX_ALPHA], usx_hcode_lens[USX_ALPHA]));
+            SAFE_APPEND_BITS2(rawolen, ol = append_bits(out, olen, ol, usx_vcodes[1], usx_vcode_lens[1])); // code for space (' ')
             state = USX_DELTA;
           } else {
-            ol = append_switch_code(out, ol, state);
-            ol = append_bits(out, ol, usx_hcodes[USX_DELTA], usx_hcode_lens[USX_DELTA]);
+            SAFE_APPEND_BITS2(rawolen, ol = append_switch_code(out, olen, ol, state));
+            SAFE_APPEND_BITS2(rawolen, ol = append_bits(out, olen, ol, usx_hcodes[USX_DELTA], usx_hcode_lens[USX_DELTA]));
           }
         }
-        ol = encodeUnicode(out, ol, uni, prev_uni);
+        SAFE_APPEND_BITS2(rawolen, ol = encodeUnicode(out, olen, ol, uni, prev_uni));
         //printf("%d:%d:%d\n", l, utf8len, uni);
         prev_uni = uni;
         l--;
@@ -681,60 +819,71 @@ int unishox2_compress_lines(const char *in, int len, char *out, const byte usx_h
           bin_count++;
         }
         //printf("Bin:%d:%d:%x:%d\n", l, (unsigned char) c_in, (unsigned char) c_in, bin_count);
-        ol = append_nibble_escape(out, ol, state, usx_hcodes, usx_hcode_lens);
-        ol = append_bits(out, ol, 0xF8, 5);
-        ol = encodeCount(out, ol, bin_count);
+        SAFE_APPEND_BITS2(rawolen, ol = append_nibble_escape(out, olen, ol, state, usx_hcodes, usx_hcode_lens));
+        SAFE_APPEND_BITS2(rawolen, ol = append_bits(out, olen, ol, 0xF8, 5));
+        SAFE_APPEND_BITS2(rawolen, ol = encodeCount(out, olen, ol, bin_count));
         do {
-          ol = append_bits(out, ol, in[l++], 8);
+          SAFE_APPEND_BITS2(rawolen, ol = append_bits(out, olen, ol, in[l++], 8));
         } while (--bin_count);
         l--;
       }
     }
   }
-  int ret = ol/8+(ol%8?1:0);
-  if (ol % 8) {
-    if (state == USX_DELTA)
-      ol = append_bits(out, ol, UNI_STATE_SPL_CODE, UNI_STATE_SPL_CODE_LEN);
-    ol = append_code(out, ol, TERM_CODE, &state, usx_hcodes, usx_hcode_lens);
-  }
-  //printf("\n%ld\n", ol);
-  return ret;
 
+  if (need_full_term_codes) {
+    const int orig_ol = ol;
+    SAFE_APPEND_BITS2(rawolen, ol = append_final_bits(out, olen, ol, state, is_all_upper, usx_hcodes, usx_hcode_lens));
+    return (ol / 8) * 4 + (((ol-orig_ol)/8) & 3);
+  } else {
+    const int rst = (ol + 7) / 8;
+    append_final_bits(out, rst, ol, state, is_all_upper, usx_hcodes, usx_hcode_lens);
+    return rst;
+  }
 }
 
-int unishox2_compress(const char *in, int len, char *out, const byte usx_hcodes[], const byte usx_hcode_lens[], const char *usx_freq_seq[], const char *usx_templates[]) {
-  return unishox2_compress_lines(in, len, out, usx_hcodes, usx_hcode_lens, usx_freq_seq, usx_templates, NULL);
+// Main API function. See unishox2.h for documentation
+int unishox2_compress(const char *in, int len, UNISHOX_API_OUT_AND_LEN(char *out, int olen), const uint8_t usx_hcodes[], const uint8_t usx_hcode_lens[], const char *usx_freq_seq[], const char *usx_templates[]) {
+  return unishox2_compress_lines(in, len, UNISHOX_API_OUT_AND_LEN(out, olen), usx_hcodes, usx_hcode_lens, usx_freq_seq, usx_templates, NULL);
 }
 
+// Main API function. See unishox2.h for documentation
 int unishox2_compress_simple(const char *in, int len, char *out) {
-  return unishox2_compress_lines(in, len, out, USX_HCODES_DFLT, USX_HCODE_LENS_DFLT, USX_FREQ_SEQ_DFLT, USX_TEMPLATES, NULL);
+  return unishox2_compress_lines(in, len, UNISHOX_API_OUT_AND_LEN(out, INT_MAX - 1), USX_HCODES_DFLT, USX_HCODE_LENS_DFLT, USX_FREQ_SEQ_DFLT, USX_TEMPLATES, NULL);
 }
 
+// Reads one bit from in
 int readBit(const char *in, int bit_no) {
    return in[bit_no >> 3] & (0x80 >> (bit_no % 8));
 }
 
-int read8bitCode(const char *in, int len, int *bit_no_p) {
-  int bit_pos = *bit_no_p & 0x07;
-  int char_pos = *bit_no_p >> 3;
-  byte code = (((byte)in[char_pos]) << bit_pos);
-  if (((*bit_no_p) + bit_pos) < len) {
-    code |= ((byte)in[++char_pos]) >> (8 - bit_pos);
+// Reads next 8 bits, if available
+int read8bitCode(const char *in, int len, int bit_no) {
+  int bit_pos = bit_no & 0x07;
+  int char_pos = bit_no >> 3;
+  len >>= 3;
+  uint8_t code = (((uint8_t)in[char_pos]) << bit_pos);
+  char_pos++;
+  if (char_pos < len) {
+    code |= ((uint8_t)in[char_pos]) >> (8 - bit_pos);
   } else
     code |= (0xFF >> (8 - bit_pos));
   return code;
 }
 
-// Decoder is designed for using less memory, not speed
+/// The list of veritical codes is split into 5 sections. Used by readVCodeIdx()
 #define SECTION_COUNT 5
-const byte usx_vsections[] = {0x7F, 0xBF, 0xDF, 0xEF, 0xFF};
-const byte usx_vsection_pos[] = {0, 4, 8, 12, 20};
-const byte usx_vsection_mask[] = {0x7F, 0x3F, 0x1F, 0x0F, 0x0F};
-const byte usx_vsection_shift[] = {5, 4, 3, 1, 0};
-
-// Vertical decoder lookup table - 3 bits code len, 5 bytes vertical pos
-// code len is one less as 8 cannot be accommodated in 3 bits
-const byte usx_vcode_lookup[36] = {
+/// Used by readVCodeIdx() for finding the section under which the code read using read8bitCode() falls
+uint8_t usx_vsections[] = {0x7F, 0xBF, 0xDF, 0xEF, 0xFF};
+/// Used by readVCodeIdx() for finding the section vertical position offset
+uint8_t usx_vsection_pos[] = {0, 4, 8, 12, 20};
+/// Used by readVCodeIdx() for masking the code read by read8bitCode()
+uint8_t usx_vsection_mask[] = {0x7F, 0x3F, 0x1F, 0x0F, 0x0F};
+/// Used by readVCodeIdx() for shifting the code read by read8bitCode() to obtain the vpos
+uint8_t usx_vsection_shift[] = {5, 4, 3, 1, 0};
+
+/// Vertical decoder lookup table - 3 bits code len, 5 bytes vertical pos
+/// code len is one less as 8 cannot be accommodated in 3 bits
+uint8_t usx_vcode_lookup[36] = {
   (1 << 5) + 0,  (1 << 5) + 0,  (2 << 5) + 1,  (2 << 5) + 2,  // Section 1
   (3 << 5) + 3,  (3 << 5) + 4,  (3 << 5) + 5,  (3 << 5) + 6,  // Section 2
   (3 << 5) + 7,  (3 << 5) + 7,  (4 << 5) + 8,  (4 << 5) + 9,  // Section 3
@@ -746,13 +895,20 @@ const byte usx_vcode_lookup[36] = {
   (7 << 5) + 24, (7 << 5) + 25, (7 << 5) + 26, (7 << 5) + 27
 };
 
+/// Decodes the vertical code from the given bitstream at in \n
+/// This is designed to use less memory using a 36 uint8_t buffer \n
+/// compared to using a 256 uint8_t buffer to decode the next 8 bits read by read8bitCode() \n
+/// by splitting the list of vertical codes. \n
+/// Decoder is designed for using less memory, not speed. \n
+/// Returns the veritical code index or 99 if match could not be found. \n
+/// Also updates bit_no_p with how many ever bits used by the vertical code.
 int readVCodeIdx(const char *in, int len, int *bit_no_p) {
   if (*bit_no_p < len) {
-    byte code = read8bitCode(in, len, bit_no_p);
+    uint8_t code = read8bitCode(in, len, *bit_no_p);
     int i = 0;
     do {
       if (code <= usx_vsections[i]) {
-        byte vcode = usx_vcode_lookup[usx_vsection_pos[i] + ((code & usx_vsection_mask[i]) >> usx_vsection_shift[i])];
+        uint8_t vcode = usx_vcode_lookup[usx_vsection_pos[i] + ((code & usx_vsection_mask[i]) >> usx_vsection_shift[i])];
         (*bit_no_p) += ((vcode >> 5) + 1);
         if (*bit_no_p > len)
           return 99;
@@ -763,14 +919,20 @@ int readVCodeIdx(const char *in, int len, int *bit_no_p) {
   return 99;
 }
 
-byte len_masks[] = {0x80, 0xC0, 0xE0, 0xF0, 0xF8, 0xFC, 0xFE, 0xFF};
-int readHCodeIdx(const char *in, int len, int *bit_no_p, const byte usx_hcodes[], const byte usx_hcode_lens[]) {
+/// Mask for retrieving each code to be decoded according to its length \n
+/// Same as usx_mask so redundant
+uint8_t len_masks[] = {0x80, 0xC0, 0xE0, 0xF0, 0xF8, 0xFC, 0xFE, 0xFF};
+/// Decodes the horizontal code from the given bitstream at in \n
+/// depending on the hcodes defined using usx_hcodes and usx_hcode_lens \n
+/// Returns the horizontal code index or 99 if match could not be found. \n
+/// Also updates bit_no_p with how many ever bits used by the horizontal code.
+int readHCodeIdx(const char *in, int len, int *bit_no_p, const uint8_t usx_hcodes[], const uint8_t usx_hcode_lens[]) {
   if (!usx_hcode_lens[USX_ALPHA])
     return USX_ALPHA;
   if (*bit_no_p < len) {
-    byte code = read8bitCode(in, len, bit_no_p);
+    uint8_t code = read8bitCode(in, len, *bit_no_p);
     for (int code_pos = 0; code_pos < 5; code_pos++) {
-      if ((code & len_masks[usx_hcode_lens[code_pos] - 1]) == usx_hcodes[code_pos]) {
+      if (usx_hcode_lens[code_pos] && (code & len_masks[usx_hcode_lens[code_pos] - 1]) == usx_hcodes[code_pos]) {
         *bit_no_p += usx_hcode_lens[code_pos];
         return code_pos;
       }
@@ -780,6 +942,7 @@ int readHCodeIdx(const char *in, int len, int *bit_no_p, const byte usx_hcodes[]
 }
 
 // TODO: Last value check.. Also len check in readBit
+/// Returns the position of step code (0, 10, 110, etc.) encountered in the stream
 int getStepCodeIdx(const char *in, int len, int *bit_no_p, int limit) {
   int idx = 0;
   while (*bit_no_p < len && readBit(in, *bit_no_p)) {
@@ -794,33 +957,36 @@ int getStepCodeIdx(const char *in, int len, int *bit_no_p, int limit) {
   return idx;
 }
 
-// TODO: Check length
+/// Reads specified number of bits and builds the corresponding integer
 int32_t getNumFromBits(const char *in, int len, int bit_no, int count) {
    int32_t ret = 0;
    while (count-- && bit_no < len) {
      ret += (readBit(in, bit_no) ? 1 << count : 0);
      bit_no++;
    }
-   return ret;
+   return count < 0 ? ret : -1;
 }
 
-int readCount(const char *in, int *bit_no_p, int len) {
+/// Decodes the count from the given bit stream at in. Also updates bit_no_p
+int32_t readCount(const char *in, int *bit_no_p, int len) {
   int idx = getStepCodeIdx(in, len, bit_no_p, 4);
   if (idx == 99)
     return -1;
   if (*bit_no_p + count_bit_lens[idx] - 1 >= len)
     return -1;
-  int count = getNumFromBits(in, len, *bit_no_p, count_bit_lens[idx]) + (idx ? count_adder[idx - 1] : 0);
+  int32_t count = getNumFromBits(in, len, *bit_no_p, count_bit_lens[idx]) + (idx ? count_adder[idx - 1] : 0);
   (*bit_no_p) += count_bit_lens[idx];
   return count;
 }
 
+/// Decodes the Unicode codepoint from the given bit stream at in. Also updates bit_no_p \n
+/// When the step code is 5, reads the next step code to find out the special code.
 int32_t readUnicode(const char *in, int *bit_no_p, int len) {
   int idx = getStepCodeIdx(in, len, bit_no_p, 5);
   if (idx == 99)
     return 0x7FFFFF00 + 99;
   if (idx == 5) {
-    int idx = getStepCodeIdx(in, len, bit_no_p, 4);
+    idx = getStepCodeIdx(in, len, bit_no_p, 4);
     return 0x7FFFFF00 + idx;
   }
   if (idx >= 0) {
@@ -837,78 +1003,114 @@ int32_t readUnicode(const char *in, int *bit_no_p, int len) {
   return 0;
 }
 
-void writeUTF8(char *out, int *ol, int uni) {
+/// Macro to ensure that the decoder does not append more than olen bytes to out
+#define DEC_OUTPUT_CHAR(out, olen, ol, c) do { \
+  char *const obuf = (out); \
+  const int oidx = (ol); \
+  const int limit = (olen); \
+  if (limit <= oidx) return limit + 1; \
+  else if (oidx < 0) return 0; \
+  else obuf[oidx] = (c); \
+} while (0)
+
+/// Macro to ensure that the decoder does not append more than olen bytes to out
+#define DEC_OUTPUT_CHARS(olen, exp) do { \
+  const int newidx = (exp); \
+  const int limit = (olen); \
+  if (newidx > limit) return limit + 1; \
+} while (0)
+
+/// Write given unicode code point to out as a UTF-8 sequence
+int writeUTF8(char *out, int olen, int ol, int uni) {
   if (uni < (1 << 11)) {
-    out[(*ol)++] = (0xC0 + (uni >> 6));
-    out[(*ol)++] = (0x80 + (uni & 0x3F));
+    DEC_OUTPUT_CHAR(out, olen, ol++, 0xC0 + (uni >> 6));
+    DEC_OUTPUT_CHAR(out, olen, ol++, 0x80 + (uni & 0x3F));
   } else
   if (uni < (1 << 16)) {
-    out[(*ol)++] = (0xE0 + (uni >> 12));
-    out[(*ol)++] = (0x80 + ((uni >> 6) & 0x3F));
-    out[(*ol)++] = (0x80 + (uni & 0x3F));
+    DEC_OUTPUT_CHAR(out, olen, ol++, 0xE0 + (uni >> 12));
+    DEC_OUTPUT_CHAR(out, olen, ol++, 0x80 + ((uni >> 6) & 0x3F));
+    DEC_OUTPUT_CHAR(out, olen, ol++, 0x80 + (uni & 0x3F));
   } else {
-    out[(*ol)++] = (0xF0 + (uni >> 18));
-    out[(*ol)++] = (0x80 + ((uni >> 12) & 0x3F));
-    out[(*ol)++] = (0x80 + ((uni >> 6) & 0x3F));
-    out[(*ol)++] = (0x80 + (uni & 0x3F));
+    DEC_OUTPUT_CHAR(out, olen, ol++, 0xF0 + (uni >> 18));
+    DEC_OUTPUT_CHAR(out, olen, ol++, 0x80 + ((uni >> 12) & 0x3F));
+    DEC_OUTPUT_CHAR(out, olen, ol++, 0x80 + ((uni >> 6) & 0x3F));
+    DEC_OUTPUT_CHAR(out, olen, ol++, 0x80 + (uni & 0x3F));
   }
+  return ol;
 }
 
-int decodeRepeat(const char *in, int len, char *out, int ol, int *bit_no, struct us_lnk_lst *prev_lines) {
+/// Decode repeating sequence and appends to out
+int decodeRepeat(const char *in, int len, char *out, int olen, int ol, int *bit_no, struct us_lnk_lst *prev_lines) {
   if (prev_lines) {
-    int dict_len = readCount(in, bit_no, len) + NICE_LEN;
-    if (dict_len < 0)
-      return ol;
-    int dist = readCount(in, bit_no, len);
+    int32_t dict_len = readCount(in, bit_no, len) + NICE_LEN;
+    if (dict_len < NICE_LEN)
+      return -1;
+    int32_t dist = readCount(in, bit_no, len);
     if (dist < 0)
-      return ol;
-    int ctx = readCount(in, bit_no, len);
+      return -1;
+    int32_t ctx = readCount(in, bit_no, len);
     if (ctx < 0)
-      return ol;
+      return -1;
     struct us_lnk_lst *cur_line = prev_lines;
-    while (ctx--)
+    const int left = olen - ol;
+    while (ctx-- && cur_line)
       cur_line = cur_line->previous;
-    memmove(out + ol, cur_line->data + dist, dict_len);
+    if (cur_line == NULL)
+      return -1;
+    if (left <= 0) return olen + 1;
+    if (dist >= strlen(cur_line->data))
+      return -1;
+    memmove(out + ol, cur_line->data + dist, min_of(left, dict_len));
+    if (left < dict_len) return olen + 1;
     ol += dict_len;
   } else {
-    int dict_len = readCount(in, bit_no, len) + NICE_LEN;
-    if (dict_len < 0)
-      return ol;
-    int dist = readCount(in, bit_no, len) + NICE_LEN - 1;
-    if (dist < 0)
-      return ol;
+    int32_t dict_len = readCount(in, bit_no, len) + NICE_LEN;
+    if (dict_len < NICE_LEN)
+      return -1;
+    int32_t dist = readCount(in, bit_no, len) + NICE_LEN - 1;
+    if (dist < NICE_LEN - 1)
+      return -1;
+    const int32_t left = olen - ol;
     //printf("Decode len: %d, dist: %d\n", dict_len - NICE_LEN, dist - NICE_LEN + 1);
-    memcpy(out + ol, out + ol - dist, dict_len);
+    if (left <= 0) return olen + 1;
+    if (ol - dist < 0)
+      return -1;
+    memmove(out + ol, out + ol - dist, min_of(left, dict_len));
+    if (left < dict_len) return olen + 1;
     ol += dict_len;
   }
   return ol;
 }
 
-char getHexChar(int nibble, int hex_type) {
+/// Returns hex character corresponding to the 4 bit nibble
+char getHexChar(int32_t nibble, int hex_type) {
   if (nibble >= 0 && nibble <= 9)
     return '0' + nibble;
-  else if (hex_type < 3)
+  else if (hex_type < USX_NIB_HEX_UPPER)
     return 'a' + nibble - 10;
   return 'A' + nibble - 10;
 }
 
-int unishox2_decompress_lines(const char *in, int len, char *out, const byte usx_hcodes[], const byte usx_hcode_lens[], const char *usx_freq_seq[], const char *usx_templates[], struct us_lnk_lst *prev_lines) {
+// Main API function. See unishox2.h for documentation
+int unishox2_decompress_lines(const char *in, int len, UNISHOX_API_OUT_AND_LEN(char *out, int olen), const uint8_t usx_hcodes[], const uint8_t usx_hcode_lens[], const char *usx_freq_seq[], const char *usx_templates[], struct us_lnk_lst *prev_lines) {
 
   int dstate;
   int bit_no;
   int h, v;
-  byte is_all_upper;
+  uint8_t is_all_upper;
+#if (UNISHOX_API_OUT_AND_LEN(0,1)) == 0
+  const int olen = INT_MAX - 1;
+#endif
 
   init_coder();
   int ol = 0;
-  bit_no = 1; // ignore the magic bit
+  bit_no = UNISHOX_MAGIC_BIT_LEN; // ignore the magic bit
   dstate = h = USX_ALPHA;
   is_all_upper = 0;
 
   int prev_uni = 0;
 
   len <<= 3;
-  out[ol] = 0;
   while (bit_no < len) {
     int orig_bit_no = bit_no;
     if (dstate == USX_DELTA || h == USX_DELTA) {
@@ -921,7 +1123,7 @@ int unishox2_decompress_lines(const char *in, int len, char *out, const byte usx
           break;
         switch (spl_code_idx) {
           case 0:
-            out[ol++] = ' ';
+            DEC_OUTPUT_CHAR(out, olen, ol++, ' ');
             continue;
           case 1:
             h = readHCodeIdx(in, len, &bit_no, usx_hcodes, usx_hcode_lens);
@@ -934,24 +1136,27 @@ int unishox2_decompress_lines(const char *in, int len, char *out, const byte usx
               continue;
             }
             if (h == USX_DICT) {
-              ol = decodeRepeat(in, len, out, ol, &bit_no, prev_lines);
+              int rpt_ret = decodeRepeat(in, len, out, olen, ol, &bit_no, prev_lines);
+              if (rpt_ret < 0)
+                return ol; // if we break here it will only break out of switch
+              DEC_OUTPUT_CHARS(olen, ol = rpt_ret);
               h = dstate;
               continue;
             }
             break;
           case 2:
-            out[ol++] = ',';
+            DEC_OUTPUT_CHAR(out, olen, ol++, ',');
             continue;
           case 3:
-            out[ol++] = '.';
+            DEC_OUTPUT_CHAR(out, olen, ol++, '.');
             continue;
           case 4:
-            out[ol++] = 10;
+            DEC_OUTPUT_CHAR(out, olen, ol++, 10);
             continue;
         }
       } else {
         prev_uni += delta;
-        writeUTF8(out, &ol, prev_uni);
+        DEC_OUTPUT_CHARS(olen, ol = writeUTF8(out, olen, ol, prev_uni));
         //printf("%ld, ", prev_uni);
       }
       if (dstate == USX_DELTA && h == USX_DELTA)
@@ -959,7 +1164,7 @@ int unishox2_decompress_lines(const char *in, int len, char *out, const byte usx
     } else
       h = dstate;
     char c = 0;
-    byte is_upper = is_all_upper;
+    uint8_t is_upper = is_all_upper;
     v = readVCodeIdx(in, len, &bit_no);
     if (v == 99 || h == 99) {
       bit_no = orig_bit_no;
@@ -977,6 +1182,8 @@ int unishox2_decompress_lines(const char *in, int len, char *out, const byte usx
       }
       if (h == USX_ALPHA) {
          if (dstate == USX_ALPHA) {
+           if (!usx_hcode_lens[USX_ALPHA] && TERM_BYTE_PRESET_1 == (read8bitCode(in, len, bit_no - SW_CODE_LEN) & (0xFF << (8 - (is_all_upper ? TERM_BYTE_PRESET_1_LEN_UPPER : TERM_BYTE_PRESET_1_LEN_LOWER)))))
+             break; // Terminator for preset 1
            if (is_all_upper) {
              is_upper = is_all_upper = 0;
              continue;
@@ -1004,7 +1211,10 @@ int unishox2_decompress_lines(const char *in, int len, char *out, const byte usx
          }
       } else
       if (h == USX_DICT) {
-        ol = decodeRepeat(in, len, out, ol, &bit_no, prev_lines);
+        int rpt_ret = decodeRepeat(in, len, out, olen, ol, &bit_no, prev_lines);
+        if (rpt_ret < 0)
+          break;
+        DEC_OUTPUT_CHARS(olen, ol = rpt_ret);
         continue;
       } else
       if (h == USX_DELTA) {
@@ -1021,47 +1231,74 @@ int unishox2_decompress_lines(const char *in, int len, char *out, const byte usx
         }
         if (h == USX_NUM && v == 0) {
           int idx = getStepCodeIdx(in, len, &bit_no, 5);
+          if (idx == 99)
+            break;
           if (idx == 0) {
             idx = getStepCodeIdx(in, len, &bit_no, 4);
-            int rem = readCount(in, &bit_no, len);
+            if (idx >= 5)
+              break;
+            int32_t rem = readCount(in, &bit_no, len);
             if (rem < 0)
               break;
-            rem = strlen(usx_templates[idx]) - rem;
+            if (usx_templates[idx] == NULL)
+              break;
+            size_t tlen = strlen(usx_templates[idx]);
+            if (rem > tlen)
+              break;
+            rem = tlen - rem;
+            int eof = 0;
             for (int j = 0; j < rem; j++) {
               char c_t = usx_templates[idx][j];
               if (c_t == 'f' || c_t == 'r' || c_t == 't' || c_t == 'o' || c_t == 'F') {
                   char nibble_len = (c_t == 'f' || c_t == 'F' ? 4 : (c_t == 'r' ? 3 : (c_t == 't' ? 2 : 1)));
-                  out[ol++] = getHexChar(getNumFromBits(in, len, bit_no, nibble_len),
-                      c_t == 'f' ? USX_NIB_HEX_LOWER : USX_NIB_HEX_UPPER);
+                  const int32_t raw_char = getNumFromBits(in, len, bit_no, nibble_len);
+                  if (raw_char < 0) {
+                      eof = 1;
+                      break;
+                  }
+                  DEC_OUTPUT_CHAR(out, olen, ol++, getHexChar((char)raw_char,
+                      c_t == 'f' ? USX_NIB_HEX_LOWER : USX_NIB_HEX_UPPER));
                   bit_no += nibble_len;
               } else
-                out[ol++] = c_t;
+                DEC_OUTPUT_CHAR(out, olen, ol++, c_t);
             }
+            if (eof) break; // reach input eof
           } else
           if (idx == 5) {
-            int bin_count = readCount(in, &bit_no, len);
+            int32_t bin_count = readCount(in, &bit_no, len);
             if (bin_count < 0)
               break;
+            if (bin_count == 0) // invalid encoding
+              break;
             do {
-              out[ol++] = getNumFromBits(in, len, bit_no, 8);
+              const int32_t raw_char = getNumFromBits(in, len, bit_no, 8);
+              if (raw_char < 0)
+                  break;
+              DEC_OUTPUT_CHAR(out, olen, ol++, (char)raw_char);
               bit_no += 8;
             } while (--bin_count);
+            if (bin_count > 0) break; // reach input eof
           } else {
-            int nibble_count = 0;
+            int32_t nibble_count = 0;
             if (idx == 2 || idx == 4)
               nibble_count = 32;
             else {
               nibble_count = readCount(in, &bit_no, len);
               if (nibble_count < 0)
                 break;
+              if (nibble_count == 0) // invalid encoding
+                break;
             }
             do {
-              int nibble = (int) getNumFromBits(in, len, bit_no, 4);
-              out[ol++] = getHexChar(nibble, idx);
+              int32_t nibble = getNumFromBits(in, len, bit_no, 4);
+              if (nibble < 0)
+                  break;
+              DEC_OUTPUT_CHAR(out, olen, ol++, getHexChar(nibble, idx < 3 ? USX_NIB_HEX_LOWER : USX_NIB_HEX_UPPER));
               if ((idx == 2 || idx == 4) && (nibble_count == 25 || nibble_count == 21 || nibble_count == 17 || nibble_count == 13))
-                out[ol++] = '-';
+                DEC_OUTPUT_CHAR(out, olen, ol++, '-');
               bit_no += 4;
             } while (--nibble_count);
+            if (nibble_count > 0) break; // reach input eof
           }
           if (dstate == USX_DELTA)
             h = USX_DELTA;
@@ -1084,24 +1321,34 @@ int unishox2_decompress_lines(const char *in, int len, char *out, const byte usx
         dstate = USX_NUM;
       } else if (c == 0) {
         if (v == 8) {
-          out[ol++] = '\r';
-          out[ol++] = '\n';
+          DEC_OUTPUT_CHAR(out, olen, ol++, '\r');
+          DEC_OUTPUT_CHAR(out, olen, ol++, '\n');
         } else if (h == USX_NUM && v == 26) {
-          int count = readCount(in, &bit_no, len);
+          int32_t count = readCount(in, &bit_no, len);
           if (count < 0)
             break;
           count += 4;
+          if (ol <= 0)
+            return 0; // invalid encoding
           char rpt_c = out[ol - 1];
           while (count--)
-            out[ol++] = rpt_c;
+            DEC_OUTPUT_CHAR(out, olen, ol++, rpt_c);
         } else if (h == USX_SYM && v > 24) {
           v -= 25;
-          memcpy(out + ol, usx_freq_seq[v], strlen(usx_freq_seq[v]));
-          ol += strlen(usx_freq_seq[v]);
+          const int freqlen = (int)strlen(usx_freq_seq[v]);
+          const int left = olen - ol;
+          if (left <= 0) return olen + 1;
+          memcpy(out + ol, usx_freq_seq[v], min_of(left, freqlen));
+          if (left < freqlen) return olen + 1;
+          ol += freqlen;
         } else if (h == USX_NUM && v > 22 && v < 26) {
           v -= (23 - 3);
-          memcpy(out + ol, usx_freq_seq[v], strlen(usx_freq_seq[v]));
-          ol += strlen(usx_freq_seq[v]);
+          const int freqlen = (int)strlen(usx_freq_seq[v]);
+          const int left = olen - ol;
+          if (left <= 0) return olen + 1;
+          memcpy(out + ol, usx_freq_seq[v], min_of(left, freqlen));
+          if (left < freqlen) return olen + 1;
+          ol += freqlen;
         } else
           break; // Terminator
         if (dstate == USX_DELTA)
@@ -1111,17 +1358,19 @@ int unishox2_decompress_lines(const char *in, int len, char *out, const byte usx
     }
     if (dstate == USX_DELTA)
       h = USX_DELTA;
-    out[ol++] = c;
+    DEC_OUTPUT_CHAR(out, olen, ol++, c);
   }
 
   return ol;
 
 }
 
-int unishox2_decompress(const char *in, int len, char *out, const byte usx_hcodes[], const byte usx_hcode_lens[], const char *usx_freq_seq[], const char *usx_templates[]) {
-  return unishox2_decompress_lines(in, len, out, usx_hcodes, usx_hcode_lens, usx_freq_seq, usx_templates, NULL);
+// Main API function. See unishox2.h for documentation
+int unishox2_decompress(const char *in, int len, UNISHOX_API_OUT_AND_LEN(char *out, int olen), const uint8_t usx_hcodes[], const uint8_t usx_hcode_lens[], const char *usx_freq_seq[], const char *usx_templates[]) {
+  return unishox2_decompress_lines(in, len, UNISHOX_API_OUT_AND_LEN(out, olen), usx_hcodes, usx_hcode_lens, usx_freq_seq, usx_templates, NULL);
 }
 
+// Main API function. See unishox2.h for documentation
 int unishox2_decompress_simple(const char *in, int len, char *out) {
-  return unishox2_decompress(in, len, out, USX_PSET_DFLT);
+  return unishox2_decompress(in, len, UNISHOX_API_OUT_AND_LEN(out, INT_MAX - 1), USX_PSET_DFLT);
 }
diff --git a/Arduino/unishox2.h b/Arduino/unishox2.h
index 803d74a..fd9db2b 100644
--- a/Arduino/unishox2.h
+++ b/Arduino/unishox2.h
@@ -17,55 +17,101 @@
  * 
  * Port for Particle (particle.io) / Aruino - Jonathan Greenblatt
  *
+ * This file describes each function of the Unishox2 API \n
+ * For finding out how this API can be used in your program, \n
+ * please see test_unishox2.c.
  */
+
 #ifndef unishox2
 #define unishox2
 
-#define UNISHOX_VERSION "2.0"
+#define UNISHOX_VERSION "2.0"   ///< Unicode spec version
+
+/**
+ * Macro switch to enable/disable output buffer length parameter in low level api \n
+ * Disabled by default \n
+ * When this macro is defined, the all the API functions \n
+ * except the simple API functions accept an additional parameter olen \n
+ * that enables the developer to pass the size of the output buffer provided \n
+ * so that the api function may not write beyond that length. \n
+ * This can be disabled if the developer knows that the buffer provided is sufficient enough \n
+ * so no additional parameter is passed and the program is faster since additional check \n
+ * for output length is not performed at each step \n
+ * The simple api, i.e. unishox2_(de)compress_simple will always omit the buffer length
+ */
+#ifndef UNISHOX_API_WITH_OUTPUT_LEN
+#  define UNISHOX_API_WITH_OUTPUT_LEN 1
+#endif
+
+/// Upto 8 bits of initial magic bit sequence can be included. Bit count can be specified with UNISHOX_MAGIC_BIT_LEN
+#ifndef UNISHOX_MAGIC_BITS
+#  define UNISHOX_MAGIC_BITS 0xFF
+#endif
+
+/// Desired length of Magic bits defined by UNISHOX_MAGIC_BITS
+#ifdef UNISHOX_MAGIC_BIT_LEN
+#  if UNISHOX_MAGIC_BIT_LEN < 0 || 9 <= UNISHOX_MAGIC_BIT_LEN
+#    error "UNISHOX_MAGIC_BIT_LEN need between [0, 8)"
+#  endif
+#else
+#  define UNISHOX_MAGIC_BIT_LEN 1
+#endif
 
 //enum {USX_ALPHA = 0, USX_SYM, USX_NUM, USX_DICT, USX_DELTA};
 
-#define USX_HCODES_DFLT (const unsigned char[]){0x00, 0x40, 0x80, 0xC0, 0xE0}
-#define USX_HCODE_LENS_DFLT (const unsigned char[]){2, 2, 2, 3, 3}
+/// Default Horizontal codes. When composition of text is know beforehand, the other hcodes in this section can be used to achieve more compression.
+#define USX_HCODES_DFLT (const unsigned char[]) {0x00, 0x40, 0x80, 0xC0, 0xE0}
+/// Length of each default hcode
+#define USX_HCODE_LENS_DFLT (const unsigned char[]) {2, 2, 2, 3, 3}
 
-#define USX_HCODES_ALPHA_ONLY (const unsigned char[]){0x00, 0x00, 0x00, 0x00, 0x00}
-#define USX_HCODE_LENS_ALPHA_ONLY (const unsigned char[]){0, 0, 0, 0, 0}
+/// Horizontal codes preset for English Alphabet content only
+#define USX_HCODES_ALPHA_ONLY (const unsigned char[]) {0x00, 0x00, 0x00, 0x00, 0x00}
+/// Length of each Alpha only hcode
+#define USX_HCODE_LENS_ALPHA_ONLY (const unsigned char[]) {0, 0, 0, 0, 0}
 
-#define USX_HCODES_ALPHA_NUM_ONLY (const unsigned char[]){0x00, 0x00, 0x80, 0x00, 0x00}
-#define USX_HCODE_LENS_ALPHA_NUM_ONLY (const unsigned char[]){1, 0, 1, 0, 0}
+/// Horizontal codes preset for Alpha Numeric content only
+#define USX_HCODES_ALPHA_NUM_ONLY (const unsigned char[]) {0x00, 0x00, 0x80, 0x00, 0x00}
+/// Length of each Alpha numeric hcode
+#define USX_HCODE_LENS_ALPHA_NUM_ONLY (const unsigned char[]) {1, 0, 1, 0, 0}
 
-#define USX_HCODES_ALPHA_NUM_SYM_ONLY (const unsigned char[]){0x00, 0x80, 0xC0, 0x00, 0x00}
-#define USX_HCODE_LENS_ALPHA_NUM_SYM_ONLY (const unsigned char[]){1, 2, 2, 0, 0}
+/// Horizontal codes preset for Alpha Numeric and Symbol content only
+#define USX_HCODES_ALPHA_NUM_SYM_ONLY (const unsigned char[]) {0x00, 0x80, 0xC0, 0x00, 0x00}
+/// Length of each Alpha numeric and symbol hcodes
+#define USX_HCODE_LENS_ALPHA_NUM_SYM_ONLY (const unsigned char[]) {1, 2, 2, 0, 0}
 
-#define USX_HCODES_FAVOR_ALPHA (const unsigned char[]){0x00, 0x80, 0xA0, 0xC0, 0xE0}
-#define USX_HCODE_LENS_FAVOR_ALPHA (const unsigned char[]){1, 3, 3, 3, 3}
+/// Horizontal codes preset favouring Alphabet content
+#define USX_HCODES_FAVOR_ALPHA (const unsigned char[]) {0x00, 0x80, 0xA0, 0xC0, 0xE0}
+/// Length of each hcode favouring Alpha content
+#define USX_HCODE_LENS_FAVOR_ALPHA (const unsigned char[]) {1, 3, 3, 3, 3}
 
-#define USX_HCODES_FAVOR_DICT (const unsigned char[]){0x00, 0x40, 0xC0, 0x80, 0xE0}
-#define USX_HCODE_LENS_FAVOR_DICT (const unsigned char[]){2, 2, 3, 2, 3}
+/// Horizontal codes preset favouring repeating sequences
+#define USX_HCODES_FAVOR_DICT (const unsigned char[]) {0x00, 0x40, 0xC0, 0x80, 0xE0}
+/// Length of each hcode favouring repeating sequences
+#define USX_HCODE_LENS_FAVOR_DICT (const unsigned char[]) {2, 2, 3, 2, 3}
 
-#define USX_HCODES_FAVOR_SYM (const unsigned char[]){0x80, 0x00, 0xA0, 0xC0, 0xE0}
-#define USX_HCODE_LENS_FAVOR_SYM (const unsigned char[]){3, 1, 3, 3, 3}
+/// Horizontal codes preset favouring symbols
+#define USX_HCODES_FAVOR_SYM (const unsigned char[]) {0x80, 0x00, 0xA0, 0xC0, 0xE0}
+/// Length of each hcode favouring symbols
+#define USX_HCODE_LENS_FAVOR_SYM (const unsigned char[]) {3, 1, 3, 3, 3}
 
 //#define USX_HCODES_FAVOR_UMLAUT {0x00, 0x40, 0xE0, 0xC0, 0x80}
 //#define USX_HCODE_LENS_FAVOR_UMLAUT {2, 2, 3, 3, 2}
 
-#define USX_HCODES_FAVOR_UMLAUT (const unsigned char[]){0x80, 0xA0, 0xC0, 0xE0, 0x00}
-#define USX_HCODE_LENS_FAVOR_UMLAUT (const unsigned char[]){3, 3, 3, 3, 1}
+/// Horizontal codes preset favouring umlaut letters
+#define USX_HCODES_FAVOR_UMLAUT (const unsigned char[]) {0x80, 0xA0, 0xC0, 0xE0, 0x00}
+/// Length of each hcode favouring umlaut letters
+#define USX_HCODE_LENS_FAVOR_UMLAUT (const unsigned char[]) {3, 3, 3, 3, 1}
 
-#define USX_HCODES_NO_DICT (const unsigned char[]){0x00, 0x40, 0x80, 0x00, 0xC0}
-#define USX_HCODE_LENS_NO_DICT (const unsigned char[]){2, 2, 2, 0, 2}
+/// Horizontal codes preset for no repeating sequences
+#define USX_HCODES_NO_DICT (const unsigned char[]) {0x00, 0x40, 0x80, 0x00, 0xC0}
+/// Length of each hcode for no repeating sequences
+#define USX_HCODE_LENS_NO_DICT (const unsigned char[]) {2, 2, 2, 0, 2}
+
+/// Horizontal codes preset for no Unicode characters
+#define USX_HCODES_NO_UNI (const unsigned char[]) {0x00, 0x40, 0x80, 0xC0, 0x00}
+/// Length of each hcode for no Unicode characters
+#define USX_HCODE_LENS_NO_UNI (const unsigned char[]) {2, 2, 2, 2, 0}
 
-#define USX_HCODES_NO_UNI (const unsigned char[]){0x00, 0x40, 0x80, 0xC0, 0x00}
-#define USX_HCODE_LENS_NO_UNI (const unsigned char[]){2, 2, 2, 2, 0}
-/*
-#define USX_FREQ_SEQ_DFLT (const char *[]){"\": \"", "\": ", "</", "=\"", "\":\"", "://"}
-#define USX_FREQ_SEQ_TXT (const char *[]){" the ", " and ", "tion", " with", "ing", "ment"}
-#define USX_FREQ_SEQ_URL (const char *[]){"https://", "www.", ".com", "http://", ".org", ".net"}
-#define USX_FREQ_SEQ_JSON (const char *[]){"\": \"", "\": ", "\",", "}}}", "\":\"", "}}"}
-#define USX_FREQ_SEQ_HTML (const char *[]){"</", "=\"", "div", "href", "class", "<p>"}
-#define USX_FREQ_SEQ_XML (const char *[]){"</", "=\"", "\">", "<?xml version=\"1.0\"", "xmlns:", "://"}
-#define USX_TEMPLATES (const char *[]){"tfff-of-tfTtf:rf:rf.fffZ", "tfff-of-tf", "(fff) fff-ffff", "tf:rf:rf", 0}
-*/
 extern const char * USX_FREQ_SEQ_DFLT[];
 extern const char * USX_FREQ_SEQ_TXT[];
 extern const char * USX_FREQ_SEQ_URL[];
@@ -74,42 +120,144 @@ extern const char * USX_FREQ_SEQ_HTML[];
 extern const char * USX_FREQ_SEQ_XML[];
 extern const char * USX_TEMPLATES[];
 
+/// Default preset parameter set. When composition of text is know beforehand, the other parameter sets in this section can be used to achieve more compression.
 #define USX_PSET_DFLT USX_HCODES_DFLT, USX_HCODE_LENS_DFLT, USX_FREQ_SEQ_DFLT, USX_TEMPLATES
+/// Preset parameter set for English Alphabet only content
 #define USX_PSET_ALPHA_ONLY USX_HCODES_ALPHA_ONLY, USX_HCODE_LENS_ALPHA_ONLY, USX_FREQ_SEQ_TXT, USX_TEMPLATES
+/// Preset parameter set for Alpha numeric content
 #define USX_PSET_ALPHA_NUM_ONLY USX_HCODES_ALPHA_NUM_ONLY, USX_HCODE_LENS_ALPHA_NUM_ONLY, USX_FREQ_SEQ_TXT, USX_TEMPLATES
+/// Preset parameter set for Alpha numeric and symbol content
 #define USX_PSET_ALPHA_NUM_SYM_ONLY USX_HCODES_ALPHA_NUM_SYM_ONLY, USX_HCODE_LENS_ALPHA_NUM_SYM_ONLY, USX_FREQ_SEQ_DFLT, USX_TEMPLATES
+/// Preset parameter set for Alpha numeric symbol content having predominantly text
 #define USX_PSET_ALPHA_NUM_SYM_ONLY_TXT USX_HCODES_ALPHA_NUM_SYM_ONLY, USX_HCODE_LENS_ALPHA_NUM_SYM_ONLY, USX_FREQ_SEQ_DFLT, USX_TEMPLATES
+/// Preset parameter set favouring Alphabet content
 #define USX_PSET_FAVOR_ALPHA USX_HCODES_FAVOR_ALPHA, USX_HCODE_LENS_FAVOR_ALPHA, USX_FREQ_SEQ_TXT, USX_TEMPLATES
+/// Preset parameter set favouring repeating sequences
 #define USX_PSET_FAVOR_DICT USX_HCODES_FAVOR_DICT, USX_HCODE_LENS_FAVOR_DICT, USX_FREQ_SEQ_DFLT, USX_TEMPLATES
+/// Preset parameter set favouring symbols
 #define USX_PSET_FAVOR_SYM USX_HCODES_FAVOR_SYM, USX_HCODE_LENS_FAVOR_SYM, USX_FREQ_SEQ_DFLT, USX_TEMPLATES
+/// Preset parameter set favouring unlaut letters
 #define USX_PSET_FAVOR_UMLAUT USX_HCODES_FAVOR_UMLAUT, USX_HCODE_LENS_FAVOR_UMLAUT, USX_FREQ_SEQ_DFLT, USX_TEMPLATES
+/// Preset parameter set for when there are no repeating sequences
 #define USX_PSET_NO_DICT USX_HCODES_NO_DICT, USX_HCODE_LENS_NO_DICT, USX_FREQ_SEQ_DFLT, USX_TEMPLATES
+/// Preset parameter set for when there are no unicode symbols
 #define USX_PSET_NO_UNI USX_HCODES_NO_UNI, USX_HCODE_LENS_NO_UNI, USX_FREQ_SEQ_DFLT, USX_TEMPLATES
+/// Preset parameter set for when there are no unicode symbols favouring text
 #define USX_PSET_NO_UNI_FAVOR_TEXT USX_HCODES_NO_UNI, USX_HCODE_LENS_NO_UNI, USX_FREQ_SEQ_TXT, USX_TEMPLATES
+/// Preset parameter set favouring URL content
 #define USX_PSET_URL USX_HCODES_DFLT, USX_HCODE_LENS_DFLT, USX_FREQ_SEQ_URL, USX_TEMPLATES
+/// Preset parameter set favouring JSON content
 #define USX_PSET_JSON USX_HCODES_DFLT, USX_HCODE_LENS_DFLT, USX_FREQ_SEQ_JSON, USX_TEMPLATES
+/// Preset parameter set favouring JSON content having no Unicode symbols
 #define USX_PSET_JSON_NO_UNI USX_HCODES_NO_UNI, USX_HCODE_LENS_NO_UNI, USX_FREQ_SEQ_JSON, USX_TEMPLATES
+/// Preset parameter set favouring XML content
 #define USX_PSET_XML USX_HCODES_DFLT, USX_HCODE_LENS_DFLT, USX_FREQ_SEQ_XML, USX_TEMPLATES
+/// Preset parameter set favouring HTML content
 #define USX_PSET_HTML USX_HCODES_DFLT, USX_HCODE_LENS_DFLT, USX_FREQ_SEQ_HTML, USX_TEMPLATES
 
+/**
+ * This structure is used when a string array needs to be compressed.
+ * This is passed as a parameter to the unishox2_decompress_lines() function
+ */
 struct us_lnk_lst {
   char *data;
   struct us_lnk_lst *previous;
 };
 
+/**
+ * This macro is for internal use, but builds upon the macro UNISHOX_API_WITH_OUTPUT_LEN
+ * When the macro UNISHOX_API_WITH_OUTPUT_LEN is defined, the all the API functions
+ * except the simple API functions accept an additional parameter olen
+ * that enables the developer to pass the size of the output buffer provided
+ * so that the api function may not write beyond that length.
+ * This can be disabled if the developer knows that the buffer provided is sufficient enough
+ * so no additional parameter is passed and the program is faster since additional check
+ * for output length is not performed at each step
+ */
+#if defined(UNISHOX_API_WITH_OUTPUT_LEN) && UNISHOX_API_WITH_OUTPUT_LEN != 0
+#  define UNISHOX_API_OUT_AND_LEN(out, olen) out, olen
+#else
+#  define UNISHOX_API_OUT_AND_LEN(out, olen) out
+#endif
+
+/** 
+ * Simple API for compressing a string
+ * @param[in] in    Input ASCII / UTF-8 string
+ * @param[in] len   length in bytes
+ * @param[out] out  output buffer - should be large enough to hold compressed output
+ */
 extern int unishox2_compress_simple(const char *in, int len, char *out);
+/** 
+ * Simple API for decompressing a string
+ * @param[in] in    Input compressed bytes (output of unishox2_compress functions)
+ * @param[in] len   length of 'in' in bytes
+ * @param[out] out  output buffer for ASCII / UTF-8 string - should be large enough
+ */
 extern int unishox2_decompress_simple(const char *in, int len, char *out);
-extern int unishox2_compress(const char *in, int len, char *out, 
-              const unsigned char usx_hcodes[], const unsigned char usx_hcode_lens[], 
+/** 
+ * Comprehensive API for compressing a string
+ * 
+ * Presets are available for the last four parameters so they can be passed as single parameter. \n
+ * See USX_PSET_* macros. Example call: \n
+ *    unishox2_compress(in, len, out, olen, USX_PSET_ALPHA_ONLY);
+ * 
+ * @param[in] in             Input ASCII / UTF-8 string
+ * @param[in] len            length in bytes
+ * @param[out] out           output buffer - should be large enough to hold compressed output
+ * @param[in] olen           length of 'out' buffer in bytes. Can be omitted if sufficient buffer is provided
+ * @param[in] usx_hcodes     Horizontal codes (array of bytes). See macro section for samples.
+ * @param[in] usx_hcode_lens Length of each element in usx_hcodes array
+ * @param[in] usx_freq_seq   Frequently occuring sequences. See USX_FREQ_SEQ_* macros for samples
+ * @param[in] usx_templates  Templates of frequently occuring patterns. See USX_TEMPLATES macro.
+ */
+extern int unishox2_compress(const char *in, int len, UNISHOX_API_OUT_AND_LEN(char *out, int olen),
+              const unsigned char usx_hcodes[], const unsigned char usx_hcode_lens[],
               const char *usx_freq_seq[], const char *usx_templates[]);
-extern int unishox2_decompress(const char *in, int len, char *out, 
+/** 
+ * Comprehensive API for de-compressing a string
+ * 
+ * Presets are available for the last four parameters so they can be passed as single parameter. \n
+ * See USX_PSET_* macros. Example call: \n
+ *    unishox2_decompress(in, len, out, olen, USX_PSET_ALPHA_ONLY);
+ * 
+ * @param[in] in             Input compressed bytes (output of unishox2_compress functions)
+ * @param[in] len            length of 'in' in bytes
+ * @param[out] out           output buffer - should be large enough to hold de-compressed output
+ * @param[in] olen           length of 'out' buffer in bytes. Can be omitted if sufficient buffer is provided
+ * @param[in] usx_hcodes     Horizontal codes (array of bytes). See macro section for samples.
+ * @param[in] usx_hcode_lens Length of each element in usx_hcodes array
+ * @param[in] usx_freq_seq   Frequently occuring sequences. See USX_FREQ_SEQ_* macros for samples
+ * @param[in] usx_templates  Templates of frequently occuring patterns. See USX_TEMPLATES macro.
+ */
+extern int unishox2_decompress(const char *in, int len, UNISHOX_API_OUT_AND_LEN(char *out, int olen),
               const unsigned char usx_hcodes[], const unsigned char usx_hcode_lens[],
               const char *usx_freq_seq[], const char *usx_templates[]);
-extern int unishox2_compress_lines(const char *in, int len, char *out, 
-              const unsigned char usx_hcodes[], const unsigned char usx_hcode_lens[], 
+/** 
+ * More Comprehensive API for compressing array of strings
+ * 
+ * See unishox2_compress() function for parameter definitions. \n
+ * This function takes an additional parameter, i.e. 'prev_lines' - the usx_lnk_lst structure \n
+ * See -g parameter in test_unishox2.c to find out how this can be used. \n
+ * This function is used when an array of strings need to be compressed \n
+ * and stored in a compressed array of bytes for use as a constant in other programs \n
+ * where each element of the array can be decompressed and used at runtime.
+ */
+extern int unishox2_compress_lines(const char *in, int len, UNISHOX_API_OUT_AND_LEN(char *out, int olen),
+              const unsigned char usx_hcodes[], const unsigned char usx_hcode_lens[],
               const char *usx_freq_seq[], const char *usx_templates[],
               struct us_lnk_lst *prev_lines);
-extern int unishox2_decompress_lines(const char *in, int len, char *out, 
+/** 
+ * More Comprehensive API for de-compressing array of strings \n
+ * This function is not be used in conjuction with unishox2_compress_lines()
+ * 
+ * See unishox2_decompress() function for parameter definitions. \n
+ * Typically an array is compressed using unishox2_compress_lines() and \n
+ * a header (.h) file is generated using the resultant compressed array. \n
+ * This header file can be used in another program with another decompress \n
+ * routine which takes this compressed array as parameter and index to be \n
+ * decompressed.
+ */
+extern int unishox2_decompress_lines(const char *in, int len, UNISHOX_API_OUT_AND_LEN(char *out, int olen),
               const unsigned char usx_hcodes[], const unsigned char usx_hcode_lens[],
               const char *usx_freq_seq[], const char *usx_templates[],
               struct us_lnk_lst *prev_lines);
diff --git a/unishox2.c b/unishox2.c
index 2d6c60d..e6361dc 100644
--- a/unishox2.c
+++ b/unishox2.c
@@ -36,6 +36,24 @@
 /// uint8_t is unsigned char
 typedef unsigned char uint8_t;
 
+/// Default frequently occuring sequences. When composition of text is know beforehand, the other sequences in this section can be used to achieve more compression.
+const char * USX_FREQ_SEQ_DFLT[] = {"\": \"", "\": ", "</", "=\"", "\":\"", "://"};
+/// Frequently occuring sequences in text content
+const char * USX_FREQ_SEQ_TXT[] = {" the ", " and ", "tion", " with", "ing", "ment"};
+/// Frequently occuring sequences in URL content
+const char * USX_FREQ_SEQ_URL[] = {"https://", "www.", ".com", "http://", ".org", ".net"};
+/// Frequently occuring sequences in JSON content
+const char * USX_FREQ_SEQ_JSON[] = {"\": \"", "\": ", "\",", "}}}", "\":\"", "}}"};
+/// Frequently occuring sequences in HTML content
+const char * USX_FREQ_SEQ_HTML[]  = {"</", "=\"", "div", "href", "class", "<p>"};
+/// Frequently occuring sequences in XML content
+const char * USX_FREQ_SEQ_XML[]  = {"</", "=\"", "\">", "<?xml version=\"1.0\"", "xmlns:", "://"};
+
+const char * USX_TEMPLATES[] = {"tfff-of-tfTtf:rf:rf.fffZ", "tfff-of-tf", "(fff) fff-ffff", "tf:rf:rf", 0};
+
+/// Commonly occuring templates (ISO Date/Time, ISO Date, US Phone number, ISO Time, Unused)
+#define USX_TEMPLATES (const char *[]) {"tfff-of-tfTtf:rf:rf.fffZ", "tfff-of-tf", "(fff) fff-ffff", "tf:rf:rf", 0}
+
 /// possible horizontal sets and states
 enum {USX_ALPHA = 0, USX_SYM, USX_NUM, USX_DICT, USX_DELTA, USX_NUM_TEMP};
 
diff --git a/unishox2.h b/unishox2.h
index bbbd7a7..32e9a25 100644
--- a/unishox2.h
+++ b/unishox2.h
@@ -117,21 +117,13 @@
 /// Length of each hcode for no Unicode characters
 #define USX_HCODE_LENS_NO_UNI (const unsigned char[]) {2, 2, 2, 2, 0}
 
-/// Default frequently occuring sequences. When composition of text is know beforehand, the other sequences in this section can be used to achieve more compression.
-#define USX_FREQ_SEQ_DFLT (const char *[]) {"\": \"", "\": ", "</", "=\"", "\":\"", "://"}
-/// Frequently occuring sequences in text content
-#define USX_FREQ_SEQ_TXT (const char *[]) {" the ", " and ", "tion", " with", "ing", "ment"}
-/// Frequently occuring sequences in URL content
-#define USX_FREQ_SEQ_URL (const char *[]) {"https://", "www.", ".com", "http://", ".org", ".net"}
-/// Frequently occuring sequences in JSON content
-#define USX_FREQ_SEQ_JSON (const char *[]) {"\": \"", "\": ", "\",", "}}}", "\":\"", "}}"}
-/// Frequently occuring sequences in HTML content
-#define USX_FREQ_SEQ_HTML (const char *[]) {"</", "=\"", "div", "href", "class", "<p>"}
-/// Frequently occuring sequences in XML content
-#define USX_FREQ_SEQ_XML (const char *[]) {"</", "=\"", "\">", "<?xml version=\"1.0\"", "xmlns:", "://"}
-
-/// Commonly occuring templates (ISO Date/Time, ISO Date, US Phone number, ISO Time, Unused)
-#define USX_TEMPLATES (const char *[]) {"tfff-of-tfTtf:rf:rf.fffZ", "tfff-of-tf", "(fff) fff-ffff", "tf:rf:rf", 0}
+extern const char * USX_FREQ_SEQ_DFLT[];
+extern const char * USX_FREQ_SEQ_TXT[];
+extern const char * USX_FREQ_SEQ_URL[];
+extern const char * USX_FREQ_SEQ_JSON[];
+extern const char * USX_FREQ_SEQ_HTML[];
+extern const char * USX_FREQ_SEQ_XML[];
+extern const char * USX_TEMPLATES[];
 
 /// Default preset parameter set. When composition of text is know beforehand, the other parameter sets in this section can be used to achieve more compression.
 #define USX_PSET_DFLT USX_HCODES_DFLT, USX_HCODE_LENS_DFLT, USX_FREQ_SEQ_DFLT, USX_TEMPLATES