From ac8f8329af5c750eb8cdad168a7cf9165f8afdfe Mon Sep 17 00:00:00 2001
From: Hudson Cooper <hncooper96@gmail.com>
Date: Thu, 20 Jun 2024 18:09:53 -0700
Subject: [PATCH 01/14] make _state structured data rather than a string

---
 guidance/models/_model.py       | 60 ++++++++++++++-------------------
 guidance/models/_model_state.py | 57 +++++++++++++++++++++++++++++++
 2 files changed, 83 insertions(+), 34 deletions(-)
 create mode 100644 guidance/models/_model_state.py
diff --git a/guidance/models/_model.py b/guidance/models/_model.py
index bdde3f2c0..5ee4d1a65 100644
--- a/guidance/models/_model.py
+++ b/guidance/models/_model.py
@@ -38,6 +38,8 @@
         "Failed to load guidance.cpp, falling back to Python mirror implementations..."
     )
     from .. import _cpp as cpp
+
+from ._model_state import ModelState, Text, Object
 from ._guidance_engine_metrics import GuidanceEngineMetrics
 from .._utils import softmax, CaptureEvents
 from .._parser import EarleyCommitParser, Parser
@@ -857,7 +859,7 @@ def __init__(self, engine, echo=True, **kwargs):
         self._variables = {}  # these are the state variables stored with the model
         self._variables_log_probs = {}  # these are the state variables stored with the model
         self._cache_state = {}  # mutable caching state used to save computation
-        self._state = ""  # the current bytes that represent the state of the model
+        self._state = ModelState()  # the current bytes that represent the state of the model
         self._event_queue = None  # TODO: these are for streaming results in code, but that needs implemented
         self._event_parent = None
         self._last_display = 0  # used to track the last display call to enable throttling
@@ -881,27 +883,6 @@ def active_role_end(self):
 
         return select(parts)
 
-    def _html(self):
-        """Generate HTML that displays the model object."""
-        display_out = self._state
-        for context in reversed(self.opened_blocks):
-            display_out += self.opened_blocks[context][1]
-        display_out = html.escape(display_out)
-        display_out = nodisp_pattern.sub("", display_out)
-        display_out = html_pattern.sub(lambda x: html.unescape(x.group(1)), display_out)
-        display_out = image_pattern.sub(
-            lambda x: '<img src="data:image/png;base64,'
-            + base64.b64encode(self[x.groups(1)[0]]).decode()
-            + '" style="max-width: 400px; vertical-align: middle; margin: 4px;">',
-            display_out,
-        )
-        display_out = (
-            "<pre style='margin: 0px; padding: 0px; vertical-align: middle; padding-left: 8px; margin-left: -8px; border-radius: 0px; border-left: 1px solid rgba(127, 127, 127, 0.2); white-space: pre-wrap; font-family: ColfaxAI, Arial; font-size: 15px; line-height: 23px;'>"
-            + display_out
-            + "</pre>"
-        )
-        return display_out
-
     def _send_to_event_queue(self, value):
         """For streaming in code.
 
@@ -938,7 +919,7 @@ def copy(self):
 
         return new_lm
 
-    def _inplace_append(self, value, force_silent=False):
+    def _inplace_append(self, obj: Object, force_silent: bool = False):
         """This is the base way to add content to the current LM object that is being constructed.
 
         All updates to the model state should eventually use this function.
@@ -951,7 +932,7 @@ def _inplace_append(self, value, force_silent=False):
         """
 
         # update the byte state
-        self._state += str(value)  # TODO: make _state to be bytes not a string
+        self._state.append(obj)
 
         # see if we should update the display
         if not force_silent:
@@ -977,7 +958,7 @@ def _update_display(self, throttle=True):
 
             if ipython_is_imported:
                 clear_output(wait=True)
-                display(HTML(self._html()))
+                display(HTML(self._state._html()))
             else:
                 pprint(self._state)
 
@@ -1000,9 +981,9 @@ def _repr_html_(self):
             clear_output(wait=True)
         return self._html()
 
-    def _current_prompt(self):
+    def _current_prompt(self) -> str:
         """The current prompt in bytes (which is the state without the context close tags)."""
-        return format_pattern.sub("", self._state)
+        return str(self._state)
 
     def __str__(self):
         """A string representation of the current model object (that includes context closers)."""
@@ -1075,7 +1056,9 @@ def __add__(self, value):
 
                 # we have no embedded objects
                 if len(parts) == 1:
-                    lm._inplace_append(value)
+                    lm._inplace_append(
+                        Text(text=value)
+                    )
                     out = lm
 
                 # if we have embedded objects we have to convert the string to a grammar tree
@@ -1119,7 +1102,8 @@ def __add__(self, value):
                     )
 
         # this flushes the display
-        out._inplace_append("")
+        # TODO: directly call _update_display?
+        out._inplace_append(Text(text=""))
 
         return out
 
@@ -1328,11 +1312,19 @@ def _run_stateless(self, stateless_function, temperature=0.0, top_p=1.0, n=1):
                 if len(chunk.new_bytes) > 0:
                     generated_value += new_text
                     if chunk.is_generated:
-                        lm += f"<||_html:<span style='background-color: rgba({165*(1-chunk.new_bytes_prob) + 0}, {165*chunk.new_bytes_prob + 0}, 0, {0.15}); border-radius: 3px;' title='{chunk.new_bytes_prob}'>_||>"
-                    lm += new_text
-                    if chunk.is_generated:
-                        lm += "<||_html:</span>_||>"
-
+                        self._inplace_append(
+                            Text(
+                                text = new_text,
+                                # TODO: this will be slightly wrong if we have a delayed byte string
+                                probability = chunk.new_bytes_prob
+                            )
+                        )
+                    else:
+                        self._inplace_append(
+                            Text(
+                                text = new_text,
+                            )
+                        )
                 # last_is_generated = chunk.is_generated
 
                 if len(chunk.capture_groups) > 0:
diff --git a/guidance/models/_model_state.py b/guidance/models/_model_state.py
new file mode 100644
index 000000000..b3f61e2a7
--- /dev/null
+++ b/guidance/models/_model_state.py
@@ -0,0 +1,57 @@
+from __future__ import annotations
+from dataclasses import dataclass
+from typing import Optional
+import base64
+import html
+
+@dataclass
+class Object:
+    def _html(self) -> str:
+        raise NotImplementedError
+
+    def __str__(self) -> str:
+        raise NotImplementedError
+
+
+@dataclass
+class Text(Object):
+    text: str
+    probability: Optional[float] = None
+
+    def __str__(self) -> str:
+        return self.text
+
+    def _html(self) -> str:
+        escaped_text = html.escape(self.text)
+        if self.probability is not None:
+            style = f"background-color: rgba({165*(1-self.probability) + 0}, {165*self.probability + 0}, 0, {0.15}); border-radius: 3px;"
+            return f"<span style='{style}' title='{self.probability}'>{escaped_text}</span>"
+        return escaped_text
+
+
+@dataclass
+class Image(Object):
+    id: str
+    data: bytes
+
+    def __str__(self) -> str:
+        raise NotImplementedError
+    
+    def _html(self) -> str:
+        return f"""<img src="data:image/png;base64,'{base64.b64encode(self.data).decode()}'" style="max-width: 400px; vertical-align: middle; margin: 4px;">"""
+
+
+class ModelState(list[Object]):
+    # TODO: opened blocks
+    def __str__(self) -> str:
+        out = ""
+        for obj in self:
+            out += str(obj)
+        return out
+
+    def _html(self) -> str:
+        out = "<pre style='margin: 0px; padding: 0px; vertical-align: middle; padding-left: 8px; margin-left: -8px; border-radius: 0px; border-left: 1px solid rgba(127, 127, 127, 0.2); white-space: pre-wrap; font-family: ColfaxAI, Arial; font-size: 15px; line-height: 23px;'>"
+        for obj in self:
+            out += obj._html()
+        out += "</pre>"
+        return out

From 75ffd29c2c6a90692367aff5419af624e6626ed7 Mon Sep 17 00:00:00 2001
From: Hudson Cooper <hncooper96@gmail.com>
Date: Thu, 20 Jun 2024 18:37:32 -0700
Subject: [PATCH 02/14] deep copy modelstate

---
 guidance/models/_model.py       |  1 +
 guidance/models/_model_state.py | 40 ++++++++++++++++++++++++++++-----
 2 files changed, 36 insertions(+), 5 deletions(-)

diff --git a/guidance/models/_model.py b/guidance/models/_model.py
index 5ee4d1a65..4fdc9779a 100644
--- a/guidance/models/_model.py
+++ b/guidance/models/_model.py
@@ -905,6 +905,7 @@ def copy(self):
         new_lm._variables = self._variables.copy()
         new_lm._variables_log_probs = self._variables_log_probs.copy()
         new_lm.opened_blocks = self.opened_blocks.copy()
+        new_lm._state = self._state.copy()
 
         # create a new clean event queue
         new_lm._event_queue = None  # we start with no event queue because nobody is listening to us yet
diff --git a/guidance/models/_model_state.py b/guidance/models/_model_state.py
index b3f61e2a7..075b975c4 100644
--- a/guidance/models/_model_state.py
+++ b/guidance/models/_model_state.py
@@ -1,9 +1,10 @@
 from __future__ import annotations
 from dataclasses import dataclass
-from typing import Optional
+from typing import Optional, overload
 import base64
 import html
 
+
 @dataclass
 class Object:
     def _html(self) -> str:
@@ -36,22 +37,51 @@ class Image(Object):
 
     def __str__(self) -> str:
         raise NotImplementedError
-    
+
     def _html(self) -> str:
         return f"""<img src="data:image/png;base64,'{base64.b64encode(self.data).decode()}'" style="max-width: 400px; vertical-align: middle; margin: 4px;">"""
 
 
-class ModelState(list[Object]):
+class ModelState:
+    def __init__(self) -> None:
+        self.objects: list[Object] = []
+
+    def copy(self) -> ModelState:
+        new = ModelState()
+        new.objects = self.objects.copy()
+        return new
+
+    @overload
+    def __getitem__(self, index: int) -> Object: ...
+
+    @overload
+    def __getitem__(self, index: slice) -> ModelState: ...
+
+    def __getitem__(self, index):
+        if isinstance(index, int):
+            return self.objects[index]
+        elif isinstance(index, slice):
+            new = ModelState()
+            new.objects = self.objects[index]
+            return new
+        raise TypeError(f"Index must be int or slice, not {type(index)}")
+
+    def append(self, obj: Object) -> None:
+        self.objects.append(obj)
+
+    def __len__(self) -> int:
+        return len(self.objects)
+
     # TODO: opened blocks
     def __str__(self) -> str:
         out = ""
-        for obj in self:
+        for obj in self.objects:
             out += str(obj)
         return out
 
     def _html(self) -> str:
         out = "<pre style='margin: 0px; padding: 0px; vertical-align: middle; padding-left: 8px; margin-left: -8px; border-radius: 0px; border-left: 1px solid rgba(127, 127, 127, 0.2); white-space: pre-wrap; font-family: ColfaxAI, Arial; font-size: 15px; line-height: 23px;'>"
-        for obj in self:
+        for obj in self.objects:
             out += obj._html()
         out += "</pre>"
         return out

From 1ca3a33310c51eb3cb8c8b49cf4d75b51e506b4f Mon Sep 17 00:00:00 2001
From: Hudson Cooper <hncooper96@gmail.com>
Date: Fri, 21 Jun 2024 12:59:43 -0700
Subject: [PATCH 03/14] RoleBlock type

---
 guidance/library/_role.py | 12 ++++++++++--
 1 file changed, 10 insertions(+), 2 deletions(-)

diff --git a/guidance/library/_role.py b/guidance/library/_role.py
index 843ed904e..dea510deb 100644
--- a/guidance/library/_role.py
+++ b/guidance/library/_role.py
@@ -1,5 +1,5 @@
 from .._guidance import guidance
-from ._block import block
+from ._block import ContextBlock
 from ._set_attribute import set_attribute
 
 nodisp_start = "<||_#NODISP_||>"
@@ -7,6 +7,13 @@
 span_start = "<||_html:<span style='background-color: rgba(255, 180, 0, 0.3); border-radius: 3px;'>_||>"
 span_end = "<||_html:</span>_||>"
 
+
+class RoleBlock(ContextBlock):
+    def __init__(self, role_name, opener, closer, name=None):
+        super().__init__(opener, closer, name=name)
+        self.role_name = role_name
+
+
 @guidance
 def role_opener(lm, role_name, **kwargs):
     indent = getattr(lm, "indent_roles", True)
@@ -73,7 +80,8 @@ def role_closer(lm, role_name, **kwargs):
 # TODO HN: Add a docstring to better describe arbitrary role functions
 def role(role_name, text=None, **kwargs):
     if text is None:
-        return block(
+        return RoleBlock(
+            role_name=role_name,
             opener=role_opener(role_name, **kwargs),
             closer=role_closer(role_name, **kwargs),
         )

From 5d86bd128aa1aea395bb25663ae950efd102c4f9 Mon Sep 17 00:00:00 2001
From: Hudson Cooper <hncooper96@gmail.com>
Date: Fri, 21 Jun 2024 13:04:55 -0700
Subject: [PATCH 04/14] Role{Opener,Closer} Object types

---
 guidance/library/_role.py       | 39 +-----------------------
 guidance/models/_model.py       | 53 +++++++++++++++++++++++++++------
 guidance/models/_model_state.py | 40 +++++++++++++++++++++++++
 3 files changed, 85 insertions(+), 47 deletions(-)

diff --git a/guidance/library/_role.py b/guidance/library/_role.py
index dea510deb..692af78ec 100644
--- a/guidance/library/_role.py
+++ b/guidance/library/_role.py
@@ -16,19 +16,6 @@ def __init__(self, role_name, opener, closer, name=None):
 
 @guidance
 def role_opener(lm, role_name, **kwargs):
-    indent = getattr(lm, "indent_roles", True)
-
-
-    # Block start container (centers elements)
-    if indent:
-        lm += f"<||_html:<div style='display: flex; border-bottom: 1px solid rgba(127, 127, 127, 0.2);  justify-content: center; align-items: center;'><div style='flex: 0 0 80px; opacity: 0.5;'>{role_name.lower()}</div><div style='flex-grow: 1; padding: 5px; padding-top: 10px; padding-bottom: 10px; margin-top: 0px; white-space: pre-wrap; margin-bottom: 0px;'>_||>"
-
-    # Start of either debug or HTML no disp block
-    if indent:
-        lm += nodisp_start
-    else:
-        lm += span_start
-    
     # TODO [HN]: Temporary change while I instrument chat_template in transformers only.
     # Eventually have all models use chat_template.
     if hasattr(lm, "get_role_start"):
@@ -39,44 +26,20 @@ def role_opener(lm, role_name, **kwargs):
         raise Exception(
             f"You need to use a chat model in order the use role blocks like `with {role_name}():`! Perhaps you meant to use the {type(lm).__name__}Chat class?"
         )
-
-    # End of either debug or HTML no disp block
-    if indent:
-        lm += nodisp_end
-    else:
-        lm += span_end
-
     return lm
 
 
 @guidance
 def role_closer(lm, role_name, **kwargs):
-    indent = getattr(lm, "indent_roles", True)
-    # Start of either debug or HTML no disp block
-    if indent:
-        lm += nodisp_start
-    else:
-        lm += span_start
-
     # TODO [HN]: Temporary change while I instrument chat_template in transformers only.
     # Eventually have all models use chat_template.
     if hasattr(lm, "get_role_end"):
         lm += lm.get_role_end(role_name)
     elif hasattr(lm, "chat_template"):
         lm += lm.chat_template.get_role_end(role_name)
-
-    # End of either debug or HTML no disp block
-    if indent:
-        lm += nodisp_end
-    else:
-        lm += span_end
-
-    # End of top container
-    if indent:
-        lm += "<||_html:</div></div>_||>"
-
     return lm
 
+
 # TODO HN: Add a docstring to better describe arbitrary role functions
 def role(role_name, text=None, **kwargs):
     if text is None:
diff --git a/guidance/models/_model.py b/guidance/models/_model.py
index 4fdc9779a..1ea7d674e 100644
--- a/guidance/models/_model.py
+++ b/guidance/models/_model.py
@@ -39,7 +39,7 @@
     )
     from .. import _cpp as cpp
 
-from ._model_state import ModelState, Text, Object
+from ._model_state import ModelState, Text, Object, RoleOpener, RoleCloser
 from ._guidance_engine_metrics import GuidanceEngineMetrics
 from .._utils import softmax, CaptureEvents
 from .._parser import EarleyCommitParser, Parser
@@ -988,10 +988,23 @@ def _current_prompt(self) -> str:
 
     def __str__(self):
         """A string representation of the current model object (that includes context closers)."""
-        out = self._current_prompt()
+        # Import in function to guard against circular import
+        from ..library._role import RoleBlock
+        lm = self.copy()
         for context in reversed(self.opened_blocks):
-            out += format_pattern.sub("", self.opened_blocks[context][1])
-        return out
+            _, close_text = self.opened_blocks[context]
+            assert close_text is not None
+            if isinstance(context, RoleBlock):
+                lm._inplace_append(
+                    RoleCloser(
+                        role_name=context.role_name,
+                        text=close_text,
+                        indent=getattr(lm, "indent_roles", True)
+                    )
+                )
+            else:
+                lm += close_text
+        return str(lm._state)
 
     def __add__(self, value):
         """Adding is the primary mechanism for extending model state.
@@ -1001,6 +1014,8 @@ def __add__(self, value):
         value : guidance grammar
             The grammar used to extend the current model.
         """
+        # Import in function to guard against circular import
+        from ..library._role import RoleBlock
 
         # create the new lm object we will return
         # (we need to do this since Model objects are immutable)
@@ -1030,17 +1045,37 @@ def __add__(self, value):
             # close any newly closed contexts
             for (pos, close_text), context in old_blocks:
                 if context.name is not None:
-                    lm._variables[context.name] = format_pattern.sub(
-                        "", lm._state[pos:]
+                    # Capture
+                    lm._variables[context.name] = str(lm._state[pos:])
+                if isinstance(context, RoleBlock):
+                    lm._inplace_append(
+                        RoleCloser(
+                            role_name=context.role_name,
+                            text=close_text,
+                            indent=getattr(lm, "indent_roles", True)
+                        )
                     )
-                lm += context.closer
+                else:
+                    lm += close_text
 
             # apply any newly opened contexts (new from this object's perspective)
             for context in new_blocks:
-                lm += context.opener
+                if isinstance(context, RoleBlock):
+                    with grammar_only():
+                        tmp = lm + context.opener
+                    open_text = str(tmp._state[len(lm._state):])  # get the new state added by calling the opener
+                    lm._inplace_append(
+                        RoleOpener(
+                            role_name=context.role_name,
+                            text=open_text,
+                            indent=getattr(lm, "indent_roles", True)
+                        )
+                    )
+                else:
+                    lm += context.opener
                 with grammar_only():
                     tmp = lm + context.closer
-                close_text = tmp._state[len(lm._state):]  # get the new state added by calling the closer
+                close_text = str(tmp._state[len(lm._state):])  # get the new state added by calling the closer
                 lm.opened_blocks[context] = (len(lm._state), close_text)
 
                 # clear out names that we override
diff --git a/guidance/models/_model_state.py b/guidance/models/_model_state.py
index 075b975c4..3b35ea400 100644
--- a/guidance/models/_model_state.py
+++ b/guidance/models/_model_state.py
@@ -42,6 +42,46 @@ def _html(self) -> str:
         return f"""<img src="data:image/png;base64,'{base64.b64encode(self.data).decode()}'" style="max-width: 400px; vertical-align: middle; margin: 4px;">"""
 
 
+@dataclass
+class RoleOpener(Object):
+    role_name: str
+    text: str
+    indent: bool
+
+    def _html(self) -> str:
+        out = ""
+        if self.indent:
+            out += f"<div style='display: flex; border-bottom: 1px solid rgba(127, 127, 127, 0.2);  justify-content: center; align-items: center;'><div style='flex: 0 0 80px; opacity: 0.5;'>{self.role_name.lower()}</div><div style='flex-grow: 1; padding: 5px; padding-top: 10px; padding-bottom: 10px; margin-top: 0px; white-space: pre-wrap; margin-bottom: 0px;'>"
+        else:
+            out += "<span style='background-color: rgba(255, 180, 0, 0.3); border-radius: 3px;'>"
+            out += self.text
+            out += "</span>"
+        return out
+
+    def __str__(self) -> str:
+        return self.text
+
+
+@dataclass()
+class RoleCloser(Object):
+    role_name: str
+    text: str
+    indent: bool
+
+    def _html(self) -> str:
+        out = ""
+        if self.indent:
+            out += "</div></div>"
+        else:
+            out += "<span style='background-color: rgba(255, 180, 0, 0.3); border-radius: 3px;'>"
+            out += self.text
+            out += "</span>"
+        return out
+
+    def __str__(self) -> str:
+        return self.text
+
+
 class ModelState:
     def __init__(self) -> None:
         self.objects: list[Object] = []

From 423489c85c806620de74c68bd12466d9f5569fd9 Mon Sep 17 00:00:00 2001
From: Hudson Cooper <hncooper96@gmail.com>
Date: Fri, 21 Jun 2024 13:05:30 -0700
Subject: [PATCH 05/14] Fix _repr_html_

---
 guidance/models/_model.py | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/guidance/models/_model.py b/guidance/models/_model.py
index 1ea7d674e..f63c29229 100644
--- a/guidance/models/_model.py
+++ b/guidance/models/_model.py
@@ -980,7 +980,7 @@ def reset(self, clear_variables=True):
     def _repr_html_(self):
         if ipython_is_imported:
             clear_output(wait=True)
-        return self._html()
+        return self._state._html()
 
     def _current_prompt(self) -> str:
         """The current prompt in bytes (which is the state without the context close tags)."""

From 86b99042ae9329158a2aeea61300346eacdb3f91 Mon Sep 17 00:00:00 2001
From: Hudson Cooper <hncooper96@gmail.com>
Date: Fri, 21 Jun 2024 13:08:54 -0700
Subject: [PATCH 06/14] Be a bit more careful about close_text

---
 guidance/models/_model.py | 3 ++-
 1 file changed, 2 insertions(+), 1 deletion(-)

diff --git a/guidance/models/_model.py b/guidance/models/_model.py
index f63c29229..26cdd3241 100644
--- a/guidance/models/_model.py
+++ b/guidance/models/_model.py
@@ -1031,7 +1031,7 @@ def __add__(self, value):
                     new_blocks.append(context)
 
                     # mark this so we don't re-add when computing the opener or closer (even though we don't know the close text yet)
-                    lm.opened_blocks[context] = (0, "")
+                    lm.opened_blocks[context] = (0, None)
 
             # find what old blocks need to be removed
             old_blocks = []
@@ -1044,6 +1044,7 @@ def __add__(self, value):
 
             # close any newly closed contexts
             for (pos, close_text), context in old_blocks:
+                assert close_text is not None
                 if context.name is not None:
                     # Capture
                     lm._variables[context.name] = str(lm._state[pos:])

From d88dfb2d091e521edd267bff7a7c54d39e1edcf5 Mon Sep 17 00:00:00 2001
From: Hudson Cooper <hncooper96@gmail.com>
Date: Fri, 21 Jun 2024 13:18:11 -0700
Subject: [PATCH 07/14] fix and simplify model.__str__ impl

---
 guidance/models/_model.py | 18 +++---------------
 1 file changed, 3 insertions(+), 15 deletions(-)

diff --git a/guidance/models/_model.py b/guidance/models/_model.py
index 26cdd3241..b3ea55b29 100644
--- a/guidance/models/_model.py
+++ b/guidance/models/_model.py
@@ -988,23 +988,11 @@ def _current_prompt(self) -> str:
 
     def __str__(self):
         """A string representation of the current model object (that includes context closers)."""
-        # Import in function to guard against circular import
-        from ..library._role import RoleBlock
-        lm = self.copy()
+        out = str(self._state)
         for context in reversed(self.opened_blocks):
             _, close_text = self.opened_blocks[context]
-            assert close_text is not None
-            if isinstance(context, RoleBlock):
-                lm._inplace_append(
-                    RoleCloser(
-                        role_name=context.role_name,
-                        text=close_text,
-                        indent=getattr(lm, "indent_roles", True)
-                    )
-                )
-            else:
-                lm += close_text
-        return str(lm._state)
+            out += close_text
+        return out
 
     def __add__(self, value):
         """Adding is the primary mechanism for extending model state.

From 6b13846c19d2f2a5aea7f69d9de9071cfcc58009 Mon Sep 17 00:00:00 2001
From: Hudson Cooper <hncooper96@gmail.com>
Date: Fri, 21 Jun 2024 13:18:31 -0700
Subject: [PATCH 08/14] Kill unnecessary tag strings

---
 guidance/library/_role.py | 5 -----
 1 file changed, 5 deletions(-)

diff --git a/guidance/library/_role.py b/guidance/library/_role.py
index 692af78ec..737d86a56 100644
--- a/guidance/library/_role.py
+++ b/guidance/library/_role.py
@@ -2,11 +2,6 @@
 from ._block import ContextBlock
 from ._set_attribute import set_attribute
 
-nodisp_start = "<||_#NODISP_||>"
-nodisp_end = "<||_/NODISP_||>"
-span_start = "<||_html:<span style='background-color: rgba(255, 180, 0, 0.3); border-radius: 3px;'>_||>"
-span_end = "<||_html:</span>_||>"
-
 
 class RoleBlock(ContextBlock):
     def __init__(self, role_name, opener, closer, name=None):

From 8d510924f9f07aa20bbe361d291502c9000d662a Mon Sep 17 00:00:00 2001
From: Hudson Cooper <hncooper96@gmail.com>
Date: Fri, 21 Jun 2024 13:18:51 -0700
Subject: [PATCH 09/14] No more format_pattern

---
 guidance/models/_model.py | 8 +++-----
 1 file changed, 3 insertions(+), 5 deletions(-)

diff --git a/guidance/models/_model.py b/guidance/models/_model.py
index b3ea55b29..4b36435b4 100644
--- a/guidance/models/_model.py
+++ b/guidance/models/_model.py
@@ -64,7 +64,6 @@
 
 # define some constants we will reuse many times
 _null_grammar = string("")
-format_pattern = re.compile(r"<\|\|_.*?_\|\|>", flags=re.DOTALL)
 nodisp_pattern = re.compile(
     r"&lt;\|\|_#NODISP_\|\|&gt;.*?&lt;\|\|_/NODISP_\|\|&gt;", flags=re.DOTALL
 )
@@ -877,7 +876,7 @@ def active_role_end(self):
         # add any active non-empty role ends. Ignore role ends that are spaces
         parts = []
         for _, role_end_str in self.opened_blocks.values():
-            role_end_str = format_pattern.sub("", role_end_str)
+            role_end_str = role_end_str
             if len(role_end_str) > 0 and not re.fullmatch(r"\s+", role_end_str):
                 parts.append(role_end_str)
 
@@ -1156,9 +1155,8 @@ def __getitem__(self, key):
         else:
             for context in list(reversed(self.opened_blocks)):
                 if context.name == key:
-                    return format_pattern.sub(
-                        "", self._state[self.opened_blocks[context][0] :]
-                    )
+                    pos, _ = self.opened_blocks[context]
+                    return str(self._state[pos:])
 
         raise KeyError(f"Model does not contain the variable '{key}'")
 

From 88b4a9c2b5c103682598df934cca0f9b3456fa5d Mon Sep 17 00:00:00 2001
From: Hudson Cooper <hncooper96@gmail.com>
Date: Fri, 21 Jun 2024 13:27:36 -0700
Subject: [PATCH 10/14] Remove old patterns

---
 guidance/models/_model.py | 7 -------
 1 file changed, 7 deletions(-)

diff --git a/guidance/models/_model.py b/guidance/models/_model.py
index 4b36435b4..366403987 100644
--- a/guidance/models/_model.py
+++ b/guidance/models/_model.py
@@ -64,13 +64,6 @@
 
 # define some constants we will reuse many times
 _null_grammar = string("")
-nodisp_pattern = re.compile(
-    r"&lt;\|\|_#NODISP_\|\|&gt;.*?&lt;\|\|_/NODISP_\|\|&gt;", flags=re.DOTALL
-)
-html_pattern = re.compile(r"&lt;\|\|_html:(.*?)_\|\|&gt;", flags=re.DOTALL)
-image_pattern = re.compile(r"&lt;\|_image:(.*?)\|&gt;")
-
-
 
 
 class EngineCallResponse:

From 55b91620140d72a0a16797229a23be735de36128 Mon Sep 17 00:00:00 2001
From: Hudson Cooper <hncooper96@gmail.com>
Date: Fri, 21 Jun 2024 13:37:11 -0700
Subject: [PATCH 11/14] immutability and slots

---
 guidance/models/_model_state.py | 12 +++++++-----
 1 file changed, 7 insertions(+), 5 deletions(-)

diff --git a/guidance/models/_model_state.py b/guidance/models/_model_state.py
index 3b35ea400..72cd02940 100644
--- a/guidance/models/_model_state.py
+++ b/guidance/models/_model_state.py
@@ -5,7 +5,7 @@
 import html
 
 
-@dataclass
+@dataclass(frozen=True, slots=True)
 class Object:
     def _html(self) -> str:
         raise NotImplementedError
@@ -14,7 +14,7 @@ def __str__(self) -> str:
         raise NotImplementedError
 
 
-@dataclass
+@dataclass(frozen=True, slots=True)
 class Text(Object):
     text: str
     probability: Optional[float] = None
@@ -30,7 +30,7 @@ def _html(self) -> str:
         return escaped_text
 
 
-@dataclass
+@dataclass(frozen=True, slots=True)
 class Image(Object):
     id: str
     data: bytes
@@ -42,7 +42,7 @@ def _html(self) -> str:
         return f"""<img src="data:image/png;base64,'{base64.b64encode(self.data).decode()}'" style="max-width: 400px; vertical-align: middle; margin: 4px;">"""
 
 
-@dataclass
+@dataclass(frozen=True, slots=True)
 class RoleOpener(Object):
     role_name: str
     text: str
@@ -62,7 +62,7 @@ def __str__(self) -> str:
         return self.text
 
 
-@dataclass()
+@dataclass(frozen=True, slots=True)
 class RoleCloser(Object):
     role_name: str
     text: str
@@ -83,6 +83,8 @@ def __str__(self) -> str:
 
 
 class ModelState:
+    __slots__ = ["objects"]
+
     def __init__(self) -> None:
         self.objects: list[Object] = []
 

From b9fb115e2ffeaaa06e8c372f71324190782d8386 Mon Sep 17 00:00:00 2001
From: Hudson Cooper <hncooper96@gmail.com>
Date: Tue, 25 Jun 2024 12:31:18 -0700
Subject: [PATCH 12/14] Object-typed closers

---
 guidance/models/_model.py | 38 +++++++++++++++++++++-----------------
 1 file changed, 21 insertions(+), 17 deletions(-)

diff --git a/guidance/models/_model.py b/guidance/models/_model.py
index 366403987..c8ddeb59b 100644
--- a/guidance/models/_model.py
+++ b/guidance/models/_model.py
@@ -11,7 +11,7 @@
 
 
 from pprint import pprint
-from typing import Dict, TYPE_CHECKING
+from typing import Dict, Optional, TYPE_CHECKING
 
 
 import numpy as np
@@ -844,7 +844,7 @@ def __init__(self, engine, echo=True, **kwargs):
         self.echo = echo
         self.token_count = 0  # tracks how many tokens our byte state represents
         self.max_display_rate = 0.2  # this controls how frequently we are allowed to redraw the display (in seconds)
-        self.opened_blocks = {}  # what context blocks have been opened but not closed
+        self.opened_blocks: dict["ContextBlock", tuple[int, Optional(Object)]] = {}  # what context blocks have been opened but not closed
         # self.compute_log_probs = compute_log_probs
 
         # private attributes
@@ -982,8 +982,9 @@ def __str__(self):
         """A string representation of the current model object (that includes context closers)."""
         out = str(self._state)
         for context in reversed(self.opened_blocks):
-            _, close_text = self.opened_blocks[context]
-            out += close_text
+            _, closer = self.opened_blocks[context]
+            if closer is not None:
+                out += str(closer)
         return out
 
     def __add__(self, value):
@@ -1023,28 +1024,22 @@ def __add__(self, value):
                     del lm.opened_blocks[context]
 
             # close any newly closed contexts
-            for (pos, close_text), context in old_blocks:
-                assert close_text is not None
+            for (pos, closer), context in old_blocks:
+                assert closer is not None
                 if context.name is not None:
                     # Capture
                     lm._variables[context.name] = str(lm._state[pos:])
-                if isinstance(context, RoleBlock):
-                    lm._inplace_append(
-                        RoleCloser(
-                            role_name=context.role_name,
-                            text=close_text,
-                            indent=getattr(lm, "indent_roles", True)
-                        )
-                    )
-                else:
-                    lm += close_text
+                lm._inplace_append(closer)
 
             # apply any newly opened contexts (new from this object's perspective)
             for context in new_blocks:
                 if isinstance(context, RoleBlock):
+                    # Apply the opener (a grammar)
                     with grammar_only():
+                        # TODO: be careful about the temp lm's display? (e.g. with silent())
                         tmp = lm + context.opener
                     open_text = str(tmp._state[len(lm._state):])  # get the new state added by calling the opener
+                    # Add that new state as text in a RoleOpener
                     lm._inplace_append(
                         RoleOpener(
                             role_name=context.role_name,
@@ -1055,9 +1050,18 @@ def __add__(self, value):
                 else:
                     lm += context.opener
                 with grammar_only():
+                    # TODO: be careful about the temp lm's display? (e.g. with silent())
                     tmp = lm + context.closer
                 close_text = str(tmp._state[len(lm._state):])  # get the new state added by calling the closer
-                lm.opened_blocks[context] = (len(lm._state), close_text)
+                if isinstance(context, RoleBlock):
+                    closer = RoleCloser(
+                        role_name=context.role_name,
+                        text=close_text,
+                        indent=getattr(lm, "indent_roles", True)
+                    )
+                else:
+                    closer = Text(text=close_text)
+                lm.opened_blocks[context] = (len(lm._state), closer)
 
                 # clear out names that we override
                 if context.name is not None:

From 7ab695b3285a38d38f3677dc2605bba4fead744c Mon Sep 17 00:00:00 2001
From: Hudson Cooper <hncooper96@gmail.com>
Date: Tue, 25 Jun 2024 12:31:34 -0700
Subject: [PATCH 13/14] Use closers in html

---
 guidance/models/_model.py | 12 ++++++++++--
 1 file changed, 10 insertions(+), 2 deletions(-)

diff --git a/guidance/models/_model.py b/guidance/models/_model.py
index c8ddeb59b..8a5b41340 100644
--- a/guidance/models/_model.py
+++ b/guidance/models/_model.py
@@ -951,7 +951,7 @@ def _update_display(self, throttle=True):
 
             if ipython_is_imported:
                 clear_output(wait=True)
-                display(HTML(self._state._html()))
+                display(HTML(self._html()))
             else:
                 pprint(self._state)
 
@@ -969,10 +969,18 @@ def reset(self, clear_variables=True):
             self._variables_log_probs = {}
         return self
 
+    def _html(self):
+        out = self._state._html()
+        for context in reversed(self.opened_blocks):
+            _, closer = self.opened_blocks[context]
+            if closer is not None:
+                out += closer._html()
+        return out
+
     def _repr_html_(self):
         if ipython_is_imported:
             clear_output(wait=True)
-        return self._state._html()
+        return self._html()
 
     def _current_prompt(self) -> str:
         """The current prompt in bytes (which is the state without the context close tags)."""

From c6af474b1208bf4de985752a4dc84044b64d0793 Mon Sep 17 00:00:00 2001
From: Hudson Cooper <hncooper96@gmail.com>
Date: Tue, 25 Jun 2024 14:15:20 -0700
Subject: [PATCH 14/14] Remove active_role_end

The existing implementation wouldn't properly pop the selected role
off the opened_blocks dict, so roles could be closed twice. We'd need
a stateful implementation that could modify the Model object more
directly... Removing it for now
---
 guidance/_grammar.py      |  4 ----
 guidance/library/_gen.py  |  4 ++--
 guidance/models/_model.py | 17 -----------------
 3 files changed, 2 insertions(+), 23 deletions(-)

diff --git a/guidance/_grammar.py b/guidance/_grammar.py
index 7500b54a3..8b63df031 100644
--- a/guidance/_grammar.py
+++ b/guidance/_grammar.py
@@ -966,10 +966,6 @@ def _re_with_temperature(grammar, temperature, visited_set):
 #     return ModelVariable(name)
 
 
-def active_role_end() -> ModelVariable:
-    return ModelVariable("active_role_end")
-
-
 def eos_token() -> ModelVariable:
     return ModelVariable("eos_token")
 
diff --git a/guidance/library/_gen.py b/guidance/library/_gen.py
index 71b969e8c..775843103 100644
--- a/guidance/library/_gen.py
+++ b/guidance/library/_gen.py
@@ -8,7 +8,7 @@
 from ._any_char import any_char
 from .._grammar import capture
 from ._regex import regex as regex_grammar
-from .._grammar import token_limit, eos_token, active_role_end, with_temperature
+from .._grammar import token_limit, eos_token, with_temperature
 from ._tool import Tool
 from ._block import block
 
@@ -129,7 +129,7 @@ def gen(
         if isinstance(stop, str):
             stop = [stop]
         if regex is None:
-            stop = stop + [select([eos_token(), active_role_end()])]
+            stop = stop + [eos_token()]
 
         if stop_regex is None:
             stop_regex = []
diff --git a/guidance/models/_model.py b/guidance/models/_model.py
index 8a5b41340..bbe44adb2 100644
--- a/guidance/models/_model.py
+++ b/guidance/models/_model.py
@@ -857,23 +857,6 @@ def __init__(self, engine, echo=True, **kwargs):
         self._last_display = 0  # used to track the last display call to enable throttling
         self._last_event_stream = 0  # used to track the last event streaming call to enable throttling
 
-    @property
-    def active_role_end(self):
-        """The default end patterns we should use for `gen` calls.
-        TODO: move this logic into the gen call...we can do with if we allow model_variables to run functions.
-
-        These patterns are computed dynamically by the model object because they can depend on
-        what the current open roles are, which is something
-        """
-
-        # add any active non-empty role ends. Ignore role ends that are spaces
-        parts = []
-        for _, role_end_str in self.opened_blocks.values():
-            role_end_str = role_end_str
-            if len(role_end_str) > 0 and not re.fullmatch(r"\s+", role_end_str):
-                parts.append(role_end_str)
-
-        return select(parts)
 
     def _send_to_event_queue(self, value):
         """For streaming in code.