From d00ac3de4947868ecb00f8a0c7652ccdacb493d8 Mon Sep 17 00:00:00 2001
From: Jordan Wu <101218661+jordan-definitive@users.noreply.github.com>
Date: Tue, 5 Aug 2025 14:52:12 -0700
Subject: [PATCH 01/16] fix: make `HarmonyEncoding` usable concurrently

the `conversation_has_function_tools` atomic bool makes `HarmonyEncoding` stateful
---
 python/openai_harmony/__init__.py | 19 ++++++-
 src/encoding.rs                   | 91 ++++++++++++++++++++++---------
 src/py_module.rs                  | 20 ++++++-
 src/registry.rs                   |  3 +-
 src/tests.rs                      |  2 +-
 src/wasm_module.rs                | 29 +++++++++-
 6 files changed, 130 insertions(+), 34 deletions(-)
diff --git a/python/openai_harmony/__init__.py b/python/openai_harmony/__init__.py
index 3485864..13b5fdd 100644
--- a/python/openai_harmony/__init__.py
+++ b/python/openai_harmony/__init__.py
@@ -425,6 +425,10 @@ class RenderConversationConfig(BaseModel):
     auto_drop_analysis: bool = True
 
 
+class RenderOptions(BaseModel):
+    conversation_has_function_tools: bool = False
+
+
 class HarmonyEncoding:
     """High-level wrapper around the Rust ``PyHarmonyEncoding`` class."""
 
@@ -498,9 +502,20 @@ class HarmonyEncoding:
             config=config_dict,
         )
 
-    def render(self, message: Message) -> List[int]:
+    def render(
+        self, message: Message, render_options: Optional[RenderOptions] = None
+    ) -> List[int]:
         """Render a single message into tokens."""
-        return self._inner.render(message_json=message.to_json())
+        if render_options is None:
+            render_options_dict = {"conversation_has_function_tools": False}
+        else:
+            render_options_dict = {
+                "conversation_has_function_tools": render_options.conversation_has_function_tools
+            }
+
+        return self._inner.render(
+            message_json=message.to_json(), render_options=render_options_dict
+        )
 
     # -- Parsing -------------------------------------------------------
 
diff --git a/src/encoding.rs b/src/encoding.rs
index c58e8b8..afe1fce 100644
--- a/src/encoding.rs
+++ b/src/encoding.rs
@@ -5,10 +5,7 @@ use crate::{
 use anyhow::Context as _;
 use std::{
     collections::{HashMap, HashSet},
-    sync::{
-        atomic::{AtomicBool, Ordering},
-        Arc,
-    },
+    sync::Arc,
     vec,
 };
 
@@ -92,7 +89,6 @@ pub struct HarmonyEncoding {
     pub(crate) format_token_mapping: HashMap<FormattingToken, String>,
     pub(crate) stop_formatting_tokens: HashSet<FormattingToken>,
     pub(crate) stop_formatting_tokens_for_assistant_actions: HashSet<FormattingToken>,
-    pub(crate) conversation_has_function_tools: Arc<AtomicBool>,
 }
 
 impl std::fmt::Debug for HarmonyEncoding {
@@ -191,8 +187,9 @@ impl HarmonyEncoding {
                 }
             })
         });
-        self.conversation_has_function_tools
-            .store(has_function_tools, Ordering::Relaxed);
+        let render_options = RenderOptions {
+            conversation_has_function_tools: has_function_tools,
+        };
         let last_assistant_is_final = messages
             .iter()
             .rev()
@@ -217,9 +214,7 @@ impl HarmonyEncoding {
                     && first_final_idx.is_some_and(|first| *idx < first)
                     && msg.channel.as_deref() == Some("analysis"))
             })
-            .try_for_each(|(_, msg)| self.render_into(msg, into));
-        self.conversation_has_function_tools
-            .store(false, Ordering::Relaxed);
+            .try_for_each(|(_, msg)| self.render_into(msg, into, Some(&render_options)));
         result?;
         Ok(())
     }
@@ -305,18 +300,27 @@ impl HarmonyEncoding {
     }
 
     /// Render a single message into tokens.
-    pub fn render(&self, message: &Message) -> anyhow::Result<Vec<Rank>> {
+    pub fn render(
+        &self,
+        message: &Message,
+        render_options: Option<&RenderOptions>,
+    ) -> anyhow::Result<Vec<Rank>> {
         let mut out = vec![];
-        Render::<Message>::render(self, message, &mut out)?;
+        Render::<Message>::render(self, message, &mut out, render_options)?;
         Ok(out)
     }
 
     /// Render a single message into the provided buffer.
-    pub fn render_into<B>(&self, message: &Message, into: &mut B) -> anyhow::Result<()>
+    pub fn render_into<B>(
+        &self,
+        message: &Message,
+        into: &mut B,
+        render_options: Option<&RenderOptions>,
+    ) -> anyhow::Result<()>
     where
         B: Extend<Rank>,
     {
-        Render::<Message>::render(self, message, into)
+        Render::<Message>::render(self, message, into, render_options)
     }
 }
 
@@ -772,14 +776,29 @@ impl HarmonyEncoding {
     }
 }
 
+#[derive(Clone, Copy, Debug, Default)]
+pub struct RenderOptions {
+    pub conversation_has_function_tools: bool,
+}
+
 trait Render<T: ?Sized> {
-    fn render<B>(&self, item: &T, into: &mut B) -> anyhow::Result<()>
+    fn render<B>(
+        &self,
+        item: &T,
+        into: &mut B,
+        render_options: Option<&RenderOptions>,
+    ) -> anyhow::Result<()>
     where
         B: Extend<Rank>;
 }
 
 impl Render<Message> for HarmonyEncoding {
-    fn render<B>(&self, message: &Message, into: &mut B) -> anyhow::Result<()>
+    fn render<B>(
+        &self,
+        message: &Message,
+        into: &mut B,
+        render_options: Option<&RenderOptions>,
+    ) -> anyhow::Result<()>
     where
         B: Extend<Rank>,
     {
@@ -836,7 +855,7 @@ impl Render<Message> for HarmonyEncoding {
                     message.author.role
                 );
             }
-            Render::<Content>::render(self, content, into)?;
+            Render::<Content>::render(self, content, into, render_options)?;
         }
 
         // If there is a tool call we should render a tool call token
@@ -851,15 +870,22 @@ impl Render<Message> for HarmonyEncoding {
 
 // Dispatch Content variants to their specific Render implementations
 impl Render<Content> for HarmonyEncoding {
-    fn render<B>(&self, content: &Content, into: &mut B) -> anyhow::Result<()>
+    fn render<B>(
+        &self,
+        content: &Content,
+        into: &mut B,
+        render_options: Option<&RenderOptions>,
+    ) -> anyhow::Result<()>
     where
         B: Extend<Rank>,
     {
         match content {
-            Content::Text(text) => Render::<TextContent>::render(self, text, into),
-            Content::SystemContent(sys) => Render::<SystemContent>::render(self, sys, into),
+            Content::Text(text) => Render::<TextContent>::render(self, text, into, render_options),
+            Content::SystemContent(sys) => {
+                Render::<SystemContent>::render(self, sys, into, render_options)
+            }
             Content::DeveloperContent(dev) => {
-                Render::<crate::chat::DeveloperContent>::render(self, dev, into)
+                Render::<crate::chat::DeveloperContent>::render(self, dev, into, render_options)
             }
         }
     }
@@ -867,7 +893,12 @@ impl Render<Content> for HarmonyEncoding {
 
 // Render plain text content
 impl Render<TextContent> for HarmonyEncoding {
-    fn render<B>(&self, text: &TextContent, into: &mut B) -> anyhow::Result<()>
+    fn render<B>(
+        &self,
+        text: &TextContent,
+        into: &mut B,
+        _render_options: Option<&RenderOptions>,
+    ) -> anyhow::Result<()>
     where
         B: Extend<Rank>,
     {
@@ -877,7 +908,12 @@ impl Render<TextContent> for HarmonyEncoding {
 
 // Render system-specific content (model identity, instructions, effort)
 impl Render<SystemContent> for HarmonyEncoding {
-    fn render<B>(&self, sys: &SystemContent, into: &mut B) -> anyhow::Result<()>
+    fn render<B>(
+        &self,
+        sys: &SystemContent,
+        into: &mut B,
+        render_options: Option<&RenderOptions>,
+    ) -> anyhow::Result<()>
     where
         B: Extend<Rank>,
     {
@@ -923,7 +959,7 @@ impl Render<SystemContent> for HarmonyEncoding {
                 if channel_config.channel_required {
                     channels_header.push_str(" Channel must be included for every message.");
                 }
-                if self.conversation_has_function_tools.load(Ordering::Relaxed) {
+                if render_options.is_some_and(|o| o.conversation_has_function_tools) {
                     channels_header.push('\n');
                     channels_header.push_str(
                         "Calls to these tools must go to the commentary channel: 'functions'.",
@@ -940,7 +976,12 @@ impl Render<SystemContent> for HarmonyEncoding {
 
 // Render developer-specific content (instructions, tools)
 impl Render<crate::chat::DeveloperContent> for HarmonyEncoding {
-    fn render<B>(&self, dev: &crate::chat::DeveloperContent, into: &mut B) -> anyhow::Result<()>
+    fn render<B>(
+        &self,
+        dev: &crate::chat::DeveloperContent,
+        into: &mut B,
+        _render_options: Option<&RenderOptions>,
+    ) -> anyhow::Result<()>
     where
         B: Extend<Rank>,
     {
diff --git a/src/py_module.rs b/src/py_module.rs
index e7bb9e5..c5c7b0a 100644
--- a/src/py_module.rs
+++ b/src/py_module.rs
@@ -178,13 +178,29 @@ impl PyHarmonyEncoding {
     }
 
     /// Render a single message into tokens.
-    fn render(&self, message_json: &str) -> PyResult<Vec<u32>> {
+    fn render(
+        &self,
+        message_json: &str,
+        render_options: Option<Bound<'_, PyDict>>,
+    ) -> PyResult<Vec<u32>> {
         let message: crate::chat::Message = serde_json::from_str(message_json).map_err(|e| {
             PyErr::new::<pyo3::exceptions::PyValueError, _>(format!("invalid message JSON: {e}"))
         })?;
 
+        let rust_options = if let Some(options_dict) = render_options {
+            let conversation_has_function_tools = options_dict
+                .get_item("conversation_has_function_tools")?
+                .and_then(|v| v.extract().ok())
+                .unwrap_or(false);
+            Some(crate::encoding::RenderOptions {
+                conversation_has_function_tools,
+            })
+        } else {
+            None
+        };
+
         self.inner
-            .render(&message)
+            .render(&message, rust_options.as_ref())
             .map_err(|e| PyErr::new::<pyo3::exceptions::PyRuntimeError, _>(e.to_string()))
     }
 
diff --git a/src/registry.rs b/src/registry.rs
index 6d8a98f..d1ffd2e 100644
--- a/src/registry.rs
+++ b/src/registry.rs
@@ -1,6 +1,6 @@
 use std::{
     collections::{HashMap, HashSet},
-    sync::{atomic::AtomicBool, Arc},
+    sync::Arc,
 };
 
 use crate::{
@@ -76,7 +76,6 @@ pub fn load_harmony_encoding(name: HarmonyEncodingName) -> anyhow::Result<Harmon
                     FormattingToken::EndMessageDoneSampling,
                     FormattingToken::EndMessageAssistantToTool,
                 ]),
-                conversation_has_function_tools: Arc::new(AtomicBool::new(false)),
             })
         }
     }
diff --git a/src/tests.rs b/src/tests.rs
index d6b8504..d072d73 100644
--- a/src/tests.rs
+++ b/src/tests.rs
@@ -525,7 +525,7 @@ fn test_render_and_render_conversation_roundtrip() {
     let encoding = load_harmony_encoding(HarmonyEncodingName::HarmonyGptOss).unwrap();
     let msg = Message::from_role_and_content(Role::User, "Hello");
     let convo = Conversation::from_messages([msg.clone()]);
-    let tokens_msg = encoding.render(&msg).unwrap();
+    let tokens_msg = encoding.render(&msg, None).unwrap();
     let tokens_convo = encoding.render_conversation(&convo, None).unwrap();
     assert_eq!(tokens_msg, tokens_convo);
     let tokens_completion = encoding
diff --git a/src/wasm_module.rs b/src/wasm_module.rs
index b1c4490..1b96a4f 100644
--- a/src/wasm_module.rs
+++ b/src/wasm_module.rs
@@ -18,6 +18,9 @@ extern "C" {
 
     #[wasm_bindgen(typescript_type = "RenderConversationConfig")]
     pub type JsRenderConversationConfig;
+
+    #[wasm_bindgen(typescript_type = "RenderOptions")]
+    pub type JsRenderOptions;
 }
 
 #[wasm_bindgen(typescript_custom_section)]
@@ -127,12 +130,34 @@ impl JsHarmonyEncoding {
     }
 
     #[wasm_bindgen]
-    pub fn render(&self, message: JsMessage) -> Result<Vec<u32>, JsValue> {
+    pub fn render(
+        &self,
+        message: JsMessage,
+        render_options: JsRenderOptions,
+    ) -> Result<Vec<u32>, JsValue> {
         let message: JsValue = message.into();
         let message: crate::chat::Message = serde_wasm_bindgen::from_value(message)
             .map_err(|e| JsValue::from_str(&format!("invalid message JSON: {e}")))?;
+
+        #[derive(Deserialize)]
+        struct RenderOptions {
+            conversation_has_function_tools: Option<bool>,
+        }
+        let render_options: JsValue = render_options.into();
+        let rust_options = if render_options.is_undefined() || render_options.is_null() {
+            None
+        } else {
+            let cfg: RenderOptions = serde_wasm_bindgen::from_value(render_options)
+                .map_err(|e| JsValue::from_str(&format!("invalid render options: {e}")))?;
+            Some(crate::encoding::RenderOptions {
+                conversation_has_function_tools: cfg
+                    .conversation_has_function_tools
+                    .unwrap_or(false),
+            })
+        };
+
         self.inner
-            .render(&message)
+            .render(&message, rust_options.as_ref())
             .map_err(|e| JsValue::from_str(&e.to_string()))
     }
 

From 9528c7b4a00a3307fd9685fc1328aee11c3d9c90 Mon Sep 17 00:00:00 2001
From: Scott Lessans <scl@openai.com>
Date: Tue, 5 Aug 2025 17:13:26 -0700
Subject: [PATCH 02/16] version bump

---
 Cargo.lock | 2 +-
 Cargo.toml | 2 +-
 2 files changed, 2 insertions(+), 2 deletions(-)

diff --git a/Cargo.lock b/Cargo.lock
index 6b774e8..ce97b77 100644
--- a/Cargo.lock
+++ b/Cargo.lock
@@ -1317,7 +1317,7 @@ checksum = "42f5e15c9953c5e4ccceeb2e7382a716482c34515315f7b03532b8b4e8393d2d"
 
 [[package]]
 name = "openai-harmony"
-version = "0.0.2"
+version = "0.0.3"
 dependencies = [
  "anyhow",
  "base64",
diff --git a/Cargo.toml b/Cargo.toml
index 12ebc27..25d070c 100644
--- a/Cargo.toml
+++ b/Cargo.toml
@@ -1,6 +1,6 @@
 [package]
 name = "openai-harmony"
-version = "0.0.2"
+version = "0.0.3"
 edition = "2021"
 license = "Apache-2.0"
 repository = "https://github.com/openai/harmony"

From 1eb285b8745c574c7ecc6f880f452dae1fc194c8 Mon Sep 17 00:00:00 2001
From: dkqjrm <dkqjrm@naver.com>
Date: Wed, 6 Aug 2025 09:31:41 +0900
Subject: [PATCH 03/16] fix: correct typo in docs/format.md

Fix duplicate text in safety warning where 'You should We recommend' should be just 'We recommend'.
---
 docs/format.md | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/docs/format.md b/docs/format.md
index a03aae8..7ec0113 100644
--- a/docs/format.md
+++ b/docs/format.md
@@ -305,7 +305,7 @@ And the actual answer is:
 ```
 
 **Important:**  
-The model has not been trained to the same safety standards in the chain-of-thought as it has for final output. You should We recommend not to show the chain-of-thought to your users as they might contain harmful content. [Learn more in the model card](https://openai.com/index/gpt-oss-model-card/).
+The model has not been trained to the same safety standards in the chain-of-thought as it has for final output. We recommend not to show the chain-of-thought to your users as they might contain harmful content. [Learn more in the model card](https://openai.com/index/gpt-oss-model-card/).
 
 #### Handling reasoning output in subsequent sampling
 

From a01b5e66ffa471528f28f6133b5c5b804381202c Mon Sep 17 00:00:00 2001
From: axion66 <ssongjinseob@gmail.com>
Date: Tue, 5 Aug 2025 22:05:51 -0400
Subject: [PATCH 04/16] docs: improve repo layout and checks

---
 README.md     | 2 +-
 run_checks.sh | 3 ++-
 2 files changed, 3 insertions(+), 2 deletions(-)

diff --git a/README.md b/README.md
index d9c5f13..5b460ca 100644
--- a/README.md
+++ b/README.md
@@ -149,7 +149,7 @@ through thin [`pyo3`](https://pyo3.rs/) bindings.
 │   ├── tests.rs          # Canonical Rust test-suite
 │   └── py_module.rs      # PyO3 bindings ⇒ compiled as openai_harmony.*.so
 │
-├── harmony/              # Pure-Python wrapper around the binding
+├── python/openai_harmony/ # Pure-Python wrapper around the binding
 │   └── __init__.py       # Dataclasses + helper API mirroring chat.rs
 │
 ├── tests/                # Python test-suite (1-to-1 port of tests.rs)
diff --git a/run_checks.sh b/run_checks.sh
index 2b9d439..c945094 100755
--- a/run_checks.sh
+++ b/run_checks.sh
@@ -5,4 +5,5 @@ set -e
 cargo fmt --check
 cargo clippy --all-targets --all-features -- -D warnings
 cargo test --all-targets --all-features
-
+mypy python/openai_harmony
+ruff check .

From 85e43ea7f821a78ac56ed4e35955b25b2217fb69 Mon Sep 17 00:00:00 2001
From: axion66 <ssongjinseob@gmail.com>
Date: Tue, 5 Aug 2025 22:07:51 -0400
Subject: [PATCH 05/16] dep

---
 run_checks.sh | 3 +--
 1 file changed, 1 insertion(+), 2 deletions(-)

diff --git a/run_checks.sh b/run_checks.sh
index c945094..2b9d439 100755
--- a/run_checks.sh
+++ b/run_checks.sh
@@ -5,5 +5,4 @@ set -e
 cargo fmt --check
 cargo clippy --all-targets --all-features -- -D warnings
 cargo test --all-targets --all-features
-mypy python/openai_harmony
-ruff check .
+

From 0c9c61c35cc21962a10666bcfe941045fcc0b2e4 Mon Sep 17 00:00:00 2001
From: Yuan-Man <68322456+Yuan-ManX@users.noreply.github.com>
Date: Wed, 6 Aug 2025 10:28:12 +0800
Subject: [PATCH 06/16] Update harmony format

---
 README.md | 4 +++-
 1 file changed, 3 insertions(+), 1 deletion(-)

diff --git a/README.md b/README.md
index d9c5f13..d9672e2 100644
--- a/README.md
+++ b/README.md
@@ -20,7 +20,9 @@ Current date: 2025-06-28
 Reasoning: high
 
 # Valid channels: analysis, commentary, final. Channel must be included for every message.
-Calls to these tools must go to the commentary channel: 'functions'.<|end|><|start|>developer<|message|># Instructions
+Calls to these tools must go to the commentary channel: 'functions'.<|end|>
+
+<|start|>developer<|message|># Instructions
 
 Always respond in riddles
 

From c0f2f407e0f1693916b280b03413131bb61ac5ee Mon Sep 17 00:00:00 2001
From: =?UTF-8?q?Marvin=20Gie=C3=9Fing?= <marvin.giessing@gmail.com>
Date: Wed, 6 Aug 2025 09:13:19 +0200
Subject: [PATCH 07/16] Enable PowerPC arch

---
 .github/workflows/CI.yml | 2 ++
 1 file changed, 2 insertions(+)

diff --git a/.github/workflows/CI.yml b/.github/workflows/CI.yml
index 45b5516..4fcb76f 100644
--- a/.github/workflows/CI.yml
+++ b/.github/workflows/CI.yml
@@ -48,6 +48,8 @@ jobs:
             target: aarch64
           - runner: ubuntu-22.04
             target: armv7
+          - runner: ubuntu-22.04
+            target: ppc64le
     steps:
       - uses: actions/checkout@v4
       - uses: actions/setup-python@v5

From bd5ed13085bb82bd35c8f98ca5d6d12c4c5e99d7 Mon Sep 17 00:00:00 2001
From: Simon Willison <swillison@gmail.com>
Date: Fri, 8 Aug 2025 04:58:53 -0700
Subject: [PATCH 08/16] Add 'DeveloperContent' to __all__

For better import *
---
 python/openai_harmony/__init__.py | 1 +
 1 file changed, 1 insertion(+)

diff --git a/python/openai_harmony/__init__.py b/python/openai_harmony/__init__.py
index 13b5fdd..33afbd7 100644
--- a/python/openai_harmony/__init__.py
+++ b/python/openai_harmony/__init__.py
@@ -708,6 +708,7 @@ __all__ = [
     "Author",
     "Content",
     "TextContent",
+    "DeveloperContent",
     "ToolDescription",
     "SystemContent",
     "Message",

From 8a4645f0f9d9c20a8ecd3381dbb88ce5f56084cc Mon Sep 17 00:00:00 2001
From: Dmytro Dzhulgakov <dzhulgakov@users.noreply.github.com>
Date: Fri, 8 Aug 2025 17:50:17 -0700
Subject: [PATCH 09/16] Fix tokenization of <|constrain|> content type in
 rendering (#47)

---
 src/encoding.rs       | 17 ++++++++++++++++-
 tests/test_harmony.py | 34 +++++++++++++++++++++++++++++++++-
 2 files changed, 49 insertions(+), 2 deletions(-)

diff --git a/src/encoding.rs b/src/encoding.rs
index afe1fce..d57f8ec 100644
--- a/src/encoding.rs
+++ b/src/encoding.rs
@@ -835,7 +835,22 @@ impl Render<Message> for HarmonyEncoding {
 
         // finally content type
         if let Some(content_type) = &message.content_type {
-            self.render_text_into(format!(" {content_type}"), into)?;
+            // <|constrain|> is a unique case which needs to be tokenized as a special token
+            if let Some(constrain_marker) = self.mapped_format_token(FormattingToken::ConstrainedFormat) {
+                if content_type.starts_with(constrain_marker) {
+                    // Render the space, then the constrain marker as a special token, then the rest as text (if any)
+                    self.render_text_into(" ", into)?;
+                    self.render_formatting_token_into(FormattingToken::ConstrainedFormat, into)?;
+                    let rest = &content_type[constrain_marker.len()..];
+                    if !rest.is_empty() {
+                        self.render_text_into(rest, into)?;
+                    }
+                } else {
+                    self.render_text_into(format!(" {content_type}"), into)?;
+                }
+            } else {
+                self.render_text_into(format!(" {content_type}"), into)?;
+            }
         }
 
         self.render_formatting_token_into(FormattingToken::Message, into)?;
diff --git a/tests/test_harmony.py b/tests/test_harmony.py
index 07d5562..dd34e81 100644
--- a/tests/test_harmony.py
+++ b/tests/test_harmony.py
@@ -233,6 +233,36 @@ def test_simple_tool_call(encoding_name):
     assert parsed == expected
 
 
+@pytest.mark.parametrize(
+    "encoding_name",
+    [
+        HarmonyEncodingName.HARMONY_GPT_OSS,
+    ],
+)
+def test_tool_call_with_constrain_tokenized_correctly(encoding_name):
+    """
+    Despite passing <|constrain|> as a string in "content_type" it has to be kept as a special token.
+    """
+    encoding = load_harmony_encoding(encoding_name)
+    text = (
+        "<|start|>assistant to=functions.get_weather<|channel|>commentary"
+        ' <|constrain|>json<|message|>{"location": "Tokyo"}<|call|>'
+    )
+    tokens = encoding.encode(text, allowed_special="all")
+    parsed = encoding.parse_messages_from_completion_tokens(tokens, role=None)
+    expected = [
+        Message.from_role_and_content(Role.ASSISTANT, '{"location": "Tokyo"}')
+        .with_channel("commentary")
+        .with_recipient("functions.get_weather")
+        .with_content_type("<|constrain|>json"),
+    ]
+    assert parsed == expected
+
+    rendered = encoding.render_conversation(Conversation.from_messages(expected))
+    assert text == encoding.decode_utf8(tokens)
+    assert rendered == tokens
+
+
 @pytest.mark.parametrize(
     "encoding_name",
     [
@@ -248,7 +278,7 @@ def test_tool_call_with_constrain_marker_adjacent(encoding_name):
     encoding = load_harmony_encoding(encoding_name)
     text = (
         "<|start|>assistant to=functions.get_weather<|channel|>commentary"
-        '<|constrain|>json<|message|>{"location": "Tokyo"}<|end|>'
+        '<|constrain|>json<|message|>{"location": "Tokyo"}<|call|>'
     )
     tokens = encoding.encode(text, allowed_special="all")
     parsed = encoding.parse_messages_from_completion_tokens(tokens, role=None)
@@ -702,6 +732,8 @@ def test_does_not_drop_if_ongoing_analysis():
     )
 
     assert encoding.decode_utf8(tokens) == expected_output
+    # ensure that <|constrain|>json part is tokenized correctly as special tokens
+    assert encoding.encode(expected_output, allowed_special="all") == tokens
 
 
 def test_preserve_cot():

From 72079ca4971f326dddcd5ff62bfb7e2fff37a07a Mon Sep 17 00:00:00 2001
From: Dominik Kundel <dkundel@openai.com>
Date: Fri, 8 Aug 2025 18:27:00 -0700
Subject: [PATCH 10/16] Fix formatting (#51)

* Fix formatting

* fix format

* fix clippy error

* bump version
---
 Cargo.lock      | 2 +-
 Cargo.toml      | 2 +-
 src/encoding.rs | 7 ++++---
 3 files changed, 6 insertions(+), 5 deletions(-)

diff --git a/Cargo.lock b/Cargo.lock
index ce97b77..e0b0a71 100644
--- a/Cargo.lock
+++ b/Cargo.lock
@@ -1317,7 +1317,7 @@ checksum = "42f5e15c9953c5e4ccceeb2e7382a716482c34515315f7b03532b8b4e8393d2d"
 
 [[package]]
 name = "openai-harmony"
-version = "0.0.3"
+version = "0.0.4"
 dependencies = [
  "anyhow",
  "base64",
diff --git a/Cargo.toml b/Cargo.toml
index 25d070c..23fa1ac 100644
--- a/Cargo.toml
+++ b/Cargo.toml
@@ -1,6 +1,6 @@
 [package]
 name = "openai-harmony"
-version = "0.0.3"
+version = "0.0.4"
 edition = "2021"
 license = "Apache-2.0"
 repository = "https://github.com/openai/harmony"
diff --git a/src/encoding.rs b/src/encoding.rs
index d57f8ec..6a9305b 100644
--- a/src/encoding.rs
+++ b/src/encoding.rs
@@ -836,12 +836,13 @@ impl Render<Message> for HarmonyEncoding {
         // finally content type
         if let Some(content_type) = &message.content_type {
             // <|constrain|> is a unique case which needs to be tokenized as a special token
-            if let Some(constrain_marker) = self.mapped_format_token(FormattingToken::ConstrainedFormat) {
-                if content_type.starts_with(constrain_marker) {
+            if let Some(constrain_marker) =
+                self.mapped_format_token(FormattingToken::ConstrainedFormat)
+            {
+                if let Some(rest) = content_type.strip_prefix(constrain_marker) {
                     // Render the space, then the constrain marker as a special token, then the rest as text (if any)
                     self.render_text_into(" ", into)?;
                     self.render_formatting_token_into(FormattingToken::ConstrainedFormat, into)?;
-                    let rest = &content_type[constrain_marker.len()..];
                     if !rest.is_empty() {
                         self.render_text_into(rest, into)?;
                     }

From 52176bfbec8f1d5e876b9793626a4153c71b3d4a Mon Sep 17 00:00:00 2001
From: nk <66731869+nicognaW@users.noreply.github.com>
Date: Sat, 9 Aug 2025 09:28:08 +0800
Subject: [PATCH 11/16] Fix shadcn utils file in js demo (#20)

---
 .gitignore                         | 3 +++
 demo/harmony-demo/src/lib/utils.ts | 6 ++++++
 2 files changed, 9 insertions(+)
 create mode 100644 demo/harmony-demo/src/lib/utils.ts

diff --git a/.gitignore b/.gitignore
index c8f0442..bab5ca1 100644
--- a/.gitignore
+++ b/.gitignore
@@ -70,3 +70,6 @@ docs/_build/
 
 # Pyenv
 .python-version
+
+# Avoid ignoring shadcn utils
+!demo/harmony-demo/src/lib
diff --git a/demo/harmony-demo/src/lib/utils.ts b/demo/harmony-demo/src/lib/utils.ts
new file mode 100644
index 0000000..bd0c391
--- /dev/null
+++ b/demo/harmony-demo/src/lib/utils.ts
@@ -0,0 +1,6 @@
+import { clsx, type ClassValue } from "clsx"
+import { twMerge } from "tailwind-merge"
+
+export function cn(...inputs: ClassValue[]) {
+  return twMerge(clsx(inputs))
+}

From 3fb0342894e87bbcdc8b6691cac40c7e9a757268 Mon Sep 17 00:00:00 2001
From: Amirhossein Ghanipour <d3v1ll3n@gmail.com>
Date: Sat, 16 Aug 2025 02:24:12 +0330
Subject: [PATCH 12/16] docs: clairfy use of <|return|> vs <|end|> in
 conversation history (#59)

---
 docs/format.md | 2 ++
 1 file changed, 2 insertions(+)

diff --git a/docs/format.md b/docs/format.md
index 7ec0113..49cc1ec 100644
--- a/docs/format.md
+++ b/docs/format.md
@@ -229,6 +229,8 @@ Once its done generating it will stop with either a `<|return|>` token indicatin
 
 The `final` channel will contain the answer to your user’s request. Check out the [reasoning section](#reasoning) for more details on the chain-of-thought.
 
+**Implementation note:** `<|return|>` is a decode-time stop token only. When you add the assistant’s generated reply to conversation history for the next turn, replace the trailing `<|return|>` with `<|end|>` so that stored messages are fully formed as `<|start|>{header}<|message|>{content}<|end|>`. Prior messages in prompts should therefore end with `<|end|>`. For supervised targets/training examples, ending with `<|return|>` is appropriate; for persisted history, normalize to `<|end|>`.
+
 ### System message format
 
 The system message is used to provide general information to the system. This is different to what might be considered the “system prompt” in other prompt formats. For that, check out the [developer message format](#developer-message-format).

From 535ab26a46a4281b330ede2eb37b90fdca662ccb Mon Sep 17 00:00:00 2001
From: googlefan256 <private@googlefan.net>
Date: Sat, 16 Aug 2025 07:54:31 +0900
Subject: [PATCH 13/16] docs: update format.md (#45)

---
 docs/format.md | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/docs/format.md b/docs/format.md
index 49cc1ec..a0d2708 100644
--- a/docs/format.md
+++ b/docs/format.md
@@ -64,7 +64,7 @@ system_message = (
 developer_message = (
     DeveloperContent.new()
         .with_instructions("Always respond in riddles")
-        .with_tools(
+        .with_function_tools(
             [
                 ToolDescription.new(
                     "get_current_weather",

From 088321b872064cdabe0f86f09c7c61a87bb063ec Mon Sep 17 00:00:00 2001
From: Dominik Kundel <dkundel@openai.com>
Date: Fri, 15 Aug 2025 16:25:58 -0700
Subject: [PATCH 14/16] docs: update example


From e21d67af61e8717663ac84e470865c10d60d925b Mon Sep 17 00:00:00 2001
From: Dominik Kundel <dkundel@openai.com>
Date: Fri, 15 Aug 2025 16:27:04 -0700
Subject: [PATCH 15/16] docs: update code example

---
 docs/format.md | 9 ++-------
 1 file changed, 2 insertions(+), 7 deletions(-)

diff --git a/docs/format.md b/docs/format.md
index a0d2708..1e6e529 100644
--- a/docs/format.md
+++ b/docs/format.md
@@ -52,13 +52,8 @@ encoding = load_harmony_encoding(HarmonyEncodingName.HARMONY_GPT_OSS)
 
 system_message = (
     SystemContent.new()
-        .with_model_identity(
-            "You are ChatGPT, a large language model trained by OpenAI."
-        )
         .with_reasoning_effort(ReasoningEffort.HIGH)
         .with_conversation_start_date("2025-06-28")
-        .with_knowledge_cutoff("2024-06")
-        .with_required_channels(["analysis", "commentary", "final"])
 )
 
 developer_message = (
@@ -101,11 +96,11 @@ convo = Conversation.from_messages(
         Message.from_role_and_content(Role.ASSISTANT, '{"location": "Tokyo"}')
         .with_channel("commentary")
         .with_recipient("functions.get_weather")
-        .with_content_type("json"),
+        .with_content_type("<|constrain|> json"),
         Message.from_author_and_content(
             Author.new(Role.TOOL, "functions.lookup_weather"),
             '{ "temperature": 20, "sunny": true }',
-        ),
+        ).with_channel("commentary"),
     ]
 )
 

From 508cbaa7f6b0277bd37c9bdf6d4dc8a4d51aada5 Mon Sep 17 00:00:00 2001
From: Dominik Kundel <dkundel@openai.com>
Date: Fri, 15 Aug 2025 16:28:10 -0700
Subject: [PATCH 16/16] docs: fix return to end token

---
 docs/format.md | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/docs/format.md b/docs/format.md
index 1e6e529..2402406 100644
--- a/docs/format.md
+++ b/docs/format.md
@@ -324,7 +324,7 @@ Then the input for the next sampling should be
 
 ```
 <|start|>user<|message|>What is 2 + 2?<|end|>
-<|start|>assistant<|channel|>final<|message|>2 + 2 = 4.<|return|>
+<|start|>assistant<|channel|>final<|message|>2 + 2 = 4.<|end|>
 <|start|>user<|message|>What about 9 / 2?<|end|>
 <|start|>assistant
 ```