Merge branch 'main' into main

2025-08-23 10:17:08 -04:00 · 2025-08-05 21:31:34 +03:00 · 2025-08-05 21:31:34 +03:00 · eb86106b69
commit eb86106b69
parent 57afd6f60b 64bca4cf32
6 changed files with 27 additions and 20 deletions
--- a/.github/workflows/CI.yml
+++ b/.github/workflows/CI.yml
@ -28,14 +28,10 @@ jobs:
            target: x86_64
          - runner: ubuntu-22.04
            target: x86
-          # - runner: ubuntu-22.04
+          - runner: ubuntu-22.04
-          #   target: aarch64
+            target: aarch64
          - runner: ubuntu-22.04
            target: armv7
          # - runner: ubuntu-22.04
          #   target: s390x
          # - runner: ubuntu-22.04
          #   target: ppc64le
    steps:
      - uses: actions/checkout@v4
      - uses: actions/setup-python@v5
@ -43,6 +39,9 @@ jobs:
          python-version: 3.x
      - name: Build wheels
        uses: PyO3/maturin-action@v1
        env:
          # Ensure ring's ARM assembly sees an explicit architecture on aarch64 (glibc)
          CFLAGS_aarch64_unknown_linux_gnu: -D__ARM_ARCH=8
        with:
          target: ${{ matrix.platform.target }}
          args: --release --out dist --find-interpreter
@ -74,6 +73,9 @@ jobs:
          python-version: 3.x
      - name: Build wheels
        uses: PyO3/maturin-action@v1
        env:
          # Ensure ring's ARM assembly sees an explicit architecture on aarch64 (musl)
          CFLAGS_aarch64_unknown_linux_musl: -D__ARM_ARCH=8
        with:
          target: ${{ matrix.platform.target }}
          args: --release --out dist --find-interpreter
@ -104,7 +106,7 @@ jobs:
        uses: PyO3/maturin-action@v1
        with:
          target: ${{ matrix.platform.target }}
-          args: -F python-binding --release --out dist --find-interpreter
+          args: --release --out dist --find-interpreter
          sccache: ${{ !startsWith(github.ref, 'refs/tags/') }}
      - name: Upload wheels
        uses: actions/upload-artifact@v4
@ -130,7 +132,7 @@ jobs:
        uses: PyO3/maturin-action@v1
        with:
          target: ${{ matrix.platform.target }}
-          args: -F python-binding --release --out dist --find-interpreter
+          args: --release --out dist --find-interpreter
          sccache: ${{ !startsWith(github.ref, 'refs/tags/') }}
      - name: Upload wheels
        uses: actions/upload-artifact@v4
--- a/Cargo.toml
+++ b/Cargo.toml
@ -42,7 +42,10 @@ reqwest = { version = "0.12.5", default-features = false, features = [
 ] }
 futures = "0.3"
 clap = { version = "4", features = ["derive"] }
-pyo3 = { version = "0.25.0", optional = true, features = ["extension-module"] }
+pyo3 = { version = "0.25.0", optional = true, features = [
    "extension-module",
    "abi3-py38",
 ] }
 wasm-bindgen = { version = "0.2.100", optional = true, features = [
    "serde-serialize",
 ] }
--- a/README.md
+++ b/README.md
@ -10,9 +10,9 @@
 The [gpt-oss models][gpt-oss] were trained on the [harmony response format][harmony-format] for defining conversation structures, generating reasoning output and structuring function calls. If you are not using gpt-oss directly but through an API or a provider like HuggingFace, Ollama, or vLLM, you will not have to be concerned about this as your inference solution will handle the formatting. If you are building your own inference solution, this guide will walk you through the prompt format. The format is designed to mimic the OpenAI Responses API, so if you have used that API before, this format should hopefully feel familiar to you. gpt-oss should not be used without using the harmony format as it will not work correctly.
-The format enables the model to output to multiple different channels for chain of thought, and tool calling premables along with regular responses. It also enables specifying various tool namespaces, and structured outputs along with a clear instruction hierarchy. [Check out the guide][harmony-format] to learn more about the format itself.
+The format enables the model to output to multiple different channels for chain of thought, and tool calling preambles along with regular responses. It also enables specifying various tool namespaces, and structured outputs along with a clear instruction hierarchy. [Check out the guide][harmony-format] to learn more about the format itself.
-```
+```text
 <|start|>system<|message|>You are ChatGPT, a large language model trained by OpenAI.
 Knowledge cutoff: 2024-06
 Current date: 2025-06-28
@ -114,11 +114,11 @@ openai-harmony = { git = "https://github.com/openai/harmony" }
 ```rust
 use openai_harmony::chat::{Message, Role, Conversation};
 use openai_harmony::{HarmonyEncodingName, load_harmony_encoding};
 fn main() -> anyhow::Result<()> {
    let enc = load_harmony_encoding(HarmonyEncodingName::HarmonyGptOss)?;
-    let convo = Conversation::from_messages([
+    let convo =
-        Message::from_role_and_content(Role::User, "Hello there!"),
+        Conversation::from_messages([Message::from_role_and_content(Role::User, "Hello there!")]);
    ]);
    let tokens = enc.render_conversation_for_completion(&convo, Role::Assistant, None)?;
    println!("{:?}", tokens);
    Ok(())
@ -130,7 +130,7 @@ fn main() -> anyhow::Result<()> {
 The majority of the rendering and parsing is built in Rust for performance and exposed to Python
 through thin [`pyo3`](https://pyo3.rs/) bindings.
-```
+```text
 ┌──────────────────┐      ┌───────────────────────────┐
 │  Python code     │      │  Rust core (this repo)    │
 │  (dataclasses,   │────► │  • chat / encoding logic  │
@ -140,7 +140,7 @@ through thin [`pyo3`](https://pyo3.rs/) bindings.
 ### Repository layout
-```
+```text
 .
 ├── src/                  # Rust crate
 │   ├── chat.rs           # High-level data-structures (Role, Message, …)
@ -177,10 +177,10 @@ source .venv/bin/activate
 # Install maturin and test dependencies
 pip install maturin pytest mypy ruff  # tailor to your workflow
 # Compile the Rust crate *and* install the Python package in editable mode
-maturin develop -F python-binding --release
+maturin develop --release
 ```
-`maturin develop -F python-binding` builds _harmony_ with Cargo, produces a native extension
+`maturin develop` builds _harmony_ with Cargo, produces a native extension
 (`openai_harmony.<abi>.so`) and places it in your virtualenv next to the pure-
 Python wrapper – similar to `pip install -e .` for pure Python projects.
--- a/pyproject.toml
+++ b/pyproject.toml
@ -19,7 +19,7 @@ readme = "README.md"
 demo = ["uvicorn", "fastapi"]
 [tool.maturin]
-features = ["pyo3/extension-module"]
+features = ["python-binding", "pyo3/extension-module"]
 module-name = "openai_harmony"
 python-source = "python"
--- a/src/lib.rs
+++ b/src/lib.rs
@ -1,3 +1,5 @@
 #![doc = include_str!("../README.md")]
 pub mod chat;
 mod encoding;
 mod registry;
--- a/test_python.sh
+++ b/test_python.sh
@ -1,5 +1,5 @@
 #!/usr/bin/env bash
 set -e
 source .venv/bin/activate
-maturin develop -F python-binding --release 
+maturin develop --release 
 pytest "$@"