noperator · June 23, 2026 16:47
diff --git a/README.md b/README.md
diff --git a/fruits.py b/fruits.py
 #!/usr/bin/env python3
 import json
 from openai import OpenAI

 client = OpenAI(base_url="http://localhost:8000/v1", api_key="-")
 model = client.models.list().data[0].id

 END = "ekYyhUMDCGhE65J5"

 schema = {
    "type": "object",
    "properties": {
        "fruit": {
            "type": "string",
            "enum": ["apple", "banana", "orange"],
        }
    },
    "required": ["fruit"],
    "additionalProperties": False,
 }

 resp = client.chat.completions.create(
    model=model,
    messages=[
        {
            "role": "user",
            "content": "Pick one fruit. Keep your reasoning brief.",
        }
    ],
    temperature=0,
    max_tokens=1024,
    stop=[END],
    response_format={
        "type": "structural_tag",
        "structures": [
            {
                "begin": "</think>",
                "schema": schema,
                "end": END,
            }
        ],
        "triggers": ["</think>"],
    },
 )

 text = resp.choices[0].message.content
 print("RAW:")
 print(text)

 if "</think>" not in text:
    raise RuntimeError("Model never emitted </think>; structural constraint never activated.")

 after = text.split("</think>", 1)[1]

 # With stop=[END], vLLM usually removes END from returned text.
 # This split keeps the parser safe if behavior/config changes.
 json_text = after.split(END, 1)[0].strip()

 print("\nJSON TEXT:")
 print(json_text)

 parsed = json.loads(json_text)

 assert isinstance(parsed, dict)
 assert set(parsed.keys()) == {"fruit"}
 assert parsed["fruit"] in schema["properties"]["fruit"]["enum"]

 print("\nparsed:", parsed)
 print("OK")
	#!/usr/bin/env python3
	import json
	from openai import OpenAI

	client = OpenAI(base_url="http://localhost:8000/v1", api_key="-")
	model = client.models.list().data[0].id

	END = "ekYyhUMDCGhE65J5"

	schema = {
	"type": "object",
	"properties": {
	"fruit": {
	"type": "string",
	"enum": ["apple", "banana", "orange"],
	}
	},
	"required": ["fruit"],
	"additionalProperties": False,
	}

	resp = client.chat.completions.create(
	model=model,
	messages=[
	{
	"role": "user",
	"content": "Pick one fruit. Keep your reasoning brief.",
	}
	],
	temperature=0,
	max_tokens=1024,
	stop=[END],
	response_format={
	"type": "structural_tag",
	"structures": [
	{
	"begin": "</think>",
	"schema": schema,
	"end": END,
	}
	],
	"triggers": ["</think>"],
	},
	)

	text = resp.choices[0].message.content
	print("RAW:")
	print(text)

	if "</think>" not in text:
	raise RuntimeError("Model never emitted </think>; structural constraint never activated.")

	after = text.split("</think>", 1)[1]

	# With stop=[END], vLLM usually removes END from returned text.
	# This split keeps the parser safe if behavior/config changes.
	json_text = after.split(END, 1)[0].strip()

	print("\nJSON TEXT:")
	print(json_text)

	parsed = json.loads(json_text)

	assert isinstance(parsed, dict)
	assert set(parsed.keys()) == {"fruit"}
	assert parsed["fruit"] in schema["properties"]["fruit"]["enum"]

	print("\nparsed:", parsed)
	print("OK")
No results found