SimpleTIR: End-to-End Reinforcement Learning for Multi-Turn Tool-Integrated Reasoning
Paper
β’
2509.02479
β’
Published
β’
74
Open language models for South-East Asia
blocks between responses.from HelpingAI import HAI # pip install HelpingAI==1.1.1
from rich import print
hai = HAI(api_key="hl-***********************")
response = hai.chat.completions.create(
model="Dhanishtha-2.0-preview",
messages=[{"role": "user", "content": "What is the value of β«0βπ₯3/π₯β1ππ₯ ?"}],
stream=True,
hide_think=False # Hide or show models thinking
)
for chunk in response:
print(chunk.choices[0].delta.content, end="", flush=True)