while not env.is_done():
llm_response = agent.step(obs.question).msgs[0].content
agent.reset() # clear context window
action = Action(llm_response=llm_response)
result = await env.step(action)
next_obs, reward, done, info = result
obs = next_obs
print("\nAgent Move:", action.llm_response)
print("Observation:")
print(next_obs.question)
print("Reward:", reward)
print("Done:", done)
print("Info:", info)