import requests import json messages = [ {"role": "user", "content": "helo"}, {"role": "assistant", "content": "Hello! How can I assist you today?"}, {"role": "user", "content": "who are you and give me a breif description of who created you "} ] model = "grok-3-mini" url = " http://127.0.0.1:8000/api/v1/generate" payload = { "messages": messages, "model": model } response = requests.post(url, json=payload, stream=True) if response.status_code == 200: for line in response.iter_lines(): if line: decoded_line = line.decode('utf-8') if decoded_line.startswith('data: [DONE]'): break elif decoded_line.startswith('data: '): try: json_data = json.loads(decoded_line[6:]) if json_data["choices"] and "text" in json_data["choices"][0]: print(json_data["choices"][0]["text"], end='') except json.JSONDecodeError: continue else: print(f"Request failed with status code {response.status_code}")