3,2,1… Your inference is ready
import requests url = "https://api.tandemn.com/api/v1/chat/completions" headers = { "Authorization": f"Bearer <your-api-key>", "Content-Type": "application/json" } data = { "model": "casperhansen/llama-3.3-70b-instruct-awq", "messages": [ {"role": "user", "content": "Hello! Can you explain quantum computing?"} ] } response = requests.post(url, headers=headers, json=data) print(response.json())