LLM
FP8
Context Length: 131072
LLM
FP8
Context Length: 131072

Control Bar

API

import requests url = "https://api.hyperbolic.xyz/v1/chat/completions" headers = { "Content-Type": "application/json", "Authorization": "Bearer <api-key>" } data = { "messages": [{ "role": "user", "content": "What can I do in SF?" }], "model": "meta-llama/Meta-Llama-3.1-405B-Instruct", "max_tokens": 512, "temperature": 0.7, "top_p": 0.9 } response = requests.post(url, headers=headers, json=data) print(response.json())