post
POST /v1/chat/completions HTTP/1.1
Host: sn1.api.macrocosmos.ai
Content-Type: application/json
Accept: */*
Content-Length: 395

{
  "uids": [
    1,
    2,
    3
  ],
  "messages": [
    {
      "content": "Tell me about neural networks",
      "role": "user"
    }
  ],
  "seed": 42,
  "task": "InferenceTask",
  "model": "hugging-quants/Meta-Llama-3.1-70B-Instruct-AWQ-INT4",
  "test_time_inference": true,
  "mixture": true,
  "sampling_parameters": {
    "do_sample": true,
    "max_new_tokens": 512,
    "temperature": 0.7,
    "top_k": 50,
    "top_p": 0.95
  },
  "inference_mode": "Reasoning-Fast",
  "json_format": true,
  "stream": true
}
{
  "id": "ca0b8681-7b78-4234-8868-71ad1ebfa9ed",
  "choices": [
    {
      "finish_reason": "stop",
      "index": 0,
      "logprobs": null,
      "message": {
        "content": "Neural networks are a type of machine learning model inspired by the human brain's structure. They consist of interconnected nodes arranged in layers, including input, hidden, and output layers. These networks learn by adjusting weights during training using optimization algorithms. Neural networks find applications in image recognition, speech processing, and many other domains requiring pattern recognition and prediction capabilities.",
        "refusal": null,
        "role": "assistant",
        "audio": null,
        "function_call": null,
        "tool_calls": null
      }
    }
  ],
  "created": 1743016348,
  "model": "hugging-quants/Meta-Llama-3.1-70B-Instruct-AWQ-INT4",
  "object": "chat.completion",
  "service_tier": null,
  "system_fingerprint": null,
  "usage": null
}