parameters.json 408 B

123456789101112
  1. {
  2. "MAX_NEW_TOKEN" : 256,
  3. "CONCURRENT_LEVELS" : [1, 2, 4, 8, 16, 32, 64],
  4. "THRESHOLD_TPS" : 7,
  5. "MODEL_PATH" : "meta-llama/your-model-path",
  6. "RANDOM_PROMPT_LENGTH" : 25,
  7. "TEMPERATURE" : 0.6,
  8. "TOP_P" : 0.9,
  9. "MODEL_ENDPOINTS" : "https://your-endpoint.inference.ai.azure.com/v1/chat/completions",
  10. "API_KEY" : "your-auth-key",
  11. "SYS_PROMPT" : "You are a helpful assistant."
  12. }