parameters.json 398 B

123456789101112
  1. {
  2. "MAX_NEW_TOKEN" : 256,
  3. "CONCURRENT_LEVELS" : [1, 2, 4, 8, 16, 32, 64],
  4. "THRESHOLD_TPS" : 7,
  5. "TOKENIZER_PATH" : "../../tokenizer",
  6. "RANDOM_PROMPT_LENGTH" : 1000,
  7. "TEMPERATURE" : 0.6,
  8. "TOP_P" : 0.9,
  9. "MODEL_ENDPOINTS" : "https://your-endpoint.inference.ai.azure.com/v1/completions",
  10. "API_KEY" : "your-auth-key",
  11. "SYS_PROMPT" : "You are a helpful assistant."
  12. }