clients: - type: ollama api_base: https://ollama.giugl.io models: - name: mistral:7b-instruct-v0.3-fp16 max_input_tokens: 32000 max_output_tokens: 8192 - name: llama3:8b-instruct-fp16 max_input_tokens: 8192 max_output_tokens: 8192 - name: phi3:14b-medium-4k-instruct-q8_0 max_input_tokens: 128000 max_output_tokens: 8192 - name: pino-coder max_input_tokens: 8192 max_output_tokens: 8192 - type: openai api_key: null api_base: https://api.openai.com/v1