-
Notifications
You must be signed in to change notification settings - Fork 2
/
Copy pathlitellm_config.yml
141 lines (118 loc) · 4.05 KB
/
litellm_config.yml
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
model_list:
- model_name: ollama/codellama
litellm_params:
model: "ollama/codellama:34b"
- model_name: mistral/mistral-medium
litellm_params:
model: mistral/mistral-medium-latest
api_key: os.environ/MISTRAL_API_KEY
api_base: https://api.mistral.ai/v1
- model_name: openai/gpt-4-turbo-2024-04-09
litellm_params:
model: openai/gpt-4-turbo-2024-04-09
api_key: os.environ/OPENAI_API_KEY
api_base: https://api.openai.com/v1
- model_name: openai/o1-mini
litellm_params:
model: o1-mini
api_key: os.environ/OPENAI_API_KEY
api_base: https://api.openai.com/v1
- model_name: openai/o1-preview
litellm_params:
model: o1-preview
api_key: os.environ/OPENAI_API_KEY
api_base: https://api.openai.com/v1
- model_name: openai/gpt-4o
litellm_params:
model: openai/gpt-4o
api_key: os.environ/OPENAI_API_KEY
api_base: https://api.openai.com/v1
- model_name: openai/gpt-4o-2024-11-20
litellm_params:
model: gpt-4o-2024-11-20
api_key: os.environ/OPENAI_API_KEY
- model_name: openai/gpt-4o-mini
litellm_params:
model: gpt-4o-mini
api_key: os.environ/OPENAI_API_KEY
api_base: https://api.openai.com/v1
- model_name: openai/o1-preview
litellm_params:
model: openai/o1-preview
api_key: os.environ/OPENAI_API_KEY
api_base: https://api.openai.com/v1
- model_name: openai/gpt-3.5-turbo-0125
litellm_params:
model: openai/gpt-3.5-turbo-0125
api_key: os.environ/OPENAI_API_KEY
api_base: https://api.openai.com/v1
- model_name: openai/gpt-3.5-turbo
litellm_params:
model: openai/gpt-3.5-turbo
api_key: os.environ/OPENAI_API_KEY
api_base: https://api.openai.com/v1
- model_name: openai/dall-e-3
litellm_params:
model: openai/dall-e-3
api_key: os.environ/OPENAI_API_KEY
api_base: https://api.openai.com/v1
- model_name: mistral/mistral-large
litellm_params:
model: mistral/mistral-large-latest
api_key: os.environ/MISTRAL_API_KEY
api_base: https://api.mistral.ai/v1
- model_name: anthropic/claude-3-opus
litellm_params:
model: claude-3-opus-20240229
api_base: https://api.anthropic.com/v1/messages
api_key: os.environ/ANTHROPIC_API_KEY
# explicit max_tokens required because a 256 default is being set otherwise
max_tokens: 4096
- model_name: anthropic/claude-3.5-sonnet
litellm_params:
model: claude-3-5-sonnet-20241022
api_base: https://api.anthropic.com/v1/messages
api_key: os.environ/ANTHROPIC_API_KEY
max_tokens: 4096
- model_name: anthropic/claude-3.5-haiku
litellm_params:
model: claude-3-5-haiku-20241022
api_base: https://api.anthropic.com/v1/messages
api_key: os.environ/ANTHROPIC_API_KEY
max_tokens: 4096
- model_name: deepseek/deepseek-v3
litellm_params:
model: deepseek/deepseek-chat
api_base: https://api.deepseek.com
api_key: os.environ/DEEPSEEK_API_KEY
max_tokens: 4096
- model_name: deepseek/deepseek-r1
litellm_params:
model: deepseek/deepseek-reasoner
api_base: https://api.deepseek.com
api_key: os.environ/DEEPSEEK_API_KEY
max_tokens: 4096
- model_name: openrouter/llama-3.1-sonar-large-online
litellm_params:
model: openrouter/perplexity/llama-3.1-sonar-large-128k-online
# api_base: https://openrouter.ai/api/v1/chat/completions
api_key: os.environ/OPENROUTER_API_KEY
max_tokens: 4096
- model_name: openrouter/deepseek-v3
litellm_params:
model: openrouter/deepseek/deepseek-chat
api_key: os.environ/OPENROUTER_API_KEY
max_tokens: 4096
- model_name: openrouter/deepseek-r1
litellm_params:
model: openrouter/deepseek/deepseek-r1
api_key: os.environ/OPENROUTER_API_KEY
max_tokens: 4096
litellm_settings:
drop_params: True
stream: False
general_settings:
master_key: os.environ/LITELLM_MASTER_KEY
database_url: os.environ/DATABASE_URL
database_connection_pool_limit: 100
database_connection_timeout: 60