forked from julep-ai/julep
-
Notifications
You must be signed in to change notification settings - Fork 0
/
Copy pathlitellm-config.yaml
151 lines (124 loc) · 3.53 KB
/
litellm-config.yaml
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
environment_variables:
NO_DOCS: "true"
model_list:
# -*= Paid models =*-
# -------------------
# Gemini models
- model_name: gemini-1.5-pro
litellm_params:
model: vertex_ai_beta/gemini-1.5-pro
tags: ["paid"]
vertex_credentials: os.environ/GOOGLE_APPLICATION_CREDENTIALS
- model_name: claude-3.5-sonnet
litellm_params:
model: vertex_ai/claude-3-5-sonnet@20240620
tags: ["paid"]
vertex_credentials: os.environ/GOOGLE_APPLICATION_CREDENTIALS
# OpenAI models
- model_name: "gpt-4-turbo"
litellm_params:
model: "openai/gpt-4-turbo"
tags: ["paid"]
api_key: os.environ/OPENAI_API_KEY
- model_name: "gpt-4o"
litellm_params:
model: "openai/gpt-4o"
tags: ["paid"]
api_key: os.environ/OPENAI_API_KEY
# Anthropic models
- model_name: "claude-3.5-sonnet"
litellm_params:
model: "claude-3-5-sonnet-20240620"
tags: ["paid"]
api_key: os.environ/ANTHROPIC_API_KEY
- model_name: "claude-3-opus"
litellm_params:
model: "claude-3-opus-20240229"
tags: ["paid"]
api_key: os.environ/ANTHROPIC_API_KEY
- model_name: "claude-3-sonnet"
litellm_params:
model: "claude-3-sonnet-20240229"
tags: ["paid"]
api_key: os.environ/ANTHROPIC_API_KEY
- model_name: "claude-3-haiku"
litellm_params:
model: "claude-3-haiku-20240307"
tags: ["paid"]
api_key: os.environ/ANTHROPIC_API_KEY
# Groq models
- model_name: "llama-3.1-70b"
litellm_params:
model: "groq/llama-3.1-70b-versatile"
tags: ["paid"]
api_key: os.environ/GROQ_API_KEY
- model_name: "llama-3.1-8b"
litellm_params:
model: "groq/llama-3.1-8b-instant"
tags: ["paid"]
api_key: os.environ/GROQ_API_KEY
# -*= Embedding models =*-
# ------------------------
- model_name: text-embedding-3-large
litellm_params:
model: "openai/text-embedding-3-large"
api_key: os.environ/OPENAI_API_KEY
tags: ["paid"]
- model_name: voyage-multilingual-2
litellm_params:
model: "voyage/voyage-multilingual-2"
api_key: os.environ/VOYAGE_API_KEY
tags: ["paid"]
- model_name: voyage-3
litellm_params:
model: "voyage/voyage-3"
api_key: os.environ/VOYAGE_API_KEY
tags: ["paid"]
- model_name: Alibaba-NLP/gte-large-en-v1.5
litellm_params:
model: openai/Alibaba-NLP/gte-large-en-v1.5
api_base: http://text-embeddings-inference
tags: ["free"]
- model_name: BAAI/bge-m3
litellm_params:
model: openai/BAAI/bge-m3
api_base: http://text-embeddings-inference
tags: ["free"]
- model_name: vertex_ai/text-embedding-004
litellm_params:
model: vertex_ai/text-embedding-004
# vertex_project: os.environ/GOOGLE_PROJECT_ID
# vertex_location: os.environ/VERTEX_LOCATION
# -*= Free models =*-
# -------------------
- model_name: gpt-4o-mini
litellm_params:
model: openai/gpt-4o-mini
api_key: os.environ/OPENAI_API_KEY
tags: ["free"]
# https://github.com/BerriAI/litellm/blob/main/litellm/__init__.py
litellm_settings:
num_retries: 3
request_timeout: 180
allowed_fails: 3
cooldown_time: 30
drop_params: true
modify_params: true
telemetry: false
retry: true
add_function_to_prompt: true
set_verbose: false
cache: true
cache_params: # set cache params for redis
type: redis
namespace: "litellm_caching"
host: os.environ/LITELLM_REDIS_HOST
port: os.environ/LITELLM_REDIS_PORT
password: os.environ/LITELLM_REDIS_PASSWORD
router_settings:
routing_strategy: simple-shuffle
num_retries: 3
general_settings:
master_key: os.environ/LITELLM_MASTER_KEY
database_url: os.environ/LITELLM_DATABASE_URL
enforce_user_param: true