/
supported_models.yaml
91 lines (88 loc) · 2.77 KB
/
supported_models.yaml
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
models:
# Llama
- name: llama-2-7b
type: llama2-completion
runtime: llama-2
tag: 0.0.3
- name: llama-2-7b-chat
type: llama2-chat
runtime: llama-2
tag: 0.0.3
- name: llama-2-13b
type: llama2-completion
runtime: llama-2
tag: 0.0.3
- name: llama-2-13b-chat
type: llama2-chat
runtime: llama-2
tag: 0.0.3
- name: llama-2-70b
type: llama2-completion
runtime: llama-2
tag: 0.0.3
- name: llama-2-70b-chat
type: llama2-chat
runtime: llama-2
tag: 0.0.3
# Tag history:
# 0.0.3 - Inference API Cleanup (#233)
# 0.0.2 - Eliminate Unnecessary Process Group Creation in Worker Initialization (#244)
# 0.0.1 - Initial Release
# Falcon
- name: falcon-7b
type: text-generation
version: https://huggingface.co/tiiuae/falcon-7b/commit/898df1396f35e447d5fe44e0a3ccaaaa69f30d36
runtime: tfs
tag: 0.0.4
- name: falcon-7b-instruct
type: text-generation
version: https://huggingface.co/tiiuae/falcon-7b-instruct/commit/cf4b3c42ce2fdfe24f753f0f0d179202fea59c99
runtime: tfs
tag: 0.0.4
# Tag history:
# 0.0.4 - Adjust default model params (#310)
# 0.0.3 - Update Default Params (#294)
# 0.0.2 - Inference API Cleanup (#233)
# 0.0.1 - Initial Release
- name: falcon-40b
type: text-generation
version: https://huggingface.co/tiiuae/falcon-40b/commit/4a70170c215b36a3cce4b4253f6d0612bb7d4146
runtime: tfs
tag: 0.0.5
- name: falcon-40b-instruct
type: text-generation
version: https://huggingface.co/tiiuae/falcon-40b-instruct/commit/ecb78d97ac356d098e79f0db222c9ce7c5d9ee5f
runtime: tfs
tag: 0.0.5
# Tag history for 40b models:
# 0.0.5 - Adjust default model params (#310)
# 0.0.4 - Skipped due to incomplete upload issue
# 0.0.3 - Update Default Params (#294)
# 0.0.2 - Inference API Cleanup (#233)
# 0.0.1 - Initial Release
# Mistral
- name: mistral-7b
type: text-generation
version: https://huggingface.co/mistralai/Mistral-7B-v0.1/commit/26bca36bde8333b5d7f72e9ed20ccda6a618af24
runtime: tfs
tag: 0.0.4
- name: mistral-7b-instruct
type: text-generation
version: https://huggingface.co/mistralai/Mistral-7B-Instruct-v0.2/commit/b70aa86578567ba3301b21c8a27bea4e8f6d6d61
runtime: tfs
tag: 0.0.4
# Tag history:
# 0.0.4 - Adjust default model params (#310)
# 0.0.3 - Update Default Params (#294)
# 0.0.2 - Inference API Cleanup (#233)
# 0.0.1 - Initial Release
# Phi-2
- name: phi-2
type: text-generation
version: https://huggingface.co/microsoft/phi-2/commit/b10c3eba545ad279e7208ee3a5d644566f001670
runtime: tfs
tag: 0.0.3
# Tag history:
# 0.0.3 - Adjust default model params (#310)
# 0.0.2 - Update Default Params (#294)
# 0.0.1 - Initial Release