File size: 3,698 Bytes
85e37e1
 
 
 
 
 
 
 
 
7ef1ddb
 
85e37e1
7ef1ddb
85e37e1
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
9f104ef
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
85e37e1
7ef1ddb
 
85e37e1
7ef1ddb
85e37e1
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
PROVIDERS = [
    ("OpenAI", "openai"),
    ("Anthropic", "anthropic"),
    ("Cohere", "cohere"),
    ("Meta", "huggingface_hub/meta"),
    ("Mistral AI", "mistralai"),
]

OPENAI_MODELS = [
    ("GPT-4o", "gpt-4o"),
    ("GPT-4-Turbo", "gpt-4-turbo"),
    ("GPT-4", "gpt-4"),
    ("GPT-3.5-Turbo", "gpt-3.5-turbo"),
]

ANTHROPIC_MODELS = [
    ("Claude 3 Opus", "claude-3-opus-20240229"),
    ("Claude 3 Sonnet", "claude-3-sonnet-20240229"),
    ("Claude 3 Haiku", "claude-3-haiku-20240307"),
    ("Claude 2.1", "claude-2.1"),
    ("Claude 2.0", "claude-2.0"),
    ("Claude Instant 1.2", "claude-instant-1.2"),
]

COHERE_MODELS = [
    ("Command Light", "command-light"),
    ("Command", "command"),
    ("Command R", "command-r"),
    ("Command R+", "command-r-plus"),
]

META_MODELS = [
    ("Llama 3 8B", "meta-llama/Meta-Llama-3-8B"),
    ("Llama 3 70B", "meta-llama/Meta-Llama-3-70B"),
    ("Llama 2 7B", "meta-llama/Llama-2-7b-hf"),
    ("Llama 2 13B", "meta-llama/Llama-2-13b-hf"),
    ("Llama 2 70B", "meta-llama/Llama-2-70b-hf"),
]

MISTRALAI_MODELS = [
    ("Mistral 7B", "open-mistral-7b"),
    ("Mixtral 8x7B", "open-mixtral-8x7b"),
    ("Mixtral 8x22B", "open-mixtral-8x22b"),
    ("Tiny", "mistral-tiny-2312"),
    ("Small", "mistral-small-2402"),
    ("Medium", "mistral-medium-2312"),
    ("Large", "mistral-large-2402"),
]

PROMPTS = [
    ("Write a Tweet", 50),
    ("Write an email", 170),
    ("Write an article summary", 250),
    ("Small conversation with a chatbot", 400),
    ("Write a report of 5 pages", 5000),
]
PROMPTS = [(s + f" ({v} output tokens)", v) for (s, v) in PROMPTS]

CLOSED_SOURCE_MODELS = {
    "openai/gpt-4o",
    "openai/gpt-4-turbo",
    "openai/gpt-4",
    "openai/gpt-3.5-turbo",
    "anthropic/claude-3-opus-20240229",
    "anthropic/claude-3-sonnet-20240229",
    "anthropic/claude-3-haiku-20240307",
    "anthropic/claude-2.1",
    "anthropic/claude-2.0",
    "anthropic/claude-instant-1.2",
    "mistralai/mistral-tiny-2312",
    "mistralai/mistral-small-2402",
    "mistralai/mistral-medium-2312",
    "mistralai/mistral-large-2402",
}

MODELS = [
    ("OpenAI / GPT-4o", "openai/gpt-4o"),
    ("OpenAI / GPT-4-Turbo", "openai/gpt-4-turbo"),
    ("OpenAI / GPT-4", "openai/gpt-4"),
    ("OpenAI / GPT-3.5-Turbo", "openai/gpt-3.5-turbo"),
    ("Anthropic / Claude 3 Opus", "anthropic/claude-3-opus-20240229"),
    ("Anthropic / Claude 3 Sonnet", "anthropic/claude-3-sonnet-20240229"),
    ("Anthropic / Claude 3 Haiku", "anthropic/claude-3-haiku-20240307"),
    ("Anthropic / Claude 2.1", "anthropic/claude-2.1"),
    ("Anthropic / Claude 2.0", "anthropic/claude-2.0"),
    ("Anthropic / Claude Instant 1.2", "anthropic/claude-instant-1.2"),
    ("Mistral AI / Mistral 7B", "mistralai/open-mistral-7b"),
    ("Mistral AI / Mixtral 8x7B", "mistralai/open-mixtral-8x7b"),
    ("Mistral AI / Mixtral 8x22B", "mistralai/open-mixtral-8x22b"),
    ("Mistral AI / Tiny", "mistralai/mistral-tiny-2312"),
    ("Mistral AI / Small", "mistralai/mistral-small-2402"),
    ("Mistral AI / Medium", "mistralai/mistral-medium-2312"),
    ("Mistral AI / Large", "mistralai/mistral-large-2402"),
    ("Meta / Llama 3 8B", "huggingface_hub/meta-llama/Meta-Llama-3-8B"),
    ("Meta / Llama 3 70B", "huggingface_hub/meta-llama/Meta-Llama-3-70B"),
    ("Meta / Llama 2 7B", "huggingface_hub/meta-llama/Llama-2-7b-hf"),
    ("Meta / Llama 2 13B", "huggingface_hub/meta-llama/Llama-2-13b-hf"),
    ("Meta / Llama 2 70B", "huggingface_hub/meta-llama/Llama-2-70b-hf"),
    ("Cohere / Command Light", "cohere/command-light"),
    ("Cohere / Command", "cohere/command"),
    ("Cohere / Command R", "cohere/command-r"),
    ("Cohere / Command R+", "cohere/command-r-plus"),
]