File size: 8,935 Bytes
ecfb771
a016519
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
[
    {
        "name": "GPT-4",
        "description": "A large language model capable of understanding and generating human-like text.",
        "dateOfRelease": "2023-03-14",
        "developer": "OpenAI",
        "use_case": "Natural language understanding and generation.",
        "impact": "Enhanced capabilities in various applications, including chatbots and content creation."
    },
    {
        "name": "DALL·E 3",
        "description": "An AI system that can generate realistic images and art from textual descriptions.",
        "dateOfRelease": "2023-09-20",
        "developer": "OpenAI",
        "use_case": "Text-to-image generation for creative and design purposes.",
        "impact": "Enabled users to create detailed and diverse images from textual prompts."
    },
    {
        "name": "MidJourney",
        "description": "An AI program that creates images from textual descriptions.",
        "dateOfRelease": "2022-07-12",
        "developer": "MidJourney, Inc.",
        "use_case": "Artistic image generation based on user prompts.",
        "impact": "Empowered artists and creators to generate unique visuals through AI."
    },
    {
        "name": "Stable Diffusion",
        "description": "A deep learning model capable of generating detailed images from text prompts.",
        "dateOfRelease": "2022-08-22",
        "developer": "Stability AI",
        "use_case": "Open-source text-to-image generation.",
        "impact": "Provided an accessible tool for generating images, fostering innovation in AI art."
    },
    {
        "name": "Gemini 1.0 Ultra",
        "description": "A large multimodal model for complex tasks, including text and image understanding.",
        "dateOfRelease": "2024-05-10",
        "developer": "Google AI",
        "use_case": "Multimodal reasoning and content generation.",
        "impact": "Advanced AI capabilities in understanding and generating diverse content types."
    },
    {
        "name": "LLaMA",
        "description": "A collection of foundation language models ranging from 7B to 65B parameters.",
        "dateOfRelease": "2023-02-24",
        "developer": "Meta AI",
        "use_case": "Research in natural language processing.",
        "impact": "Contributed to the development of efficient and accessible language models."
    },
    {
        "name": "Gen-2",
        "description": "A text-to-video generative AI model that creates videos from textual descriptions.",
        "dateOfRelease": "2023-04-04",
        "developer": "Runway",
        "use_case": "Video content creation from text prompts.",
        "impact": "Enabled creators to produce videos without traditional filming equipment."
    },
    {
        "name": "Make-A-Video",
        "description": "An AI system that generates videos from textual input.",
        "dateOfRelease": "2022-09-29",
        "developer": "Meta Platforms",
        "use_case": "Text-to-video generation for creative applications.",
        "impact": "Pioneered AI-driven video generation, expanding creative possibilities."
    },
    {
        "name": "Imagen",
        "description": "A text-to-image diffusion model with high fidelity and deep language understanding.",
        "dateOfRelease": "2022-05-23",
        "developer": "Google Research",
        "use_case": "High-quality image generation from text.",
        "impact": "Set new benchmarks in photorealistic image generation from textual descriptions."
    },
    {
        "name": "Codey",
        "description": "An AI model designed for code generation and understanding.",
        "dateOfRelease": "2023-06-15",
        "developer": "Google AI",
        "use_case": "Assisting developers in writing and understanding code.",
        "impact": "Improved developer productivity by providing AI-driven coding assistance."
    },
    {
        "name": "Chirp",
        "description": "A speech-to-text model that transcribes audio into text.",
        "dateOfRelease": "2023-08-01",
        "developer": "Google AI",
        "use_case": "Transcription of spoken language into text.",
        "impact": "Enhanced accessibility and usability in applications requiring speech recognition."
    },
    {
        "name": "Veo",
        "description": "An AI model for video understanding and analysis.",
        "dateOfRelease": "2023-11-20",
        "developer": "Google AI",
        "use_case": "Analyzing and interpreting video content.",
        "impact": "Improved capabilities in video content analysis for various applications."
    },
    {
        "name": "MedLM",
        "description": "A language model specialized in medical knowledge and terminology.",
        "dateOfRelease": "2023-09-30",
        "developer": "Google Health",
        "use_case": "Assisting in medical documentation and information retrieval.",
        "impact": "Supported healthcare professionals with AI-driven medical language understanding."
    },
    {
        "name": "LearnLM",
        "description": "A language model tailored for educational content and applications.",
        "dateOfRelease": "2023-10-15",
        "developer": "Google Research",
        "use_case": "Enhancing educational tools with AI-driven language understanding.",
        "impact": "Facilitated the development of intelligent educational platforms and resources."
    },
    {
        "name": "SecLM",
        "description": "A language model focused on cybersecurity terminology and knowledge.",
        "dateOfRelease": "2023-12-01",
        "developer": "Google AI",
        "use_case": "Assisting in cybersecurity threat analysis and documentation.",
        "impact": "Enhanced cybersecurity efforts with AI-driven language understanding."
    },
    {
        "name": "Gemma",
        "description": "A multimodal AI model capable of understanding and generating text and images.",
        "dateOfRelease": "2024-01-20",
        "developer": "Google AI",
        "use_case": "Applications requiring integrated text and image processing.",
        "impact": "Advanced the field of multimodal AI with integrated processing capabilities."
    },
    {
        "name": "CodeGemma",
        "description": "An AI model designed for code generation with multimodal inputs.",
        "dateOfRelease": "2024-02-10",
        "developer": "Google AI",
        "use_case": "Assisting developers with code generation from diverse inputs.",
        "impact": "Improved coding efficiency by leveraging multimodal AI capabilities."
    },
    {
        "name": "DALL·E 2",
        "description": "An AI system that can create realistic images and art from textual descriptions.",
        "dateOfRelease": "2022-04-06",
        "developer": "OpenAI",
        "use_case": "Text-to-image generation",
        "impact": "Enabled the creation of detailed images from textual prompts, bridging language and visual art."
    },
    {
        "name": "Gemini 1.0 Ultra",
        "description": "A multimodal AI model capable of handling text, images, audio, video, and code.",
        "dateOfRelease": "2024-06-01",
        "developer": "Google",
        "use_case": "Multimodal reasoning and complex coding",
        "impact": "Enhanced AI's ability to process and reason across multiple types of data, improving versatility."
    },
    {
        "name": "PyramidFlow",
        "description": "An innovative text-to-video AI model that generates high-resolution videos from textual descriptions.",
        "dateOfRelease": "2023-11-15",
        "developer": "Research Community",
        "use_case": "Text-to-video generation",
        "impact": "Advanced the field of video generation, enabling the creation of videos directly from text prompts."
    },
    {
        "name": "LLaMA 2",
        "description": "A large language model developed by Meta, designed to generate human-like text.",
        "dateOfRelease": "2023-07-18",
        "developer": "Meta",
        "use_case": "Natural language processing",
        "impact": "Contributed to the diversity of available LLMs, promoting research and development in AI language models."
    },
    {
        "name": "Nova Pro",
        "description": "An AI foundation model optimized for multimodal capabilities, including text and image processing.",
        "dateOfRelease": "2024-12-03",
        "developer": "Amazon",
        "use_case": "Multimodal AI applications",
        "impact": "Expanded AI capabilities in processing and integrating multiple data types, enhancing application versatility."
    },
    {
        "name": "o1",
        "description": "An AI model designed with reasoning capabilities, moving beyond traditional prediction-based models.",
        "dateOfRelease": "2024-12-01",
        "developer": "OpenAI",
        "use_case": "Advanced reasoning and problem-solving",
        "impact": "Marked a shift towards AI systems with human-like thinking, enhancing problem-solving abilities."
    }
]