Spaces:
Running
Running
jadehardouin
commited on
Commit
•
847028b
1
Parent(s):
2db3504
Update models.py
Browse files
models.py
CHANGED
@@ -144,7 +144,11 @@ class OpenSourceLlama2Model(BaseTCOModel):
|
|
144 |
input_tokens_cost_per_token = 0.00052
|
145 |
r = maxed_out / 100
|
146 |
return input_tokens_cost_per_token * 0.65 / r, output_tokens_cost_per_token * 0.65/ r
|
147 |
-
|
|
|
|
|
|
|
|
|
148 |
self.vm = gr.Textbox(value="2x A100 80GB NVLINK",
|
149 |
visible=False,
|
150 |
label="Instance of VM with GPU",
|
@@ -171,11 +175,6 @@ class OpenSourceLlama2Model(BaseTCOModel):
|
|
171 |
interactive=False
|
172 |
)
|
173 |
self.maxed_out.change(on_maxed_out_change, inputs=[self.maxed_out, self.input_tokens_cost_per_token, self.output_tokens_cost_per_token], outputs=[self.input_tokens_cost_per_token, self.output_tokens_cost_per_token])
|
174 |
-
self.source = gr.Markdown("""<span style="font-size: 16px; font-weight: 600; color: #212529;">Source</span>""")
|
175 |
-
self.info = gr.Markdown("The cost per input and output tokens values above are from [these benchmark results](https://www.cursor.so/blog/llama-inference#user-content-fn-llama-paper)",
|
176 |
-
label="Source",
|
177 |
-
interactive=False,
|
178 |
-
visible=False)
|
179 |
|
180 |
self.labor = gr.Number(10000, visible=False,
|
181 |
label="($) Labor cost per month",
|
|
|
144 |
input_tokens_cost_per_token = 0.00052
|
145 |
r = maxed_out / 100
|
146 |
return input_tokens_cost_per_token * 0.65 / r, output_tokens_cost_per_token * 0.65/ r
|
147 |
+
|
148 |
+
self.source = gr.Markdown("""<span style="font-size: 16px; font-weight: 600; color: #212529;">Source</span>""")
|
149 |
+
self.info = gr.Markdown("The cost per input and output tokens values below are from [these benchmark results](https://www.cursor.so/blog/llama-inference#user-content-fn-llama-paper) that were obtained using the following initial configurations.",
|
150 |
+
interactive=False,
|
151 |
+
visible=False)
|
152 |
self.vm = gr.Textbox(value="2x A100 80GB NVLINK",
|
153 |
visible=False,
|
154 |
label="Instance of VM with GPU",
|
|
|
175 |
interactive=False
|
176 |
)
|
177 |
self.maxed_out.change(on_maxed_out_change, inputs=[self.maxed_out, self.input_tokens_cost_per_token, self.output_tokens_cost_per_token], outputs=[self.input_tokens_cost_per_token, self.output_tokens_cost_per_token])
|
|
|
|
|
|
|
|
|
|
|
178 |
|
179 |
self.labor = gr.Number(10000, visible=False,
|
180 |
label="($) Labor cost per month",
|