jadehardouin commited on
Commit
847028b
1 Parent(s): 2db3504

Update models.py

Browse files
Files changed (1) hide show
  1. models.py +5 -6
models.py CHANGED
@@ -144,7 +144,11 @@ class OpenSourceLlama2Model(BaseTCOModel):
144
  input_tokens_cost_per_token = 0.00052
145
  r = maxed_out / 100
146
  return input_tokens_cost_per_token * 0.65 / r, output_tokens_cost_per_token * 0.65/ r
147
-
 
 
 
 
148
  self.vm = gr.Textbox(value="2x A100 80GB NVLINK",
149
  visible=False,
150
  label="Instance of VM with GPU",
@@ -171,11 +175,6 @@ class OpenSourceLlama2Model(BaseTCOModel):
171
  interactive=False
172
  )
173
  self.maxed_out.change(on_maxed_out_change, inputs=[self.maxed_out, self.input_tokens_cost_per_token, self.output_tokens_cost_per_token], outputs=[self.input_tokens_cost_per_token, self.output_tokens_cost_per_token])
174
- self.source = gr.Markdown("""<span style="font-size: 16px; font-weight: 600; color: #212529;">Source</span>""")
175
- self.info = gr.Markdown("The cost per input and output tokens values above are from [these benchmark results](https://www.cursor.so/blog/llama-inference#user-content-fn-llama-paper)",
176
- label="Source",
177
- interactive=False,
178
- visible=False)
179
 
180
  self.labor = gr.Number(10000, visible=False,
181
  label="($) Labor cost per month",
 
144
  input_tokens_cost_per_token = 0.00052
145
  r = maxed_out / 100
146
  return input_tokens_cost_per_token * 0.65 / r, output_tokens_cost_per_token * 0.65/ r
147
+
148
+ self.source = gr.Markdown("""<span style="font-size: 16px; font-weight: 600; color: #212529;">Source</span>""")
149
+ self.info = gr.Markdown("The cost per input and output tokens values below are from [these benchmark results](https://www.cursor.so/blog/llama-inference#user-content-fn-llama-paper) that were obtained using the following initial configurations.",
150
+ interactive=False,
151
+ visible=False)
152
  self.vm = gr.Textbox(value="2x A100 80GB NVLINK",
153
  visible=False,
154
  label="Instance of VM with GPU",
 
175
  interactive=False
176
  )
177
  self.maxed_out.change(on_maxed_out_change, inputs=[self.maxed_out, self.input_tokens_cost_per_token, self.output_tokens_cost_per_token], outputs=[self.input_tokens_cost_per_token, self.output_tokens_cost_per_token])
 
 
 
 
 
178
 
179
  self.labor = gr.Number(10000, visible=False,
180
  label="($) Labor cost per month",