File size: 1,478 Bytes
bfaed46 6c097a6 dbd7ab9 bfaed46 51bd170 bfaed46 dbd7ab9 |
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48 49 50 51 52 53 54 |
# fly.toml app configuration file generated for medical-transcription-cpu on 2024-01-22T15:15:29-06:00
#
# See https://fly.io/docs/reference/configuration/ for information about how to use this file.
#
app = "medical-transcription-cpu"
primary_region = "ord"
kill_signal = "SIGTERM"
# TODO: Enable the following line and install the necessary CUDA packages in the Dockerfile for GPU usage.
# The volumes will need to be recreated as well to match the GPU kind.
# See https://fly.io/docs/gpus/gpu-quickstart/
# and https://fly.io/docs/gpus/getting-started-gpus/
# vm.size = "a100-40gb"
[build]
# [deploy]
# release_command = "/app/bin/migrate"
[[mounts]]
source = "data"
destination = "/data"
initial_size = "40gb"
[env]
ELIXIR_ERL_OPTIONS = "-proto_dist inet6_tcp +sssdio 128"
AUDIO_TAGGER_CACHE_DIR="/data/cache/audio_tagger"
BUMBLEBEE_CACHE_DIR="/data/cache/bumblebee"
XLA_CACHE_DIR="/data/cache/xla"
# XLA_TARGET="cuda120"
PHX_HOST = "medical-transcription-cpu.fly.dev"
PORT = "8080"
[http_service]
internal_port = 8080
force_https = true
auto_stop_machines = false
auto_start_machines = false
min_machines_running = 0
processes = ["app"]
[http_service.concurrency]
type = "connections"
hard_limit = 1000
soft_limit = 1000
[[vm]]
cpu_kind = "shared"
cpus = 1
memory_mb = 2048
# To generate the vector embeddings for the ICD-9 codelist, we need more RAM available.
# fly scale vm shared-cpu-8x --memory 16384
|