timgremore
commited on
Commit
•
c872965
1
Parent(s):
d77a9fd
feat: Mix task to generate ICD10 code embeddings
Browse files- lib/mix/tasks/embedding.ex +21 -0
lib/mix/tasks/embedding.ex
ADDED
@@ -0,0 +1,21 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
defmodule Mix.Tasks.Embedding do
|
2 |
+
@moduledoc "Generate embeddings from ICD10 codes"
|
3 |
+
|
4 |
+
use Mix.Task
|
5 |
+
|
6 |
+
@shortdoc "Generates icd10_vector_tensors.bin in system tmp"
|
7 |
+
def run(_) do
|
8 |
+
Mix.Task.run("app.start")
|
9 |
+
|
10 |
+
tmpfile = Path.join(System.tmp_dir(), "icd10_vector_tensors.bin")
|
11 |
+
|
12 |
+
if File.exists?(tmpfile) do
|
13 |
+
IO.puts("Found pre-calculated ICD-10 vector embeddings. Skipping embedding.")
|
14 |
+
else
|
15 |
+
AudioTagger.SampleData.icd10_codes()
|
16 |
+
|> AudioTagger.Classifier.SemanticSearch.precalculate_label_vectors(tmpfile)
|
17 |
+
|
18 |
+
IO.inspect(tmpfile, label: "Wrote vector embeddings")
|
19 |
+
end
|
20 |
+
end
|
21 |
+
end
|