HeshamHaroon commited on
Commit
ab010ed
1 Parent(s): ca4c188

Update app.py

Browse files
Files changed (1) hide show
  1. app.py +5 -5
app.py CHANGED
@@ -14,20 +14,20 @@ def load_tokenizer(tokenizer_choice):
14
  "aranizer_sp64k": aranizer_sp64k.get_tokenizer(),
15
  "aranizer_sp86k": aranizer_sp86k.get_tokenizer(),
16
  }
17
-
18
  return tokenizer_map.get(tokenizer_choice, None)
19
 
20
  def tokenize_and_encode_and_embed(text, tokenizer_choice):
21
- tokenizer = get_tokenizer(tokenizer_choice)
22
  if tokenizer:
23
  # Example methods. Replace with actual methods from your tokenizer
24
  tokens = tokenizer.tokenize(text)
25
  encoded_output = tokenizer.encode(text, add_special_tokens=True)
26
  decoded_text = tokenizer.decode(encoded_output)
27
-
28
  # Example embedding (replace with actual embedding generation from your model)
29
  embeddings = [random() for _ in range(10)] # Example 10-dimensional embedding vector
30
-
31
  return " ".join(tokens), str(encoded_output), decoded_text, embeddings
32
  else:
33
  return "Tokenizer not loaded correctly", "", "", []
@@ -48,4 +48,4 @@ demo = gr.Interface(
48
  description="حدد نوع المحلل اللفظي وأدخل نصًا لرؤية النتائج ومتجه التضمين.",
49
  )
50
 
51
- demo.launch()
 
14
  "aranizer_sp64k": aranizer_sp64k.get_tokenizer(),
15
  "aranizer_sp86k": aranizer_sp86k.get_tokenizer(),
16
  }
17
+
18
  return tokenizer_map.get(tokenizer_choice, None)
19
 
20
  def tokenize_and_encode_and_embed(text, tokenizer_choice):
21
+ tokenizer = load_tokenizer(tokenizer_choice) # Use load_tokenizer here
22
  if tokenizer:
23
  # Example methods. Replace with actual methods from your tokenizer
24
  tokens = tokenizer.tokenize(text)
25
  encoded_output = tokenizer.encode(text, add_special_tokens=True)
26
  decoded_text = tokenizer.decode(encoded_output)
27
+
28
  # Example embedding (replace with actual embedding generation from your model)
29
  embeddings = [random() for _ in range(10)] # Example 10-dimensional embedding vector
30
+
31
  return " ".join(tokens), str(encoded_output), decoded_text, embeddings
32
  else:
33
  return "Tokenizer not loaded correctly", "", "", []
 
48
  description="حدد نوع المحلل اللفظي وأدخل نصًا لرؤية النتائج ومتجه التضمين.",
49
  )
50
 
51
+ demo.launch()