Commit
e5aaf6d
1 Parent(s): b6678bf

update app

Browse files
Files changed (1) hide show
  1. app.py +3 -1
app.py CHANGED
@@ -6,7 +6,9 @@ def tokenize_text(text, tokenizer_name):
6
  tokenizer = AutoTokenizer.from_pretrained(tokenizer_name)
7
  tokenized_text = tokenizer.tokenize(text)
8
  input_ids = tokenizer.convert_tokens_to_ids(tokenized_text)
9
- return f"Tokenized Text: {tokenized_text}\nInput IDs: {input_ids}"
 
 
10
 
11
  # Define available tokenizers
12
  tokenizer_names = [
 
6
  tokenizer = AutoTokenizer.from_pretrained(tokenizer_name)
7
  tokenized_text = tokenizer.tokenize(text)
8
  input_ids = tokenizer.convert_tokens_to_ids(tokenized_text)
9
+ decoded_text = tokenizer.decode(input_ids) # Decode the input IDs
10
+ return f"Tokenized Text: {tokenized_text}\nInput IDs: {input_ids}\nDecoded Text: {decoded_text}"
11
+
12
 
13
  # Define available tokenizers
14
  tokenizer_names = [