HeshamHaroon commited on
Commit
91eabe4
1 Parent(s): 778be61

Update app.py

Browse files
Files changed (1) hide show
  1. app.py +4 -1
app.py CHANGED
@@ -69,8 +69,11 @@ def compare_tokenizers(tokenizer_name, text):
69
  encoded_output = tokenizer.encode(text, add_special_tokens=True)
70
  decoded_text = tokenizer.decode(encoded_output, skip_special_tokens=True)
71
 
 
 
 
72
  # Prepare the results to be displayed in HTML format
73
- tokens_html = "".join([f"<span style='background-color:#D3D3D3; padding:2px; margin:2px; border-radius:5px;'>{token}</span>" for token in tokens])
74
  encoded_html = "".join([f"<span style='background-color:#ADD8E6; padding:2px; margin:2px; border-radius:5px;'>{token}</span>" for token in encoded_output])
75
  decoded_html = f"<div style='background-color:#90EE90; padding:10px; border-radius:5px;'>{decoded_text}</div>"
76
 
 
69
  encoded_output = tokenizer.encode(text, add_special_tokens=True)
70
  decoded_text = tokenizer.decode(encoded_output, skip_special_tokens=True)
71
 
72
+ # Ensure the tokens are properly decoded
73
+ tokens_display = [token for token in tokens]
74
+
75
  # Prepare the results to be displayed in HTML format
76
+ tokens_html = "".join([f"<span style='background-color:#D3D3D3; padding:2px; margin:2px; border-radius:5px;'>{token}</span>" for token in tokens_display])
77
  encoded_html = "".join([f"<span style='background-color:#ADD8E6; padding:2px; margin:2px; border-radius:5px;'>{token}</span>" for token in encoded_output])
78
  decoded_html = f"<div style='background-color:#90EE90; padding:10px; border-radius:5px;'>{decoded_text}</div>"
79