Spaces:
Sleeping
Sleeping
Update app.py
Browse files
app.py
CHANGED
@@ -1,6 +1,7 @@
|
|
1 |
import streamlit as st
|
2 |
import langcodes
|
3 |
|
|
|
4 |
# https://huggingface.co/blog/streamlit-spaces
|
5 |
langtext = st.text_input("language lookup using https://github.com/rspeer/langcodes, see also https://r12a.github.io/app-subtags/", "english")
|
6 |
|
@@ -36,6 +37,22 @@ if lang is None:
|
|
36 |
lang = None
|
37 |
|
38 |
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
39 |
|
40 |
|
41 |
#st.write(f"langcodes found the following tag: {type(found)}") # a Language object
|
@@ -53,6 +70,13 @@ if lang is not None:
|
|
53 |
st.write(f"If it exists, the ISO 639 Code Tables entry for the T variant would be at https://iso639-3.sil.org/code/{t_variant}")
|
54 |
st.write(f"If it exists, the ISO 639 Code Tables entry for the B variant would be at https://iso639-3.sil.org/code/{b_variant}")
|
55 |
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
56 |
|
57 |
broader_tags = lang.broader_tags()
|
58 |
st.write(f"Broader tags for this language, if any: {broader_tags}")
|
1 |
import streamlit as st
|
2 |
import langcodes
|
3 |
|
4 |
+
|
5 |
# https://huggingface.co/blog/streamlit-spaces
|
6 |
langtext = st.text_input("language lookup using https://github.com/rspeer/langcodes, see also https://r12a.github.io/app-subtags/", "english")
|
7 |
|
37 |
lang = None
|
38 |
|
39 |
|
40 |
+
def pull_obsolete_codes(iso_code):
|
41 |
+
from requests_html import HTMLSession
|
42 |
+
session = HTMLSession()
|
43 |
+
r= session.get(f"https://iso639-3.sil.org/code/{iso_code}")
|
44 |
+
for thing in r.html.find(".views-field-nothing", clean=True):
|
45 |
+
lines = thing.text.splitlines()
|
46 |
+
# lines = text.splitlines()
|
47 |
+
obsolete_codes = {}
|
48 |
+
for line in lines:
|
49 |
+
for obsolete_code_name in ["639-1","639-2/B", "639-2/T", "639-3"]
|
50 |
+
if obsolete_code_name in line:
|
51 |
+
print(line)
|
52 |
+
code = line.split()[-1]
|
53 |
+
print(code)
|
54 |
+
obsolete_codes[obsolete_code_name] = code
|
55 |
+
return obsolete_codes
|
56 |
|
57 |
|
58 |
#st.write(f"langcodes found the following tag: {type(found)}") # a Language object
|
70 |
st.write(f"If it exists, the ISO 639 Code Tables entry for the T variant would be at https://iso639-3.sil.org/code/{t_variant}")
|
71 |
st.write(f"If it exists, the ISO 639 Code Tables entry for the B variant would be at https://iso639-3.sil.org/code/{b_variant}")
|
72 |
|
73 |
+
|
74 |
+
# ethnologue prefers T for german (deu), and T for French
|
75 |
+
obsolete_codes = pull_obsolete_codes(t_variant)
|
76 |
+
|
77 |
+
|
78 |
+
|
79 |
+
|
80 |
|
81 |
broader_tags = lang.broader_tags()
|
82 |
st.write(f"Broader tags for this language, if any: {broader_tags}")
|