ginipick commited on
Commit
f5e28c7
·
verified ·
1 Parent(s): f562d6f

Update src/ASL_gloss_functions.py

Browse files
Files changed (1) hide show
  1. src/ASL_gloss_functions.py +6 -19
src/ASL_gloss_functions.py CHANGED
@@ -56,13 +56,11 @@ def question_type(doc):
56
  except IndexError:
57
  return None
58
 
59
- # add question id as a prefix
60
  def process_sentence(doc):
61
  nms = {
62
  "wh-question": "wh-q",
63
  "yes-no-question": "y/n-q"
64
  }
65
-
66
  classifiers = {
67
  "car": "CL:3",
68
  "person": "CL:1"
@@ -70,11 +68,12 @@ def process_sentence(doc):
70
 
71
  glossed_sentence = []
72
  for token in doc:
73
- ## utilize token.lemma_, not .text
74
- #word = token.text.lower()
75
  word = token.lemma_.lower()
76
 
77
- if word in ["i", "me"]:
 
 
 
78
  glossed_word = handle_indexing("I", 1)
79
  elif word in ["you"]:
80
  glossed_word = handle_indexing("YOU", 2)
@@ -82,18 +81,6 @@ def process_sentence(doc):
82
  glossed_word = classifiers[word]
83
  else:
84
  glossed_word = gloss_word(word)
 
85
  glossed_word = skip_stop_words(glossed_word)
86
-
87
- glossed_sentence.append(glossed_word)
88
-
89
- for gloss in glossed_sentence:
90
- if gloss.lower() in time_words:
91
- # move gloss at beginning
92
- glossed_sentence.insert(0, glossed_sentence.pop(glossed_sentence.index(gloss)))
93
- break
94
-
95
- type_doc = question_type(doc)
96
- if type_doc != None:
97
- glossed_sentence.insert(0, nms[type_doc])
98
-
99
- return " ".join(glossed_sentence)
 
56
  except IndexError:
57
  return None
58
 
 
59
  def process_sentence(doc):
60
  nms = {
61
  "wh-question": "wh-q",
62
  "yes-no-question": "y/n-q"
63
  }
 
64
  classifiers = {
65
  "car": "CL:3",
66
  "person": "CL:1"
 
68
 
69
  glossed_sentence = []
70
  for token in doc:
 
 
71
  word = token.lemma_.lower()
72
 
73
+ # 고유명사 처리
74
+ if token.pos_ == "PROPN":
75
+ glossed_word = token.text.upper()
76
+ elif word in ["i", "me"]:
77
  glossed_word = handle_indexing("I", 1)
78
  elif word in ["you"]:
79
  glossed_word = handle_indexing("YOU", 2)
 
81
  glossed_word = classifiers[word]
82
  else:
83
  glossed_word = gloss_word(word)
84
+
85
  glossed_word = skip_stop_words(glossed_word)
86
+ glossed_sentence.append(glossed_word)