etchen commited on
Commit
5ee6809
·
verified ·
1 Parent(s): 0f4cad5

Update TaiwaneseHokkien.py

Browse files
Files changed (1) hide show
  1. TaiwaneseHokkien.py +7 -2
TaiwaneseHokkien.py CHANGED
@@ -4,6 +4,8 @@ from transformers import pipeline
4
  model_repo_id = "emlinking/wav2vec2-large-xls-r-300m-tsm-asr-v6"
5
  util = Converter()
6
  def get_initial_length(s):
 
 
7
  if len(s) >= 3 and s[2] == 'h':
8
  return 3
9
  elif len(s) >= 2 and s[1] in ['s', 'h']:
@@ -29,7 +31,10 @@ class TaiwaneseHokkien(Language):
29
  til = get_initial_length(target_syl)
30
  uil = get_initial_length(user_syl)
31
  if target_syl[:til] != user_syl[:uil]:
32
- result.append((user_syl[:uil], 'initial error'))
 
 
 
33
  else:
34
  result.append((user_syl[:uil], None))
35
  if target_syl[til:-1] != user_syl[uil:-1]:
@@ -60,4 +65,4 @@ class TaiwaneseHokkien(Language):
60
  return result
61
  @property
62
  def compare_colors(self):
63
- return {'tone error': 'red', 'initial error': 'blue', 'rime error': 'green', 'missing syllables': 'yellow', 'extra syllables': 'stone'}
 
4
  model_repo_id = "emlinking/wav2vec2-large-xls-r-300m-tsm-asr-v6"
5
  util = Converter()
6
  def get_initial_length(s):
7
+ if s[0] in ['a', 'e', 'i', 'o', 'u']: return 0
8
+ if (len(s) == 3 and s[:2] == 'ng') or (len(s) == 2 and s[:1] == 'm'): return 0
9
  if len(s) >= 3 and s[2] == 'h':
10
  return 3
11
  elif len(s) >= 2 and s[1] in ['s', 'h']:
 
31
  til = get_initial_length(target_syl)
32
  uil = get_initial_length(user_syl)
33
  if target_syl[:til] != user_syl[:uil]:
34
+ if uil == 0:
35
+ result.append((' ', 'initial error'))
36
+ else:
37
+ result.append((user_syl[:uil], 'initial error'))
38
  else:
39
  result.append((user_syl[:uil], None))
40
  if target_syl[til:-1] != user_syl[uil:-1]:
 
65
  return result
66
  @property
67
  def compare_colors(self):
68
+ return {'tone error': 'red', 'initial error': 'blue', 'rime error': 'green', 'missing syllables': 'yellow', 'extra syllables': 'gray'}