asmashayea commited on
Commit
d472db4
·
1 Parent(s): 4556147
Files changed (1) hide show
  1. inference.py +23 -4
inference.py CHANGED
@@ -122,10 +122,29 @@ def infer_araberta(text):
122
  "sentiment": sentiment_map.get(current_sentiment, current_sentiment)
123
  })
124
 
125
- token_predictions = [
126
- {"token": token, "label": label}
127
- for token, label in zip(clean_tokens, clean_labels)
128
- ]
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
129
 
130
  return {
131
  "aspects": aspects,
 
122
  "sentiment": sentiment_map.get(current_sentiment, current_sentiment)
123
  })
124
 
125
+ token_predictions = []
126
+ merged_token = ""
127
+ merged_label = None
128
+
129
+ for token, label in zip(clean_tokens, clean_labels):
130
+ if token.startswith("##"):
131
+ merged_token += token[2:]
132
+ else:
133
+ if merged_token:
134
+ token_predictions.append({
135
+ "token": merged_token,
136
+ "label": merged_label
137
+ })
138
+ merged_token = token
139
+ merged_label = label
140
+
141
+ # Add last token
142
+ if merged_token:
143
+ token_predictions.append({
144
+ "token": merged_token,
145
+ "label": merged_label
146
+ })
147
+
148
 
149
  return {
150
  "aspects": aspects,