AIRider commited on
Commit
cc5f243
ยท
verified ยท
1 Parent(s): 3991a94

Update app.py

Browse files
Files changed (1) hide show
  1. app.py +29 -7
app.py CHANGED
@@ -146,12 +146,35 @@ def generate_blog_post(query, prompt_template):
146
  frequency_penalty = 0.5
147
  presence_penalty = 0
148
 
149
- # ๋ถˆํ•„์š”ํ•œ ํ‘œํ˜„ ํŒจํ„ด ์ •์˜ (ํ•˜๋“œ์ฝ”๋”ฉ)
150
- unwanted_patterns = [
151
- re.compile(r'\b์—ฌ๋Ÿฌ๋ถ„[,.]?\s*', re.IGNORECASE),
152
- re.compile(r'\b(๋งˆ์ง€๋ง‰์œผ๋กœ|๊ฒฐ๋ก ์ ์œผ๋กœ|๊ฒฐ๊ตญ|์ข…ํ•ฉ์ ์œผ๋กœ|๋”ฐ๋ผ์„œ|๋งˆ๋ฌด๋ฆฌ|์š”์•ฝ)[,.]?\s*', re.IGNORECASE)
 
 
 
 
 
 
 
153
  ]
154
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
155
  # ์ดˆ๊ธฐ ํ”„๋กฌํ”„ํŠธ ๊ตฌ์„ฑ
156
  base_prompt = prompt_template + f"""
157
  ์ฃผ์ œ: {query}
@@ -193,9 +216,8 @@ def generate_blog_post(query, prompt_template):
193
  # ๋ชจ๋ธ์ด ์ƒ์„ฑํ•œ ๋‹ต๋ณ€ ์ถ”์ถœ
194
  generated_post = response['choices'][0]['message']['content'].strip()
195
 
196
- # ๋ถˆํ•„์š”ํ•œ ํ‘œํ˜„ ์ œ๊ฑฐ (์ฝ”๋“œ์—์„œ ํ•˜๋“œ์ฝ”๋”ฉ์œผ๋กœ ์ฒ˜๋ฆฌ)
197
- for pattern in unwanted_patterns:
198
- generated_post = pattern.sub('', generated_post)
199
 
200
  # ์ƒ์„ฑ๋œ ๊ธ€์˜ ์‹ค์ œ ๋ฌธ์ž ์ˆ˜ ๊ณ„์‚ฐ
201
  actual_char_length = len(generated_post)
 
146
  frequency_penalty = 0.5
147
  presence_penalty = 0
148
 
149
+ # ๋ถˆํ•„์š”ํ•œ ํ‘œํ˜„ ๋ฆฌ์ŠคํŠธ
150
+ unwanted_phrases = [
151
+ '์—ฌ๋Ÿฌ๋ถ„',
152
+ '์ตœ๊ทผ',
153
+ '๋งˆ์ง€๋ง‰์œผ๋กœ',
154
+ '๊ฒฐ๋ก ์ ์œผ๋กœ',
155
+ '๊ฒฐ๊ตญ',
156
+ '์ข…ํ•ฉ์ ์œผ๋กœ',
157
+ '๋”ฐ๋ผ์„œ',
158
+ '๋งˆ๋ฌด๋ฆฌ',
159
+ '์š”์•ฝ'
160
  ]
161
 
162
+ # ๋ถˆํ•„์š”ํ•œ ํ‘œํ˜„ ์ œ๊ฑฐ ํ•จ์ˆ˜
163
+ def remove_unwanted_phrases(text):
164
+ for phrase in unwanted_phrases:
165
+ # ๋ถˆํ•„์š”ํ•œ ํ‘œํ˜„์ด ํ…์ŠคํŠธ์— ํฌํ•จ๋˜์–ด ์žˆ๋Š” ๋™์•ˆ ๋ฐ˜๋ณต
166
+ while phrase in text:
167
+ index = text.find(phrase)
168
+ # ๋ถˆํ•„์š”ํ•œ ํ‘œํ˜„ ์ด์ „์˜ ๋งˆ์ง€๋ง‰ ๊ณต๋ฐฑ ์œ„์น˜ ์ฐพ๊ธฐ
169
+ prev_space = text.rfind(' ', 0, index)
170
+ # prev_space๊ฐ€ -1์ด๋ฉด ๋ฌธ์ž์—ด์˜ ์ฒ˜์Œ๋ถ€ํ„ฐ ์‹œ์ž‘
171
+ start = prev_space if prev_space != -1 else 0
172
+ # ๋ถˆํ•„์š”ํ•œ ํ‘œํ˜„์˜ ๋ ์œ„์น˜
173
+ end = index + len(phrase)
174
+ # ํ•ด๋‹น ๋ถ€๋ถ„ ๋ฌธ์ž์—ด ์ œ๊ฑฐ
175
+ text = text[:start] + text[end:]
176
+ return text
177
+
178
  # ์ดˆ๊ธฐ ํ”„๋กฌํ”„ํŠธ ๊ตฌ์„ฑ
179
  base_prompt = prompt_template + f"""
180
  ์ฃผ์ œ: {query}
 
216
  # ๋ชจ๋ธ์ด ์ƒ์„ฑํ•œ ๋‹ต๋ณ€ ์ถ”์ถœ
217
  generated_post = response['choices'][0]['message']['content'].strip()
218
 
219
+ # ๋ถˆํ•„์š”ํ•œ ํ‘œํ˜„ ์ œ๊ฑฐ ํ•จ์ˆ˜ ์ ์šฉ
220
+ generated_post = remove_unwanted_phrases(generated_post)
 
221
 
222
  # ์ƒ์„ฑ๋œ ๊ธ€์˜ ์‹ค์ œ ๋ฌธ์ž ์ˆ˜ ๊ณ„์‚ฐ
223
  actual_char_length = len(generated_post)