📦 Initialize Geulbeot structure and merge Prompts & test projects

This commit is contained in:
2026-03-05 11:32:29 +09:00
commit 555a954458
687 changed files with 205247 additions and 0 deletions

View File

@@ -0,0 +1,13 @@
def clean_text(text):
replacements = {
' ': ' ', '‘': "'", '’': "'", '“': '"', '”': '"',
'&amp;': '&', '&lt;': '<', '&gt;': '>', '&#39;': "'",
'&quot;' : "'", '&middot;': "'"
}
for entity, replacement in replacements.items():
text = text.replace(entity, replacement)
text = re.sub(r'<[^>]+>', '', text)
text = re.sub(r'\(엔지니어링데일리\).*?기자=', '', text) # (엔지니어링데일리) *** 기자= 패턴 삭제
text = re.sub(r'\[국토일보\s.*?