fix: qa regex (#1738)

This commit is contained in:
crazywoola 2023-12-11 15:53:37 +08:00 committed by GitHub
parent 8c451eb0e6
commit 994fceece3
No known key found for this signature in database
GPG Key ID: 4AEE18F83AFDEB23

View File

@ -632,8 +632,8 @@ class IndexingRunner:
return text
def format_split_text(self, text):
regex = r"Q\d+:\s*(.*?)\s*A\d+:\s*([\s\S]*?)(?=Q|$)"
matches = re.findall(regex, text, re.MULTILINE)
regex = r"Q\d+:\s*(.*?)\s*A\d+:\s*([\s\S]*?)(?=Q\d+:|$)"
matches = re.findall(regex, text, re.UNICODE)
return [
{