fix: qa regex (#1738)

This commit is contained in:
crazywoola
2023-12-11 15:53:37 +08:00
committed by GitHub
parent 8c451eb0e6
commit 994fceece3

View File

@@ -632,8 +632,8 @@ class IndexingRunner:
return text
def format_split_text(self, text):
regex = r"Q\d+:\s*(.*?)\s*A\d+:\s*([\s\S]*?)(?=Q|$)"
matches = re.findall(regex, text, re.MULTILINE)
regex = r"Q\d+:\s*(.*?)\s*A\d+:\s*([\s\S]*?)(?=Q\d+:|$)"
matches = re.findall(regex, text, re.UNICODE)
return [
{