From fb7fc8006a11d951dc8de8c34e3ba1299fec8de6 Mon Sep 17 00:00:00 2001 From: Timofey Arkhangelskiy <timarkh@gmail.com> Date: Tue, 24 Jan 2023 13:01:44 +0100 Subject: [PATCH] Fix Tsakorpus advanced view offsets --- common/tsakorpus_response_parser.py | 3 ++- 1 file changed, 2 insertions(+), 1 deletion(-) diff --git a/common/tsakorpus_response_parser.py b/common/tsakorpus_response_parser.py index 7658d68..10d7e68 100644 --- a/common/tsakorpus_response_parser.py +++ b/common/tsakorpus_response_parser.py @@ -83,6 +83,7 @@ class TsakorpusResponseParser: # (title, author etc.) if el.tail is not None: record.text += el.tail.strip('\n\t ') + record.textNoHighlight += el.text.strip('\n\t ') return if el.text is not None: @@ -90,7 +91,6 @@ class TsakorpusResponseParser: if 'class' in el.attrib and re.search('\\bword\\b', el.attrib['class']) is not None: if re.search('\\bwmatch\\b', el.attrib['class']) is not None: bMatch = True - record.textNoHighlight += el.text if advancedHits: segID = 's' + str(len(record.segments)) segment = { @@ -101,6 +101,7 @@ class TsakorpusResponseParser: record.segments.append(segment) if 'data-ana' in el.attrib: self.parse_annotation(el.attrib['data-ana'], segID, record) + record.textNoHighlight += el.text if bMatch: record.text += '<hits:Hit>' + el.text + '</hits:Hit>' else: -- GitLab