diff --git a/orangecontrib/text/import_documents.py b/orangecontrib/text/import_documents.py index 840a66366..e5feee97f 100644 --- a/orangecontrib/text/import_documents.py +++ b/orangecontrib/text/import_documents.py @@ -138,7 +138,7 @@ def read_file(self): for lt_obj in layout: if isinstance(lt_obj, LTTextBox) or isinstance(lt_obj, LTTextLine): extracted_text.append(lt_obj.get_text()) - self.content = ' '.join(extracted_text) + self.content = ' '.join(extracted_text).replace('\x00', '') class XmlReader(Reader):