From 0833d28fad68cbbfc1b6fba94e9f0d2042d676f9 Mon Sep 17 00:00:00 2001 From: Ajda Pretnar Date: Tue, 6 Jul 2021 15:29:26 +0200 Subject: [PATCH] Import Documents: Read metas as the right type --- orangecontrib/text/import_documents.py | 9 +++++---- 1 file changed, 5 insertions(+), 4 deletions(-) diff --git a/orangecontrib/text/import_documents.py b/orangecontrib/text/import_documents.py index 1c8684f65..c71107bb2 100644 --- a/orangecontrib/text/import_documents.py +++ b/orangecontrib/text/import_documents.py @@ -29,7 +29,8 @@ import serverfiles -from Orange.data import DiscreteVariable, Domain, StringVariable +from Orange.data import DiscreteVariable, Domain, StringVariable, \ + guess_data_type from Orange.data.io import detect_encoding, UrlReader as CoreUrlReader from Orange.data.util import get_unique_names from Orange.util import Registry @@ -346,12 +347,12 @@ def _add_metadata(self, corpus: Corpus) -> Corpus: df = df[~df.index.duplicated(keep='first')] filtered = df.reindex(path_column) for column in filtered.columns: + _, vals, var_type = guess_data_type(filtered[column]) corpus = corpus.add_column( - StringVariable(get_unique_names(corpus.domain, column)), - filtered[column].to_numpy(), + var_type(get_unique_names(corpus.domain, column)), + vals, to_metas=True ) - return corpus @staticmethod