Skip to content

Commit

Permalink
Import Documents: Read metas as the right type
Browse files Browse the repository at this point in the history
  • Loading branch information
ajdapretnar committed Jul 8, 2021
1 parent b9b9612 commit 0833d28
Showing 1 changed file with 5 additions and 4 deletions.
9 changes: 5 additions & 4 deletions orangecontrib/text/import_documents.py
Original file line number Diff line number Diff line change
Expand Up @@ -29,7 +29,8 @@

import serverfiles

from Orange.data import DiscreteVariable, Domain, StringVariable
from Orange.data import DiscreteVariable, Domain, StringVariable, \
guess_data_type
from Orange.data.io import detect_encoding, UrlReader as CoreUrlReader
from Orange.data.util import get_unique_names
from Orange.util import Registry
Expand Down Expand Up @@ -346,12 +347,12 @@ def _add_metadata(self, corpus: Corpus) -> Corpus:
df = df[~df.index.duplicated(keep='first')]
filtered = df.reindex(path_column)
for column in filtered.columns:
_, vals, var_type = guess_data_type(filtered[column])
corpus = corpus.add_column(
StringVariable(get_unique_names(corpus.domain, column)),
filtered[column].to_numpy(),
var_type(get_unique_names(corpus.domain, column)),
vals,
to_metas=True
)

return corpus

@staticmethod
Expand Down

0 comments on commit 0833d28

Please sign in to comment.