Skip to content

Commit

Permalink
Merge pull request #1 from mpacer/subjectsDB
Browse files Browse the repository at this point in the history
introduce iter_samples utility & utils.py, use ternarys to simplify makedb
  • Loading branch information
sbassi authored Mar 3, 2018
2 parents 14fd36c + 742b9ba commit 47244b1
Showing 1 changed file with 4 additions and 11 deletions.
15 changes: 4 additions & 11 deletions allofplos/makedb.py
Original file line number Diff line number Diff line change
Expand Up @@ -118,18 +118,11 @@ class CoAuthorPLOSArticle(BaseModel):
SubjectsPLOSArticle, Subjects])


if args.starter:
corpus = Corpus(starterdir)
allfiles = corpus.iter_files
else:
corpus = Corpus()
allfiles = corpus.iter_files

if args.random:
corpus = Corpus()
allfiles = random.sample(list(corpus.iter_files), args.random)
corpus_dir = starterdir if args.starter else None
allfiles = Corpus(corpus_dir).files
files = random.sample(allfiles, args.random) if args.random else allfiles

for file_ in tqdm(allfiles):
for file_ in tqdm(files):
doi = filename_to_doi(file_)
article = Article(doi)
journal_name = journal_title_dict[article.journal.upper()]
Expand Down

0 comments on commit 47244b1

Please sign in to comment.