Yijun-Yang commited on
Commit
b90b0df
1 Parent(s): 087385c

updatefindarticles

Browse files
huixiangdou/service/findarticles.py CHANGED
@@ -60,7 +60,7 @@ class ArticleRetrieval:
60
  if not os.path.exists(self.repo_dir):
61
  os.makedirs(self.repo_dir)
62
  print(f"Saving articles to {self.repo_dir}.")
63
-
64
  for id in tqdm(self.pmc_ids, desc="Fetching full texts", unit="article"):
65
  base_url = "https://eutils.ncbi.nlm.nih.gov/entrez/eutils/efetch.fcgi"
66
  params = {
@@ -76,13 +76,14 @@ class ArticleRetrieval:
76
  else:
77
  with open(os.path.join(self.repo_dir,f'PMC{id}.txt'), 'w') as f:
78
  f.write(full_text)
 
79
 
80
  def save_config(self):
81
  config = {
82
  'keywords': self.keywords,
83
  'repo_dir': self.repo_dir,
84
  'pmc_ids': self.pmc_ids,
85
- 'len': len(self.pmc_ids),
86
  'retmax': self.retmax
87
  }
88
  with open(os.path.join(self.repo_dir, 'config.json'), 'w') as f:
 
60
  if not os.path.exists(self.repo_dir):
61
  os.makedirs(self.repo_dir)
62
  print(f"Saving articles to {self.repo_dir}.")
63
+ success = 0
64
  for id in tqdm(self.pmc_ids, desc="Fetching full texts", unit="article"):
65
  base_url = "https://eutils.ncbi.nlm.nih.gov/entrez/eutils/efetch.fcgi"
66
  params = {
 
76
  else:
77
  with open(os.path.join(self.repo_dir,f'PMC{id}.txt'), 'w') as f:
78
  f.write(full_text)
79
+ success += 1
80
 
81
  def save_config(self):
82
  config = {
83
  'keywords': self.keywords,
84
  'repo_dir': self.repo_dir,
85
  'pmc_ids': self.pmc_ids,
86
+ 'len': success,
87
  'retmax': self.retmax
88
  }
89
  with open(os.path.join(self.repo_dir, 'config.json'), 'w') as f: