aboutsummaryrefslogtreecommitdiff
path: root/ncbi
diff options
context:
space:
mode:
authorJonathan DeMasi <jonathan.demasi@colorado.edu>2019-06-17 19:09:18 -0600
committerJonathan DeMasi <jonathan.demasi@colorado.edu>2019-06-17 19:09:18 -0600
commit0cae42c6a6fccfdb591f2a1855c82776a669d4a8 (patch)
treeb0f9757524adbc467c37ad1eead49a0c16f8c640 /ncbi
parent6c3881da5854550adce6911d960cd62ebe356b50 (diff)
downloadsnippets-0cae42c6a6fccfdb591f2a1855c82776a669d4a8.tar
snippets-0cae42c6a6fccfdb591f2a1855c82776a669d4a8.tar.gz
snippets-0cae42c6a6fccfdb591f2a1855c82776a669d4a8.tar.bz2
snippets-0cae42c6a6fccfdb591f2a1855c82776a669d4a8.tar.lz
snippets-0cae42c6a6fccfdb591f2a1855c82776a669d4a8.tar.xz
snippets-0cae42c6a6fccfdb591f2a1855c82776a669d4a8.tar.zst
snippets-0cae42c6a6fccfdb591f2a1855c82776a669d4a8.zip
fetching results
Diffstat (limited to 'ncbi')
-rwxr-xr-x[-rw-r--r--]ncbi/dbsnp/dbsnp.py37
1 files changed, 37 insertions, 0 deletions
diff --git a/ncbi/dbsnp/dbsnp.py b/ncbi/dbsnp/dbsnp.py
index e5a0d9b..fbad492 100644..100755
--- a/ncbi/dbsnp/dbsnp.py
+++ b/ncbi/dbsnp/dbsnp.py
@@ -1 +1,38 @@
#!/usr/bin/env python3
+
+import sys
+import time
+from Bio import Entrez
+
+
+Entrez.email = "jonathan.demasi@colorado.edu"
+# We should apply for an API key so we get more queries/sec
+Entrez.api_key = None
+
+def get_complete_rsids():
+ rsidlist = []
+ numresults = 0
+ retstart = 0
+ search_string = "snp_pubmed_cited[sb]"
+ search_results = Entrez.read(Entrez.esearch(db="snp", term=search_string,
+ retmax=100000, retstart=retstart, usehistory="y"))
+ print("Found a total of " +
+ search_results["Count"] + " results using search string '" + search_string + "'")
+ numresults = search_results["Count"]
+ rsidlist = rsidlist + search_results["IdList"]
+ additional_queries = int(int(numresults) / 100000)
+ while additional_queries != 0:
+ retstart = retstart + 100000
+ search_results = Entrez.read(Entrez.esearch(db="snp", term=search_string,
+ retmax=100000, retstart=retstart, usehistory="y"))
+ rsidlist = rsidlist + search_results["IdList"]
+ additional_queries = additional_queries - 1
+ return(rsidlist)
+
+def main():
+ listy = get_complete_rsids()
+ return()
+
+if __name__ == '__main__':
+ main()
+