docs: fix examples (#182)

biocommons · Jun 26, 2024 · dd9caa7 · dd9caa7
1 parent 3ef65fd
commit dd9caa7
Show file tree

Hide file tree

Showing 2 changed files with 35 additions and 23 deletions.
diff --git a/README.rst b/README.rst
@@ -47,7 +47,8 @@ respectively).
   $ pip install biocommons.eutils
   $ ipython
 
-  >>> from biocmmons.eutils import Client
+  >>> import os
+  >>> from biocommons.eutils import Client
 
   # Initialize a client. This client handles all caching and query
   # throttling.  For example:
@@ -57,7 +58,11 @@ respectively).
   # any valid NCBI query may be used
   >>> esr = ec.esearch(db='gene',term='tumor necrosis factor')
 
-  # fetch one of those (gene id 7157 is human TNF)
+  # esearch returns a list of entity IDs associated with your search. preview some of them:
+  >>> esr.ids[:5]
+  [136114222, 136113226, 136112112, 136111930, 136111620]
+
+  # fetch data for an ID (gene id 7157 is human TNF)
   >>> egs = ec.efetch(db='gene', id=7157)
 
   # One may fetch multiple genes at a time. These are returned as an
@@ -76,16 +81,15 @@ respectively).
    ('NG_017013.2', 'RefSeqGene')]
 
   # Get the first three products defined on GRCh38
-  #>>> [p.acv for p in eg.references[0].products][:3]
-  #['NM_001126112.2', 'NM_001276761.1', 'NM_000546.5']
+  >>> [p.acv for p in eg.references[0].products][:3]
+  ['NM_001126112.2', 'NM_001276761.1', 'NM_000546.5']
 
   # As a sample, grab the first product defined on this reference (order is arbitrary)
-  >>> mrna = eg.references[0].products[0]
+  >>> mrna = [i for i in eg.references[0].products if i.type == "mRNA"][0]
   >>> str(mrna)
   'GeneCommentary(acv=NM_001126112.2,type=mRNA,heading=Reference,label=transcript variant 2)'
 
   # mrna.genomic_coords provides access to the exon definitions on this reference
-
   >>> mrna.genomic_coords.gi, mrna.genomic_coords.strand
   ('568815581', -1)
 
@@ -95,7 +99,7 @@ respectively).
   (7674180, 7674289), (7673700, 7673836), (7673534, 7673607),
   (7670608, 7670714), (7668401, 7669689)]
 
-  # and the mrna has a product, the resulting protein:
+  # and if the mrna has a product, the resulting protein:
   >>> str(mrna.products[0])
   'GeneCommentary(acv=NP_001119584.1,type=peptide,heading=Reference,label=isoform a)'
 

diff --git a/docs/using.rst b/docs/using.rst
@@ -42,10 +42,16 @@ Instantiating an eutils :class:`biocommons.eutils.Client` is this easy::
 
     >>> import biocommons.eutils as eutils
 
-    # Initialize a client. This client handles all caching and query
-    # throttling
+    # Initialize a client. This client handles all caching and query throttling
     >>> ec = eutils.Client()
 
+.. note::
+
+   E-Utilities APIs aren't guaranteed to return data in a consistent order, so it is
+   expected that responses shown in the demonstrations below may not be consistent
+   with your own console sessions. These examples are intended to demonstrate library
+   API functions, not to show exhaustive or consistent results.
+
 
 Fetching gene information
 $$$$$$$$$$$$$$$$$$$$$$$$$
@@ -56,8 +62,12 @@ $$$$$$$$$$$$$$$$$$$$$$$$$
     # any valid NCBI query may be used
     >>> esr = ec.esearch(db='gene',term='tumor necrosis factor')
 
-    # fetch one of those (gene id 7157 is human TNF)
-    >>> egs = ec.efetch(db='gene',id=7157)
+    # esearch returns a list of entity IDs associated with your search. preview some of them:
+    >>> esr.ids[:5]
+    [136114222, 136113226, 136112112, 136111930, 136111620]
+
+    # fetch data for an ID (gene id 7157 is human TNF)
+    >>> egs = ec.efetch(db='gene', id=7157)
 
     # One may fetch multiple genes at a time. These are returned as an
     # EntrezgeneSet. We'll grab the first (and only) child, which returns
@@ -76,20 +86,18 @@ $$$$$$$$$$$$$$$$$$$$$$$$$
 
     # Get all products defined on GRCh38
     >>> [p.acv for p in eg.references[0].products]
-    [u'NM_001126112.2', u'NM_001276761.1', u'NM_000546.5',
-    u'NM_001276760.1', u'NM_001126113.2', u'NM_001276695.1',
-    u'NM_001126114.2', u'NM_001276696.1', u'NM_001126118.1',
-    u'NM_001126115.1', u'NM_001276697.1', u'NM_001126117.1',
-    u'NM_001276699.1', u'NM_001126116.1', u'NM_001276698.1']
+    ['NM_001126112.2', 'NM_001276761.1', 'NM_000546.5',
+    'NM_001276760.1', 'NM_001126113.2', 'NM_001276695.1',
+    'NM_001126114.2', 'NM_001276696.1', 'NM_001126118.1',
+    'NM_001126115.1', 'NM_001276697.1', 'NM_001126117.1',
+    'NM_001276699.1', 'NM_001126116.1', 'NM_001276698.1']
 
     # As a sample, grab the first product defined on this reference (order is arbitrary)
-    >>> mrna = eg.references[0].products[0]
+    >>> mrna = [i for i in eg.references[0].products if i.type == "mRNA"][0]
     >>> str(mrna)
     'GeneCommentary(acv=NM_001126112.2,type=mRNA,heading=Reference,label=transcript variant 2)'
 
-    # mrna.genomic_coords provides access to the exon definitions on this
-    reference
-
+    # mrna.genomic_coords provides access to the exon definitions on this reference
     >>> mrna.genomic_coords.gi, mrna.genomic_coords.strand
     ('568815581', -1)
 
@@ -110,16 +118,16 @@ $$$$$$$$$$$$$$$$$$$$$$$$
 ::
 
    # search pubmed by author
-   >>> esr = c.esearch(db='pubmed', term='Nussbaum RL')
+   >>> esr = ec.esearch(db='pubmed', term='Nussbaum RL')
 
    # fetch all of them
-   >>> paset = c.efetch(db='pubmed', id=esr.ids)
+   >>> paset = ec.efetch(db='pubmed', id=esr.ids)
 
    # paset represents PubmedArticleSet, a collection of
    PubmedArticles. The major interface component is to iterate over
    PubmedArticles with constructs like `for pa in paset: ...`. We
    fetch the first PubmedArticle like this:
-   >>> pa = iter(paset).next()
+   >>> pa = next(iter(paset))
 
    PubmedArticle provides acccessors to essential data:
    >>> pa.title