dhimmel · dhimmel · Sep 27, 2020 · Sep 25, 2020 · Sep 26, 2020 · Sep 26, 2020
diff --git a/obonet/read.py b/obonet/read.py
@@ -6,7 +6,7 @@
 from .io import open_read_file
 
 
-def read_obo(path_or_file):
+def read_obo(path_or_file, ignore_obsolete=True):
     """
     Return a networkx.MultiDiGraph of the ontology serialized by the
     specified path or file.
@@ -19,6 +19,9 @@ def read_obo(path_or_file):
     path_or_file : str or file
         Path, URL, or open file object. If path or URL, compression is
         inferred from the file extension.
+    ignore_obsolete : boolean
+        When true (default), terms that are marked 'is_obsolete' will
+        not be added to the graph. 
     """
     obo_file = open_read_file(path_or_file)
     typedefs, terms, instances, header = get_sections(obo_file)
@@ -32,7 +35,7 @@ def read_obo(path_or_file):
     edge_tuples = list()
 
     for term in terms:
-        is_obsolete = term.get('is_obsolete', 'false') == 'true'
+        is_obsolete = ignore_obsolete and term.get('is_obsolete', 'false') == 'true'
         if is_obsolete:
             continue
         term_id = term.pop('id')

diff --git a/tests/test_obo_reading.py b/tests/test_obo_reading.py
@@ -17,8 +17,9 @@ def test_read_taxrank_file():
     with open(path, 'rt') as read_file:
         taxrank = obonet.read_obo(read_file)
     assert len(taxrank) == 61
-    assert taxrank.node['TAXRANK:0000001']['name'] == 'phylum'
-    assert 'NCBITaxon:kingdom' in taxrank.node['TAXRANK:0000017']['xref']
+    # It looks like networkx has changed the name of the node variable to nodes -- EST 2020-09-25
+    assert taxrank.nodes['TAXRANK:0000001']['name'] == 'phylum'
+    assert 'NCBITaxon:kingdom' in taxrank.nodes['TAXRANK:0000017']['xref']
 
 
 @pytest.mark.parametrize('extension', ['', '.gz', '.bz2', '.xz'])
@@ -118,3 +119,15 @@ def test_parse_tag_line_backslashed_exclamation():
     tag, value, trailing_modifier, comment = parse_tag_line(line)
     assert tag == 'synonym'
     assert value == r'not a real example \!'
+
+def test_ignore_obsolete_nodes():
+    hpo = obonet.read_obo("http://purl.obolibrary.org/obo/hp.obo")
+    nodes = hpo.nodes(data=True)
+    assert "HP:0005549" not in nodes
+
+def test_presence_of_obsolete_nodes():
+    hpo = obonet.read_obo("http://purl.obolibrary.org/obo/hp.obo", ignore_obsolete=False)
+    nodes = hpo.nodes(data=True)
+    assert "HP:0005549" in nodes
+    node = nodes['HP:0005549']
+    assert node['is_obsolete'] == 'true'