else:
limit = args
+ if opts.reload_libraries:
+ reload_libraries(model, args)
+ return
+
if opts.update:
opts.update_submission = True
opts.update_libraries = True
commands.add_option('--update-libraries', action="store_true",
default=False,
help="download library info from htsw")
+ commands.add_option('--reload-libraries', action="store_true",
+ default=False,
+ help="Delete and redownload library information. "\
+ "Optionally list specific library IDs.")
parser.add_option_group(commands)
queries = OptionGroup(parser, "Queries")
query = RDF.SPARQLQuery(unscanned_libraries)
return query.execute(model)
+def find_all_libraries(model):
+ """Scan model for every library marked as
+ """
+ libraries = """
+PREFIX rdf:<http://www.w3.org/1999/02/22-rdf-syntax-ns#>
+PREFIX libraryOntology:<{libraryOntology}>
+
+SELECT distinct ?library_urn
+WHERE {{
+ ?library_urn rdf:type ?library_type .
+ FILTER(regex(?libray
+}}""".format(libraryOntology=libraryOntology[''].uri)
+ query = RDF.SPARQLQuery(libraries)
+ return query.execute(model)
+
def add_submission_creation_date(model, subUrn, cookie):
# in theory the submission page might have more information on it.
LOGGER.warn("Unassigned, submitted library: {0}".format(library_urn))
load_library_detail(model, library_urn)
+def reload_libraries(model, library_list):
+ if len(library_list) == 0:
+ # reload everything.
+ queryset = find_all_libraries(model)
+ libraries = ( str(s['library_urn']) for s in queryset )
+ else:
+ libraries = ( user_library_id_to_library_urn(l) for l in library_list )
+
+ for library_urn in libraries:
+ delete_library(model, library_urn)
+ load_library_detail(model, library_urn)
+
+def user_library_id_to_library_urn(library_id):
+ split_url = urlparse.urlsplit(library_id)
+ if len(split_url.scheme) == 0:
+ return LIBRARY_NS[library_id]
+ else:
+ return library_id
+
+def delete_library(model, library_urn):
+ if not isinstance(library_urn, RDF.Node):
+ raise ValueError("library urn must be a RDF.Node")
+
+ LOGGER.info("Deleting {0}".format(str(library_urn.uri)))
+ lane_query = RDF.Statement(library_urn, libraryOntology['has_lane'],None)
+ for lane in model.find_statements(lane_query):
+ delete_lane(model, lane.object)
+ library_attrib_query = RDF.Statement(library_urn, None, None)
+ for library_attrib in model.find_statements(library_attrib_query):
+ LOGGER.debug("Deleting {0}".format(str(library_attrib)))
+ del model[library_attrib]
+
+
+def delete_lane(model, lane_urn):
+ if not isinstance(lane_urn, RDF.Node):
+ raise ValueError("lane urn must be a RDF.Node")
+
+ delete_lane_mapping(model, lane_urn)
+ lane_attrib_query = RDF.Statement(lane_urn,None,None)
+ for lane_attrib in model.find_statements(lane_attrib_query):
+ LOGGER.debug("Deleting {0}".format(str(lane_attrib)))
+ del model[lane_attrib]
+
+
+def delete_lane_mapping(model, lane_urn):
+ if not isinstance(lane_urn, RDF.Node):
+ raise ValueError("lane urn must be a RDF.Node")
+
+ lane_mapping_query = RDF.Statement(lane_urn,
+ libraryOntology['has_mappings'],
+ None)
+ for lane_mapping in model.find_statements(lane_mapping_query):
+ mapping_attrib_query = RDF.Statement(lane_mapping.object,
+ None,
+ None)
+ for mapping_attrib in model.find_statements(mapping_attrib_query):
+ LOGGER.debug("Deleting {0}".format(str(mapping_attrib)))
+ del model[mapping_attrib]
+
def load_encodedcc_files(model, genome, composite):
file_index = ucsc.get_encodedcc_file_index(genome, composite)
object_date = fromTypedNode(dates[0].object)
self.assertEqual(object_date, datetime(2011,12,7,15,23,0))
+ def test_delete_simple_lane(self):
+ model = get_model()
+ parser = RDF.Parser(name='turtle')
+ parser.parse_string_into_model(model, '''@prefix rdf: <http://www.w3.org/1999/02/22-rdf-syntax-ns#> .
+@prefix : <http://www.w3.org/1999/xhtml> .
+@prefix rdfs: <http://www.w3.org/2000/01/rdf-schema#> .
+@prefix xsd: <http://www.w3.org/2001/XMLSchema#> .
+@prefix libns: <http://jumpgate.caltech.edu/wiki/LibraryOntology#> .
+
+<http://jumpgate.caltech.edu/lane/1232>
+ libns:flowcell <http://jumpgate.caltech.edu/flowcell/42JV5AAXX/> ;
+ libns:total_unique_locations 5789938 .
+
+''', 'http://jumpgate.caltech.edu/library/')
+ urn = RDF.Node(RDF.Uri('http://jumpgate.caltech.edu/lane/1232'))
+ encode_find.delete_lane(model, urn)
+ self.failUnlessEqual(len(model), 0)
+
+ def test_delete_lane_with_mapping(self):
+ model = get_model()
+ parser = RDF.Parser(name='turtle')
+ parser.parse_string_into_model(model, '''@prefix rdf: <http://www.w3.org/1999/02/22-rdf-syntax-ns#> .
+@prefix : <http://www.w3.org/1999/xhtml> .
+@prefix rdfs: <http://www.w3.org/2000/01/rdf-schema#> .
+@prefix xsd: <http://www.w3.org/2001/XMLSchema#> .
+@prefix libns: <http://jumpgate.caltech.edu/wiki/LibraryOntology#> .
+
+<http://jumpgate.caltech.edu/lane/1232>
+ libns:flowcell <http://jumpgate.caltech.edu/flowcell/42JV5AAXX/> ;
+ libns:has_mappings _:bnode110110 ;
+ libns:total_unique_locations 5789938 .
+
+_:bnode110110
+ libns:mapped_to "newcontam_UK.fa"@en ;
+ libns:reads 42473 .
+''', 'http://jumpgate.caltech.edu/library/')
+ self.failUnlessEqual(len(model), 5)
+ urn = RDF.Node(RDF.Uri('http://jumpgate.caltech.edu/lane/1232'))
+ encode_find.delete_lane(model, urn)
+ self.failUnlessEqual(len(model), 0)
+
+ def test_delete_library(self):
+ model = get_model()
+ parser = RDF.Parser(name='turtle')
+ parser.parse_string_into_model(model, '''@prefix rdf: <http://www.w3.org/1999/02/22-rdf-syntax-ns#> .
+@prefix : <http://www.w3.org/1999/xhtml> .
+@prefix rdfs: <http://www.w3.org/2000/01/rdf-schema#> .
+@prefix xsd: <http://www.w3.org/2001/XMLSchema#> .
+@prefix libns: <http://jumpgate.caltech.edu/wiki/LibraryOntology#> .
+
+<http://jumpgate.caltech.edu/lane/1232>
+ libns:flowcell <http://jumpgate.caltech.edu/flowcell/42JV5AAXX/> ;
+ libns:has_mappings _:bnode110110 ;
+ libns:total_unique_locations 5789938 .
+
+<http://jumpgate.caltech.edu/library/11011/>
+ libns:affiliation "ENCODE"@en, "ENCODE_Tier1"@en, "Georgi Marinov"@en ;
+ libns:has_lane <http://jumpgate.caltech.edu/lane/1232> ;
+ libns:library_id "11011"@en ;
+ libns:library_type "None"@en ;
+ a "libns:library"@en ;
+ <http://www.w3.org/1999/xhtml/vocab#stylesheet> <http://jumpgate.caltech.edu/static/css/app.css>, <http://jumpgate.caltech.edu/static/css/data-browse-index.css> .
+
+_:bnode110110
+ libns:mapped_to "newcontam_UK.fa"@en ;
+ libns:reads 42473 .
+
+<http://jumpgate.caltech.edu/lane/1903>
+ libns:flowcell <http://jumpgate.caltech.edu/flowcell/62WCKAAXX/> ;
+ libns:has_mappings _:bnode120970 ;
+ libns:total_unique_locations 39172114 .
+
+<http://jumpgate.caltech.edu/library/12097/>
+ libns:has_lane <http://jumpgate.caltech.edu/lane/1903> ;
+ libns:library_id "12097"@en ;
+ libns:library_type "Paired End (non-multiplexed)"@en ;
+ a "libns:library"@en ;
+
+_:bnode120970
+ libns:mapped_to "newcontam_UK.fa"@en ;
+ libns:reads 64 .
+''', 'http://jumpgate.caltech.edu/library')
+ urn = RDF.Node(RDF.Uri('http://jumpgate.caltech.edu/library/11011/'))
+ encode_find.delete_library(model, urn)
+ q = RDF.Statement(None, encode_find.libraryOntology['reads'], None)
+ stmts = list(model.find_statements(q))
+ self.failUnlessEqual(len(stmts), 1)
+ self.failUnlessEqual(fromTypedNode(stmts[0].object),
+ 64)
+
+ q = RDF.Statement(None, encode_find.libraryOntology['library_id'], None)
+ stmts = list(model.find_statements(q))
+ self.failUnlessEqual(len(stmts), 1)
+ self.failUnlessEqual(fromTypedNode(stmts[0].object),
+ '12097')
def suite():
return unittest.makeSuite(TestEncodeFind, "test")