mark the example submission rule files as being raw, so the escapes dont get confused

[htsworkflow.git] / encode_submission / encode_find.py
diff --git a/encode_submission/encode_find.py b/encode_submission/encode_find.py

index eebc3bcc481c5597c121f5a461da4199249e6811..7589f5487aef5ef85a6c4ec65072aa3d025ef5bc 100644 (file)
--- a/encode_submission/encode_find.py
+++ b/encode_submission/encode_find.py
@@ -20,21 +20,20 @@ import sys
  import urllib
  import urlparse
  
+if not 'DJANGO_SETTINGS_MODULE' in os.environ:
+    os.environ['DJANGO_SETTINGS_MODULE'] = 'htsworkflow.settings'
+
  from htsworkflow.submission import daf, ucsc
  
  from htsworkflow.util import api
+from htsworkflow.util.rdfns import *
  from htsworkflow.util.rdfhelp import \
-     dafTermOntology, \
-     dublinCoreNS, \
       get_model, \
       get_serializer, \
       sparql_query, \
       submissionOntology, \
       libraryOntology, \
-     load_into_model, \
-     rdfNS, \
-     rdfsNS, \
-     xsdNS
+     load_into_model
  TYPE_N = rdfNS['type']
  CREATION_DATE = libraryOntology['date']
  
@@ -124,7 +123,7 @@ def main(cmdline=None):
              load_encodedcc_files(model, **track_info )
  
      if opts.sparql is not None:
-        sparql_query(model, opts.sparql)
+        sparql_query(model, opts.sparql, 'html')
  
      if opts.find_submission_with_no_library:
          report_submissions_with_no_library(model)
@@ -183,7 +182,7 @@ def make_parser():
  
  
  def load_my_submissions(model, limit=None, cookie=None):
-    """Parse all the submissions from UCSC into model
+    """Parse all of my submissions from encodesubmit into model
      It will look at the global USER_URL to figure out who to scrape
      cookie contains the session cookie, if none, will attempt to login
      """
@@ -535,12 +534,23 @@ def load_encodedcc_files(model, genome, composite):
      if file_index is None:
          return
  
+    lib_term = submissionOntology['library_urn']
+    sub_term = submissionOntology['submission_urn']
      for filename, attributes in file_index.items():
          s = RDF.Node(RDF.Uri(filename))
+        model.add_statement(
+            RDF.Statement(s, TYPE_N, submissionOntology['ucsc_track']))
          for name, value in attributes.items():
              p = RDF.Node(DCC_NS[name])
              o = RDF.Node(value)
              model.add_statement(RDF.Statement(s,p,o))
+            if name.lower() == 'labexpid':
+                model.add_statement(
+                    RDF.Statement(s, lib_term, LIBRARY_NS[value+'/']))
+            elif name.lower() == 'subid':
+                sub_url = RDF.Uri(submission_view_url(value))
+                model.add_statement(
+                    RDF.Statement(s, sub_term, sub_url))
  
  
  def load_library_detail(model, libraryUrn):