6 print "combineRPKMs: version 1.1"
16 from commoncode import getConfigParser, getConfigBoolOption
23 usage = "usage: python %prog firstRPKM expandedRPKM finalRPKM combinedOutfile [--withmultifraction]"
24 parser = makeParser(usage)
25 (options, args) = parser.parse_args(argv[1:])
32 expandedfile = args[1]
36 combineRPKMs(firstfile, expandedfile, finalfile, outfile, options.doFraction)
39 def makeParser(usage=""):
40 parser = optparse.OptionParser(usage=usage)
41 parser.add_option("--withmultifraction", action="store_true", dest="doFraction")
43 configParser = getConfigParser()
44 section = "combineRPKMs"
45 doFraction = getConfigBoolOption(configParser, section, "doFraction", False)
47 parser.set_defaults(doFraction=doFraction)
52 def combineRPKMs(firstfileName, expandedfileName, finalfileName, outfileName, doFraction=False):
54 firstDict = getRPKMDict(firstfileName)
55 gidDict, expandedDict = getRPKMDict(expandedfileName, getGIDDict=True)
58 header = "gid\tRNAkb\tgene\tfirstRPKM\texpandedRPKM\tfinalRPKM\tfractionMulti\n"
60 header = "gid\tRNAkb\tgene\tfirstRPKM\texpandedRPKM\tfinalRPKM\n"
62 outfile = open(outfileName, "w")
65 finalfile = open(finalfileName)
66 for line in finalfile:
67 fields = line.strip().split()
71 firstRPKM = firstDict.get(gene, "")
72 outputFields = [gidDict[gene], rnakb, gene, firstRPKM, expandedDict[gene], finalRPKM]
76 outputFields.append(fraction)
78 outline = "%s\n" % string.join(outputFields, "\t")
79 outfile.write(outline)
85 def getRPKMDict(rpkmFileName, getGIDDict=False):
88 rpkmFile = open(rpkmFileName)
90 fields = line.strip().split()
91 rpkmDict[fields[1]] = fields[-1]
93 gidDict[fields[1]] = fields[0]
98 return gidDict, rpkmDict
103 if __name__ == "__main__":