jbrowse: blastxml_to_gapped_gff3.py comparison

comparison blastxml_to_gapped_gff3.py @ 3:7342f467507b draft

Uploaded v0.4 of JBrowse

author	iuc
date	Thu, 31 Dec 2015 13:58:43 -0500
parents	497c6bb3b717
children	ad4b9d7eae6a

comparison

equal deleted inserted replaced

-:b6a0e126dbee
+:7342f467507b
 from Bio.SeqFeature import SeqFeature, FeatureLocation
 blast_records = NCBIXML.parse(blastxml)
 records = []
 for record in blast_records:
+# http://www.sequenceontology.org/browser/release_2.4/term/SO:0000343
+match_type = {  # Currently we can only handle BLASTN, BLASTP
+'BLASTN': 'nucleotide_match',
+'BLASTP': 'protein_match',
+}.get(record.application, 'match')
 rec = SeqRecord(Seq("ACTG"), id=record.query)
 for hit in record.alignments:
 for hsp in hit.hsps:
 qualifiers = {
 "source": "blast",
 if trim or trim_end:
 if parent_match_end > hsp.query_end:
 parent_match_end = hsp.query_end + 1
-# The ``protein_match`` feature will hold one or more ``match_part``s
+# The ``match`` feature will hold one or more ``match_part``s
 top_feature = SeqFeature(
 FeatureLocation(parent_match_start, parent_match_end),
-type="protein_match", strand=0,
+type=match_type, strand=0,
 qualifiers=qualifiers
 )
 # Unlike the parent feature, ``match_part``s have sources.
 part_qualifiers = {
 part_qualifiers['Gap'] = cigar
 part_qualifiers['ID'] = hit.hit_id
 if trim:
 # If trimming, then we start relative to the
-# protein_match's start
+# match's start
 match_part_start = parent_match_start + start
 else:
 # Otherwise, we have to account for the subject start's location
 match_part_start = parent_match_start + hsp.sbjct_start + start - 1
 type="match_part", strand=0,
 qualifiers=copy.deepcopy(part_qualifiers))
 )
 rec.features.append(top_feature)
+rec.annotations = {}
 records.append(rec)
 return records
 def __remove_query_gaps(query, match, subject):
 parser.add_argument('--trim', action='store_true', help='Trim blast hits to be only as long as the parent feature')
 parser.add_argument('--trim_end', action='store_true', help='Cut blast results off at end of gene')
 args = parser.parse_args()
 result = blastxml2gff3(**vars(args))
 GFF.write(result, sys.stdout)

Mercurial > repos > iuc > jbrowse

comparison blastxml_to_gapped_gff3.py @ 3:7342f467507b draft