comparison lrn_risk.py @ 4:8fe04662585c draft

Uploaded
author greg
date Tue, 29 Aug 2023 01:23:22 +0000
parents 5a27ac020c9e
children 5aa8560d9d91
comparison
equal deleted inserted replaced
3:5a27ac020c9e 4:8fe04662585c
80 80
81 81
82 def gene_dist(f, blast, gtdb): 82 def gene_dist(f, blast, gtdb):
83 # get within-species prevalence of genes 83 # get within-species prevalence of genes
84 # for virulence factors (VFs): uses VFDB VFs detected via ABRicate's VFDB db 84 # for virulence factors (VFs): uses VFDB VFs detected via ABRicate's VFDB db
85 # for AMR genes: uses AMR genes detected via ABRicate's ResFinder db 85 # for AMR genes: uses AMR genes detected via ABRicate + PIMA db
86 # for VFs and AMR genes: genes were detected via ABRicate XXX 86 # for VFs and AMR genes: genes were detected via ABRicate XXX
87 # minimum nucleotide identity and coverage values >=80% 87 # minimum nucleotide identity and coverage values >=80%
88 # total of 61,161 genomes queried 88 # total of 61,161 genomes queried
89 # takes VFDB or AMR gene distribution file as input (f) 89 # takes VFDB or AMR gene distribution file as input (f)
90 # BLAST file of VFDB or AMR genes (blast) 90 # BLAST file of VFDB or AMR genes (blast)
130 perc = items[4] 130 perc = items[4]
131 perc = str(round(float(perc), 2)) 131 perc = str(round(float(perc), 2))
132 ann = items[-1] 132 ann = items[-1]
133 freetext = '{0}/{1} ({2}%)'.format(pres, denom, perc) 133 freetext = '{0}/{1} ({2}%)'.format(pres, denom, perc)
134 elif gtdb != '(Unknown Species)': 134 elif gtdb != '(Unknown Species)':
135 ann = annd[key] 135 ann = 'NA'
136 denom = gtdbd[gtdb] 136 denom = gtdbd[gtdb]
137 freetext = "*WARNING" 137 freetext = "*WARNING"
138 warnings.append("*WARNING: This gene has never been detected in this species! Interpret with caution!") 138 warnings.append("*WARNING: This gene has never been detected in this species! Interpret with caution!")
139 else: 139 else:
140 ann = annd[key] 140 ann = 'NA'
141 freetext = "**WARNING" 141 freetext = "**WARNING"
142 warnings.append("**WARNING: This genome belongs to an undescribed species. Interpret with caution!") 142 warnings.append("**WARNING: This genome belongs to an undescribed species. Interpret with caution!")
143 finallines.append('%s\t%s\t%s' % (bv, ann, freetext)) 143 finallines.append('%s\t%s\t%s' % (bv, ann, freetext))
144 return [finallines, warnings] 144 return [finallines, warnings]
145 145