# HG changeset patch # User brinkmanlab # Date 1592326027 14400 # Node ID f2656e644641f548c87dcf4051d6df80be74e386 # Parent a2258ce2d58c3cf6478c488b25ad0e03acf9b813 "planemo upload for repository https://github.com/brinkmanlab/galaxy-tools/tree/master/make_unique_id commit e3bef6bd24b0d0bf5645a5d1083c1fa886c19e4a" diff -r a2258ce2d58c -r f2656e644641 make_unique_id.py --- a/make_unique_id.py Mon Jun 15 19:32:32 2020 -0400 +++ b/make_unique_id.py Tue Jun 16 12:47:07 2020 -0400 @@ -29,22 +29,15 @@ ids = defaultdict(int) def makeUnique(seq): - seqlenlen = len(str(len(seq))) - newid = seq.id[:26 - seqlenlen] # Genbank has a max length for the id and sequence length number, truncate the sequence id if too long - count = ids[newid] - ids[newid] += 1 + count = ids[seq.id] + ids[seq.id] += 1 if count: + oldid = seq.id suffix = "_" + str(count) - if len(newid) + len(suffix) + 1 + seqlenlen > 26: - newid = newid[:25 - seqlenlen - len(suffix)] - - newid += suffix + seq.id += suffix seq.name += suffix + print(f"{oldid}\t{seq.id}") - if seq.id != newid: - print(f"{seq.id}\t{newid}") - - seq.id = newid return seq diff -r a2258ce2d58c -r f2656e644641 make_unique_id.xml --- a/make_unique_id.xml Mon Jun 15 19:32:32 2020 -0400 +++ b/make_unique_id.xml Tue Jun 16 12:47:07 2020 -0400 @@ -10,7 +10,7 @@ python - biopython + biopython