Mercurial > repos > bebatut > extract_min_max_lines
view extract_min_max_lines.py @ 0:90fc00b34716 draft default tip
planemo upload for repository https://github.com/asaim/galaxytools/tree/master/tools/extract_min_max_lines commit 718c006213709b631862b8d6d655fafc92e79ef7-dirty
author | bebatut |
---|---|
date | Fri, 15 Apr 2016 07:59:28 -0400 |
parents | |
children |
line wrap: on
line source
#!/usr/bin/env python # -*- coding: utf-8 -*- import sys import os import argparse import re import time def extract_lines(input_content, column_id, extraction_type, extraction_nb): conserved_lines = [] for line in input_content: split_line = line[:-1].split('\t') value = float(split_line[column_id]) if len(conserved_lines) < extraction_nb: conserved_lines.append(split_line) else: best_pos = None #print value #print conserved_lines for i in range(len(conserved_lines)-1,-1,-1): compared_value = float(conserved_lines[i][column_id]) if extraction_type(value, compared_value) == value: print value, compared_value, extraction_type(value, compared_value) best_pos = i else: break if best_pos != None: print best_pos tmp_conserved_lines = conserved_lines conserved_lines = tmp_conserved_lines[:best_pos] conserved_lines += [split_line] conserved_lines += tmp_conserved_lines[best_pos:-1] print conserved_lines print return conserved_lines def extract_min_max_lines(args): if args.extraction_type == 'max': extraction_type = max elif args.extraction_type == 'min': extraction_type = min with open(args.input_file, 'r') as input_file: input_content = input_file.readlines() conserved_lines = extract_lines(input_content, args.column_id - 1, extraction_type, args.extraction_nb) with open(args.output_file, 'w') as output_file: for line in conserved_lines: output_file.write('\t'.join(line) + "\n") if __name__ == '__main__': parser = argparse.ArgumentParser() parser.add_argument('--input_file', required=True) parser.add_argument('--output_file', required=True) parser.add_argument('--column_id', required=True, type=int) parser.add_argument('--extraction_type', required=True, choices = ['min','max']) parser.add_argument('--extraction_nb', required=True, type=int) args = parser.parse_args() extract_min_max_lines(args)