Skip to content
Snippets Groups Projects
Select Git revision
  • da94c9ce1c200ea42893ec804206a291d8165401
  • master default protected
2 results

parse_fastqc.py

Blame
  • user avatar
    Blaise Li authored
    da94c9ce
    History
    parse_fastqc.py 666 B
    #!/usr/bin/env python3
    
    import sys
    
    with open(sys.argv[1], "r") as fqc:
        line = fqc.readline()
        assert line.startswith("##FastQC")
        while not line.startswith(">>Overrepresented sequences"):
            line = fqc.readline()
        seq, count, percent, source = fqc.readline().strip().split("\t")
        assert seq == "#Sequence"
        #cumul_percent = 0
        line = fqc.readline()
        order = 0
        while not line.startswith(">>END_MODULE"):
            seq, _, percent, _ = line.strip().split("\t")
            order += 1
            #cumul_percent += float(percent)
            print(">Over_represented_%d (%s)\n%s" % (order, percent, seq))
            line = fqc.readline()
    
    sys.exit(0)