Skip to content
Snippets Groups Projects
Commit fa07acf1 authored by Julien  GUGLIELMINI's avatar Julien GUGLIELMINI
Browse files

Removed evalue filtering because some self hits might have higher e-values and...

Removed evalue filtering because some self hits might have higher e-values and the other filters seem to be enough.
parent 629bcefa
No related branches found
No related tags found
No related merge requests found
...@@ -7,7 +7,7 @@ trap 'rm -rf "$tmp"' EXIT ...@@ -7,7 +7,7 @@ trap 'rm -rf "$tmp"' EXIT
export LC_ALL=C export LC_ALL=C
SECONDS=0 SECONDS=0
readonly VERSION=0.7 readonly VERSION=0.8
bold=$(tput bold) bold=$(tput bold)
normal=$(tput sgr0) normal=$(tput sgr0)
...@@ -21,8 +21,9 @@ display_usage() { ...@@ -21,8 +21,9 @@ display_usage() {
echo "${bold}MANDATORY PARAMETERS:${normal}" echo "${bold}MANDATORY PARAMETERS:${normal}"
echo " -i <string> fasta file with all proteins of all the compared genetic elements." echo " -i <string> fasta file with all proteins of all the compared genetic elements."
echo " All identifiers must be formatted as:" echo " All identifiers must be formatted as:"
echo " >element_identifier_XXX" echo " >elementId_XXX"
echo " where XXX is a serie of numbers unique for each protein of each element." echo " where elementID is a string unique for each genetic element"
echo " and XXX is a serie of characters unique for each protein of each element."
echo "${bold}OPTIONS:${normal}" echo "${bold}OPTIONS:${normal}"
echo " -p <string> Path to the mmseqs executable." echo " -p <string> Path to the mmseqs executable."
echo " e.g. /usr/local/bin" echo " e.g. /usr/local/bin"
......
...@@ -66,7 +66,7 @@ FILENAME==ARGV[3] { ...@@ -66,7 +66,7 @@ FILENAME==ARGV[3] {
cov1=$3 cov1=$3
cov2=$4 cov2=$4
fid=$5 fid=$5
evalue=$6 # evalue=$6
bits=$7 bits=$7
# Fix for some evalues below awk precision # Fix for some evalues below awk precision
...@@ -77,7 +77,8 @@ FILENAME==ARGV[3] { ...@@ -77,7 +77,8 @@ FILENAME==ARGV[3] {
} }
} }
if(cov1<=COV || cov2<=COV || fid<=ID || evalue>=EVAL){ # if(cov1<=COV || cov2<=COV || fid<=ID || evalue>=EVAL){
if(cov1<=COV || cov2<=COV || fid<=ID){
next next
} }
...@@ -265,6 +266,16 @@ END { ...@@ -265,6 +266,16 @@ END {
lcj=lj_singleton+length(cluster) lcj=lj_singleton+length(cluster)
lci<lcj ? lc=lci : lc=lcj lci<lcj ? lc=lci : lc=lcj
if(mp==0){
print "bad mp for genomes "gi" "gj
}
if(minprot==0){
print "bad minprot for genomes"gi" "gj
}
if(lc==0){
print "bad lc for genomes "gi" "gj
}
if(gi==gj){ if(gi==gj){
lc = length(cluster) lc = length(cluster)
if(!MEM){ if(!MEM){
......
0% Loading or .
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment