my $in_file = $ARGV[0];
my $out_file = $ARGV[1];
+my $max_genes = 100;
+
# Get list of species to check
my @species_list;
print OUTFILE "Description\tID";
# Print species list to output file
for my $species (@species_list) {
- print OUTFILE "\t$species";
+ my $species_sub = $species;
+ $species_sub =~ s/_//;
+ print OUTFILE "\t$species_sub";
}
print OUTFILE "\n";
# drop any lines (clusters) that only have one species in them
my @line_array = split("\t", $mid_line);
my @match_array;
+ my $max_over = 1;
foreach my $elem (@line_array) {
if($elem != 0) {
push(@match_array, $elem);
}
+ if($elem >= $max_genes) {
+ $max_over = 0;
+ }
}
my $match_count = @match_array;
- if ($match_count != 1) {
+ if ($match_count != 1 && $max_over) {
print OUTFILE "$super_id\t$super_id\t$mid_line\n";
}
}