Skip to content

Commit 3cbaed6

Browse files
committed
updating taxon_id_scripts with modified versions
1 parent 3e58aa0 commit 3cbaed6

23 files changed

+732
-1670
lines changed

taxon_id_scripts/LCA_table_to_kraken_output_format.pl

Lines changed: 18 additions & 10 deletions
Original file line numberDiff line numberDiff line change
@@ -33,7 +33,7 @@
3333
# perl LCA_table_to_kraken_output_format.pl
3434
# [output of retrieve_top_blast_hits_LCA_for_each_sequence.pl for one blast search]
3535
# [fasta file that was input to blast search (to retrieve sequence lengths and names of unclassified sequences)]
36-
# [output kraken format table]
36+
# > [output kraken format table]
3737

3838

3939
use strict;
@@ -56,14 +56,15 @@
5656
my $LCA_taxon_species_column = 3;
5757
my $LCA_taxon_genus_column = 4;
5858
my $LCA_taxon_family_column = 5;
59-
my $evalue_of_top_hits_column = 6;
60-
my $lowest_pident_of_top_hits_column = 7;
61-
my $mean_pident_of_top_hits_column = 8;
62-
my $highest_pident_of_top_hits_column = 9;
63-
my $lowest_qcovs_of_top_hits_column = 10;
64-
my $mean_qcovs_of_top_hits_column = 11;
65-
my $highest_qcovs_of_top_hits_column = 12;
66-
my $number_top_hits_column = 13;
59+
my $LCA_taxon_superkingdom_column = 6;
60+
my $evalue_of_top_hits_column = 7;
61+
my $lowest_pident_of_top_hits_column = 8;
62+
my $mean_pident_of_top_hits_column = 9;
63+
my $highest_pident_of_top_hits_column = 10;
64+
my $lowest_qcovs_of_top_hits_column = 11;
65+
my $mean_qcovs_of_top_hits_column = 12;
66+
my $highest_qcovs_of_top_hits_column = 13;
67+
my $number_top_hits_column = 14;
6768

6869

6970
# reads in sequence names and lengths from fasta file
@@ -126,7 +127,14 @@
126127
# prints kraken format row for unclassified sequence
127128
# "C"/"U": a one letter code indicating that the sequence was either classified
128129
# or unclassified.
129-
print "C".$DELIMITER;
130+
if($assigned_taxon_id == 0)
131+
{
132+
print "U".$DELIMITER;
133+
}
134+
else
135+
{
136+
print "C".$DELIMITER;
137+
}
130138

131139
# The sequence ID, obtained from the FASTA/FASTQ header.
132140
print $sequence_name.$DELIMITER;

taxon_id_scripts/add_column_with_superkingdom_of_taxon_id.pl

Lines changed: 0 additions & 158 deletions
This file was deleted.

taxon_id_scripts/add_one_value_column.pl

100755100644
File mode changed.

0 commit comments

Comments
 (0)