forked from Axolotl233/Simple_Script
-
Notifications
You must be signed in to change notification settings - Fork 0
/
Blast.GrepNameFormOut.pl
53 lines (49 loc) · 1.06 KB
/
Blast.GrepNameFormOut.pl
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
#! perl
use warnings;
use strict;
use PerlIO::gzip;
use Cwd;
my $h_dir = getcwd();
print STDERR "perl $0 blast.out(tab split) /data/01/user112/database/nr/prot.accession2taxid.gz /data/01/user112/database/nr/names.dmp out.file.name\n";
my %h;
open B,'<',shift;
while(<B>){
my $nr_p =(split/\t/,$_)[1];
$h{$nr_p} = 1;
}
close B;
open T,'<:gzip',shift;
open E,'>',"$h_dir/GrepNameFormBlastOut.tmp";
my %h2;
while(<T>){
my @line = split/\t/,$_;
if(exists $h{$line[1]}){
$h{$line[1]} = $line[2];
push @{$h2{$line[2]}} ,$line[1];
print E $line[1]."\t".$line[2]."\n";
}
}
close T;
close E;
my %h3;
open R,'<',"$h_dir/GrepNameFormBlastOut.tmp";
while(<R>){
chomp;
my $num = (split/\t/,$_)[1];
next if (! $num =~ /\d/);
$h3{$num} += 1;
}
open N,'<',shift;
open O,'>',shift;
while(<N>){
chomp;
next unless /scientific name/;
my @n = split/\|/,$_;
$n[0] =~ s/\s+//g;
$n[1] =~ s/\s+//g;
if (exists $h3{$n[0]}){
print O $n[0]."\t".$n[1];
print O "\t".$h3{$n[0]};
print O "\n";
}
}