-
Notifications
You must be signed in to change notification settings - Fork 0
/
Copy pathscan_strand_gene.pl
67 lines (57 loc) · 1.24 KB
/
scan_strand_gene.pl
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
#!/usr/bin/perl
use strict;
use warnings;
use Tie::File;
use Getopt::Std;
my %para;
getopts('a:i:o:b:c:d:e:f:h:i:j:k:l:m:n:s:',\%para);
if(!defined $para{i} || !defined $para{o}){
my $usage=qq'
Usage:
Contact:honghh\@honghh.com.cn
perl $0 -i <infile> -o <outfile> -s <seperator> :default="###"
';
print $usage;
exit;
}
$para{s} ||="###";
my @file;
open(IN,"$para{i}") or die "$!";
open(OUT,">$para{o}");
open(OUT1,">Filter_id_with_+-strand_on.txt");
open(TEMP,">\.Temp.list"); #hiden temp file
##filter file header of gff3 build middle file
my @header=();
while(<IN>){
chomp;
if($_=~/^##.*\d+$/){
push @header,$_;
next;
}else{
print TEMP $_,"\n";
}
}
close TEMP;
#print header description
for(@header){
print OUT $_,"\n";
}
open(IN1,"\.Temp.list") or die "$!";
tie @file,'Tie::File',\*IN1, recsep => $para{s},autochomp => 0;
my $count=0;
for my $line(@file){
chomp($line);
if($line=~/\+.*\-/smg || $line=~/\-.*\+/smg){
my $gene_id=(split /\;/,(split /\s+/,(split /\n+/,$line,2)[1])[8])[0];
$count++;
print OUT1 $gene_id,"\n";
}else{
print OUT $line;
}
}
print OUT1 "Number of gene on both positive strand and negative strand:",$count,"\n";
close IN;
close OUT;
close OUT1;
close IN1;
`rm -r \.Temp.list` if(-e "\.Temp.list");