forked from LangilleLab/microbiome_helper
-
Notifications
You must be signed in to change notification settings - Fork 0
/
Copy pathcount_fastq.pl
executable file
·62 lines (52 loc) · 1.31 KB
/
count_fastq.pl
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
#!/usr/bin/perl
use warnings;
use strict;
use File::Basename;
use Getopt::Long;
use Pod::Usage;
use Parallel::ForkManager;
use List::Util 'sum';
my ($parallel,$help);
my $res = GetOptions("parallel:i"=>\$parallel,
"help"=>\$help,
)or pod2usage(2);
pod2usage(-verbose=>2) if $help;
my $cpu_count=0;
#if the option is set
if(defined($parallel)){
#option is set but with no value then use the max number of proccessors
if($parallel ==0){
#load this module dynamically
eval("use Sys::CPU;");
$cpu_count=Sys::CPU::cpu_count();
}else{
$cpu_count=$parallel;
}
}
my $pm = new Parallel::ForkManager($cpu_count);
my @files=@ARGV;
my $gzipped=0;
foreach my $input_file (@files){
my $pid = $pm->start and next;
my ($file,$dir,$suffix)=fileparse($input_file, qr/\.[^.]*/);
my $IN;
if($suffix eq '.gz'){
open($IN, "gunzip -c $input_file |") || die "can't open pipe to $input_file";
}else{
open($IN, '<',$input_file) || die "can't read $input_file";
}
my $i=3;
my $seq_count=0;
my @lengths;
while(<$IN>){
#read every 4th line
unless($i++ %4){
$seq_count++;
push @lengths,length($_);
}
}
print join("\t",$file,$seq_count,sprintf('%d',sum(@lengths)/scalar(@lengths))),"\n";
$pm->finish;
}
#Wait for all samples to be processed
$pm->wait_all_children;