- 论坛徽章:
- 0
|
- [symphony@archlinux p]$ cat sumab.pl
- #!/usr/bin/perl -w
- use strict;
- my $name;
- my %hash;
- my %a;
- my %b;
- while (<>) {
- chomp;
- $name = [ DISCUZ_CODE_0 ] if /^>sp.*/;
- $hash{$name} .= $1 if /PredSS\s+(.*)$/;
- }
- foreach (keys %hash){
- my @tmp = ();
- @tmp = $hash{$_} =~ /(a)/g;
- $a{$_} = @tmp;
- @tmp = ();
- @tmp = $hash{$_} =~ /(b)/g;
- $b{$_} = @tmp;
- print $_,"\nhas a:",$a{$_},"\nhas b:",$b{$_},"\n";
- }
复制代码
- [symphony@archlinux p]$ cat data
- >sp|P35354|PGH2_HUMAN Prostaglandin G/H synthase 2 OS=Homo sapiens GN=PTGS2 PE=
- Length=604
- 10 20 30 40 50
- PredSS aaaaaaaaaaaa bbbbbb bbbbb
- AA seq MLARALLLCAVLALSHTANPCCSHPCQNRGVCMSVGFDQYKCDCTRTGFY
- ProbA
- ProbB
- 60 70 80 90 100
- PredSS aaaaaaaaaa bbbbbb aaaa aaaaaaaaa
- AA seq GENCSTPEFLTRIKLFLKPTPNTVHYILTHFKGFWNVVNNIPFLRNAIMS
- ProbA
- ProbB
- 110 120 130 140 150
- PredSS aaaaa aaaaaaa
- AA seq YVLTSRSHLIDSPPTYNADYGYKSWEAFSNLSYYTRALPPVPDDCPTPLG
- ProbA
- ProbB
- >sp|Q02127|PYRD_HUMAN Dihydroorotate dehydrogenase, mitochondrial OS=Homo sapie
- Length=395
- 10 20 30 40 50
- PredSS aaaaaaa bbbbb aaaaaaaaaaa aaaaaaaaaaaa
- AA seq MAWRHLKKRAQDAVIILGGGGLLFASYLMATGDERFYAEHLMPTLQGLLD
- ProbA
- ProbB
- 60 70 80 90 100
- PredSS aaaaaaaaaaaaaa bbbbbb bbbbbbb
- AA seq PESAHRLAVRFTSLGLLPRARFQDSDMLEVRVLGHKFRNPVGIAAGFDKH
- ProbA
- ProbB
- 110 120 130 140 150
- PredSS aaaaaaaaaa bbbbb bbbbbaaa bbbb
- AA seq GEAVDGLYKMGFGFVEIGSVTPKPQEGNPRPRVFRLPEDQAVINRYGFNS
- ProbA
- ProbB
复制代码
- [symphony@archlinux p]$ ./sumab.pl data
- >sp|Q02127|PYRD_HUMAN Dihydroorotate dehydrogenase, mitochondrial OS=Homo sapie
- has a:57
- has b:32
- >sp|P35354|PGH2_HUMAN Prostaglandin G/H synthase 2 OS=Homo sapiens GN=PTGS2 PE=
- has a:47
- has b:17
复制代码 |
|