- 论坛徽章:
- 0
|
$/=undef;
$content = <DATA>;
my %hash;
while($content =~ /(Gene.+\n.+)/g) {
#push @array, $1;
my $content = $1;
($key, $length) = $content =~ /(NM_\d+).+len \d+)/;
push @array, [$content, $key, $length];
$hash{$key} //= $length;
if($hash{$key} < $length) {
$hash{$key} = $length;
}
}
@target = map {$_->[0]} grep { if($hash{$_->[1]} == $_->[2]){1} else{0} } @array;
print join"\n", @target;
__DATA__
>Gene.1::NM_198493::g.1::m.1 type:5prime_partial len:287 gc:universal NM_198493:2-862(+)
LRRCYGNRGGRGPGVVFLELMESEGPPESESSEFFSQQEEENEEEEAQEPEETGPKNPLLQPALTGDVEGLQKIFEDPEN
>Gene.2::NM_198493::g.2::m.2 type:complete len:153 gc:universal NM_198493:1865-2323(+)
MYEQFSFNFLKQKNTAITFSHLFGRPSGCLWSSTKKTCVCSFFFFTLL
>Gene.3::NM_198493::g.4::m.4 type:complete len:118 gc:universal NM_198493:1954-2307(+)
MEQYKEDLCLLLFFFYPPSPFSLFPSLPLLLPLPSSPFPSLPLPSPPFLSLPLPSPPFLSPPLPSSPLPSPSSSLSSSSSLSNSFFFLSYLSLSLHPRNLLDRVCLSCPGWNAVE
>Gene.4::NM_173852::g.6::m.6 type:complete len:163 gc:universal NM_173852:27-515(+)
MRIANRTRFSSPFLARGAGWTHGRGMMVVGTGTSLALSSLLSLLLFAGMQMYSRQLASTEWLTIQGGLLGSGLFVFSLTAFNNLENLVFGKGFQAKIFPEILLCLA
>Gene.9::NM_013945::g.9::m.9 type:complete len:519 gc:universal NM_013945:599-2155(+)
MAALPGTVPRMMRPAPGQNYPRTGFPLEVSTPLGQGRVNQLGGVFINGRP
>Gene.13::NM_013945::g.13::m.13 type:complete len:102 gc:universal NM_013945:1821-2126(+)
MAAWTRPPPSQPAAASGPTPSSQETACPPPRPTAHPPTAPPATAWTPWPAISTASTARVSAWCPGRPPSPFLLPPPGPPACLWRATRWCQGGECPFHRWKN |
|