Hello,

J'aimerais pour chaque gène récuperer le accession number (Acc )et la séquence traduite (translation)
Mon problème est que j'obtiens des lignes vides!!!(correspondant aux lignes non selectionnés

>Acc:20773
MREIVLTQIGQCGNQIGAKFWEVISDEHAINSAGTYHGDSHLQLE
RINVYYNEASGGR
>Acc:H2Q1I7
MSRVHGMHPKETTRQLSLAVKDGLIVETLTVGCKGSKAGIEQEGY WLPGDEIDWETENHDWYCFECHLPGEVLICDLCFRVYHSKCLSDEFRLRDSSSPWQCPVCRSIKKKNTNKQEMGTYLRFIVSRMKERAIDLNKKGK

[CODE]
...
FT gene complement(98074..100357)
FT /gene=ENSPTRG00000002168
FT /locus_tag="TUBB8"
FT /note="tubulin, beta 8 class VIII [Source:HGNC
FT Symbol;Acc:20773]"
FT mRNA join(complement(100232..100357),complement(99852..99960),
FT complement(99663..99773),complement(98074..99162))
FT /gene="ENSPTRG00000002168"
FT /note="transcript_id=ENSPTRT00000003967"
FT CDS join(complement(100232..100288),complement(99852..99960),
FT complement(99663..99773),complement(98105..99162))
FT /gene="ENSPTRG00000002168"
FT /translation="MREIVLTQIGQCGNQIGAKFWEVISDEHAINSAGTYHGDSHLQLE
FT RINVYYNEASGGR"
FT gene 189072..315637
FT /gene=ENSPTRG00000002229
FT /locus_tag="ZMYND11"
FT /note="Uncharacterized protein
FT [Source:UniProtKB/TrEMBL;Acc:H2Q1I7]"
FT mRNA join(189072..189393,235063..235197,271057..271216,
FT 282201..282362,297879..297956,298626..298718,
FT 300469..300556,301102..301157,301939..302016,
FT 303068..303186,307802..308009,308433..308501,
FT 309351..309623,309917..310102,313361..315637)
FT /gene="ENSPTRG00000002229"
FT /note="transcript_id=ENSPTRT00000004081"
FT CDS join(271061..271216,282201..282362,297879..297956,
FT 298626..298718,300469..300556,301102..301157,
FT 301939..302016,303068..303186,307802..308009,
FT 308433..308501,309351..309623,309917..310102,
FT 313361..313483)
FT /gene="ENSPTRG00000002229"
FT /protein_id="ENSPTRP00000003768"
FT /note="transcript_id=ENSPTRT00000004081"
FT /db_xref="RefSeq_mRNA_predicted:XM_001135863.3"
FT /db_xref="Ens_Hs_transcript:ENST00000309776"
FT /db_xref="Uniprot/SPTREMBL:H2Q1I7_PANTR"
FT /db_xref="Uniprot/SPTREMBL:K7CUR4_PANTR"
FT /db_xref="EMBL:AACZ03076941"
FT /db_xref="EMBL:GABD01004750"
FT /db_xref="EMBL:GABF01002657"
FT /db_xref="Ens_Hs_translation:ENSP00000309992"
FT /db_xref="GO:GO:0005515"
FT /db_xref="GO:GO:0005515"
FT /db_xref="Uniprot_gn_trans_name:ZMYND11-201"
FT /db_xref="goslim_goa:GO:0003674"
FT /db_xref="goslim_goa:GO:0005622"
FT /db_xref="protein_id:JAA10128.1"
FT /db_xref="UniParc:UPI000002E25A"
FT /translation="MSRVHGMHPKETTRQLSLAVKDGLIVETLTVGCKGSKAGIEQEGY
FT WLPGDEIDWETENHDWYCFECHLPGEVLICDLCFRVYHSKCLSDEFRLRDSSSPWQCPV
FT CRSIKKKNTNKQEMGTYLRFIVSRMKERAIDLNKKGK"

Code : Sélectionner tout - Visualiser dans une fenêtre à part
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
 
my $seq = 0;
my $sequence;
 
open FILE, "test" or die $!;
 
while (my $line =<FILE>) {
        if ($line =~ /Acc:(.*)\]\"/){
		print ">accession number :$1 \n";
	}
        elsif ($line =~ /^FT                   \/translation=\"(.*)/) {
		$seq = 1;
		my $all=$1;
		print "$all \n";
       }
       elsif ( ($seq) && ($line =~ /FT                   ([A-Z]*)/)){                  
                 print "$1 \n";
      }
}   
close FILE;