From 252da6c6b4502420e6dcfe843dc33b9d2b01f42b Mon Sep 17 00:00:00 2001 From: Abel Ureta-Vidal <abel@sanger.ac.uk> Date: Tue, 12 Feb 2002 12:13:29 +0000 Subject: [PATCH] Adding database source and accession number in gene description field --- scripts/gene-descriptions.pl | 12 ++++++------ 1 file changed, 6 insertions(+), 6 deletions(-) diff --git a/scripts/gene-descriptions.pl b/scripts/gene-descriptions.pl index 2caf8057a3..3e1fed1bd8 100755 --- a/scripts/gene-descriptions.pl +++ b/scripts/gene-descriptions.pl @@ -40,7 +40,7 @@ undef %gene_desc; LINE: while (<MAP>) { chomp; - ($ensp, $ensg, $db, $acc)=split(/\t/); + my ($ensp, $ensg, $db, $acc)=split(/\t/); if ( defined($gene_desc{$ensg}) ) { ($prevdb, $prev_desc) = @{$gene_desc{$ensg}}; @@ -49,7 +49,7 @@ while (<MAP>) { } if ($db eq 'SWISS-PROT') { $desc = $sp_desc{"$db:$acc"}; - $gene_desc{$ensg} = [ $db, $desc]; # kick out the SPTREMBL desc. + $gene_desc{$ensg} = [ $db, $desc, $acc ]; # kick out the SPTREMBL desc. next LINE; } @@ -58,7 +58,7 @@ while (<MAP>) { if ( &compare_desc($prev_desc, $desc) < 0 ) { # new desc is better # warn "new better: $desc (old was: $prev_desc)\n"; - $gene_desc{$ensg} = [ $db, $desc]; + $gene_desc{$ensg} = [ $db, $desc, $acc ]; next LINE; } else { # warn "old better: $prev_desc (new is: $desc)\n"; @@ -68,13 +68,13 @@ while (<MAP>) { } } else { $desc = $sp_desc{"$db:$acc"}; - $gene_desc{$ensg} = [ $db, $desc]; + $gene_desc{$ensg} = [ $db, $desc, $acc ]; } } # while <MAP> # now dump the stuff to stdout. foreach $ensg ( keys %gene_desc ) { - ($db, $desc) = @{$gene_desc{$ensg}}; + my ($db,$desc,$acc) = @{$gene_desc{$ensg}}; ### final cleanup ### get rid of the Rik mess: @@ -86,7 +86,7 @@ foreach $ensg ( keys %gene_desc ) { s/^\s*\(\s*\)\s*$//g; ### add more as appropriate - print STDOUT "$ensg\t$_\n" if $_; # =~ /[a-z]/;??? + print STDOUT "$ensg\t $_ [Source:$db;Acc:$acc]\n" if $_; # =~ /[a-z]/;??? } #### following taken from ensembl-external/scripts/family-input.pl -- GitLab