Newer
Older
#
# Ensembl module for Registry
#
# Copyright EMBL/EBI
##
# You may distribute this module under the same terms as perl itself
# POD documentation - main docs before the code
=head1 NAME
Bio::EnsEMBL::Registry
=head1 SYNOPSIS
$gene_adaptor = Bio::EnsEMBL::Registry->get_adaptor("Homo Sapiens","core","Gene"))
=head1 DESCRIPTION
All Adaptors are stored/registered using this module. This module should then
be used to get the adaptors needed.
The registry can be loaded from a configuration file using the method load_all.
If a file is passed to load_all then this is used.
Else if the enviroment variable ENSEMBL_REGISTRY is set then this is used
Else if the file .ensembl_init in your home directory exist it is used.
For the Web server ENSEMBL_REGISTRY should be set in SiteDefs.pm, which will
pass this on to load_all.
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
The four types of registrys are for db adaptors, dba adaptors, dna adaptors
and the standard type.
=head2 db
These are registrys for backwards compatibillity and enable the subroutines
to add other adaptors to connections.
e.g. get_all_db_adaptors, get_db_adaptor, add_db_adaptor, remove_db_adaptor
are the old DBAdaptor subroutines which are now redirected to the Registry.
So if before we had
my $sfa = $self->adaptor()->db()->get_db_adaptor('blast');
We now want to change this to
my $sfa = Bio::EnsEMBL::Registry->get_db($self->adaptor->db,'blast');
OR preferably if the blast adaptor was set up in configure
my $sfa = Bio::EnsEMBL::Registry->get_adaptor("Human","core","blast");
=head2 DBA
These are the stores for the DBAdaptors
The Registry will create all the DBConnections needed now if you set up the
configuration correctly. So instead of the old commands like
my $db = Bio::EnsEMBL::DBSQL::DBAdaptor->new(....)
my $exon_adaptor = $db->get_ExonAdaptor;
we should now have just
my $exon_adaptor = Bio::EnsEMBL::Registry->get_adaptor("Human","core","Exon");
=head2 DNA
This is an internal Registry and allows the configuration of a dnadb.
An example here is to set the est database to get its dna data from the core database.
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
## set the est db to use the core for getting dna data.
#Bio::EnsEMBL::Utils::ConfigRegistry->
# dnadb_add("Homo Sapiens","core","Homo Sapiens","est");
=head2 adaptors
This is the registry for all the general types of adaptors like GeneAdaptor, ExonAdaptor,
Slice Adaptor etc.
These are accessed by the get_adaptor subroutine i.e.
my $exon_adaptor = Bio::EnsEMBL::Registry->get_adaptor("Human","core","Exon");
=head1 CONTACT
Post questions to the Ensembl developer list: <ensembl-dev@ebi.ac.uk>
=head1 METHODS
=cut
package Bio::EnsEMBL::Registry;
use strict;
use Bio::EnsEMBL::DBSQL::MergedAdaptor;
use Bio::EnsEMBL::Utils::Exception qw( deprecate throw warning );
use Bio::EnsEMBL::Utils::Argument qw(rearrange);
use vars qw(%registry_register);
$registry_register{'_WARN'} = 0;
=head2 load_all
Will load the registry with the configuration file which is obtained from
the first in the following and in that order.
1) if an argument is passed to this method this is used as the conf file.
2) If the enviroment variable ENSEMBL_REGISTRY is set this is used.
3) If the file .ensembl_init exist in the home directory it is used
Arg [1] : (optional) string $arg file to load the registry from
Example : Bio::EnsEMBL::Registry->load_all();
Returntype : none
Exceptions : none
=cut
sub load_all{
my $class = shift;
my $web_reg = shift;
#$registry_register{'_WARN'} = 0; # default report overwriting
if(!defined($registry_register{'seen'})){
$registry_register{'seen'}=1;
if(defined($web_reg)){
print STDERR "Loading conf from site defs file ".$web_reg."\n";
if(-e $web_reg){
unless (my $return = do $web_reg ){
throw "Error in Configuration\n $!\n";
}
# other wise it gets done again by the web initialisation stuff
delete $INC{$web_reg};
}
elsif(defined($ENV{ENSEMBL_REGISTRY}) and -e $ENV{ENSEMBL_REGISTRY}){
print STDERR "Loading conf from ".$ENV{ENSEMBL_REGISTRY}."\n";
unless (my $return = do $ENV{ENSEMBL_REGISTRY}){
throw "Error in Configuration\n $!\n";
}
}
elsif(-e $ENV{HOME}."/.ensembl_init"){
do($ENV{HOME}."/.ensembl_init");
}
else{
print STDERR "NO default configuration to load\n";
}
}
else{
print STDERR "Already configured???\n";
}
}
#
# add ons.
#
=head2 add_db
Arg [1] : db to add adaptor to.
Arg [2] : name of the name to add the adaptor to in the registry.
Arg [3] : The adaptor to be added to the registry.
Example : Bio::EnsEMBL::Registry->add_db($db, "lite", $dba);
Returntype : none
Exceptions : none
=cut
sub add_db{
my ($class, $db, $name, $adap) = @_;
if($db->species() ne $adap->species){
$registry_register{$db->species()}{$db->group()}{'_special'}{$name} = $adap;
}
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
210
211
212
213
214
215
216
217
}
=head2 remove_db
Arg [1] : db to remove adaptor from.
Arg [2] : name to remove the adaptor from in the registry.
Example : my $db = Bio::EnsEMBL::Registry->remove_db($db, "lite");
Returntype : adaptor
Exceptions : none
=cut
sub remove_db{
my ($class, $db, $name) = @_;
my $ret = $registry_register{$db->species()}{$db->group()}{'_special'}{$name};
$registry_register{$db->species()}{$db->group()}{'_special'}{$name} = undef;
return $ret;
}
=head2 get_db
Arg [1] : db to get adaptor from.
Arg [2] : name to get the adaptor for in the registry.
Example : my $db = Bio::EnsEMBL::Registry->get_db("Human", "core", "lite");
Returntype : adaptor
Exceptions : none
=cut
sub get_db{
my ($class, $db, $name) = @_;
my $ret = Bio::EnsEMBL::Registry->get_DBAdaptor($db->species,$name);
if(defined($ret)){
return $ret;
}
return $registry_register{$db->species()}{$db->group()}{'_special'}{$name};
}
=head2 get_all_db_adaptors
Arg [1] : db to get all the adaptor from.
Example : my $db = Bio::EnsEMBL::Registry->get_all_db_adaptors($db);
Returntype : adaptor
Exceptions : none
=cut
sub get_all_db_adaptors{
my ($class,$db) = @_;
my %ret=();
# we now also want to add all the DBAdaptors for the same species.
# as add_db_adaptor does not add if it is from the same species.
foreach my $dba (@{$registry_register{'_DBA'}}){
if($dba->species() eq $db->species()){
$ret{$dba->group()} = $dba;
}
}
foreach my $key (keys %{$registry_register{$class->get_alias($db->species())}{$db->group()}{'_special'}}){
$ret{$key} = $registry_register{$class->get_alias($db->species())}{$db->group()}{'_special'}{$key};
250
251
252
253
254
255
256
257
258
259
260
261
262
263
264
265
266
267
268
269
270
271
272
273
274
275
276
277
278
279
280
281
282
283
284
285
286
287
288
289
290
291
292
293
294
295
296
297
298
299
300
301
302
303
304
305
306
307
308
309
310
311
312
313
314
315
316
317
318
319
320
321
322
323
324
325
326
327
328
329
330
331
332
333
334
335
336
337
338
339
340
341
342
343
}
return \%ret;
}
#
# DBAdaptors
#
=head2 add_DBAdaptor
Arg [1] : name of the species to add the adaptor to in the registry.
Arg [2] : name of the group to add the adaptor to in the registry.
Arg [3] : The DBAaptor to be added to the registry.
Example : Bio::EnsEMBL::Registry->add_DBAdaptor("Human", "core", $dba);
Returntype : none
Exceptions : none
=cut
sub add_DBAdaptor{
my ($class, $species, $group, $adap) = @_;
$species = $class->get_alias($species);
$registry_register{$species}{$group}{'_DB'} = $adap;
if(!defined($registry_register{'_DBA'})){
my @list =();
push(@list,$adap);
$registry_register{'_DBA'}= \@list;
}
else{
push(@{$registry_register{'_DBA'}},$adap);
}
}
=head2 get_DBAdaptor
Arg [1] : name of the species to get the adaptor for in the registry.
Arg [2] : name of the group to get the adaptor for in the registry.
Example : $dba = Bio::EnsEMBL::Registry->get_DBAdaptor("Human", "core");
Returntype : DBAdaptor
Exceptions : none
=cut
sub get_DBAdaptor{
my ($class, $species, $group) = @_;
$species = $class->get_alias($species);
if(defined($group)){ # group defined so return standard DB Adaptor
return $registry_register{$species}{$group}{'_DB'};
}
else{ #return a merged db adaptor
return new_merged Bio::EnsEMBL::DBSQL::DBAdaptor($species);
}
}
=head2 get_all_DBAdaptors
Example : @dba = @{Bio::EnsEMBL::Registry->get_all_DBAdaptors();
Returntype : list of DBAdaptors
Exceptions : none
=cut
sub get_all_DBAdaptors{
my ($class)=@_;
return @{$registry_register{'_DBA'}};
}
#
# DNA Adaptors
#
=head2 add_DNAAdaptor
Arg [1] : name of the species to add the adaptor to in the registry.
Arg [2] : name of the group to add the adaptor to in the registry.
Arg [3] : The adaptor to be added to the registry as a DNA adaptor.
Example : Bio::EnsEMBL::Registry->add_DNAAdaptor("Human", "core", $dnaAdap);
Returntype : none
Exceptions : none
=cut
sub add_DNAAdaptor{
my ($class, $species, $group, $dnadb_species, $dnadb_group) = @_;
$dnadb_species = $class->get_alias($dnadb_species);
Ian Longden
committed
if($dnadb_group->isa('Bio::EnsEMBL::DBSQL::DBAdaptor')){
Ian Longden
committed
}
else{
$registry_register{$species}{$group}{'_DNA'} = $dnadb_group;
$registry_register{$species}{$group}{'_DNA2'} = $dnadb_species;
Ian Longden
committed
}
}
=head2 get_DNAAdaptor
Arg [1] : name of the species to get the adaptor for in the registry.
Arg [2] : name of the group to get the adaptor for in the registry.
Example : $dnaAdap = Bio::EnsEMBL::Registry->get_DNAAdaptor("Human", "core");
Returntype : adaptor
Exceptions : none
=cut
sub get_DNAAdaptor{
my ($class, $species, $group) = @_;
$species = $class->get_alias($species);
Ian Longden
committed
my $new_group = $registry_register{$species}{$group}{'_DNA'};
my $new_species = $registry_register{$species}{$group}{'_DNA2'};
Ian Longden
committed
if( defined $new_group ) {
return $class->get_DBAdaptor($new_species,$new_group);
Ian Longden
committed
} else {
return undef;
}
378
379
380
381
382
383
384
385
386
387
388
389
390
391
392
393
394
395
396
397
398
399
400
401
402
403
404
405
406
407
408
409
410
411
412
413
414
415
416
417
418
419
420
421
422
423
424
425
426
427
428
429
430
431
432
433
434
435
436
437
438
439
440
441
442
443
444
445
446
447
448
449
450
451
452
453
454
455
456
457
458
459
460
461
}
#
# General Adaptors
#
=head2 add_adaptor
Arg [1] : name of the species to add the adaptor to in the registry.
Arg [2] : name of the group to add the adaptor to in the registry.
Arg [3] : name of the type to add the adaptor to in the registry.
Arg [4] : The DBAaptor to be added to the registry.
Arg [5] : (optional) if set okay to overwrite.
Example : Bio::EnsEMBL::Registry->add_adaptor("Human", "core", "Gene", $adap);
Returntype : none
Exceptions : none
=cut
sub add_adaptor{
my ($class,$species,$group,$type,$adap, $reset)= @_;
$species = $class->get_alias($species);
#
# Becouse the adaptors are not stored initially only there class paths when
# the adaptors are obtained we need to store these instead.
# It is not necessarily an error if the registry is overwritten without
# the reset set but it is an indication that we are overwriting a database
# which should be a warning for now
#
if(defined($reset)){ # JUST REST THE HASH VLAUE NO MORE PROCESSING NEEDED
$registry_register{$species}{$group}{$type} = $adap;
return;
}
if(defined($registry_register{$species}{$group}{$type})){
print STDERR ("Overwriting Adaptor in Registry for $species $group $type\n");
$registry_register{$species}{$group}{$type} = $adap;
return;
}
$registry_register{$species}{$group}{$type} = $adap;
if(!defined ($registry_register{$species}{'list'})){
my @list =();
push(@list,$adap);
$registry_register{$species}{'list'}= \@list;
}
else{
push(@{$registry_register{$species}{'list'}},$adap);
}
# print STDERR "REGADD $species \t $group \t $type\t to the registry\n";
if(!defined ($registry_register{$type}{$species})){
my @list =();
push(@list,$adap);
$registry_register{$type}{$species}= \@list;
}
else{
push(@{$registry_register{$type}{$species}},$adap);
}
}
=head2 set_get_via_dnadb_if_set
set the flag so that for this type of adaptor the data is obtained
from the dna source and not centrally i.e. estgenes where the sequence
data is held in the core.
Arg [1] : name of the species to set flag for.
Arg [2] : name of the type to set flag for. (i.e. Sequence)
Example : Bio::EnsEMBL::Registry->set_get_via_dnadb_if_set("Human","Sequence");
Returntype : none
Exceptions : none
=cut
Ian Longden
committed
#sub set_get_via_dnadb_if_set{
# my ($class,$species,$type) = @_;
#
# $registry_register{$class->get_alias($species)}{$type}{'DNADB'} = 1;
#}
=head2 get_adaptor
Arg [1] : name of the species to add the adaptor to in the registry.
Arg [2] : name of the group to add the adaptor to in the registry.
Arg [3] : name of the type to add the adaptor to in the registry.
Example : $adap = Bio::EnsEMBL::Registry->get_adaptor("Human", "core", "Gene");
Returntype : adaptor
Exceptions : none
=cut
sub get_adaptor{
my ($class,$species,$group,$type)= @_;
Ian Longden
committed
$species = $class->get_alias($species);
my %dnadb_adaptors = qw(Sequence 1 AssemblyMapper 1 KaryotypeBand 1 RepeatFeature 1 CoordSystem 1 AssemblyExceptionFeature 1 );
my $dnadb_group = $registry_register{$species}{$group}{_DNA};
if( defined($dnadb_group) && defined($dnadb_adaptors{$type}) ) {
$species = $registry_register{$species}{$group}{'_DNA2'};
Ian Longden
committed
$group = $dnadb_group;
}
my $ret = $registry_register{$species}{$group}{$type};
if(!defined($ret)){
495
496
497
498
499
500
501
502
503
504
505
506
507
508
509
510
511
512
513
514
515
516
517
518
519
520
521
522
523
524
525
526
527
528
529
530
531
532
533
534
535
536
537
538
539
540
541
542
543
544
545
546
547
548
549
550
551
552
553
554
555
556
557
558
559
560
561
562
563
564
565
566
567
568
569
570
571
572
}
if(!ref($ret)){ # not instantiated yet
my $dba = $registry_register{$species}{$group}{'_DB'};
my $module = $ret;
eval "require $module";
if($@) {
warning("$module cannot be found.\nException $@\n");
return undef;
}
my $adap = "$module"->new($dba);
Bio::EnsEMBL::Registry->add_adaptor($species, $group, $type, $adap, "reset");
$ret = $adap;
}
return $ret;
}
=head2 get_all_adaptors
Arg [1] : name of the species to get the adaptors for.
Example : @adaps = @{Bio::EnsEMBL::Registry->get_all_adaptors()};
Returntype : list of adaptors
Exceptions : none
=cut
sub get_all_adaptors{
my ($class,$species)= @_;
$species = get_alias($species);
return $registry_register{$species}{'list'};
}
=head2 get_MergedAdaptor
Arg [1] : name of the species to get the adaptors for in the registry.
Arg [2] : name of the type to get the adaptors for in the registry.
Example : $merged = Bio::EnsEMBL::Registry->get_MergedAdaptor("Mouse","Gene");
Returntype : Bio::EnsEMBL::DBSQL::MergedAdaptor
Exceptions : none
=cut
sub get_MergedAdaptor{
my ($class,$species,$type)=@_;
$species = $class->get_alias($species);
my $ret = new Bio::EnsEMBL::DBSQL::MergedAdaptor();
$ret->add_list(@{$registry_register{$type}{$species}});
return $ret;
}
=head2 add_alias
Arg [1] : name of the species to add alias for
Arg [2] : name of the alias
Example : Bio::EnsEMBL::Registry->add_alias("Homo Sapiens","Human");
Description: add alternative name for the species.
Returntype : none
Exceptions : none
=cut
sub add_alias{
my ($class, $species,$key) = @_;
$registry_register{'_ALIAS'}{$key} = $species;
}
=head2 get_alias
Arg [1] : name of the possible alias to get species for
Example : Bio::EnsEMBL::Registry->get_alias("Human");
Description: get proper species name.
Returntype : species name
if(!defined($registry_register{'_ALIAS'}{$key})){
}
return $registry_register{'_ALIAS'}{$key};
}
=head2 alias_exists
Arg [1] : name of the possible alias to get species for
Arg [2] : if set will not throw if not found.
Description: does the species name exist.
Returntype : 1 if exists else 0
Exceptions : none
=cut
sub alias_exists{
my ($class, $key) = @_;
if(defined($registry_register{'_ALIAS'}{$key})){
return 1;
}
return 0;
}
sub set_disconnect_when_inactive{
foreach my $dba ( @{get_all_DBAdaptors()}){
my $dbc = $dba->dbc;
#disconnect if connected
$dbc->disconnect_if_idle() if $dbc->connected();
$dbc->disconnect_when_inactive(1);
}
}
sub disconnect_all {
foreach my $dba ( get_all_DBAdaptors() ){
my $dbc = $dba->dbc;
#disconnect if connected
$dbc->disconnect_if_idle() if $dbc->connected();
}
}
=head2 change_access
Will change the username and password for a set of databases.
if host,user or database names are missing then these are not checked.
So for example if you do not specify a database then ALL databases on
the specified host and port will be changed.
Arg [1] : name of the host to change access on
Arg [2] : port number to change access on
Arg [3] : name of the user to change access on
Arg [4] : name of the database to change access on
Arg [5] : name of the new user
Arg [6] : new password
Example : Bio::EnsEMBL::Registry->get_alias("Human");
Description: change username and password on one or more databases
Returntype : none
Exceptions : none
=cut
sub change_access{
my $self = shift;
my ($host,$port,$user,$dbname,$new_user,$new_pass) = @_;
foreach my $dba ( @{$registry_register{'_DBA'}}){
my $dbc = $dba->dbc;
if((!defined($host) or $host eq $dbc->host) and
(!defined($port) or $port eq $dbc->port) and
(!defined($user) or $user eq $dbc->username) and
(!defined($dbname) or $dbname eq $dbc->dbname)){
if($dbc->connected()){
$dbc->db_handle->disconnect();
$dbc->connected(undef);
}
# over write the username and password
$dbc->username($new_user);
$dbc->password($new_pass);
}
sub get_all_DBAdaptors_by_connection{
my ($self, $dbc_orig) = @_;
my @return;
foreach my $dba ( @{$registry_register{'_DBA'}}){
my $dbc = $dba->dbc;
if($dbc->equals($dbc_orig)){
push @return, $dba;
}
}
return \@return;
}
#
# Web specific routines
#
=head2 load_registry_with_web_adaptors
Will load the registry with all the Adaptors used in the Web server.
Providing Sitedefs and SpeciesDefs can be found on PERL5LIB path.
Example : Bio::EnsEMBL::Registry->load_registry_with_web_adaptors();
Returntype : none
Exceptions : Will die if Sitedefs or SpeciesDefs is not found on the
PERL5LIB path.
=cut
sub load_registry_with_web_adaptors{
699
700
701
702
703
704
705
706
707
708
709
710
711
712
713
714
715
716
717
718
719
720
721
722
723
724
725
726
727
728
729
730
731
732
733
734
735
736
737
738
739
740
741
742
743
744
745
746
747
748
749
750
751
752
753
754
755
756
757
758
759
760
761
762
763
my $class = shift;
eval{ require SiteDefs };
if ($@){ die "Can't use SiteDefs.pm - $@\n"; }
SiteDefs->import(qw(:ALL));
eval{ require SpeciesDefs };
if ($@){ die "Can't use SpeciesDefs.pm - $@\n"; }
my $conf = new SpeciesDefs();
}
=head2 set_default_track
Sets a flag to say that that this species/group are a default track and do not
need to be added as another web track.
Arg [1] : name of the species to get the adaptors for in the registry.
Arg [2] : name of the type to get the adaptors for in the registry.
Example : $merged = Bio::EnsEMBL::Registry->set_default_track("Human","core");
Returntype : none
Exceptions : none
=cut
sub set_default_track{
my ($class, $species, $group) = @_;
$registry_register{'def_track'}{$species}{$group} = 1;
}
=head2 default_track
Check flag to see if this is a default track
Arg [1] : name of the species to get the adaptors for in the registry.
Arg [2] : name of the type to get the adaptors for in the registry.
Example : $merged = Bio::EnsEMBL::Registry->set_default_track("Human","core");
Returntype : int
Exceptions : none
=cut
sub default_track{
my ($class, $species, $group) = @_;
if(defined($registry_register{'def_track'}{$species}{$group})){
return 1;
}
return 0;
}
=head2 add_new_tracks
Will add new gene tracks to the configuration of the WEB server if they are
not of the type default and the configuration already has genes in the display.
Arg [1] : hash of the default configuration of the web page
Returntype : none
Exceptions : none
Called by : UserConfig.pm
=cut
sub add_new_tracks{
my $start = 0;
my $reg = $class;
my $species_reg = $reg->get_alias($conf->{'species'},"nothrow");
# print STDERR "Species $species_reg check for default tracks\n";
if(defined($species_reg)){
foreach my $dba ($reg->get_all_DBAdaptors()){
if(!$reg->default_track($dba->species,$dba->group)){
$pars{'available'} = "species ".$reg->get_alias($dba->species());
$pars{'db_alias'} = $dba->group();
# print STDERR "Adding new track for ".$dba->species."\t".$dba->group."\n";
$conf->add_new_track_generictranscript('',$dba->group(), "black",$pos,%pars);