Show
Ignore:
Timestamp:
05/15/10 21:10:07 (2 years ago)
Author:
AlexanderPico
Message:

further adapted to work with plato, plus mods to handling of GO when go_adaptor is undefined

Files:
1 modified

Legend:

Unmodified
Added
Removed
  • trunk/dbbuilder/src/org/bridgedb/extract/Ensembl_ETL_Device_v18_local.pl

    r352 r353  
    4141use HashSpeciesList; 
    4242use lib '/home/socr/c/users2/apico/src/ensembl/modules'; 
    43 use lib '/home/socr/c/users2/apico/src/ensembl-compara/modules'; 
    44 use lib '/home/socr/c/users2/apico/src/ensembl-variation/modules'; 
     43#use lib '/home/socr/c/users2/apico/src/ensembl-compara/modules'; 
     44#use lib '/home/socr/c/users2/apico/src/ensembl-variation/modules'; 
    4545use lib '/home/socr/c/users2/apico/src/ensembl-functgenomics/modules'; 
    4646use lib '/home/socr/c/users2/apico/bioperl-live';  
    4747use Bio::EnsEMBL::Registry; 
    4848use Bio::EnsEMBL::DBSQL::DBConnection; 
    49 use Bio::EnsEMBL::Compara::DBSQL::DBAdaptor; 
     49#use Bio::EnsEMBL::Compara::DBSQL::DBAdaptor; 
    5050use Bio::EnsEMBL::DBSQL::GOTermAdaptor; 
    5151use Bio::EnsEMBL::OntologyTerm; 
     
    390390 
    391391$registry->load_registry_from_db( 
    392         -host => 'localhost', 
     392        -host => 'mysql-dev.cgl.ucsf.edu', 
     393        -port => '13308', 
    393394        -user => 'genmapp', 
    394395        -pass => 'fun4genmapp', 
     
    421422my $dbname = $dbas[0]->dbc->dbname();        # e.g., core_mus_musculus_42_36c 
    422423my @split_dbname = split(/_/, $dbname); 
    423 if ($split_dbname[1] == "collection"){       # shift array elements for "collections" 
     424if ($split_dbname[2] == "collection"){       # shift array elements for "collections" 
    424425        splice(@split_dbname,1,1); 
    425426} 
    426 my $build = $split_dbname[3];                # e.g., 42 
    427 my $build_nums = $build.$split_dbname[4];    # e.g., 42_36c 
     427my $build = $split_dbname[4];                # e.g., 42 
     428my $build_nums = $build.$split_dbname[5];    # e.g., 42_36c 
    428429 
    429430############################################################################ 
     
    11741175            my $sqlUser = "genmapp";                    # username 
    11751176            my $sqlPass = "fun4genmapp";                # password 
    1176             my $sqlDBLog = "ensembl_etl_device_log";    # permanent log table 
    1177             my $sqlDB = "current_".$genus_species;      # name of species database, based on user-selected species 
    1178             my $sqlCSDB = "current_CS_".$genus_species; # name of species database, based on user-selected species 
    1179             my $sqlConnection ="dbi:mysql:$sqlDBLog";   # connection statement used in DBI->connect() 
     1177            my $sqlDBLog = "genmapp_ensembl_etl_device_log";    # permanent log table 
     1178            my $sqlHost = "mysql-dev.cgl.ucsf.edu";     # plato host 
     1179            my $sqlPort = "13308";                      # plato port 
     1180            my $sqlDB = "genmapp_current_".$genus_species;      # name of species database, based on user-selected species 
     1181            my $sqlCSDB = "genmapp_current_CS_".$genus_species; # name of species database, based on user-selected species 
     1182            my $sqlConnection ="dbi:mysql:$sqlDBLog:$sqlHost:$sqlPort";   # connection statement used in DBI->connect() 
    11801183 
    11811184            $dbh = DBI->connect($sqlConnection, $sqlUser, $sqlPass) 
     
    14451448        $dateArg = $year.$mon.$mday; 
    14461449} 
    1447 my $current_std = "current_".$genus_species; 
    1448 my $new_std = $twoLetterSpecies."_Std_".$dateArg; 
    1449 my $current_cs = "current_CS_".$genus_species; 
    1450 my $new_cs = $twoLetterSpecies."_CS_".$dateArg; 
     1450my $current_std = "genmapp_current_".$genus_species; 
     1451my $new_std = "genmapp_".$twoLetterSpecies."_Std_".$dateArg; 
     1452my $current_cs = "genmapp_current_CS_".$genus_species; 
     1453my $new_cs = "genmapp_".$twoLetterSpecies."_CS_".$dateArg; 
    14511454my $sqlPass = "fun4genmapp"; 
    14521455my $bkupDir = "/home/socr/c/users2/apico/EnsemblAPI/DB_Copies/"; 
    1453 my $mysqldump_cmd = "mysqldump -u genmapp --password=".$sqlPass; 
    1454 my $mysql_cmd = "mysql -u genmapp --password=".$sqlPass; 
     1456my $mysqldump_cmd = "mysqldump --host=mysql-dev.cgl.ucsf.edu --port=13308 -u genmapp --password=".$sqlPass; 
     1457my $mysql_cmd = "mysql --host=mysql-dev.cgl.ucsf.edu --port=13308 -u genmapp --password=".$sqlPass; 
    14551458 
    14561459## BACKUP and COPY STD TABLES? 
     
    17031706            if (!${$seen{GeneOntology}{$dbe_primary_id}}++){ 
    17041707                # Get GO term annotations using $go_adaptor 
    1705                 my $acc = $dbe_primary_id; 
    1706                 $acc =~ s/\'//g; # strip single quotes to use as variable 
    1707                 my $term = $go_adaptor->fetch_by_accession($acc); 
    1708                 my $name = mysql_quotes($term->name()); #e.g., plasma membrane 
    1709                 my $namespace = mysql_quotes($term->namespace()); # e.g., cellular component 
     1708                my $name = ""; 
     1709                my $namespace = ""; 
     1710                if ($go_adaptor){ 
     1711                        my $acc = $dbe_primary_id; 
     1712                        $acc =~ s/\'//g; # strip single quotes to use as variable 
     1713                        my $term = $go_adaptor->fetch_by_accession($acc); 
     1714                        my $name = mysql_quotes($term->name()); #e.g., plasma membrane 
     1715                        my $namespace = mysql_quotes($term->namespace()); # e.g., cellular component 
     1716                }        
    17101717                $$GeneTables{GeneOntology}{$count.$dot.$subcount{GeneOntology}} = [$dbe_primary_id, $name, $namespace]; 
    17111718                $$Ensembl_GeneTables{GeneOntology}{$count.$dot.$subcount{GeneOntology}} = [$gene_stable_id, $dbe_primary_id]; 
     
    17151722        elsif ($dbe_dbname =~ /^\'goslim/){ 
    17161723            $ADMIN_Xrefs{$dbe_dbname}[10] = "\'Y\'"; # collected 
    1717                 # Get GO term annotations using $go_adaptor 
    17181724                my $acc = $dbe_primary_id; 
    17191725                $acc =~ s/\'//g; # strip single quotes to use as variable 
    1720                 my $term = $go_adaptor->fetch_by_accession($acc); 
    1721                 my $name = mysql_quotes($term->name()); #e.g., plasma membrane 
    1722                 my $namespace = mysql_quotes($term->namespace()); # e.g., cellular component 
    1723                 if ($namespace =~ /\'biological_process\'/){ 
     1726                # Get GO term annotations using $go_adaptor 
     1727                if ($go_adaptor){ 
     1728                  my $term = $go_adaptor->fetch_by_accession($acc); 
     1729                  my $name = mysql_quotes($term->name()); #e.g., plasma membrane 
     1730                  my $namespace = mysql_quotes($term->namespace()); # e.g., cellular component 
     1731                  if ($namespace =~ /\'biological_process\'/){ 
    17241732                        $$GeneTables{GOslimBP}{$count.$dot.$subcount{GOslimBP}} = [$dbe_primary_id, $name]; 
    17251733                        $$Ensembl_GeneTables{GOslimBP}{$count.$dot.$subcount{GOslimBP}} = [$gene_stable_id, $dbe_primary_id]; 
    17261734                        ++$subcount{GOslimBP}; 
    1727                 } elsif ($namespace =~ /\'cellular_component\'/){ 
     1735                  } elsif ($namespace =~ /\'cellular_component\'/){ 
    17281736                        $$GeneTables{GOslimCC}{$count.$dot.$subcount{GOslimCC}} = [$dbe_primary_id, $name]; 
    17291737                        $$Ensembl_GeneTables{GOslimCC}{$count.$dot.$subcount{GOslimCC}} = [$gene_stable_id, $dbe_primary_id]; 
    17301738                        ++$subcount{GOslimCC}; 
    1731                 } elsif ($namespace =~ /\'molecular_function\'/){ 
     1739                  } elsif ($namespace =~ /\'molecular_function\'/){ 
    17321740                        $$GeneTables{GOslimMF}{$count.$dot.$subcount{GOslimMF}} = [$dbe_primary_id, $name]; 
    17331741                        $$Ensembl_GeneTables{GOslimMF}{$count.$dot.$subcount{GOslimMF}} = [$gene_stable_id, $dbe_primary_id]; 
    17341742                        ++$subcount{GOslimMF}; 
     1743                  } else { 
     1744                        #garbage? 
     1745                  } 
    17351746                } else { 
    1736                         #garbage? 
     1747                        # no go 
    17371748                } 
    17381749        } 
     
    20922103  ## Solution #2 only works after API method has been added 
    20932104  ## See NathJohnson_API_patch.txt 
     2105print $gene_stable_id; 
     2106print $gene; 
    20942107    my $probe_features = $probe_adaptor->fetch_all_by_linked_transcript_Gene($gene); 
    20952108