Changeset 517

Show
Ignore:
Timestamp:
05/26/11 04:28:12 (12 months ago)
Author:
AlexanderPico
Message:

adapted to collect probes and probesets, skipping problematic probe_features and Ex- (all exon) arrays

Files:
1 modified

Legend:

Unmodified
Added
Removed
  • trunk/dbbuilder/src/org/bridgedb/extract/Ensembl_ETL_Device_v18_local.pl

    r468 r517  
    427427my $slice_adaptor = $registry->get_adaptor($species, "core", "slice"); 
    428428my $go_adaptor = $registry->get_adaptor("Multi", "Ontology", "GOTerm"); 
    429 my $probe_adaptor = $registry->get_adaptor($species, "funcgen", "ProbeFeature"); 
     429my $probe_feature_adaptor = $registry->get_adaptor($species, "funcgen", "ProbeFeature"); 
     430my $probe_adaptor = $registry->get_adaptor($species, "funcgen", "Probe"); 
     431my $probe_set_adaptor = $registry->get_adaptor($species, "funcgen", "Probeset"); 
    430432my @dbas = @{Bio::EnsEMBL::Registry->get_all_DBAdaptors(-species => $species)}; 
    431433my $dbname = $dbas[0]->dbc->dbname();        # e.g., core_mus_musculus_42_36c 
     
    21782180  ## Solution #2 only works after API method has been added 
    21792181  ## See NathJohnson_API_patch.txt 
    2180     my $probe_features = $probe_adaptor->fetch_all_by_linked_transcript_Gene($gene); 
    2181    
    2182     foreach my $pf (@$probe_features) { 
    2183       my $probe = $pf->probe(); 
     2182    #my @probe_features = @{$probe_feature_adaptor->fetch_all_by_linked_transcript_Gene($gene)}; 
     2183    my @probes = @{$probe_adaptor->fetch_all_by_linked_transcript_Gene($gene)}; 
     2184    my @probe_sets = @{$probe_set_adaptor->fetch_all_by_linked_transcript_Gene($gene)}; 
     2185    my @all_probes = (@probes, @probe_sets); 
     2186 
     2187    foreach my $probe (@all_probes) { 
     2188      #my $probe = $pf->probe(); 
    21842189      my $array_list = $probe->get_all_Arrays(); 
    21852190 
     
    21892194        } 
    21902195        my $pf_dbname = mysql_quotes($array->vendor()); 
    2191         my $pf_display_id = mysql_quotes($probe->get_probename($array->name())); 
     2196        my $pf_display_id = 'null'; 
    21922197        if ($pf_dbname =~ /^\'AFFY/i) { # Affy uses probesets 
    2193                 $pf_display_id = mysql_quotes($probe->probeset()->name()); 
    2194         } 
     2198                $pf_display_id = mysql_quotes($probe->name()); ##probeset()->name()); 
     2199        } else { 
     2200                $pf_display_id = mysql_quotes($probe->get_probename($array->name())); 
     2201        } 
     2202                 
    21952203        my $pf_primary_id = $pf_display_id; 
    21962204        my $pf_description = mysql_quotes($array->description()); 
     
    22002208        my $pf_info_text = mysql_quotes($array->type()); 
    22012209        my $pf_info_type = mysql_quotes("SEQUENCE_MATCH"); #enum 
    2202         my $pf_synonyms = $probe->get_all_probenames(); 
    2203         my $pf_syns = join("|", @$pf_synonyms); 
     2210        #my $pf_synonyms = $probe->get_all_probenames(); 
     2211        my $pf_syns = ''; ##join("|", @$pf_synonyms); 
    22042212        $pf_syns = mysql_quotes($pf_syns); 
    22052213 
     
    22092217                             $pf_release, $pf_status, $pf_version, $pf_info_text, $pf_info_type]; 
    22102218 
    2211         if ($pf_dbname =~ /^\'AFFY/i){  #catch all types 
     2219        if ($pf_dbname =~ /^\'AFFY/i && $pf_release !~ /Ex-/){  #catch all types #skip all exon arrays 
    22122220            $ADMIN_Xrefs{$pf_dbname}[10] = "\'Y\'"; # collected 
    22132221            if (!${$seen{Affy}{$pf_primary_id}}++){