Changeset 354
- Timestamp:
- 05/16/10 00:28:39 (21 months ago)
- Location:
- trunk/dbbuilder/src/org/bridgedb/build/scripts
- Files:
-
- 3 modified
-
PathVisioMySQL_BEEF.sql (modified) (2 diffs)
-
PathVisioMySQL_BUILD.sql.template (modified) (5 diffs)
-
buildPathVisio.sh (modified) (5 diffs)
Legend:
- Unmodified
- Added
- Removed
-
trunk/dbbuilder/src/org/bridgedb/build/scripts/PathVisioMySQL_BEEF.sql
r301 r354 5 5 ## Use 'Name' for GO-Slim additions 6 6 INSERT INTO datanode 7 SELECT XXXXXX_CS_YYYYYY.gene.Name,XXXXXX_CS_YYYYYY.gene.Code8 FROM XXXXXX_CS_YYYYYY.gene9 WHERE XXXXXX_CS_YYYYYY.gene.Name != ''10 AND XXXXXX_CS_YYYYYY.gene.Code IN ("Tb", "Tc", "Tm");7 SELECT genmapp_XXXXXX_CS_YYYYYY.gene.Name, genmapp_XXXXXX_CS_YYYYYY.gene.Code 8 FROM genmapp_XXXXXX_CS_YYYYYY.gene 9 WHERE genmapp_XXXXXX_CS_YYYYYY.gene.Name != '' 10 AND genmapp_XXXXXX_CS_YYYYYY.gene.Code IN ("Tb", "Tc", "Tm"); 11 11 12 12 ## Beef up 'link' … … 14 14 INSERT INTO link 15 15 SELECT DISTINCT id_left, code_left, Name, code_right 16 FROM XXXXXX_CS_YYYYYY.link left join XXXXXX_CS_YYYYYY.gene on XXXXXX_CS_YYYYYY.link.id_right =XXXXXX_CS_YYYYYY.gene.id17 WHERE XXXXXX_CS_YYYYYY.link.Code_Right IN ("Tb", "Tc", "Tm");16 FROM genmapp_XXXXXX_CS_YYYYYY.link left join genmapp_XXXXXX_CS_YYYYYY.gene on genmapp_XXXXXX_CS_YYYYYY.link.id_right = genmapp_XXXXXX_CS_YYYYYY.gene.id 17 WHERE genmapp_XXXXXX_CS_YYYYYY.link.Code_Right IN ("Tb", "Tc", "Tm"); 18 18 19 19 -
trunk/dbbuilder/src/org/bridgedb/build/scripts/PathVisioMySQL_BUILD.sql.template
r284 r354 4 4 5 5 ##Copy Ensembl annotations (Description, Chr) to EntrezGene 6 USE XXXXXX_CS_YYYYYY;6 USE genmapp_XXXXXX_CS_YYYYYY; 7 7 #drop index index_id_right on link; 8 8 create index index_id_right on link (ID_Right); … … 33 33 34 34 ##Create database 35 DROP DATABASE IF EXISTS XXXXXX_Derby_YYYYYY;36 CREATE DATABASE XXXXXX_Derby_YYYYYY;37 USE XXXXXX_Derby_YYYYYY;35 DROP DATABASE IF EXISTS genmapp_XXXXXX_Derby_YYYYYY; 36 CREATE DATABASE genmapp_XXXXXX_Derby_YYYYYY; 37 USE genmapp_XXXXXX_Derby_YYYYYY; 38 38 39 39 ## Create 'datanode' … … 74 74 ## Fill 'info' 75 75 INSERT INTO info 76 SELECT XXXXXX_CS_YYYYYY.Info.Version, '3', 'Ensembl', XXXXXX_CS_YYYYYY.Info.Notes,XXXXXX_CS_YYYYYY.Info.Species, 'GeneProduct'77 FROM XXXXXX_CS_YYYYYY.Info;76 SELECT genmapp_XXXXXX_CS_YYYYYY.Info.Version, '3', 'Ensembl', genmapp_XXXXXX_CS_YYYYYY.Info.Notes, genmapp_XXXXXX_CS_YYYYYY.Info.Species, 'GeneProduct' 77 FROM genmapp_XXXXXX_CS_YYYYYY.Info; 78 78 79 79 ## Fill 'attribute' … … 81 81 #symbol 82 82 INSERT INTO attribute 83 SELECT DISTINCT XXXXXX_CS_YYYYYY.attr.ID,XXXXXX_CS_YYYYYY.attr.Code,84 XXXXXX_CS_YYYYYY.attr.Name,XXXXXX_CS_YYYYYY.attr.Value85 FROM XXXXXX_CS_YYYYYY.attr86 WHERE XXXXXX_CS_YYYYYY.attr.Value != '';83 SELECT DISTINCT genmapp_XXXXXX_CS_YYYYYY.attr.ID, genmapp_XXXXXX_CS_YYYYYY.attr.Code, 84 genmapp_XXXXXX_CS_YYYYYY.attr.Name, genmapp_XXXXXX_CS_YYYYYY.attr.Value 85 FROM genmapp_XXXXXX_CS_YYYYYY.attr 86 WHERE genmapp_XXXXXX_CS_YYYYYY.attr.Value != ''; 87 87 88 88 ## Fill 'datanode' 89 89 ## From CS Database 90 90 INSERT INTO datanode 91 SELECT XXXXXX_CS_YYYYYY.gene.ID,XXXXXX_CS_YYYYYY.gene.Code92 FROM XXXXXX_CS_YYYYYY.gene93 WHERE XXXXXX_CS_YYYYYY.gene.ID != ''94 AND XXXXXX_CS_YYYYYY.gene.Code IN ("EnXXXXXX","Mb","L","X","Il","Ag","Q","Om","U","Rf","S","Ip","T","Pd","H","M","R","D","Z","F","W","Gg","A","Ti","Ir","N","Uc","Pl","Gm","Bg","Ec","Wg");91 SELECT genmapp_XXXXXX_CS_YYYYYY.gene.ID, genmapp_XXXXXX_CS_YYYYYY.gene.Code 92 FROM genmapp_XXXXXX_CS_YYYYYY.gene 93 WHERE genmapp_XXXXXX_CS_YYYYYY.gene.ID != '' 94 AND genmapp_XXXXXX_CS_YYYYYY.gene.Code IN ("EnXXXXXX","Mb","L","X","Il","Ag","Q","Om","U","Rf","S","Ip","T","Pd","H","M","R","D","Z","F","W","Gg","A","Ti","Ir","N","Uc","Pl","Gm","Bg","Ec","Wg"); 95 95 96 96 ## Fill 'link' … … 98 98 INSERT INTO link 99 99 SELECT DISTINCT * 100 FROM XXXXXX_CS_YYYYYY.link101 WHERE XXXXXX_CS_YYYYYY.link.Code_Right IN ("EnXXXXXX","Mb","L","X","Il","Ag","Q","Om","U","Rf","S","Ip","T","Pd","H","M","R","D","Z","F","W","Gg","A","Ti","Ir","N","Uc","Pl","Gm","Bg","Ec","Wg");100 FROM genmapp_XXXXXX_CS_YYYYYY.link 101 WHERE genmapp_XXXXXX_CS_YYYYYY.link.Code_Right IN ("EnXXXXXX","Mb","L","X","Il","Ag","Q","Om","U","Rf","S","Ip","T","Pd","H","M","R","D","Z","F","W","Gg","A","Ti","Ir","N","Uc","Pl","Gm","Bg","Ec","Wg"); 102 102 103 ##Add En XXXXXXsembl IDs to right side of 'link' table103 ##Add Ensembl IDs to right side of 'link' table 104 104 INSERT INTO link 105 105 SELECT datanode.id, "EnXXXXXX", datanode.id, "EnXXXXXX" -
trunk/dbbuilder/src/org/bridgedb/build/scripts/buildPathVisio.sh
r301 r354 4 4 DatabaseSpecies=$1 5 5 DatabaseDate=$2 6 Database=$1_Derby_$2 7 DatabaseCS=$1_CS_$2 8 6 Database=genmapp_$1_Derby_$2 #everything in mysql on plato needs "genmapp_" prefix 7 DatabaseDb=$1_Derby_$2 8 DatabaseCS=genmapp_$1_CS_$2 9 mysql='mysql --host=mysql-dev.cgl.ucsf.edu --port=13308 -u genmapp -pfun4genmapp' 10 mysqldump='mysqldump --host=mysql-dev.cgl.ucsf.edu --port=13308 -u genmapp -pfun4genmapp' 9 11 ScriptsDir=/home/apico/Derby/scripts 10 12 … … 14 16 wget http://downloads.yeastgenome.org/gene_registry/registry.genenames.tab 15 17 mv registry.genenames.tab ${ScriptsDir}/. 16 mysql -u genmapp -pfun4genmapp-e "create table ${DatabaseCS}.sgd (a varchar(31), b varchar(31), c varchar(31), d varchar(31), e varchar(31), f varchar(31), g varchar(31))";17 mysql -u genmapp -pfun4genmapp-e "load data local infile '${ScriptsDir}/registry.genenames.tab' into table ${DatabaseCS}.sgd fields terminated by '\t' lines terminated by '\n'";18 mysql -u genmapp -pfun4genmapp-e "create index i_a on ${DatabaseCS}.sgd (a)";19 mysql -u genmapp -pfun4genmapp-e "update ${DatabaseCS}.gene, ${DatabaseCS}.sgd set ${DatabaseCS}.gene.ID = ${DatabaseCS}.sgd.g where ${DatabaseCS}.gene.Symbol = ${DatabaseCS}.sgd.a and ${DatabaseCS}.gene.Code = 'D'";20 mysql -u genmapp -pfun4genmapp-e "update ${DatabaseCS}.attr, ${DatabaseCS}.sgd set ${DatabaseCS}.attr.ID = ${DatabaseCS}.sgd.g where ${DatabaseCS}.attr.Value = ${DatabaseCS}.sgd.a and ${DatabaseCS}.attr.Code = 'D'";21 mysql -u genmapp -pfun4genmapp-e "alter table ${DatabaseCS}.link add column (ID_Right2 varchar(31))";22 mysql -u genmapp -pfun4genmapp-e "update ${DatabaseCS}.link set ID_Right2 = ID_Right where Code_Right = 'D'";23 mysql -u genmapp -pfun4genmapp-e "update ${DatabaseCS}.link, ${DatabaseCS}.sgd set ${DatabaseCS}.link.ID_Right = ${DatabaseCS}.sgd.g where ${DatabaseCS}.link.ID_Right2 = ${DatabaseCS}.sgd.a and ${DatabaseCS}.link.Code_Right = 'D'";24 mysql -u genmapp -pfun4genmapp-e "alter table ${DatabaseCS}.link drop column ID_Right2";18 ${mysql} -e "create table ${DatabaseCS}.sgd (a varchar(31), b varchar(31), c varchar(31), d varchar(31), e varchar(31), f varchar(31), g varchar(31))"; 19 ${mysql} -e "load data local infile '${ScriptsDir}/registry.genenames.tab' into table ${DatabaseCS}.sgd fields terminated by '\t' lines terminated by '\n'"; 20 ${mysql} -e "create index i_a on ${DatabaseCS}.sgd (a)"; 21 ${mysql} -e "update ${DatabaseCS}.gene, ${DatabaseCS}.sgd set ${DatabaseCS}.gene.ID = ${DatabaseCS}.sgd.g where ${DatabaseCS}.gene.Symbol = ${DatabaseCS}.sgd.a and ${DatabaseCS}.gene.Code = 'D'"; 22 ${mysql} -e "update ${DatabaseCS}.attr, ${DatabaseCS}.sgd set ${DatabaseCS}.attr.ID = ${DatabaseCS}.sgd.g where ${DatabaseCS}.attr.Value = ${DatabaseCS}.sgd.a and ${DatabaseCS}.attr.Code = 'D'"; 23 ${mysql} -e "alter table ${DatabaseCS}.link add column (ID_Right2 varchar(31))"; 24 ${mysql} -e "update ${DatabaseCS}.link set ID_Right2 = ID_Right where Code_Right = 'D'"; 25 ${mysql} -e "update ${DatabaseCS}.link, ${DatabaseCS}.sgd set ${DatabaseCS}.link.ID_Right = ${DatabaseCS}.sgd.g where ${DatabaseCS}.link.ID_Right2 = ${DatabaseCS}.sgd.a and ${DatabaseCS}.link.Code_Right = 'D'"; 26 ${mysql} -e "alter table ${DatabaseCS}.link drop column ID_Right2"; 25 27 fi 26 28 … … 29 31 30 32 ## Build a MySQL Database for PathVisio: 31 mysql -u genmapp -pfun4genmapp< PathVisioMySQL_BUILD.sql33 ${mysql} < PathVisioMySQL_BUILD.sql 32 34 33 35 … … 36 38 # Otherwise, derby build will crash when semicolons 37 39 # happen to precede key words (e.g., "negative") 38 # mysql -u genmapp -pfun4genmapp-e "update ${Database}.datanode set backpageText =replace(backpageText, \";\", \".\")";40 #${mysql} -e "update ${Database}.datanode set backpageText =replace(backpageText, \";\", \".\")"; 39 41 40 42 # remove pipes from around species name in Info table 41 mysql -u genmapp -pfun4genmapp-e "update ${Database}.info set species =replace(species, \"|\", \"\")";43 ${mysql} -e "update ${Database}.info set species =replace(species, \"|\", \"\")"; 42 44 43 45 ## Dump MySQL-PathVisio Database to .sql 44 46 # --net_buffer_length=30K (used to limit size of extended-inserts) 45 47 # --skip-extended-insert (used to force line-by-line inserts) 46 mysqldump --compatible=db2 --no-create-info --skip-add-locks --skip-disable-keys --skip-quote-names --net_buffer_length=30K -u genmapp -pfun4genmapp ${Database} > ${Database}.db2.sql.temp 48 ${mysqldump} --compatible=db2 --no-create-info --skip-add-locks --skip-disable-keys --skip-quote-names --net_buffer_length=30K ${Database} > ${DatabaseDb}.db2.sql.temp 49 ## Dump table creation statements separately for 2-step recontruction later (e.g., for bridgedb rest server) 50 ${mysqldump} --no-data ${Database} > ${DatabaseDb}.db2.sql.tables 47 51 48 52 ## Clean up dump file 49 53 # Replace in emacs using esc-% (! = all occurances) 50 54 # Replace in vi using :%s/old/new/g (use vi if file is too large for emacs) 51 cat ${Database }.db2.sql.temp | sed "s/\/\*/--/g" | sed "s/\\\'/\'\'/g" > ${Database}.db2.sql55 cat ${DatabaseDb}.db2.sql.temp | sed "s/\/\*/--/g" | sed "s/\\\'/\'\'/g" > ${DatabaseDb}.db2.sql 52 56 53 57 ## Create & Fill Derby via ij tool … … 56 60 export CLASSPATH=$DERBY_INSTALL/lib/derby.jar:$DERBY_INSTALL/lib/derbytools.jar:. 57 61 # Run ij Tool 58 cat ${ScriptsDir}/PathVisioDerby_BUILD.ij.template | sed "s/XXXXXX/${Database }/g" | perl ${ScriptsDir}/replacePath.pl ${ScriptsDir} > PathVisioDerby_BUILD.ij62 cat ${ScriptsDir}/PathVisioDerby_BUILD.ij.template | sed "s/XXXXXX/${DatabaseDb}/g" | perl ${ScriptsDir}/replacePath.pl ${ScriptsDir} > PathVisioDerby_BUILD.ij 59 63 60 64 java -XX:MaxPermSize=128m -Xmx1024m org.apache.derby.tools.ij PathVisioDerby_BUILD.ij 61 65 62 66 # Package it up 63 mv ${Database } database64 zip -r -0 ${Database }.bridge database/65 mv database ${Database }67 mv ${DatabaseDb} database 68 zip -r -0 ${DatabaseDb}.bridge database/ 69 mv database ${DatabaseDb} 66 70 67 71 ## Beef up MySQL version of Derby databases for web service deployment 68 mysql -u genmapp -pfun4genmapp< PathVisioMySQL_BEEF.sql69 mysqldump --skip-add-locks --skip-disable-keys --skip-quote-names --net_buffer_length=30K -u genmapp -pfun4genmapp ${Database} > ${Database}.sql.dump72 ${mysql} < PathVisioMySQL_BEEF.sql 73 ${mysqldump} --skip-add-locks --skip-disable-keys --skip-quote-names --net_buffer_length=30K ${Database} > ${DatabaseDb}.sql.dump 70 74 71 75 # report on products (check size > 1.9M) 72 ls -lh ${Database }.bridge | echo76 ls -lh ${DatabaseDb}.bridge | echo 73 77 74 78 # BELOW: Not yet automated 75 79 # - ssh-key authentication not working 76 #scp ${Database }.bridge genmappftp@conklinwolf.ucsf.edu: (password=genmappftp)77 #scp ${Database }.bridge jeff@conklinwolf.ucsf.edu:/home2/GenMAPP2_DataTreeRoot/Derby/ (1357jeff)80 #scp ${DatabaseDb}.bridge genmappftp@conklinwolf.ucsf.edu: (password=genmappftp) 81 #scp ${DatabaseDb}.bridge jeff@conklinwolf.ucsf.edu:/home2/GenMAPP2_DataTreeRoot/Derby/ (1357jeff) 78 82 79 83 # Install at WikiPathways
