-
Notifications
You must be signed in to change notification settings - Fork 0
/
get_xref.pl
116 lines (90 loc) · 2.98 KB
/
get_xref.pl
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
#! /usr/bin/perl -w
# Guglielmo Roma
$|=1;
use strict;
BEGIN {
require "/home/roma/src/scripts/unitrap2/unitrap_conf.pl";
};
use strict;
use DBI;
use Getopt::Long;
use Bio::EnsEMBL::Registry;
my $USAGE = "get_xref.pl [-debug] [-h help]";
my ( $trap_id,
$traphost, $trapuser, $trappass, $trapdbname,
$enshost, $ensuser, $enspass, $ensdbname,
$debug, $help);
&GetOptions ( 'debug' => \$debug,
'help|h' => \$help);
#### Configuration options
my %conf = %::conf;
#connect to the trapdb
$traphost = $conf{'traphost'};
$trapuser = $conf{'trapuser'};
$trapdbname = $conf{'trapdbname'};
$trappass = $conf{'trappass'};
$enshost = $conf{'enshost'};
$ensuser = $conf{'ensuser'};
$ensdbname = $conf{'ensdbname'};
$enspass = $conf{'enspass'};
my $registry = 'Bio::EnsEMBL::Registry';
$registry->load_registry_from_db(
-host => $enshost,
-user => $ensuser,
-pass => $enspass,
-database => $ensdbname
);
#### Connecting to unitrap_db
my $trapdb = DBI->connect("DBI:mysql:database=$trapdbname;host=$traphost;port=3306", $trapuser, $trappass) || die "Can't connect: ", $DBI::errst;
my $ensdb = DBI->connect("DBI:mysql:database=$ensdbname;host=$enshost;port=3306", $ensuser, $enspass) || die "Can't connect: ", $DBI::errst;
$trapdb->{RaiseError}=1;
my $st1 = "select distinct ensembl_id from trapens where (source = 'ENSMUSG' || source = 'REFSEQ')";
if ($debug) {print "SQL CODE: $st1\n";}
my $sth = $trapdb->prepare($st1);
$sth->execute();
while (my @rows = $sth->fetchrow_array) {
my $ensid = $rows[0];
$debug && print "---> $ensid\n";
my $gene_adaptor = $registry->get_adaptor( 'Mouse', 'Core', 'Gene');
my $gene = $gene_adaptor->fetch_by_stable_id ($ensid);
my @db_names = qw(RefSeq_dna RefSeq_peptide UniGene MGI miRBase MIM_MORBID GO Uniprot/SWISSPROT Uniprot/SPTREMBL);
foreach my $db (@db_names) {
print "DB $db\n";
my @dblinks = @{ $gene->get_all_DBLinks($db) };
foreach my $accession (@dblinks){
print "Accession $accession\n";
$accession =~ s/$db://;
print "new Accession $accession\n";
my %toinsert;
$toinsert{'accession'} = $accession;
$toinsert{'ensembl_id'} = $ensid;
$toinsert{'dbname'} = $db;
my $st = &prepare_stmt($trapdb, \%toinsert);
my $returned = &insert_set($trapdb, $st, 'xref');
}
}
}
############################ sub
sub prepare_stmt {
my ($dbh, $par) = @_;
my %params = %{$par};
#construct statment nd quote
my $stmt;
foreach my $f (keys %params) {
$stmt .= " , " if $stmt;
$stmt .= $f . " = \"" . $params{$f} ."\" ";
}
return $stmt;
}
sub insert_set {
my ($dbh, $stmt, $table_name) = @_;
#print "here" . $stmt . "\n";
my $s = "INSERT INTO $table_name SET $stmt";
print STDERR "### doing insert $s ###\n";
my $sth = $dbh->prepare($s);
$sth->execute() || warn "insert failed : $DBI::errstr";
my $dbi = $sth->{'mysql_insertid'};
#print STDERR "the table $table_name last inserted id is $dbi \n";
return $dbi;
}