-
Notifications
You must be signed in to change notification settings - Fork 0
Expand file tree
/
Copy pathDatasetPresenterTTUtils.pm
More file actions
188 lines (142 loc) · 5.76 KB
/
DatasetPresenterTTUtils.pm
File metadata and controls
188 lines (142 loc) · 5.76 KB
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
package EbrcModelCommon::Model::DatasetPresenterTTUtils;
use strict;
use warnings;
require Exporter;
our @ISA = qw(Exporter);
our @EXPORT_OK = qw(
getProjectListFromDb
getModelProjectBase
getPresenterFilePaths
);
=head1 NAME
DatasetPresenterTTUtils - Shared utilities for DatasetPresenter tuning table scripts
=head1 SYNOPSIS
use DatasetPresenterTTUtils qw(getProjectListFromDb getPresenterFilePaths);
my @projects = getProjectListFromDb($dbh, $instance, $PROJECT_HOME);
my @filePaths = getPresenterFilePaths($PROJECT_HOME, \@projects);
=head1 DESCRIPTION
This module provides shared functionality for scripts that work with DatasetPresenter
tuning tables. It encapsulates the logic for discovering projects from the database,
determining which model projects to use, and locating all required resource files.
=head1 FUNCTIONS
=head2 getProjectListFromDb($dbh, $instance, $PROJECT_HOME)
Queries the database to determine which projects are available.
Returns an array of hashrefs, each containing:
- project_id: The project ID (e.g., "PlasmoDB")
- lower_project_id: Lowercase version (e.g., "plasmodb")
- model_project_base: Which model project to use (ApiCommonModel, MicrobiomeModel, ClinEpiModel)
Arguments:
$dbh - Database handle
$instance - Database instance string
$PROJECT_HOME - PROJECT_HOME environment variable
=cut
sub getProjectListFromDb {
my ($dbh, $instance, $PROJECT_HOME) = @_;
my $sql;
if ($instance =~ /\/eda/i) {
$sql = <<SQL;
select 'EDA' as project_id, lower('EDA') as lower_project_id
SQL
} elsif ($PROJECT_HOME =~ /\/eupa/i) {
$sql = <<SQL;
SELECT project_id, lower(project_id) as lower_project_id
FROM (SELECT DISTINCT project_id FROM GenomicSeqAttributes) t1
SQL
} elsif ($PROJECT_HOME =~ /\/uni/i || $instance =~ /genomics/) {
$sql = <<SQL;
SELECT project_id, lower(project_id) as lower_project_id
FROM (SELECT DISTINCT project_id from webready.GenomicSeqAttributes_p) t1
UNION
SELECT 'UniDB' AS project_id, 'unidb' as lower_project_id
SQL
} else {
$sql = <<SQL;
SELECT project_id, lower(project_id) as lower_project_id
FROM (
SELECT DISTINCT pi.name as project_id from Core.ProjectInfo pi, SRes.ExternalDatabase ed
WHERE ed.row_project_id = pi.project_id
) t1
SQL
}
my $projectQuery = $dbh->prepare($sql);
$projectQuery->execute() or die "Error getting list of project IDs";
my @projects;
while (my ($project_id, $lower_project_id) = $projectQuery->fetchrow_array()) {
my $model_project_base = getModelProjectBase($lower_project_id);
push @projects, {
project_id => $project_id,
lower_project_id => $lower_project_id,
model_project_base => $model_project_base,
};
}
$projectQuery->finish();
return @projects;
}
=head2 getModelProjectBase($lower_project_id)
Determines which model project base to use for a given project.
Arguments:
$lower_project_id - Lowercase project ID
Returns:
String: "MicrobiomeModel", "ClinEpiModel", or "ApiCommonModel"
=cut
sub getModelProjectBase {
my ($lower_project_id) = @_;
if ($lower_project_id =~ /eda/ || $lower_project_id =~ /microbiome/) {
return "MicrobiomeModel";
} elsif ($lower_project_id =~ /clinepidb/) {
return "ClinEpiModel";
} else {
return "ApiCommonModel";
}
}
=head2 getPresenterFilePaths($PROJECT_HOME, \@projects)
Returns an array of all resource file paths that would be read by the
buildDatasetPresentersTT script.
Arguments:
$PROJECT_HOME - PROJECT_HOME environment variable
\@projects - Array reference of project hashrefs from getProjectListFromDb()
Returns:
Array of file paths in the order they would be accessed
=cut
sub getPresenterFilePaths {
my ($PROJECT_HOME, $projects_ref) = @_;
my @filePaths;
my $primary_model_base;
# Add project-specific XML files
# Uses "last one wins" logic from original script for determining model base
foreach my $project (@$projects_ref) {
my $project_id = $project->{project_id};
my $lower_project_id = $project->{lower_project_id};
my $model_project_base = $project->{model_project_base};
if ($lower_project_id =~ /eda/) {
# EDA databases include all three project types
push @filePaths, "$PROJECT_HOME/MicrobiomePresenters/Model/lib/xml/datasetPresenters/MicrobiomeDB.xml";
push @filePaths, "$PROJECT_HOME/ClinEpiPresenters/Model/lib/xml/datasetPresenters/ClinEpiDB.xml";
push @filePaths, "$PROJECT_HOME/ApiCommonPresenters/Model/lib/xml/datasetPresenters/VectorBase.xml";
$primary_model_base = $model_project_base;
} elsif ($lower_project_id =~ /microbiome/) {
push @filePaths, "$PROJECT_HOME/MicrobiomePresenters/Model/lib/xml/datasetPresenters/${project_id}.xml";
$primary_model_base = $model_project_base;
} elsif ($lower_project_id =~ /clinepidb/) {
push @filePaths, "$PROJECT_HOME/ClinEpiPresenters/Model/lib/xml/datasetPresenters/${project_id}.xml";
$primary_model_base = $model_project_base;
} else {
push @filePaths, "$PROJECT_HOME/ApiCommonPresenters/Model/lib/xml/datasetPresenters/${project_id}.xml";
$primary_model_base = $model_project_base;
}
}
# Add shared resource files
push @filePaths, "$PROJECT_HOME/EbrcModelCommon/Model/lib/xml/datasetPresenters/global.xml";
push @filePaths, "$PROJECT_HOME/EbrcModelCommon/DatasetPresenter/lib/xml/datasetPresenters/datasetPresenters.dtd";
push @filePaths, "$PROJECT_HOME/$primary_model_base/Model/config/datasetReferences.tab";
push @filePaths, "$PROJECT_HOME/$primary_model_base/Model/config/datasetLinks.xml";
push @filePaths, "$PROJECT_HOME/EbrcModelCommon/Model/lib/xml/datasetPresenters/contacts/allContacts.xml";
return @filePaths;
}
1;
__END__
=head1 AUTHOR
VEuPathDB
=head1 SEE ALSO
buildDatasetPresentersTT, needsUpdateDatasetPresentersTT
=cut