|
8 | 8 | """Inspirehep initial revision of migrations |
9 | 9 | which makes db identical like in inspire-next""" |
10 | 10 |
|
11 | | -import sqlalchemy as sa |
12 | | -from alembic import op |
13 | | -from sqlalchemy.dialects import postgresql |
14 | 11 |
|
15 | 12 | # revision identifiers, used by Alembic. |
16 | 13 | revision = "7be4c8b5c5e8" |
|
19 | 16 |
|
20 | 17 | """Migrations which are required and inspirehep is depending on: |
21 | 18 | 07fb52561c5c - invenio-records, |
22 | | - 1ba76da94103 - invenio-records-files |
23 | | - f741aa746a7d - invenio-files-rest |
24 | 19 | e12419831262 - invenio-accounts |
25 | 20 | """ |
26 | | -depends_on = "07fb52561c5c", "1ba76da94103", "f741aa746a7d", "e12419831262" |
| 21 | +depends_on = "07fb52561c5c", "e12419831262" |
27 | 22 |
|
28 | 23 |
|
29 | 24 | def upgrade(): |
30 | 25 | # """Upgrade database.""" |
31 | | - op.create_table( |
32 | | - "workflows_workflow", |
33 | | - sa.Column("uuid", postgresql.UUID(), autoincrement=False, nullable=False), |
34 | | - sa.Column("name", sa.VARCHAR(length=255), autoincrement=False, nullable=False), |
35 | | - sa.Column( |
36 | | - "created", postgresql.TIMESTAMP(), autoincrement=False, nullable=False |
37 | | - ), |
38 | | - sa.Column( |
39 | | - "modified", postgresql.TIMESTAMP(), autoincrement=False, nullable=False |
40 | | - ), |
41 | | - sa.Column("id_user", sa.INTEGER(), autoincrement=False, nullable=False), |
42 | | - sa.Column( |
43 | | - "extra_data", |
44 | | - postgresql.JSON(astext_type=sa.Text()), |
45 | | - autoincrement=False, |
46 | | - nullable=False, |
47 | | - ), |
48 | | - sa.Column("status", sa.INTEGER(), autoincrement=False, nullable=False), |
49 | | - sa.PrimaryKeyConstraint("uuid", name="pk_workflows_workflow"), |
50 | | - ) |
51 | | - op.create_table( |
52 | | - "workflows_object", |
53 | | - sa.Column( |
54 | | - "id", |
55 | | - sa.INTEGER(), |
56 | | - server_default=sa.text("nextval('workflows_object_id_seq'::regclass)"), |
57 | | - autoincrement=True, |
58 | | - nullable=False, |
59 | | - ), |
60 | | - sa.Column( |
61 | | - "data", |
62 | | - postgresql.JSON(astext_type=sa.Text()), |
63 | | - autoincrement=False, |
64 | | - nullable=False, |
65 | | - ), |
66 | | - sa.Column( |
67 | | - "extra_data", |
68 | | - postgresql.JSON(astext_type=sa.Text()), |
69 | | - autoincrement=False, |
70 | | - nullable=False, |
71 | | - ), |
72 | | - sa.Column("id_workflow", postgresql.UUID(), autoincrement=False, nullable=True), |
73 | | - sa.Column("status", sa.INTEGER(), autoincrement=False, nullable=False), |
74 | | - sa.Column("id_parent", sa.INTEGER(), autoincrement=False, nullable=True), |
75 | | - sa.Column("id_user", sa.INTEGER(), autoincrement=False, nullable=False), |
76 | | - sa.Column( |
77 | | - "created", postgresql.TIMESTAMP(), autoincrement=False, nullable=False |
78 | | - ), |
79 | | - sa.Column( |
80 | | - "modified", postgresql.TIMESTAMP(), autoincrement=False, nullable=False |
81 | | - ), |
82 | | - sa.Column( |
83 | | - "data_type", sa.VARCHAR(length=150), autoincrement=False, nullable=True |
84 | | - ), |
85 | | - sa.Column( |
86 | | - "callback_pos", |
87 | | - postgresql.JSON(astext_type=sa.Text()), |
88 | | - autoincrement=False, |
89 | | - nullable=True, |
90 | | - ), |
91 | | - sa.ForeignKeyConstraint( |
92 | | - ["id_parent"], |
93 | | - ["workflows_object.id"], |
94 | | - name="fk_workflows_object_id_parent_workflows_object", |
95 | | - ondelete="CASCADE", |
96 | | - ), |
97 | | - sa.ForeignKeyConstraint( |
98 | | - ["id_workflow"], |
99 | | - ["workflows_workflow.uuid"], |
100 | | - name="fk_workflows_object_id_workflow_workflows_workflow", |
101 | | - ondelete="CASCADE", |
102 | | - ), |
103 | | - sa.PrimaryKeyConstraint("id", name="pk_workflows_object"), |
104 | | - postgresql_ignore_search_path=False, |
105 | | - ) |
106 | | - op.create_index( |
107 | | - "ix_workflows_object_status", "workflows_object", ["status"], unique=False |
108 | | - ) |
109 | | - op.create_index( |
110 | | - "ix_workflows_object_id_workflow", |
111 | | - "workflows_object", |
112 | | - ["id_workflow"], |
113 | | - unique=False, |
114 | | - ) |
115 | | - op.create_index( |
116 | | - "ix_workflows_object_id_parent", "workflows_object", ["id_parent"], unique=False |
117 | | - ) |
118 | | - op.create_index( |
119 | | - "ix_workflows_object_data_type", "workflows_object", ["data_type"], unique=False |
120 | | - ) |
121 | | - op.create_table( |
122 | | - "workflows_buckets", |
123 | | - sa.Column( |
124 | | - "workflow_object_id", sa.INTEGER(), autoincrement=False, nullable=False |
125 | | - ), |
126 | | - sa.Column("bucket_id", postgresql.UUID(), autoincrement=False, nullable=False), |
127 | | - sa.ForeignKeyConstraint( |
128 | | - ["bucket_id"], |
129 | | - ["files_bucket.id"], |
130 | | - name="fk_workflows_buckets_bucket_id_files_bucket", |
131 | | - onupdate="CASCADE", |
132 | | - ondelete="CASCADE", |
133 | | - ), |
134 | | - sa.ForeignKeyConstraint( |
135 | | - ["workflow_object_id"], |
136 | | - ["workflows_object.id"], |
137 | | - name="fk_workflows_buckets_workflow_object_id_workflows_object", |
138 | | - onupdate="CASCADE", |
139 | | - ondelete="CASCADE", |
140 | | - ), |
141 | | - sa.PrimaryKeyConstraint( |
142 | | - "workflow_object_id", "bucket_id", name="pk_workflows_buckets" |
143 | | - ), |
144 | | - ) |
145 | | - op.create_table( |
146 | | - "workflows_audit_logging", |
147 | | - sa.Column("id", sa.INTEGER(), autoincrement=True, nullable=False), |
148 | | - sa.Column("user_id", sa.INTEGER(), autoincrement=False, nullable=True), |
149 | | - sa.Column( |
150 | | - "score", |
151 | | - postgresql.DOUBLE_PRECISION(precision=53), |
152 | | - autoincrement=False, |
153 | | - nullable=False, |
154 | | - ), |
155 | | - sa.Column("user_action", sa.TEXT(), autoincrement=False, nullable=False), |
156 | | - sa.Column("decision", sa.TEXT(), autoincrement=False, nullable=False), |
157 | | - sa.Column("source", sa.TEXT(), autoincrement=False, nullable=False), |
158 | | - sa.Column("action", sa.TEXT(), autoincrement=False, nullable=False), |
159 | | - sa.Column( |
160 | | - "created", postgresql.TIMESTAMP(), autoincrement=False, nullable=False |
161 | | - ), |
162 | | - sa.Column("object_id", sa.INTEGER(), autoincrement=False, nullable=False), |
163 | | - sa.ForeignKeyConstraint( |
164 | | - ["object_id"], |
165 | | - ["workflows_object.id"], |
166 | | - name="fk_workflows_audit_logging_object_id_workflows_object", |
167 | | - ondelete="CASCADE", |
168 | | - ), |
169 | | - sa.ForeignKeyConstraint( |
170 | | - ["user_id"], |
171 | | - ["accounts_user.id"], |
172 | | - name="fk_workflows_audit_logging_user_id_accounts_user", |
173 | | - ondelete="CASCADE", |
174 | | - ), |
175 | | - sa.PrimaryKeyConstraint("id", name="pk_workflows_audit_logging"), |
176 | | - ) |
177 | | - op.create_index( |
178 | | - "ix_workflows_audit_logging_user_id", |
179 | | - "workflows_audit_logging", |
180 | | - ["user_id"], |
181 | | - unique=False, |
182 | | - ) |
183 | | - op.create_index( |
184 | | - "ix_workflows_audit_logging_object_id", |
185 | | - "workflows_audit_logging", |
186 | | - ["object_id"], |
187 | | - unique=False, |
188 | | - ) |
189 | | - op.create_table( |
190 | | - "crawler_job", |
191 | | - sa.Column("id", sa.INTEGER(), autoincrement=True, nullable=False), |
192 | | - sa.Column("job_id", postgresql.UUID(), autoincrement=False, nullable=True), |
193 | | - sa.Column("spider", sa.VARCHAR(length=255), autoincrement=False, nullable=True), |
194 | | - sa.Column( |
195 | | - "workflow", sa.VARCHAR(length=255), autoincrement=False, nullable=True |
196 | | - ), |
197 | | - sa.Column("results", sa.TEXT(), autoincrement=False, nullable=True), |
198 | | - sa.Column("status", sa.VARCHAR(length=10), autoincrement=False, nullable=False), |
199 | | - sa.Column("logs", sa.TEXT(), autoincrement=False, nullable=True), |
200 | | - sa.Column( |
201 | | - "scheduled", postgresql.TIMESTAMP(), autoincrement=False, nullable=False |
202 | | - ), |
203 | | - sa.PrimaryKeyConstraint("id", name="pk_crawler_job"), |
204 | | - ) |
205 | | - op.create_index( |
206 | | - "ix_crawler_job_workflow", "crawler_job", ["workflow"], unique=False |
207 | | - ) |
208 | | - op.create_index("ix_crawler_job_spider", "crawler_job", ["spider"], unique=False) |
209 | | - op.create_index( |
210 | | - "ix_crawler_job_scheduled", "crawler_job", ["scheduled"], unique=False |
211 | | - ) |
212 | | - op.create_index("ix_crawler_job_job_id", "crawler_job", ["job_id"], unique=False) |
213 | | - op.create_table( |
214 | | - "crawler_workflows_object", |
215 | | - sa.Column("job_id", postgresql.UUID(), autoincrement=False, nullable=False), |
216 | | - sa.Column("object_id", sa.INTEGER(), autoincrement=False, nullable=False), |
217 | | - sa.ForeignKeyConstraint( |
218 | | - ["object_id"], |
219 | | - ["workflows_object.id"], |
220 | | - name="fk_crawler_workflows_object_object_id_workflows_object", |
221 | | - onupdate="CASCADE", |
222 | | - ondelete="CASCADE", |
223 | | - ), |
224 | | - sa.PrimaryKeyConstraint( |
225 | | - "job_id", "object_id", name="pk_crawler_workflows_object" |
226 | | - ), |
227 | | - ) |
228 | | - op.create_table( |
229 | | - "workflows_pending_record", |
230 | | - sa.Column("workflow_id", sa.INTEGER(), autoincrement=False, nullable=False), |
231 | | - sa.Column("record_id", sa.INTEGER(), autoincrement=False, nullable=False), |
232 | | - sa.ForeignKeyConstraint( |
233 | | - ["workflow_id"], |
234 | | - ["workflows_object.id"], |
235 | | - name="fk_workflows_pending_record_workflow_id_workflows_object", |
236 | | - ondelete="CASCADE", |
237 | | - ), |
238 | | - sa.PrimaryKeyConstraint("workflow_id", name="pk_workflows_pending_record"), |
239 | | - ) |
240 | | - op.create_table( |
241 | | - "workflows_record_sources", |
242 | | - sa.Column( |
243 | | - "source", |
244 | | - postgresql.ENUM("arxiv", "submitter", "publisher", name="source_enum"), |
245 | | - autoincrement=False, |
246 | | - nullable=False, |
247 | | - ), |
248 | | - sa.Column( |
249 | | - "record_uuid", postgresql.UUID(), autoincrement=False, nullable=False |
250 | | - ), |
251 | | - sa.Column( |
252 | | - "json", |
253 | | - postgresql.JSONB(astext_type=sa.Text()), |
254 | | - autoincrement=False, |
255 | | - nullable=True, |
256 | | - ), |
257 | | - sa.Column( |
258 | | - "created", postgresql.TIMESTAMP(), autoincrement=False, nullable=True |
259 | | - ), |
260 | | - sa.Column( |
261 | | - "updated", postgresql.TIMESTAMP(), autoincrement=False, nullable=True |
262 | | - ), |
263 | | - sa.ForeignKeyConstraint( |
264 | | - ["record_uuid"], |
265 | | - ["records_metadata.id"], |
266 | | - name="fk_workflows_record_sources_record_uuid_records_metadata", |
267 | | - ondelete="CASCADE", |
268 | | - ), |
269 | | - sa.PrimaryKeyConstraint( |
270 | | - "record_uuid", "source", name="pk_workflows_record_sources" |
271 | | - ), |
272 | | - ) |
273 | | - op.execute( |
274 | | - """ |
275 | | - CREATE OR REPLACE FUNCTION referenced_records(json jsonb) RETURNS TEXT[] AS $$ |
276 | | - DECLARE |
277 | | - reference_arr jsonb; |
278 | | - text_val text; |
279 | | - text_arr_val text[]; |
280 | | - ret_val text[]; |
281 | | - BEGIN |
282 | | - FOR reference_arr IN (SELECT jsonb_array_elements(json->'references')) LOOP |
283 | | - text_val := split_part(reference_arr->'record'->>'$ref',E'api/',2); |
284 | | - IF text_val != '' THEN |
285 | | - text_arr_val := regexp_split_to_array(text_val, E'/'); |
286 | | - ret_val:=array_append(ret_val, text_arr_val[2]||substring(text_arr_val[1] for 3)); |
287 | | - END IF; |
288 | | - END LOOP; |
289 | | - RETURN ret_val; |
290 | | - END; |
291 | | - $$ LANGUAGE plpgsql IMMUTABLE; |
292 | | - """ |
293 | | - ) |
294 | | - |
295 | | - op.execute( |
296 | | - """ |
297 | | - CREATE INDEX ix_records_metadata_json_referenced_records_2_0 |
298 | | - ON records_metadata |
299 | | - USING gin(referenced_records(json)) |
300 | | - """ |
301 | | - ) |
| 26 | + pass |
302 | 27 |
|
303 | 28 |
|
304 | 29 | def downgrade(): |
305 | 30 | # """Downgrade database.""" |
306 | | - op.execute("drop index if exists ix_records_metadata_json_referenced_records_2_0") |
307 | | - op.execute("drop function if exists referenced_records(json jsonb)") |
308 | | - op.drop_table("workflows_record_sources") |
309 | | - op.drop_table("workflows_pending_record") |
310 | | - op.drop_table("crawler_workflows_object") |
311 | | - op.drop_index("ix_crawler_job_job_id", table_name="crawler_job") |
312 | | - op.drop_index("ix_crawler_job_scheduled", table_name="crawler_job") |
313 | | - op.drop_index("ix_crawler_job_spider", table_name="crawler_job") |
314 | | - op.drop_index("ix_crawler_job_workflow", table_name="crawler_job") |
315 | | - op.drop_table("crawler_job") |
316 | | - op.drop_index( |
317 | | - "ix_workflows_audit_logging_object_id", table_name="workflows_audit_logging" |
318 | | - ) |
319 | | - op.drop_index( |
320 | | - "ix_workflows_audit_logging_user_id", table_name="workflows_audit_logging" |
321 | | - ) |
322 | | - op.drop_table("workflows_audit_logging") |
323 | | - op.drop_table("workflows_buckets") |
324 | | - op.drop_index("ix_workflows_object_data_type", table_name="workflows_object") |
325 | | - op.drop_index("ix_workflows_object_id_parent", table_name="workflows_object") |
326 | | - op.drop_index("ix_workflows_object_id_workflow", table_name="workflows_object") |
327 | | - op.drop_index("ix_workflows_object_status", table_name="workflows_object") |
328 | | - op.drop_table("workflows_object") |
329 | | - op.drop_table("workflows_workflow") |
330 | | - op.execute("DROP TYPE IF EXISTS source_enum") |
| 31 | + pass |
0 commit comments