-
Notifications
You must be signed in to change notification settings - Fork 46
Expand file tree
/
Copy pathsample_data.sql
More file actions
589 lines (504 loc) · 124 KB
/
sample_data.sql
File metadata and controls
589 lines (504 loc) · 124 KB
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
210
211
212
213
214
215
216
217
218
219
220
221
222
223
224
225
226
227
228
229
230
231
232
233
234
235
236
237
238
239
240
241
242
243
244
245
246
247
248
249
250
251
252
253
254
255
256
257
258
259
260
261
262
263
264
265
266
267
268
269
270
271
272
273
274
275
276
277
278
279
280
281
282
283
284
285
286
287
288
289
290
291
292
293
294
295
296
297
298
299
300
301
302
303
304
305
306
307
308
309
310
311
312
313
314
315
316
317
318
319
320
321
322
323
324
325
326
327
328
329
330
331
332
333
334
335
336
337
338
339
340
341
342
343
344
345
346
347
348
349
350
351
352
353
354
355
356
357
358
359
360
361
362
363
364
365
366
367
368
369
370
371
372
373
374
375
376
377
378
379
380
381
382
383
384
385
386
387
388
389
390
391
392
393
394
395
396
397
398
399
400
401
402
403
404
405
406
407
408
409
410
411
412
413
414
415
416
417
418
419
420
421
422
423
424
425
426
427
428
429
430
431
432
433
434
435
436
437
438
439
440
441
442
443
444
445
446
447
448
449
450
451
452
453
454
455
456
457
458
459
460
461
462
463
464
465
466
467
468
469
470
471
472
473
474
475
476
477
478
479
480
481
482
483
484
485
486
487
488
489
490
491
492
493
494
495
496
497
498
499
500
501
502
503
504
505
506
507
508
509
510
511
512
513
514
515
516
517
518
519
520
521
522
523
524
525
526
527
528
529
530
531
532
533
534
535
536
537
538
539
540
541
542
543
544
545
546
547
548
549
550
551
552
553
554
555
556
557
558
559
560
561
562
563
564
565
566
567
568
569
570
571
572
573
574
575
576
577
578
579
580
581
582
583
584
585
586
587
588
589
do $$
declare
-- DOMAINS
hr_domain_id uuid;
operations_and_logistics_domain_id uuid;
financial_domain_id uuid;
product_development_domain_id uuid;
risk_and_compliance_domain_id uuid;
commercial_and_customer_relationship_mgt_domain_id uuid;
-- DATA PRODUCT TYPES
processing_type_id uuid;
reporting_type_id uuid;
exploration_type_id uuid;
ingestion_type_id uuid;
machine_learning_type_id uuid;
analytics_type_id uuid;
-- USERS
alice_id uuid;
bob_id uuid;
jane_id uuid;
john_id uuid;
-- DATA PRODUCTS
data_product_lifecycle_id uuid;
customer_segmentation_id uuid;
customer_churn_prediction uuid;
marketing_campaign_analysis uuid;
customer_lifetime_value uuid;
customer_feedback_analysis uuid;
inventory_management uuid;
supply_chain_optimization uuid;
warehouse_automation_metrics uuid;
order_fulfillment_analysis uuid;
production_planning_insights uuid;
revenue_dashboard uuid;
expense_forecasting uuid;
release_impact_analysis uuid;
user_feedback_analysis uuid;
data_privacy_compliance uuid;
sales_performance_model uuid;
cash_flow_monitoring uuid;
fraud_detection uuid;
financial_risk_assessment uuid;
feature_usage_metrics uuid;
profitability_analysis uuid;
-- DATASETS
production_planning_insights_forecast uuid;
sales_performance_model_output_port uuid;
order_fulfillment_analysis_output_port uuid;
inventory_management_output_port uuid;
user_feedback_insights_report uuid;
release_impact_summary uuid;
release_engagement_by_segment uuid;
customer_segmentation_weekly_output_port_id uuid;
margin_trends_by_product uuid;
feature_usage_metrics_daily uuid;
feature_usage_metrics_weekly uuid;
-- PLATFORMS
returned_platform_id uuid;
s3_service_id uuid;
glue_service_id uuid;
returned_environment_id_dev uuid;
returned_environment_id_prd uuid;
databricks_id uuid;
databricks_service_id uuid;
snowflake_id uuid;
snowflake_service_id uuid;
redshift_service_id uuid;
-- DATA OUTPUTS
glue_configuration_id uuid;
databricks_configuration_id uuid;
customer_segmentation_weekly_technical_asset_id uuid;
product_owner_id uuid;
admin_role_id uuid;
product_member_id uuid;
dataset_owner_id uuid;
-- tags
tag_pii_id uuid;
tag_sensitive_id uuid;
tag_public_id uuid;
begin
TRUNCATE TABLE public.data_products_datasets CASCADE;
TRUNCATE TABLE public.datasets CASCADE;
TRUNCATE TABLE public.data_products CASCADE;
TRUNCATE TABLE public.data_product_types CASCADE;
TRUNCATE TABLE public.domains CASCADE;
TRUNCATE TABLE public.tags CASCADE;
TRUNCATE TABLE public.roles CASCADE;
TRUNCATE TABLE public.role_assignments_global CASCADE;
TRUNCATE TABLE public.role_assignments_data_product CASCADE;
TRUNCATE TABLE public.role_assignments_dataset CASCADE;
TRUNCATE TABLE public.dataset_curated_queries CASCADE;
-- INSERT TAGS
INSERT INTO public.tags (id, value, created_on, updated_on, deleted_at) VALUES (gen_random_uuid(), 'PII', '2025-10-28 16:32:14.563446', NULL, NULL) returning id into tag_pii_id;
INSERT INTO public.tags (id, value, created_on, updated_on, deleted_at) VALUES (gen_random_uuid(), 'Sensitive', '2025-10-28 16:32:27.884892', NULL, NULL) returning id into tag_sensitive_id;
INSERT INTO public.tags (id, value, created_on, updated_on, deleted_at) VALUES (gen_random_uuid(), 'Public', '2025-10-28 16:32:27.884892', NULL, NULL) returning id into tag_public_id;
-- PLATFORMS
INSERT INTO public.platforms (id, "name") SELECT gen_random_uuid(), 'AWS' WHERE NOT EXISTS (SELECT 1 FROM public.platforms WHERE "name" = 'AWS') returning id into returned_platform_id;
SELECT id FROM public.platforms WHERE name = 'AWS' INTO returned_platform_id;
INSERT INTO public.platform_services (id, "name", platform_id, result_string_template, technical_info_template) SELECT gen_random_uuid(), 'S3', returned_platform_id, '{database}.{schema}.{table}', '{database}.{schema}.{table}' WHERE NOT EXISTS (SELECT 1 FROM public.platform_services WHERE "name" = 'S3' AND "platform_id" = returned_platform_id);
SELECT id FROM public.platform_services WHERE platform_id = returned_platform_id AND name = 'S3' INTO s3_service_id;
INSERT INTO public.platform_services (id, "name", platform_id, result_string_template, technical_info_template) SELECT gen_random_uuid(), 'Glue', returned_platform_id, '{database}.{schema}.{table}', '{database}.{schema}.{table}' WHERE NOT EXISTS (SELECT 1 FROM public.platform_services WHERE "name" = 'Glue' AND "platform_id" = returned_platform_id);
SELECT id FROM public.platform_services WHERE platform_id = returned_platform_id AND name = 'Glue' INTO glue_service_id;
-- ...existing platform configuration code...
INSERT INTO public.platforms (id, "name") VALUES ('9be7613c-42fb-4b93-952d-1874ed1ddf77', 'Snowflake') returning id INTO snowflake_id;
INSERT INTO public.platforms (id, "name") VALUES ('6be7613c-42fb-4b93-952d-1874ed1ddf76', 'Conveyor');
INSERT INTO public.platform_services (id, "name", platform_id, result_string_template, technical_info_template) VALUES ('a75189c1-fa42-4980-9497-4bea4c968a5c', 'Conveyor', (SELECT id FROM public.platforms WHERE name = 'Conveyor'), '{database}.{schema}.{table}', '{database}.{schema}.{table}');
INSERT INTO public.platform_services (id, "name", platform_id, result_string_template, technical_info_template) VALUES ('a75189c1-fa42-4980-9497-4bea4c968a5b', 'Snowflake', snowflake_id, '{database}.{schema}.{table}', '{database}.{schema}.{table}') returning id INTO snowflake_service_id;
INSERT INTO public.platform_services (id, "name", platform_id, result_string_template, technical_info_template) VALUES ('de328223-fd90-4170-a7a1-376e4ebe0594', 'Redshift', returned_platform_id,'{database}__{schema}.{table}', '{database}__{schema}.{table}') returning id INTO redshift_service_id;
INSERT INTO public.platforms (id, "name") VALUES ('baa5c47b-805a-4cbb-ad8b-038c66e81b7e', 'Databricks') returning id INTO databricks_id;
INSERT INTO public.platform_services (id, "name", platform_id, result_string_template, technical_info_template) VALUES ('ce208413-b629-44d2-9f98-e5b47a315a56', 'Databricks', databricks_id, '{catalog}.{schema}.{table}', '{catalog}.{schema}.{table}') returning id INTO databricks_service_id;
INSERT INTO public.platform_service_configs (id, platform_id, service_id, "config", created_on, updated_on, deleted_at) VALUES('f4d3e8b1-5c6e-4f4a-0893-8f4e2c3d5b6a', (SELECT id FROM public.platforms WHERE name = 'Conveyor'), 'a75189c1-fa42-4980-9497-4bea4c968a5c', '["clean","master"]', timezone('utc'::text, CURRENT_TIMESTAMP), NULL, NULL);
INSERT INTO public.platform_service_configs (id, platform_id, service_id, "config", created_on, updated_on, deleted_at) VALUES('6bd82fd6-9a23-4517-a07c-9110d83ab38f', returned_platform_id, s3_service_id, '["datalake","ingress","egress"]', timezone('utc'::text, CURRENT_TIMESTAMP), NULL, NULL);
INSERT INTO public.platform_service_configs (id, platform_id, service_id, "config", created_on, updated_on, deleted_at) VALUES('fa026b3a-7a17-4c32-b279-995af021f6c2', returned_platform_id, glue_service_id, '["clean","master"]', timezone('utc'::text, CURRENT_TIMESTAMP), NULL, NULL);
INSERT INTO public.platform_service_configs (id, platform_id, service_id, "config", created_on, updated_on, deleted_at) VALUES('0b9a0e7f-8fee-4fd3-97e0-830e1612b77a', databricks_id, databricks_service_id, '["clean","master"]', timezone('utc'::text, CURRENT_TIMESTAMP), NULL, NULL);
INSERT INTO public.data_product_types (id, "name", description, icon_key, created_on, updated_on, deleted_at) VALUES ('90ab1128-329f-47dd-9420-c9681bfc68c4', 'Processing', 'Data products that transform, clean, or enrich data to make it usable for other systems or analysis.', 'PROCESSING', timezone('utc'::text, CURRENT_TIMESTAMP), NULL, NULL) returning id INTO processing_type_id;
INSERT INTO public.data_product_types (id, "name", description, icon_key, created_on, updated_on, deleted_at) VALUES ('1b4a64b3-96fb-404c-a73c-294802dc9852', 'Reporting', 'Data products that provide structured reports and dashboards for decision-making.', 'REPORTING', timezone('utc'::text, CURRENT_TIMESTAMP), NULL, NULL) returning id INTO reporting_type_id;
INSERT INTO public.data_product_types (id, "name", description, icon_key, created_on, updated_on, deleted_at) VALUES ('74b13338-aa85-4552-8ccb-7d51550c67de', 'Exploration', 'Data products that allow users to interactively explore data for insights or discovery.', 'EXPLORATION', timezone('utc'::text, CURRENT_TIMESTAMP), NULL, NULL) returning id INTO exploration_type_id;
INSERT INTO public.data_product_types (id, "name", description, icon_key, created_on, updated_on, deleted_at) VALUES ('c25cf2c2-418a-4d1d-a975-c6af61161546', 'Ingestion', 'Data products responsible for collecting, importing, or integrating data from various sources.', 'INGESTION', timezone('utc'::text, CURRENT_TIMESTAMP), NULL, NULL) returning id INTO ingestion_type_id;
INSERT INTO public.data_product_types (id, "name", description, icon_key, created_on, updated_on, deleted_at) VALUES ('f1672c38-ad1a-401a-8dd3-e0b026ab1416', 'Machine Learning', 'Data products that leverage predictive models or algorithms to generate insights or predictions.', 'MACHINE_LEARNING', timezone('utc'::text, CURRENT_TIMESTAMP), NULL, NULL) returning id INTO machine_learning_type_id;
INSERT INTO public.data_product_types (id, "name", description, icon_key, created_on, updated_on, deleted_at) VALUES ('3c289333-2d55-4aed-8bd5-85015a1567fe', 'Analytics', 'Data products that provide analysis, metrics, or aggregated insights to support business decisions.', 'ANALYTICS', timezone('utc'::text, CURRENT_TIMESTAMP), NULL, NULL) returning id INTO analytics_type_id;
-- ...existing platform service configs...
INSERT INTO public.roles (id, name, scope, prototype, description, permissions, created_on, updated_on, deleted_at) VALUES ('f80c101c-345c-4d5b-9524-57c55bd12d2d', 'Everyone', 'global', 1, 'This is the role that is used as fallback for users that don''t have another role', ARRAY [102, 103, 104, 105], timezone('utc'::text, CURRENT_TIMESTAMP + INTERVAL '1 seconds'), NULL, NULL);
INSERT INTO public.roles (id, name, scope, prototype, description, permissions, created_on, updated_on, deleted_at) VALUES ('e43b6f7a-e776-49b2-9b51-117d8644d971', 'Owner', 'data_product', 2, 'The owner of a Data Product', ARRAY [301, 302, 304, 305, 306, 307, 308, 309, 310, 311, 312, 313, 314, 315], timezone('utc'::text, CURRENT_TIMESTAMP), NULL, NULL) returning id into product_owner_id;
INSERT INTO public.roles (id, name, scope, prototype, description, permissions, created_on, updated_on, deleted_at) VALUES ('18e67286-92aa-449a-ba46-ac26eb0de21d', 'Solution Architect', 'data_product', 0, 'The Solution Architect for a Data Product', ARRAY [303, 309, 310, 311, 312, 313, 314], timezone('utc'::text, CURRENT_TIMESTAMP + INTERVAL '1 seconds'), NULL, NULL);
INSERT INTO public.roles (id, name, scope, prototype, description, permissions, created_on, updated_on, deleted_at) VALUES ('9ca3bfdd-2919-4190-a8bb-55e9ee7d70dd', 'Member', 'data_product', 0, 'A regular team member of a Data Product', ARRAY [313, 314, 315], timezone('utc'::text, CURRENT_TIMESTAMP + INTERVAL '2 seconds'), NULL, NULL) returning id into product_member_id;
INSERT INTO public.roles (id, name, scope, prototype, description, permissions, created_on, updated_on, deleted_at) VALUES ('9a9d7deb-14d9-4257-a986-7900aa70ef8f', 'Owner', 'dataset', 2, 'The owner of a Dataset', ARRAY [401, 402, 404, 405, 406, 407, 408, 411, 412, 413, 414], timezone('utc'::text, CURRENT_TIMESTAMP), NULL, NULL) returning id into dataset_owner_id;
INSERT INTO public.roles (id, name, scope, prototype, description, permissions, created_on, updated_on, deleted_at) VALUES ('2ae1b4e3-5b13-491a-912b-984e2e90b858', 'Solution Architect', 'dataset', 0, 'The Solution Architect for a Dataset', ARRAY [403, 409, 410], timezone('utc'::text, CURRENT_TIMESTAMP + INTERVAL '1 seconds'), NULL, NULL);
INSERT INTO public.roles (id, name, scope, prototype, description, permissions, created_on, updated_on, deleted_at) VALUES ('db8d7a76-c50b-4e95-8549-8da86f48e7c2', 'Member', 'dataset', 0, 'A regular team member of a Dataset', ARRAY [413], timezone('utc'::text, CURRENT_TIMESTAMP + INTERVAL '2 seconds'), NULL, NULL);
INSERT INTO public.roles (id, name, scope, prototype, description, permissions, created_on, updated_on, deleted_at)
VALUES
('00000000-0000-0000-0000-000000000000', 'Admin', 'global', 3, 'Global admin role', ARRAY[]::integer[], timezone('utc'::text, CURRENT_TIMESTAMP), NULL, NULL)
RETURNING id INTO admin_role_id;
-- ENVIRONMENTS
INSERT INTO public.environments ("name", context, acronym, is_default, created_on, updated_on, deleted_at) VALUES ('development', 'arn:aws:iam::{{ AWS_ACCOUNT_ID }}:role/{{ AWS_ROLE_WITH_CONTEXT_TEMPLATE_DEV }}', 'dev', true, timezone('utc'::text, CURRENT_TIMESTAMP), NULL, NULL) returning id INTO returned_environment_id_dev;
INSERT INTO public.environments ("name", context, acronym, is_default, created_on, updated_on, deleted_at) VALUES ('production', 'arn:aws:iam::{{ AWS_ACCOUNT_ID }}:role/{{ AWS_ROLE_WITH_CONTEXT_TEMPLATE_PRD }}', 'prd', false, timezone('utc'::text, CURRENT_TIMESTAMP), NULL, NULL) returning id INTO returned_environment_id_prd;
INSERT INTO public.env_platform_configs (id, environment_id, platform_id, "config", created_on, updated_on, deleted_at) VALUES ('daa8e3e8-1485-4eb2-8b4b-575e8d10a570', returned_environment_id_dev, returned_platform_id, '{"account_id": "{{ AWS_ACCOUNT_ID }}", "region": "{{ AWS_REGION }}", "can_read_from": ["production"]}', timezone('utc'::text, CURRENT_TIMESTAMP), NULL, NULL);
INSERT INTO public.env_platform_configs (id, environment_id, platform_id, "config", created_on, updated_on, deleted_at) VALUES ('e2aa2f6d-585f-4b43-8ea4-982b7bab0142', returned_environment_id_prd, returned_platform_id, '{"account_id": "{{ AWS_ACCOUNT_ID }}", "region": "{{ AWS_REGION }}", "can_read_from": []}', timezone('utc'::text, CURRENT_TIMESTAMP), NULL, NULL);
INSERT INTO public.env_platform_service_configs (id, environment_id, platform_id, service_id, "config", created_on, updated_on, deleted_at) VALUES('93f4b677-5ae8-450d-91a6-e15196b2e774', returned_environment_id_dev, returned_platform_id, s3_service_id, '[{"identifier":"datalake","bucket_name":"{{ DATALAKE_BUCKET_NAME_DEV }}","bucket_arn":"{{ DATALAKE_BUCKET_ARN_DEV }}","kms_key_arn":"{{ DATALAKE_BUCKET_KMS_ARN_DEV }}","is_default":true},{"identifier":"ingress","bucket_name":"{{ INGRESS_BUCKET_NAME_DEV }}","bucket_arn":"{{ INGRESS_BUCKET_ARN_DEV }}","kms_key_arn":"{{ INGRESS_BUCKET_KMS_ARN_DEV }}","is_default":false},{"identifier":"egress","bucket_name":"{{ EGRESS_BUCKET_NAME_DEV }}","bucket_arn":"{{ EGRESS_BUCKET_ARN_DEV }}","kms_key_arn":"{{ EGRESS_BUCKET_KMS_ARN_DEV }}","is_default":false}]', timezone('utc'::text, CURRENT_TIMESTAMP), NULL, NULL);
INSERT INTO public.env_platform_service_configs (id, environment_id, platform_id, service_id, "config", created_on, updated_on, deleted_at) VALUES('9c1d025c-f342-4665-8461-ba8b9f4035ff', returned_environment_id_prd, returned_platform_id, s3_service_id, '[{"identifier":"datalake","bucket_name":"{{ DATALAKE_BUCKET_NAME_PRD }}","bucket_arn":"{{ DATALAKE_BUCKET_ARN_PRD }}","kms_key_arn":"{{ DATALAKE_BUCKET_KMS_ARN_PRD }}","is_default":true},{"identifier":"ingress","bucket_name":"{{ INGRESS_BUCKET_NAME_PRD }}","bucket_arn":"{{ INGRESS_BUCKET_ARN_PRD }}","kms_key_arn":"{{ INGRESS_BUCKET_KMS_ARN_PRD }}","is_default":false},{"identifier":"egress","bucket_name":"{{ EGRESS_BUCKET_NAME_PRD }}","bucket_arn":"{{ EGRESS_BUCKET_ARN_PRD }}","kms_key_arn":"{{ EGRESS_BUCKET_KMS_ARN_PRD }}","is_default":false}]', timezone('utc'::text, CURRENT_TIMESTAMP), NULL, NULL);
INSERT INTO public.env_platform_service_configs (id, environment_id, platform_id, service_id, "config", created_on, updated_on, deleted_at) VALUES('1c52b0e5-961f-412a-995e-0c1efae19f41', returned_environment_id_dev, returned_platform_id, glue_service_id, '[{"identifier":"clean_test","database_name":"clean_test_dev","bucket_identifier":"datalake","s3_path":"clean/test"},{"identifier":"master_test","database_name":"master_test_dev","bucket_identifier":"datalake","s3_path":"master/test"}]', timezone('utc'::text, CURRENT_TIMESTAMP), NULL, NULL);
INSERT INTO public.env_platform_service_configs (id, environment_id, platform_id, service_id, "config", created_on, updated_on, deleted_at) VALUES('ba42ca59-ab5d-498e-8cd0-cdd680f80bb0', returned_environment_id_prd, returned_platform_id, glue_service_id, '[{"identifier":"clean_test","database_name":"clean_test_prd","bucket_identifier":"datalake","s3_path":"clean/test"},{"identifier":"master_test","database_name":"master_test_prd","bucket_identifier":"datalake","s3_path":"master/test"}]', timezone('utc'::text, CURRENT_TIMESTAMP), NULL, NULL);
-- DOMAINS
INSERT INTO public.domains (id, name, description, created_on, updated_on, deleted_at) VALUES ('672debaf-31f9-4233-820b-ad2165af044e', 'Customer Insights', 'Contains data products that provide information about customer behavior, demographics and satisfaction.', timezone('utc'::text, CURRENT_TIMESTAMP), NULL, NULL) returning id INTO hr_domain_id;
INSERT INTO public.domains (id, name, description, created_on, updated_on, deleted_at) VALUES ('bd09093e-14ff-41c1-b74d-7c2ce9821d1c', 'Operations & Logistics', 'Data products that track internal operations, supply chain efficiency and resource utilization.', timezone('utc'::text, CURRENT_TIMESTAMP), NULL, NULL) returning id INTO operations_and_logistics_domain_id;
INSERT INTO public.domains (id, name, description, created_on, updated_on, deleted_at) VALUES ('8798B58A-9119-43D1-9365-DC83E07B8D87', 'Financial Performance', 'Data products focused on revenue, expenses, profitability and other financial metrics.', timezone('utc'::text, CURRENT_TIMESTAMP), NULL, NULL) returning id INTO financial_domain_id;
INSERT INTO public.domains (id, name, description, created_on, updated_on, deleted_at) VALUES ('623e6fbf-3a06-434e-995c-b0336e71806e', 'Product Development', 'Data products that capture product usage, feature adoption and performance metrics.', timezone('utc'::text, CURRENT_TIMESTAMP), NULL, NULL) returning id INTO product_development_domain_id;
INSERT INTO public.domains (id, name, description, created_on, updated_on, deleted_at) VALUES ('bec196cb-81df-4cfc-959f-b142c312861e', 'Risk & Compliance', 'Data products designed to monitor regulatory compliance, security and operational risks', '2025-10-28 16:30:24.123498', NULL, NULL) returning id INTO risk_and_compliance_domain_id;
INSERT INTO public.domains (id, name, description, created_on, updated_on, deleted_at) VALUES ('acaaaafe-cde9-4746-9835-f1e0c3c85b6c', 'Commercial and Customer Relationship Management', 'Commercial and CRM', '2025-10-28 16:30:41.743083', NULL, NULL) returning id into commercial_and_customer_relationship_mgt_domain_id;
-- DATA PRODUCT TYPES
-- ...existing data product types code...
-- USERS
INSERT INTO public.users (email, id, external_id, first_name, last_name, created_on, updated_on, deleted_at) VALUES ('alice.baker@pharma.com', 'a02d3714-97e3-40d8-92b7-3b018fd1229f', 'alice.baker@pharma.com', 'Alice', 'Baker', timezone('utc'::text, CURRENT_TIMESTAMP), NULL, NULL) returning id INTO alice_id;
INSERT INTO public.users (email, id, external_id, first_name, last_name, created_on, updated_on, deleted_at) VALUES ('bob.johnson@pharma.com', '35f2dd11-3119-4eb3-8f19-01b323131221', 'bob.johnson@pharma.com', 'Bob', 'Johnson', timezone('utc'::text, CURRENT_TIMESTAMP), NULL, NULL) returning id INTO bob_id;
INSERT INTO public.users (email, id, external_id, can_become_admin, first_name, last_name, created_on, updated_on, deleted_at) VALUES ('jane.researcher@pharma.com', 'd9f3aae2-391e-46c1-aec6-a7ae1114a7da', 'jane.researcher@pharma.com', true, 'Jane', 'Researcher', timezone('utc'::text, CURRENT_TIMESTAMP), NULL, NULL) returning id INTO jane_id;
INSERT INTO public.users (email, id, external_id, can_become_admin, first_name, last_name, created_on, updated_on, deleted_at) VALUES ('john.scientist@pharma.com', 'b72fca38-17ff-4259-a075-5aaa5973343c', 'john.scientist@pharma.com', true, 'John', 'Scientist', timezone('utc'::text, CURRENT_TIMESTAMP), NULL, NULL) returning id INTO john_id;
-- ROLES
-- ...existing roles code...
SELECT '00000000-0000-0000-0000-000000000001' INTO data_product_lifecycle_id;
INSERT INTO data_product_lifecycles (id, name, value, color, is_default) SELECT data_product_lifecycle_id, 'Draft', 0, 'grey', true WHERE NOT EXISTS (SELECT 1 FROM public.data_product_lifecycles WHERE id = data_product_lifecycle_id);
-- Customer segmentation id
INSERT INTO public.data_products (id, "name", namespace, description, about, status, type_id, domain_id, created_on, updated_on, deleted_at) VALUES (gen_random_uuid(), 'Customer Segmentation', 'customer_segmentation', 'Groups customers based on demographics, behavior, and purchase patterns.', '<h2>Customer Segmentation</h2><p></p><p>This data product aims to provide a centralized view of customer segments across demographics and behavior.</p><p></p><p><strong>Key objectives include:</strong></p><ul><li>Enable targeted marketing and product strategies</li><li>Identify high-value customer groups</li><li>Support personalized engagement campaigns</li></ul>', 'ACTIVE', '3c289333-2d55-4aed-8bd5-85015a1567fe', hr_domain_id, timezone('utc'::text, CURRENT_TIMESTAMP), NULL, NULL) returning id into customer_segmentation_id;
INSERT INTO public.tags_data_products (data_product_id, tag_id) VALUES (customer_segmentation_id, tag_sensitive_id);
-- Customer segementation id -- Customer segments weekly
INSERT INTO public.datasets (id, namespace, data_product_id, "name", description, about, status, access_type, created_on, updated_on, deleted_at) VALUES (gen_random_uuid(), 'customer_segments_weekly', customer_segmentation_id, 'Customer Segments Weekly', 'Weekly segmentation of customers by demographics and purchase behavior', 'Provides the latest segmentation of customers to guide marketing and targeting. Key objectives: - Identify high-value segments - Support campaign personalization - Update targeting weekly', 'ACTIVE', 'RESTRICTED', timezone('utc'::text, CURRENT_TIMESTAMP), NULL, NULL) returning id into customer_segmentation_weekly_output_port_id;
INSERT INTO public.data_outputs (id, namespace, name, description, status, platform_id, service_id, owner_id, configuration, configuration_id, created_on, updated_on, deleted_at, "technical_mapping") VALUES (gen_random_uuid(), 'customer-segments-weekly-table', 'Customer segments weekly s3 table', 'Weekly segmentation of customers by demographics and purchase behavior', 'ACTIVE', returned_platform_id, glue_service_id, customer_segmentation_id, NULL, '12346cc6-f58d-4217-88d3-6443b01d5d0f', '2025-10-28 16:34:02.355842', NULL, NULL, 'default') returning id into customer_segmentation_weekly_technical_asset_id;
INSERT INTO public.tags_data_outputs (data_output_id, tag_id, created_on, updated_on) VALUES (customer_segmentation_weekly_technical_asset_id, tag_pii_id, '2025-10-28 17:56:57.829806', NULL);
INSERT INTO public.data_outputs_datasets (id, data_output_id, dataset_id, status, requested_by_id, requested_on, approved_by_id, approved_on, denied_by_id, denied_on, created_on, updated_on, deleted_at) VALUES (gen_random_uuid(), customer_segmentation_weekly_technical_asset_id, customer_segmentation_weekly_output_port_id, 'APPROVED', john_id, '2025-10-28 16:36:36.784134', john_id, '2025-10-28 16:36:36.936773', NULL, NULL, '2025-10-28 16:36:36.677803', '2025-10-28 16:36:36.838041', NULL);
INSERT INTO public.tags_datasets (dataset_id, tag_id) VALUES (customer_segmentation_weekly_output_port_id, tag_sensitive_id);
INSERT INTO public.datasets (id, namespace, data_product_id, "name", description, about, status, access_type, created_on, updated_on, deleted_at) VALUES ('eb8bb332-b05e-4529-af43-90f69a6a90bb', 'customer_segments_monthly', customer_segmentation_id, 'Customer Segments Monthly', 'Monthly aggregated customer segments', 'Provides monthly view of customer groups for strategic planning. Key objectives: - Track segment evolution - Support executive reporting - Feed into predictive models', 'ACTIVE', 'RESTRICTED', timezone('utc'::text, CURRENT_TIMESTAMP), NULL, NULL);
-- Customer churn prediction
INSERT INTO public.data_products (id, "name", namespace, description, about, status, type_id, domain_id, created_on, updated_on, deleted_at) VALUES ('0a883317-d6c0-44e1-93b2-ba531fa9eeab', 'Customer Churn Prediction', 'customer_churn_prediction', 'Predicts which customers are likely to leave using historical data.', '<h2>Customer Churn Prediction</h2><p></p><p>This data product aims to anticipate customer attrition using predictive modeling.</p><p></p><p><strong>Key objectives include:</strong></p><ul><li>Proactively engage at-risk customers</li><li>Reduce churn rates</li><li>Optimize retention strategies</li></ul>', 'ACTIVE', 'f1672c38-ad1a-401a-8dd3-e0b026ab1416', hr_domain_id, timezone('utc'::text, CURRENT_TIMESTAMP), NULL, NULL) returning id into customer_churn_prediction;
INSERT INTO public.tags_data_products (data_product_id, tag_id) VALUES (customer_churn_prediction, tag_public_id);
INSERT INTO public.datasets (id, namespace, data_product_id, "name", description, about, status, access_type, created_on, updated_on, deleted_at) VALUES ('208cc524-5df2-47dd-b8b7-489ad2c5553a', 'weekly_churn_probabilities', customer_churn_prediction, 'Weekly Churn Probabilities', 'Predicted churn probability per customer, updated weekly', 'Provides actionable insights for retention campaigns. Key objectives: - Enable timely interventions - Support sales and marketing - Reduce churn', 'ACTIVE', 'RESTRICTED', timezone('utc'::text, CURRENT_TIMESTAMP), NULL, NULL);
INSERT INTO public.datasets (id, namespace, data_product_id, "name", description, about, status, access_type, created_on, updated_on, deleted_at) VALUES ('f3aa47cf-81cc-4bc8-9876-1960b8ddcd6c', 'monthly_churn_targets', customer_churn_prediction, 'Monthly Churn Targets', 'Aggregated churn targets for marketing campaigns', 'Provides monthly churn-focused marketing guidance. Key objectives: - Plan anti-churn campaigns - Measure campaign effectiveness - Prioritize high-risk customers', 'ACTIVE', 'RESTRICTED', timezone('utc'::text, CURRENT_TIMESTAMP), NULL, NULL);
-- Marketing campaign analysis
INSERT INTO public.data_products (id, "name", namespace, description, about, status, type_id, domain_id, created_on, updated_on, deleted_at) VALUES ('403d19c9-2056-4fb7-b820-d163df800e8f', 'Marketing Campaign Analysis', 'marketing_campaign_analysis', 'Evaluates the performance of marketing campaigns across channels.', '<h2>Marketing Campaign Analysis</h2><p></p><p>This data product provides insights into marketing campaign effectiveness.</p><p></p><p><strong>Key objectives include:</strong></p><ul><li>Measure ROI of campaigns</li><li>Identify best-performing channels</li><li>Support marketing optimization</li></ul>', 'ACTIVE', '1b4a64b3-96fb-404c-a73c-294802dc9852', hr_domain_id, timezone('utc'::text, CURRENT_TIMESTAMP), NULL, NULL) returning id into marketing_campaign_analysis;
INSERT INTO public.datasets (id, namespace, data_product_id, "name", description, about, status, access_type, created_on, updated_on, deleted_at) VALUES ('0deeb253-7b8c-4ece-8a9c-29524bbc5c00', 'campaign_performance_summary', marketing_campaign_analysis, 'Campaign Performance Summary', 'KPIs for each marketing campaign', 'Provides campaign results to optimize channel strategy and improve customer retention. Key objectives: - Track ROI - Identify best-performing campaigns - Inform budget allocation', 'ACTIVE', 'RESTRICTED', timezone('utc'::text, CURRENT_TIMESTAMP), NULL, NULL);
INSERT INTO public.datasets (id, namespace, data_product_id, "name", description, about, status, access_type, created_on, updated_on, deleted_at) VALUES ('7372d7e7-aee3-4644-8ee2-237af4d0899e', 'ad_spend_vs_roi', marketing_campaign_analysis, 'Ad Spend Vs Roi', 'Comparison of spend vs campaign results', 'Measures effectiveness of marketing investments. Key objectives: - Optimize marketing spend - Support executive reporting - Improve ROI', 'ACTIVE', 'RESTRICTED', timezone('utc'::text, CURRENT_TIMESTAMP), NULL, NULL);
INSERT INTO public.datasets (id, namespace, data_product_id, "name", description, about, status, access_type, created_on, updated_on, deleted_at) VALUES ('b68f13d1-b9e8-4e27-96fa-9d6f029614c6', 'top_engaged_segments', marketing_campaign_analysis, 'Top Engaged Segments', 'Identifies most engaged customer segments per campaign', 'Combines marketing and customer segmentation data to target communications. Key objectives: - Focus campaigns on high-engagement segments - Improve conversions - Optimize messaging', 'ACTIVE', 'RESTRICTED', timezone('utc'::text, CURRENT_TIMESTAMP), NULL, NULL);
-- Customer lifetime value
INSERT INTO public.data_products (id, "name", namespace, description, about, status, type_id, domain_id, created_on, updated_on, deleted_at) VALUES ('9a78d3cc-0c0d-4d0b-a314-aeb99c8cecf3', 'Customer Lifetime Value', 'customer_lifetime_value', 'Calculates expected revenue per customer over their relationship.', '<h2>Customer Lifetime Value</h2><p></p><p>This data product estimates customer lifetime value to guide business decisions.</p><p></p><p><strong>Key objectives include:</strong></p><ul><li>Prioritize high-value customers</li><li>Optimize marketing spend</li><li>Inform loyalty programs</li></ul>', 'ACTIVE', '3c289333-2d55-4aed-8bd5-85015a1567fe', hr_domain_id, timezone('utc'::text, CURRENT_TIMESTAMP), NULL, NULL) returning id into customer_lifetime_value;
INSERT INTO public.datasets (id, namespace, data_product_id, "name", description, about, status, access_type, created_on, updated_on, deleted_at) VALUES ('22b583ce-d052-49b3-98c9-92483282f303', 'customer_lifetime_value_scores', customer_lifetime_value, 'Customer Lifetime Value Scores', 'Predicted lifetime value per customer', 'Provides metrics to prioritize high-value customers. Key objectives: - Guide marketing spend - Support sales strategy - Inform loyalty programs', 'ACTIVE', 'RESTRICTED', timezone('utc'::text, CURRENT_TIMESTAMP), NULL, NULL);
-- Customer feedback analysis
INSERT INTO public.data_products (id, "name", namespace, description, about, status, type_id, domain_id, created_on, updated_on, deleted_at) VALUES ('66563731-1be2-493c-b692-aef4cc29e493', 'Customer Feedback Analysis', 'customer_feedback_analysis', 'Analyzes surveys and reviews to understand satisfaction and needs.', '<h2>Customer Feedback Analysis</h2><p></p><p>This data product centralizes customer feedback analysis for actionable insights.</p><p></p><p><strong>Key objectives include:</strong></p><ul><li>Understand customer satisfaction</li><li>Identify improvement areas</li><li>Support product and service enhancements</li></ul>', 'ACTIVE', '74b13338-aa85-4552-8ccb-7d51550c67de', hr_domain_id, timezone('utc'::text, CURRENT_TIMESTAMP), NULL, NULL) returning id into customer_feedback_analysis;
INSERT INTO public.datasets (id, namespace, data_product_id, "name", description, about, status, access_type, created_on, updated_on, deleted_at) VALUES ('67ae0fa8-5e88-4712-b5a1-5a9fc423131f', 'customer_feedback_summary', customer_feedback_analysis, 'Customer Feedback Summary', 'Summary of feedback trends from surveys and reviews', 'Provides insights into customer sentiment and satisfaction. Key objectives: - Identify pain points - Prioritize product improvements - Track satisfaction over time', 'ACTIVE', 'RESTRICTED', timezone('utc'::text, CURRENT_TIMESTAMP), NULL, NULL);
INSERT INTO public.datasets (id, namespace, data_product_id, "name", description, about, status, access_type, created_on, updated_on, deleted_at) VALUES ('e2a641fc-c9ef-40a2-98be-76a7585db5d6', 'feature_feedback_ranking', customer_feedback_analysis, 'Feature Feedback Ranking', 'Ranked insights about product features from user feedback', 'Combines usage metrics with feedback to understand feature impact. Key objectives: - Highlight areas for product improvement - Guide roadmap prioritization - Support UX decisions', 'ACTIVE', 'RESTRICTED', timezone('utc'::text, CURRENT_TIMESTAMP), NULL, NULL);
-- Inventory management
INSERT INTO public.data_products (id, "name", namespace, description, about, status, type_id, domain_id, created_on, updated_on, deleted_at) VALUES ('65254a60-6f97-4b6c-812c-84dcf7c316e3', 'Inventory Management', 'inventory_management', 'Tracks stock levels, turnover, and replenishment schedules.', '<h2>Inventory Management</h2><p></p><p>This data product provides a centralized platform for managing inventory efficiently.</p><p></p><p><strong>Key objectives include:</strong></p><ul><li>Monitor stock levels in real-time</li><li>Reduce stockouts and overstock</li><li>Improve warehouse operations</li></ul>', 'ACTIVE', '1b4a64b3-96fb-404c-a73c-294802dc9852', operations_and_logistics_domain_id, timezone('utc'::text, CURRENT_TIMESTAMP), NULL, NULL) returning id into inventory_management;
INSERT INTO public.datasets (id, namespace, data_product_id, "name", description, about, status, access_type, created_on, updated_on, deleted_at) VALUES ('aa84c8a8-9ca3-47be-9389-c75458e326a2', 'inventory_status', '65254a60-6f97-4b6c-812c-84dcf7c316e3', 'Inventory Status', 'Current stock levels per warehouse', 'Provides visibility into inventory to prevent stockouts or overstock. Key objectives: - Monitor stock levels - Support replenishment planning - Reduce costs', 'ACTIVE', 'RESTRICTED', timezone('utc'::text, CURRENT_TIMESTAMP), NULL, NULL) returning id into inventory_management_output_port;
-- Supply chain optimization
INSERT INTO public.data_products (id, "name", namespace, description, about, status, type_id, domain_id, created_on, updated_on, deleted_at) VALUES ('429f80cf-bce9-4ac5-bafc-0c153df466fc', 'Supply Chain Optimization', 'supply_chain_optimization', 'Analyzes supplier performance, delivery times, and transportation costs.', '<h2>Supply Chain Optimization</h2><p></p><p>This data product aims to optimize supply chain efficiency across operations.</p><p></p><p><strong>Key objectives include:</strong></p><ul><li>Track supplier performance</li><li>Reduce delivery delays</li><li>Minimize transportation costs</li></ul>', 'ACTIVE', '3c289333-2d55-4aed-8bd5-85015a1567fe', operations_and_logistics_domain_id, timezone('utc'::text, CURRENT_TIMESTAMP), NULL, NULL) returning id into supply_chain_optimization;
INSERT INTO public.datasets (id, namespace, data_product_id, "name", description, about, status, access_type, created_on, updated_on, deleted_at) VALUES ('5891bb7a-ed88-4ba1-8826-7c143243f91f', 'supplier_performance_report', supply_chain_optimization, 'Supplier Performance Report', 'Supplier KPIs including delivery times and reliability', 'Provides insights to optimize supply chain efficiency. Key objectives: - Track supplier reliability - Identify delays - Improve procurement', 'ACTIVE', 'RESTRICTED', timezone('utc'::text, CURRENT_TIMESTAMP), NULL, NULL);
-- Warehouse automation metrics
INSERT INTO public.data_products (id, "name", namespace, description, about, status, type_id, domain_id, created_on, updated_on, deleted_at) VALUES ('867e3ad0-7a11-4687-bd39-3e41ad9f2ed0', 'Warehouse Automation Metrics', 'warehouse_automation_metrics', 'Monitors efficiency of warehouse processes using sensor and IoT data.', '<h2>Warehouse Automation Metrics</h2><p></p><p>This data product centralizes warehouse automation metrics for operational improvement.</p><p></p><p><strong>Key objectives include:</strong></p><ul><li>Track process efficiency</li><li>Identify bottlenecks</li><li>Support automation initiatives</li></ul>', 'ACTIVE', 'f1672c38-ad1a-401a-8dd3-e0b026ab1416', operations_and_logistics_domain_id, timezone('utc'::text, CURRENT_TIMESTAMP), NULL, NULL) returning id into warehouse_automation_metrics;
INSERT INTO public.datasets (id, namespace, data_product_id, "name", description, about, status, access_type, created_on, updated_on, deleted_at) VALUES ('05ae0792-f70a-422c-abc1-16fd8c9348bb', 'warehouse_efficiency_metrics', warehouse_automation_metrics, 'Warehouse Efficiency Metrics', 'KPIs from automated warehouse operations', 'Provides data to improve operational efficiency. Key objectives: - Identify bottlenecks - Measure automation impact - Support resource allocation', 'ACTIVE', 'RESTRICTED', timezone('utc'::text, CURRENT_TIMESTAMP), NULL, NULL);
INSERT INTO public.datasets (id, namespace, data_product_id, "name", description, about, status, access_type, created_on, updated_on, deleted_at) VALUES ('4c4ff241-9885-48eb-8b2a-b1a1d66092a3', 'automated_pick_pack_rates', warehouse_automation_metrics, 'Automated Pick Pack Rates', 'Metrics for automated picking and packing', 'Provides detailed operational data for efficiency optimization. Key objectives: - Track speed and accuracy - Support automation planning - Reduce operational costs', 'ACTIVE', 'RESTRICTED', timezone('utc'::text, CURRENT_TIMESTAMP), NULL, NULL);
--Order fulfillment analysis
INSERT INTO public.data_products (id, "name", namespace, description, about, status, type_id, domain_id, created_on, updated_on, deleted_at) VALUES ('c9940b6c-b0be-48d4-a546-cab8afa6cf4b', 'Order Fulfillment Analysis', 'order_fulfillment_analysis', 'Tracks order processing time and delivery success rates.', '<h2>Order Fulfillment Analysis</h2><p></p><p>This data product provides visibility into order fulfillment performance.</p><p></p><p><strong>Key objectives include:</strong></p><ul><li>Monitor processing times</li><li>Improve delivery success rates</li><li>Enhance customer satisfaction</li></ul>', 'ACTIVE', '3c289333-2d55-4aed-8bd5-85015a1567fe', operations_and_logistics_domain_id, timezone('utc'::text, CURRENT_TIMESTAMP), NULL, NULL) returning id into order_fulfillment_analysis;
INSERT INTO public.datasets (id, namespace, data_product_id, "name", description, about, status, access_type, created_on, updated_on, deleted_at) VALUES ('b928519b-21f9-4877-975b-686c2b336522', 'order_fulfillment_stats', order_fulfillment_analysis, 'Order Fulfillment Stats', 'Metrics on order processing and delivery success', 'Provides visibility into fulfillment performance. Key objectives: - Track delivery efficiency - Improve customer satisfaction - Reduce delays', 'ACTIVE', 'RESTRICTED', timezone('utc'::text, CURRENT_TIMESTAMP), NULL, NULL) returning id into order_fulfillment_analysis_output_port;
INSERT INTO public.datasets (id, namespace, data_product_id, "name", description, about, status, access_type, created_on, updated_on, deleted_at) VALUES ('5d99a121-826d-4426-be8a-bc820b5be365', 'delayed_orders_report', order_fulfillment_analysis, 'Delayed Orders Report', 'Orders delayed beyond SLA', 'Identifies bottlenecks in fulfillment. Key objectives: - Highlight issues - Support logistics improvements - Inform customer communication', 'ACTIVE', 'RESTRICTED', timezone('utc'::text, CURRENT_TIMESTAMP), NULL, NULL);
-- Production planning insights
INSERT INTO public.data_products (id, "name", namespace, description, about, status, type_id, domain_id, created_on, updated_on, deleted_at) VALUES ('c550880e-fcc8-4048-a6ce-fec8903b5521', 'Production Planning Insights', 'production_planning_insights', 'Predicts production needs and schedules resources effectively.', '<h2>Production Planning Insights</h2><p></p><p>This data product centralizes production planning insights to optimize operations.</p><p></p><p><strong>Key objectives include:</strong></p><ul><li>Forecast production requirements</li><li>Allocate resources efficiently</li><li>Reduce downtime</li></ul>', 'ACTIVE', '3c289333-2d55-4aed-8bd5-85015a1567fe', operations_and_logistics_domain_id, timezone('utc'::text, CURRENT_TIMESTAMP), NULL, NULL) returning id into production_planning_insights;
INSERT INTO public.datasets (id, namespace, data_product_id, "name", description, about, status, access_type, created_on, updated_on, deleted_at) VALUES ('821b84ce-a702-44f7-8521-971954c0a208', 'production_planning_forecast', production_planning_insights, 'Production Planning Forecast', 'Forecast of production requirements', 'Provides projections to optimize scheduling and capacity. Key objectives: - Reduce downtime - Optimize resource allocation - Support operational planning', 'ACTIVE', 'RESTRICTED', timezone('utc'::text, CURRENT_TIMESTAMP), NULL, NULL) returning id into production_planning_insights_forecast;
INSERT INTO public.datasets (id, namespace, data_product_id, "name", description, about, status, access_type, created_on, updated_on, deleted_at) VALUES ('bc7b3d51-1941-4312-ba83-4594c331cf05', 'production_variance_report', production_planning_insights, 'Production Variance Report', 'Difference between planned and actual production', 'Provides insights into production deviations. Key objectives: - Identify inefficiencies - Improve planning accuracy - Support operations', 'ACTIVE', 'RESTRICTED', timezone('utc'::text, CURRENT_TIMESTAMP), NULL, NULL);
-- Sales performance model
INSERT INTO public.data_products (id, name, namespace, description, about, status, type_id, domain_id, created_on, updated_on, deleted_at, lifecycle_id, usage) VALUES ('86b74246-734f-4cea-a984-3dd0d27fc565', 'Sales performance model', 'sales-performance-model', 'Evaluates sales productivity and regional performance.
It enables resource re-allocation and forecasting improvements.', NULL, 'ACTIVE', '90ab1128-329f-47dd-9420-c9681bfc68c4', commercial_and_customer_relationship_mgt_domain_id, '2025-10-28 18:19:20.450469', NULL, NULL, data_product_lifecycle_id, NULL) returning id into sales_performance_model;
INSERT INTO public.datasets (id, namespace, data_product_id, "name", description, about, status, access_type, created_on, updated_on, deleted_at) VALUES (gen_random_uuid(), 'sales_performance', sales_performance_model, 'Sales performance', 'Sales performance data', 'Provides an overview of sales performance data', 'ACTIVE', 'RESTRICTED', timezone('utc'::text, CURRENT_TIMESTAMP), NULL, NULL) returning id into sales_performance_model_output_port;
INSERT INTO public.data_outputs (id, namespace, name, description, status, platform_id, service_id, owner_id, configuration, configuration_id, created_on, updated_on, deleted_at, "technical_mapping") VALUES ('93556532-e5e5-4c8a-b0f6-e269a9e290cd', 'sales-transactions', 'Sales Transactions', 'Stores product-level revenue and quantity sold per region', 'ACTIVE', returned_platform_id, glue_service_id, sales_performance_model, NULL, 'ff632a7d-4ddd-4fd1-800a-ba8098c26c18', '2025-10-28 18:19:44.674412', NULL, NULL, 'default');
INSERT INTO public.data_outputs (id, namespace, name, description, status, platform_id, service_id, owner_id, configuration, configuration_id, created_on, updated_on, deleted_at, "technical_mapping") VALUES ('2845c506-a944-484e-a9b5-3f93d9f1532c', 'territory-assignments', 'Territory Assignments', 'Defines which representatives cover which areas or accounts.', 'ACTIVE', returned_platform_id, glue_service_id, sales_performance_model, NULL, 'e8129149-bdb5-4c15-8211-4b6b83fcb64a', '2025-10-28 18:20:01.401722', NULL, NULL, 'default');
INSERT INTO public.data_outputs_datasets (id, data_output_id, dataset_id, status, requested_by_id, requested_on, approved_by_id, approved_on, denied_by_id, denied_on, created_on, updated_on, deleted_at) VALUES (gen_random_uuid(), '93556532-e5e5-4c8a-b0f6-e269a9e290cd', sales_performance_model_output_port, 'APPROVED', john_id, '2025-10-28 16:36:36.784134', john_id, '2025-10-28 16:36:36.936773', NULL, NULL, '2025-10-28 16:36:36.677803', '2025-10-28 16:36:36.838041', NULL);
INSERT INTO public.data_outputs_datasets (id, data_output_id, dataset_id, status, requested_by_id, requested_on, approved_by_id, approved_on, denied_by_id, denied_on, created_on, updated_on, deleted_at) VALUES (gen_random_uuid(), '2845c506-a944-484e-a9b5-3f93d9f1532c', sales_performance_model_output_port, 'APPROVED', john_id, '2025-10-28 16:36:36.784134', john_id, '2025-10-28 16:36:36.936773', NULL, NULL, '2025-10-28 16:36:36.677803', '2025-10-28 16:36:36.838041', NULL);
-- Revenue dashboard
INSERT INTO public.data_products (id, "name", namespace, description, about, status, type_id, domain_id, created_on, updated_on, deleted_at) VALUES ('b976c1af-2199-420b-8e70-76b7ea4119ad', 'Revenue Dashboard', 'revenue_dashboard', 'Tracks revenue by product line, region, and period.', '<h2>Revenue Dashboard</h2><p></p><p>This data product provides a consolidated view of company revenue.</p><p></p><p><strong>Key objectives include:</strong></p><ul><li>Monitor revenue trends</li><li>Identify growth opportunities</li><li>Support strategic decision-making</li></ul>', 'ACTIVE', '1b4a64b3-96fb-404c-a73c-294802dc9852', financial_domain_id, timezone('utc'::text, CURRENT_TIMESTAMP), NULL, NULL) returning id into revenue_dashboard;
INSERT INTO public.datasets (id, namespace, data_product_id, "name", description, about, status, access_type, created_on, updated_on, deleted_at) VALUES ('b076bf53-463a-47bb-84a9-596d45b425d7', 'revenue_dashboard_summary', revenue_dashboard, 'Revenue Dashboard Summary', 'Consolidated revenue metrics', 'Provides a single view of revenue trends. Key objectives: - Track revenue by product and region - Identify growth opportunities - Support executive reporting', 'ACTIVE', 'RESTRICTED', timezone('utc'::text, CURRENT_TIMESTAMP), NULL, NULL);
INSERT INTO public.datasets (id, namespace, data_product_id, "name", description, about, status, access_type, created_on, updated_on, deleted_at) VALUES ('393cf08a-d05c-442a-8982-d7d2cced4ad2', 'revenue_by_segment', revenue_dashboard, 'Revenue By Segment', 'Revenue broken down by customer segments', 'Enables analysis of profitability per segment. Key objectives: - Inform marketing targeting - Support strategic planning - Monitor high-value customers', 'ACTIVE', 'RESTRICTED', timezone('utc'::text, CURRENT_TIMESTAMP), NULL, NULL);
-- Revenue dashboard - input ports
INSERT INTO public.data_products_datasets (id, justification, data_product_id, dataset_id, status, requested_by_id, requested_on, approved_by_id, approved_on, denied_by_id, denied_on, created_on, updated_on, deleted_at)
VALUES (gen_random_uuid(),'Needed to predict our revenue', revenue_dashboard, production_planning_insights_forecast, 'APPROVED', john_id, timezone('utc'::text, CURRENT_TIMESTAMP), NULL, NULL, NULL, NULL, timezone('utc'::text, CURRENT_TIMESTAMP), NULL, NULL);
INSERT INTO public.data_products_datasets (id, justification, data_product_id, dataset_id, status, requested_by_id, requested_on, approved_by_id, approved_on, denied_by_id, denied_on, created_on, updated_on, deleted_at)
VALUES (gen_random_uuid(),'Needed to predict our revenue', revenue_dashboard, sales_performance_model_output_port, 'APPROVED', john_id, timezone('utc'::text, CURRENT_TIMESTAMP), NULL, NULL, NULL, NULL, timezone('utc'::text, CURRENT_TIMESTAMP), NULL, NULL);
INSERT INTO public.data_products_datasets (id, justification, data_product_id, dataset_id, status, requested_by_id, requested_on, approved_by_id, approved_on, denied_by_id, denied_on, created_on, updated_on, deleted_at)
VALUES (gen_random_uuid(),'Needed to predict our revenue', revenue_dashboard, order_fulfillment_analysis_output_port, 'APPROVED', john_id, timezone('utc'::text, CURRENT_TIMESTAMP), NULL, NULL, NULL, NULL, timezone('utc'::text, CURRENT_TIMESTAMP), NULL, NULL);
INSERT INTO public.data_products_datasets (id, justification, data_product_id, dataset_id, status, requested_by_id, requested_on, approved_by_id, approved_on, denied_by_id, denied_on, created_on, updated_on, deleted_at)
VALUES (gen_random_uuid(),'Needed to predict our revenue', revenue_dashboard, inventory_management_output_port, 'APPROVED', john_id, timezone('utc'::text, CURRENT_TIMESTAMP), NULL, NULL, NULL, NULL, timezone('utc'::text, CURRENT_TIMESTAMP), NULL, NULL);
-- Expense forecasting
INSERT INTO public.data_products (id, "name", namespace, description, about, status, type_id, domain_id, created_on, updated_on, deleted_at)VALUES (gen_random_uuid(), 'Expense Forecasting', 'expense_forecasting', 'Predicts future expenses using historical financial data.', '<h2>Expense Forecasting</h2><p></p><p>This data product enables proactive expense management through forecasting.</p><p></p><p><strong>Key objectives include:</strong></p><ul><li>Anticipate future costs</li><li>Support budgeting and planning</li><li>Reduce financial risk</li></ul>', 'ACTIVE', 'f1672c38-ad1a-401a-8dd3-e0b026ab1416', financial_domain_id, timezone('utc'::text, CURRENT_TIMESTAMP), NULL, NULL) returning id into expense_forecasting;
INSERT INTO public.datasets (id, namespace, data_product_id, "name", description, about, status, access_type, created_on, updated_on, deleted_at) VALUES ('d4e7792b-fb93-4541-beb9-b3c2b2474c77', 'expense_forecast', expense_forecasting, 'Expense Forecast', 'Predicted expenses by category', 'Provides insight into expected costs to support budgeting. Key objectives: - Forecast future expenses - Support planning - Reduce financial risk', 'ACTIVE', 'RESTRICTED', timezone('utc'::text, CURRENT_TIMESTAMP), NULL, NULL);
-- Expense forecasting input ports
INSERT INTO public.data_products_datasets (id, justification, data_product_id, dataset_id, status, requested_by_id, requested_on, approved_by_id, approved_on, denied_by_id, denied_on, created_on, updated_on, deleted_at)
VALUES ('0658e52e-b69e-4787-b7b1-df215d75329c','Needed to predict our expenses, production planning is an important dataset', expense_forecasting, production_planning_insights_forecast, 'APPROVED', john_id, timezone('utc'::text, CURRENT_TIMESTAMP), NULL, NULL, NULL, NULL, timezone('utc'::text, CURRENT_TIMESTAMP), NULL, NULL);
-- User feedback analysis
INSERT INTO public.data_products (id, "name", namespace, description, about, status, type_id, domain_id, created_on, updated_on, deleted_at) VALUES (gen_random_uuid(), 'User Feedback Analysis', 'user_feedback_analysis', 'Uses text mining to extract insights from user reviews and surveys.', '<h2>User Feedback Analysis</h2><p></p><p>This data product enables centralized analysis of user feedback for product improvement.</p><p></p><p><strong>Key objectives include:</strong></p><ul><li>Extract insights from reviews and surveys</li><li>Identify pain points</li><li>Inform UX and feature decisions</li></ul>', 'ACTIVE', 'f1672c38-ad1a-401a-8dd3-e0b026ab1416', product_development_domain_id, timezone('utc'::text, CURRENT_TIMESTAMP), NULL, NULL) returning id into user_feedback_analysis;
INSERT INTO public.datasets (id, namespace, data_product_id, "name", description, about, status, access_type, created_on, updated_on, deleted_at) VALUES ('9cfcdd85-8049-42fc-8984-6a6fc7bfeba9', 'feedback_insights_report', user_feedback_analysis, 'Feedback Insights Report', 'Summarized insights from user feedback', 'Provides actionable insights for product improvements. Key objectives: - Identify pain points - Prioritize changes - Improve satisfaction', 'ACTIVE', 'RESTRICTED', timezone('utc'::text, CURRENT_TIMESTAMP), NULL, NULL) returning id into user_feedback_insights_report;
-- Release impact analysis
INSERT INTO public.data_products (id, "name", namespace, description, about, status, type_id, domain_id, created_on, updated_on, deleted_at) VALUES (gen_random_uuid(), 'Release Impact Analysis', 'release_impact_analysis', 'Measures effect of new releases on usage and performance.', '<h2>Release Impact Analysis</h2><p></p><p>This data product centralizes insights on release impact for better planning.</p><p></p><p><strong>Key objectives include:</strong></p><ul><li>Assess adoption of new features</li><li>Measure performance impact</li><li>Guide future release planning</li></ul>', 'ACTIVE', '3c289333-2d55-4aed-8bd5-85015a1567fe', product_development_domain_id, timezone('utc'::text, CURRENT_TIMESTAMP), NULL, NULL) returning id into release_impact_analysis;
INSERT INTO public.datasets (id, namespace, data_product_id, "name", description, about, status, access_type, created_on, updated_on, deleted_at) VALUES ('e3dfeb4e-e7ee-4db2-84ce-7f4f36840c96', 'release_engagement_by_segment', release_impact_analysis, 'Release Engagement By Segment', 'Feature adoption per customer segment', 'Helps measure differential impact of releases across user groups. Key objectives: - Understand segment behavior - Inform targeted communications - Optimize rollout', 'ACTIVE', 'RESTRICTED', timezone('utc'::text, CURRENT_TIMESTAMP), NULL, NULL) returning id into release_engagement_by_segment;
INSERT INTO public.datasets (id, namespace, data_product_id, "name", description, about, status, access_type, created_on, updated_on, deleted_at) VALUES ('56acafd4-5bb8-45b1-81fa-acfab84ec3fc', 'release_impact_summary', release_impact_analysis, 'Release Impact Summary', 'Metrics on usage changes after new releases', 'Provides insight into feature release performance. Key objectives: - Measure adoption - Detect regressions - Inform next releases', 'ACTIVE', 'RESTRICTED', timezone('utc'::text, CURRENT_TIMESTAMP), NULL, NULL) returning id into release_impact_summary;
-- Data privacy compliance
INSERT INTO public.data_products (id, "name", namespace, description, about, status, type_id, domain_id, created_on, updated_on, deleted_at) VALUES (gen_random_uuid(), 'Data Privacy Compliance', 'data_privacy_compliance', 'Monitors adherence to GDPR and other privacy regulations.', '<h2>Data Privacy Compliance</h2><p></p><p>This data product ensures compliance with data privacy regulations.</p><p></p><p><strong>Key objectives include:</strong></p><ul><li>Monitor GDPR compliance</li><li>Identify gaps in privacy practices</li><li>Support regulatory reporting</li></ul>', 'ACTIVE', '1b4a64b3-96fb-404c-a73c-294802dc9852', risk_and_compliance_domain_id, timezone('utc'::text, CURRENT_TIMESTAMP), NULL, NULL) returning id into data_privacy_compliance;
INSERT INTO public.datasets (id, namespace, data_product_id, "name", description, about, status, access_type, created_on, updated_on, deleted_at) VALUES ('e94890c6-0da8-4a1e-b696-e53e5312f743', 'privacy_compliance_report', data_privacy_compliance, 'Privacy Compliance Report', 'GDPR and privacy compliance metrics', 'Provides compliance tracking for regulatory adherence. Key objectives: - Identify gaps - Support audits - Ensure legal compliance', 'ACTIVE', 'RESTRICTED', timezone('utc'::text, CURRENT_TIMESTAMP), NULL, NULL);
-- Data privacy compliance - input ports
INSERT INTO public.data_products_datasets (id, justification, data_product_id, dataset_id, status, requested_by_id, requested_on, approved_by_id, approved_on, denied_by_id, denied_on, created_on, updated_on, deleted_at)
VALUES (gen_random_uuid(),'Needed to check for GDPR compliance', data_privacy_compliance, user_feedback_insights_report, 'APPROVED', john_id, timezone('utc'::text, CURRENT_TIMESTAMP), NULL, NULL, NULL, NULL, timezone('utc'::text, CURRENT_TIMESTAMP), NULL, NULL);
INSERT INTO public.data_products_datasets (id, justification, data_product_id, dataset_id, status, requested_by_id, requested_on, approved_by_id, approved_on, denied_by_id, denied_on, created_on, updated_on, deleted_at)
VALUES (gen_random_uuid(),'Needed to check for GDPR compliance', data_privacy_compliance, release_engagement_by_segment, 'APPROVED', john_id, timezone('utc'::text, CURRENT_TIMESTAMP), NULL, NULL, NULL, NULL, timezone('utc'::text, CURRENT_TIMESTAMP), NULL, NULL);
INSERT INTO public.data_products_datasets (id, justification, data_product_id, dataset_id, status, requested_by_id, requested_on, approved_by_id, approved_on, denied_by_id, denied_on, created_on, updated_on, deleted_at)
VALUES (gen_random_uuid(),'Needed to check for GDPR compliance', data_privacy_compliance, release_impact_summary, 'APPROVED', john_id, timezone('utc'::text, CURRENT_TIMESTAMP), NULL, NULL, NULL, NULL, timezone('utc'::text, CURRENT_TIMESTAMP), NULL, NULL);
INSERT INTO public.data_products_datasets (id, justification, data_product_id, dataset_id, status, requested_by_id, requested_on, approved_by_id, approved_on, denied_by_id, denied_on, created_on, updated_on, deleted_at)
VALUES (gen_random_uuid(),'Needed to check for GDPR compliance', data_privacy_compliance, customer_segmentation_weekly_output_port_id, 'APPROVED', john_id, timezone('utc'::text, CURRENT_TIMESTAMP), NULL, NULL, NULL, NULL, timezone('utc'::text, CURRENT_TIMESTAMP), NULL, NULL);
-- Cash flow monitoring
INSERT INTO public.data_products (id, "name", namespace, description, about, status, type_id, domain_id, created_on, updated_on, deleted_at) VALUES (gen_random_uuid(), 'Cash Flow Monitoring', 'cash_flow_monitoring', 'Monitors inflows and outflows of funds in real-time.', '<h2>Cash Flow Monitoring</h2><p></p><p>This data product provides real-time cash flow monitoring for financial stability.</p><p></p><p><strong>Key objectives include:</strong></p><ul><li>Track daily cash movements</li><li>Ensure liquidity and solvency</li><li>Support financial decision-making</li></ul>', 'ACTIVE', '1b4a64b3-96fb-404c-a73c-294802dc9852', financial_domain_id, timezone('utc'::text, CURRENT_TIMESTAMP), NULL, NULL) returning id into cash_flow_monitoring;
INSERT INTO public.datasets (id, namespace, data_product_id, "name", description, about, status, access_type, created_on, updated_on, deleted_at) VALUES ('dcb24163-bfec-44d8-b025-1d656d0fff36', 'cash_flow_overview', cash_flow_monitoring, 'Cash Flow Overview', 'Daily inflows and outflows', 'Provides real-time view of cash position. Key objectives: - Ensure liquidity - Identify gaps - Support financial planning', 'ACTIVE', 'RESTRICTED', timezone('utc'::text, CURRENT_TIMESTAMP), NULL, NULL);
-- Cash flow monitoring - input ports
INSERT INTO public.data_products_datasets (id, justification, data_product_id, dataset_id, status, requested_by_id, requested_on, approved_by_id, approved_on, denied_by_id, denied_on, created_on, updated_on, deleted_at)
VALUES (gen_random_uuid(),'Needed for cash flow monitoring', cash_flow_monitoring, sales_performance_model_output_port, 'APPROVED', john_id, timezone('utc'::text, CURRENT_TIMESTAMP), NULL, NULL, NULL, NULL, timezone('utc'::text, CURRENT_TIMESTAMP), NULL, NULL);
INSERT INTO public.data_products_datasets (id, justification, data_product_id, dataset_id, status, requested_by_id, requested_on, approved_by_id, approved_on, denied_by_id, denied_on, created_on, updated_on, deleted_at)
VALUES (gen_random_uuid(),'Needed for cash flow monitoring', cash_flow_monitoring, inventory_management_output_port, 'APPROVED', john_id, timezone('utc'::text, CURRENT_TIMESTAMP), NULL, NULL, NULL, NULL, timezone('utc'::text, CURRENT_TIMESTAMP), NULL, NULL);
-- Fraud detection
INSERT INTO public.data_products (id, "name", namespace, description, about, status, type_id, domain_id, created_on, updated_on, deleted_at) VALUES (gen_random_uuid(), 'Fraud Detection', 'fraud_detection', 'Detects suspicious activities in transactions using historical patterns.', '<h2>Fraud Detection</h2><p></p><p>This data product centralizes fraud detection insights for risk mitigation.</p><p></p><p><strong>Key objectives include:</strong></p><ul><li>Identify suspicious transactions</li><li>Prevent financial losses</li><li>Support security investigations</li></ul>', 'ACTIVE', 'f1672c38-ad1a-401a-8dd3-e0b026ab1416', risk_and_compliance_domain_id, timezone('utc'::text, CURRENT_TIMESTAMP), NULL, NULL) returning id into fraud_detection;
INSERT INTO public.datasets (id, namespace, data_product_id, "name", description, about, status, access_type, created_on, updated_on, deleted_at) VALUES (gen_random_uuid(), 'fraud_detection_alerts', fraud_detection, 'Fraud Detection Alerts', 'Transactions flagged for potential fraud', 'Provides actionable fraud detection results. Key objectives: - Prevent losses - Investigate suspicious activity - Improve security', 'ACTIVE', 'RESTRICTED', timezone('utc'::text, CURRENT_TIMESTAMP), NULL, NULL);
-- Fraud detection - input ports
INSERT INTO public.data_products_datasets (id, justification, data_product_id, dataset_id, status, requested_by_id, requested_on, approved_by_id, approved_on, denied_by_id, denied_on, created_on, updated_on, deleted_at)
VALUES (gen_random_uuid(),'Needed for fraud detection', fraud_detection, sales_performance_model_output_port, 'APPROVED', john_id, timezone('utc'::text, CURRENT_TIMESTAMP), NULL, NULL, NULL, NULL, timezone('utc'::text, CURRENT_TIMESTAMP), NULL, NULL);
INSERT INTO public.data_products_datasets (id, justification, data_product_id, dataset_id, status, requested_by_id, requested_on, approved_by_id, approved_on, denied_by_id, denied_on, created_on, updated_on, deleted_at)
VALUES (gen_random_uuid(),'Needed for fraud detection', fraud_detection, inventory_management_output_port, 'APPROVED', john_id, timezone('utc'::text, CURRENT_TIMESTAMP), NULL, NULL, NULL, NULL, timezone('utc'::text, CURRENT_TIMESTAMP), NULL, NULL);
-- Profitability analysis
INSERT INTO public.data_products (id, "name", namespace, description, about, status, type_id, domain_id, created_on, updated_on, deleted_at) VALUES (gen_random_uuid(), 'Profitability Analysis', 'profitability_analysis', 'Identifies which products or services contribute most to profit.', '<h2>Profitability Analysis</h2><p></p><p>This data product centralizes profitability insights to guide business strategy.</p><p></p><p><strong>Key objectives include:</strong></p><ul><li>Identify high-margin products</li><li>Optimize product portfolio</li><li>Inform investment decisions</li></ul>', 'ACTIVE', '3c289333-2d55-4aed-8bd5-85015a1567fe', financial_domain_id, timezone('utc'::text, CURRENT_TIMESTAMP), NULL, NULL) returning id into profitability_analysis;
INSERT INTO public.datasets (id, namespace, data_product_id, "name", description, about, status, access_type, created_on, updated_on, deleted_at) VALUES (gen_random_uuid(), 'profitability_analysis_report', profitability_analysis, 'Profitability Analysis Report', 'Product and service profit contribution', 'Provides insight into profitability for portfolio decisions. Key objectives: - Identify high-margin offerings - Guide investment strategy - Support executive decisions', 'ACTIVE', 'RESTRICTED', timezone('utc'::text, CURRENT_TIMESTAMP), NULL, NULL);
INSERT INTO public.datasets (id, namespace, data_product_id, "name", description, about, status, access_type, created_on, updated_on, deleted_at) VALUES (gen_random_uuid(), 'margin_trends_by_product', profitability_analysis, 'Margin Trends By Product', 'Historical margin trends per product', 'Provides deeper understanding of profitability over time. Key objectives: - Detect declining margins - Inform pricing strategies - Support product decisions', 'ACTIVE', 'RESTRICTED', timezone('utc'::text, CURRENT_TIMESTAMP), NULL, NULL) returning id into margin_trends_by_product;
-- Financial risk assessment
INSERT INTO public.data_products (id, "name", namespace, description, about, status, type_id, domain_id, created_on, updated_on, deleted_at) VALUES (gen_random_uuid(), 'Financial Risk Assessment', 'financial_risk_assessment', 'Evaluates potential financial risks and exposure.', '<h2>Financial Risk Assessment</h2><p></p><p>This data product centralizes financial risk evaluation for proactive management.</p><p></p><p><strong>Key objectives include:</strong></p><ul><li>Identify financial risks</li><li>Support compliance and regulatory requirements</li><li>Guide investment decisions</li></ul>', 'ACTIVE', '3c289333-2d55-4aed-8bd5-85015a1567fe', financial_domain_id, timezone('utc'::text, CURRENT_TIMESTAMP), NULL, NULL) returning id into financial_risk_assessment;
INSERT INTO public.datasets (id, namespace, data_product_id, "name", description, about, status, access_type, created_on, updated_on, deleted_at) VALUES (gen_random_uuid(), 'financial_risk_dashboard', financial_risk_assessment, 'Financial Risk Dashboard', 'Metrics highlighting financial exposure', 'Provides risk analysis to prevent losses. Key objectives: - Track financial risks - Support mitigation strategies - Enable compliance', 'ACTIVE', 'RESTRICTED', timezone('utc'::text, CURRENT_TIMESTAMP), NULL, NULL);
-- Financial risk - input ports
INSERT INTO public.data_products_datasets (id, justification, data_product_id, dataset_id, status, requested_by_id, requested_on, approved_by_id, approved_on, denied_by_id, denied_on, created_on, updated_on, deleted_at)
VALUES (gen_random_uuid(),'Needed for detecting financial risks', financial_risk_assessment, sales_performance_model_output_port, 'APPROVED', john_id, timezone('utc'::text, CURRENT_TIMESTAMP), NULL, NULL, NULL, NULL, timezone('utc'::text, CURRENT_TIMESTAMP), NULL, NULL);
INSERT INTO public.data_products_datasets (id, justification, data_product_id, dataset_id, status, requested_by_id, requested_on, approved_by_id, approved_on, denied_by_id, denied_on, created_on, updated_on, deleted_at)
VALUES (gen_random_uuid(),'Needed for detecting financial risks', financial_risk_assessment, inventory_management_output_port, 'APPROVED', john_id, timezone('utc'::text, CURRENT_TIMESTAMP), NULL, NULL, NULL, NULL, timezone('utc'::text, CURRENT_TIMESTAMP), NULL, NULL);
INSERT INTO public.data_products_datasets (id, justification, data_product_id, dataset_id, status, requested_by_id, requested_on, approved_by_id, approved_on, denied_by_id, denied_on, created_on, updated_on, deleted_at)
VALUES (gen_random_uuid(),'Needed for detecting financial risks', financial_risk_assessment, margin_trends_by_product, 'APPROVED', john_id, timezone('utc'::text, CURRENT_TIMESTAMP), NULL, NULL, NULL, NULL, timezone('utc'::text, CURRENT_TIMESTAMP), NULL, NULL);
INSERT INTO public.data_products (id, "name", namespace, description, about, status, type_id, domain_id, created_on, updated_on, deleted_at) VALUES (gen_random_uuid(), 'Feature Usage Metrics', 'feature_usage_metrics', 'Tracks how often users engage with product features.', '<h2>Feature Usage Metrics</h2><p></p><p>This data product provides a centralized view of feature adoption and usage.</p><p></p><p><strong>Key objectives include:</strong></p><ul><li>Monitor user engagement</li><li>Identify popular features</li><li>Inform product development priorities</li></ul>', 'ACTIVE', '1b4a64b3-96fb-404c-a73c-294802dc9852', product_development_domain_id, timezone('utc'::text, CURRENT_TIMESTAMP), NULL, NULL) returning id into feature_usage_metrics;
INSERT INTO public.datasets (id, namespace, data_product_id, "name", description, about, status, access_type, created_on, updated_on, deleted_at) VALUES ('b8f56c2f-da55-4be5-9625-ba2a4e4a42c2', 'daily_feature_engagement', feature_usage_metrics, 'Daily Feature Engagement', 'Daily usage metrics per feature', 'Provides insights into feature adoption. Key objectives: - Monitor engagement - Guide product improvements - Track trends', 'ACTIVE', 'RESTRICTED', timezone('utc'::text, CURRENT_TIMESTAMP), NULL, NULL) returning id into feature_usage_metrics_daily;
INSERT INTO public.datasets (id, namespace, data_product_id, "name", description, about, status, access_type, created_on, updated_on, deleted_at) VALUES ('f3a95935-5a3e-4427-be75-a01a40a53f55', 'weekly_feature_summary', feature_usage_metrics, 'Weekly Feature Summary', 'Aggregated weekly feature usage', 'Provides weekly trends for product teams. Key objectives: - Identify adoption patterns - Support roadmap planning - Enable executive reporting', 'ACTIVE', 'RESTRICTED', timezone('utc'::text, CURRENT_TIMESTAMP), NULL, NULL)returning id into feature_usage_metrics_weekly;
INSERT INTO public.data_products_datasets (id, justification, data_product_id, dataset_id, status, requested_by_id, requested_on, approved_by_id, approved_on, denied_by_id, denied_on, created_on, updated_on, deleted_at)
VALUES (gen_random_uuid(),'Needed for predicinting product featuree engagement', financial_risk_assessment, feature_usage_metrics_daily, 'PENDING', jane_id, timezone('utc'::text, CURRENT_TIMESTAMP), NULL, NULL, NULL, NULL, timezone('utc'::text, CURRENT_TIMESTAMP), NULL, NULL);
INSERT INTO public.role_assignments_data_product (id, data_product_id, user_id, role_id, decision, requested_by_id, requested_on, decided_by_id, decided_on, created_on, updated_on, deleted_at) VALUES (gen_random_uuid(),
feature_usage_metrics, john_id, product_owner_id, 'APPROVED', john_id, '2025-10-28 16:32:57.902449', john_id, '2025-10-28 16:32:57.910346', '2025-10-28 16:32:57.89898', '2025-10-28 16:32:57.908607', NULL);
INSERT INTO public.role_assignments_dataset (id, dataset_id, user_id, role_id, decision, requested_by_id, requested_on, decided_by_id, decided_on, created_on, updated_on, deleted_at) VALUES (gen_random_uuid(),
feature_usage_metrics_daily, john_id, dataset_owner_id, 'APPROVED', john_id, '2025-10-28 16:32:57.902449', john_id, '2025-10-28 16:32:57.910346', '2025-10-28 16:32:57.89898', '2025-10-28 16:32:57.908607', NULL);
-- extra products
INSERT INTO public.data_products (id, "name", namespace, description, about, status, type_id, domain_id, created_on, updated_on, deleted_at) VALUES ('a8afca59-78ce-4808-adaa-8bbab998ac6d', 'A/B Test Results', 'a_b_test_results', 'Stores and analyzes experiments to optimize product decisions.', '<h2>A/B Test Results</h2><p></p><p>This data product centralizes A/B testing results for actionable insights.</p><p></p><p><strong>Key objectives include:</strong></p><ul><li>Compare feature variations</li><li>Measure impact on user behavior</li><li>Support data-driven product decisions</li></ul>', 'ACTIVE', '3c289333-2d55-4aed-8bd5-85015a1567fe', product_development_domain_id, timezone('utc'::text, CURRENT_TIMESTAMP), NULL, NULL);
INSERT INTO public.data_products (id, "name", namespace, description, about, status, type_id, domain_id, created_on, updated_on, deleted_at) VALUES ('16f9cdac-f0ab-45f9-84e1-fb28bf7eda2c', 'Product Performance Dashboard', 'product_performance_dashboard', 'Monitors KPIs like uptime, error rates, and adoption.', '<h2>Product Performance Dashboard</h2><p></p><p>This data product provides a consolidated view of product performance metrics.</p><p></p><p><strong>Key objectives include:</strong></p><ul><li>Track uptime and reliability</li><li>Monitor feature adoption</li><li>Support operational and strategic decisions</li></ul>', 'ACTIVE', '1b4a64b3-96fb-404c-a73c-294802dc9852', product_development_domain_id, timezone('utc'::text, CURRENT_TIMESTAMP), NULL, NULL);
INSERT INTO public.data_products (id, "name", namespace, description, about, status, type_id, domain_id, created_on, updated_on, deleted_at) VALUES ('4bba2a03-b51c-4525-b094-1f85a3dba31b', 'Operational Risk Metrics', 'operational_risk_metrics', 'Evaluates risks in business processes to prevent disruptions.', '<h2>Operational Risk Metrics</h2><p></p><p>This data product provides centralized operational risk insights for mitigation.</p><p></p><p><strong>Key objectives include:</strong></p><ul><li>Monitor business process risks</li><li>Identify vulnerabilities</li><li>Support operational continuity</li></ul>', 'ACTIVE', '3c289333-2d55-4aed-8bd5-85015a1567fe', risk_and_compliance_domain_id, timezone('utc'::text, CURRENT_TIMESTAMP), NULL, NULL);
INSERT INTO public.data_products (id, "name", namespace, description, about, status, type_id, domain_id, created_on, updated_on, deleted_at) VALUES ('92eb574f-10ec-42dc-af72-05aa06cc8ade', 'Security Incident Reporting', 'security_incident_reporting', 'Tracks and analyzes security breaches and attempted attacks.', '<h2>Security Incident Reporting</h2><p></p><p>This data product centralizes reporting of security incidents for response.</p><p></p><p><strong>Key objectives include:</strong></p><ul><li>Track security events</li><li>Analyze incident patterns</li><li>Support rapid mitigation actions</li></ul>', 'ACTIVE', '1b4a64b3-96fb-404c-a73c-294802dc9852', risk_and_compliance_domain_id, timezone('utc'::text, CURRENT_TIMESTAMP), NULL, NULL);
INSERT INTO public.data_products (id, "name", namespace, description, about, status, type_id, domain_id, created_on, updated_on, deleted_at) VALUES ('3a3dc97d-2278-42e8-8e72-dd923192a4df', 'Regulatory Audit Tracker', 'regulatory_audit_tracker', 'Monitors audit readiness and compliance with industry standards.', '<h2>Regulatory Audit Tracker</h2><p></p><p>This data product provides a platform for tracking regulatory audit compliance.</p><p></p><p><strong>Key objectives include:</strong></p><ul><li>Monitor audit readiness</li><li>Ensure regulatory adherence</li><li>Support compliance reporting</li></ul>', 'ACTIVE', '1b4a64b3-96fb-404c-a73c-294802dc9852', risk_and_compliance_domain_id, timezone('utc'::text, CURRENT_TIMESTAMP), NULL, NULL);
INSERT INTO public.data_products (id, name, namespace, description, about, status, type_id, domain_id, created_on, updated_on, deleted_at, lifecycle_id, usage) VALUES ('81815c4c-f323-4cf1-b25b-f43f231f510f', 'Biomarker discovery', 'biomarker-discovery', 'Helps researchers identify molecular signatures linked to disease progression or drug response.
It accelerates translational research by combining omics data with clinical outcomes for biomarker validation.', NULL, 'ACTIVE', '74b13338-aa85-4552-8ccb-7d51550c67de', financial_domain_id, '2025-10-28 16:32:57.885052', NULL, NULL, data_product_lifecycle_id, NULL);
INSERT INTO public.data_products (id, name, namespace, description, about, status, type_id, domain_id, created_on, updated_on, deleted_at, lifecycle_id, usage) VALUES ('6e580d91-14ea-495e-a6d7-5db236a5c1d5', 'Clinical trial performance', 'clinical-trial-performance', 'Monitors progress, enrollment, and site efficiency for ongoing studies.
It provides near–real-time visibility for clinical operations teams.', NULL, 'ACTIVE', '1b4a64b3-96fb-404c-a73c-294802dc9852', operations_and_logistics_domain_id, '2025-10-28 16:37:39.892932', NULL, NULL, data_product_lifecycle_id, NULL);
INSERT INTO public.data_products (id, name, namespace, description, about, status, type_id, domain_id, created_on, updated_on, deleted_at, lifecycle_id, usage) VALUES ('9fa5e299-fcc4-45e0-b48d-cc3deb68eefe', 'Clinical data quality monitor', 'clinical-data-quality-monitor', 'Automates validation and consistency checks for clinical data.
It ensures data integrity for regulatory submissions.', NULL, 'ACTIVE', '3c289333-2d55-4aed-8bd5-85015a1567fe', operations_and_logistics_domain_id, '2025-10-28 17:56:19.863257', NULL, NULL, data_product_lifecycle_id, NULL);
INSERT INTO public.data_products (id, name, namespace, description, about, status, type_id, domain_id, created_on, updated_on, deleted_at, lifecycle_id, usage) VALUES ('fbcd7899-2763-4659-bd28-2a278910ef85', 'Regulatory submission tracker', 'regulatory-submission-tracker', 'Centralizes documentation and timelines for regulatory filings.
It helps teams maintain compliance and track submission readiness.', NULL, 'ACTIVE', '1b4a64b3-96fb-404c-a73c-294802dc9852', operations_and_logistics_domain_id, '2025-10-28 17:59:19.849564', NULL, NULL, data_product_lifecycle_id, NULL);
INSERT INTO public.data_products (id, name, namespace, description, about, status, type_id, domain_id, created_on, updated_on, deleted_at, lifecycle_id, usage) VALUES ('08039e5d-50a7-447a-b691-f5dc6b420dea', 'Safety Signal Detection System', 'safety-signal-detection-system', 'Detects early signs of drug-related adverse effects from trial and post-market data.
It supports pharmacovigilance and regulatory risk management.', NULL, 'ACTIVE', '90ab1128-329f-47dd-9420-c9681bfc68c4', risk_and_compliance_domain_id, '2025-10-28 18:01:54.329016', NULL, NULL, data_product_lifecycle_id, NULL);
INSERT INTO public.data_products (id, name, namespace, description, about, status, type_id, domain_id, created_on, updated_on, deleted_at, lifecycle_id, usage) VALUES ('625b65b6-13d9-4c8c-a669-865e36fc3dfc', 'Drug Supply Chain Optimization', 'drug-supply-chain-optimization', 'Forecasts and manages inventory to avoid clinical supply shortages.
It balances manufacturing throughput with site-level demand.', NULL, 'ACTIVE', 'f1672c38-ad1a-401a-8dd3-e0b026ab1416', product_development_domain_id, '2025-10-28 18:05:44.182871', NULL, NULL, data_product_lifecycle_id, NULL);
INSERT INTO public.data_products (id, name, namespace, description, about, status, type_id, domain_id, created_on, updated_on, deleted_at, lifecycle_id, usage) VALUES ('22488fe0-c30a-4447-972e-3eb22a1bd266', 'Customer intelligence platform', 'customer-intelligence-platform', 'Unifies healthcare professional and institutional engagement data.
It supports more targeted and compliant outreach strategies.', NULL, 'ACTIVE', '1b4a64b3-96fb-404c-a73c-294802dc9852', commercial_and_customer_relationship_mgt_domain_id, '2025-10-28 18:09:11.673609', NULL, NULL, data_product_lifecycle_id, NULL);
INSERT INTO public.data_products (id, name, namespace, description, about, status, type_id, domain_id, created_on, updated_on, deleted_at, lifecycle_id, usage) VALUES ('90e65438-a942-43e0-a4a9-ee406b92df65', 'Enterprise knowledge graph', 'enterprise-knowledge-graph', 'Connects data entities (people, trials, compounds, documents) across all domains.
It enables semantic search and contextual discovery within the organization.', NULL, 'ACTIVE', 'f1672c38-ad1a-401a-8dd3-e0b026ab1416', operations_and_logistics_domain_id, '2025-10-28 18:11:47.494295', NULL, NULL, data_product_lifecycle_id, NULL);
INSERT INTO public.data_products (id, name, namespace, description, about, status, type_id, domain_id, created_on, updated_on, deleted_at, lifecycle_id, usage) VALUES ('68b28e38-3faa-45ca-9d00-3830d0a7b108', 'Employee productivity', 'employee-productivity', 'Measures how teams collaborate and deliver projects.
It identifies factors influencing productivity and engagement.', NULL, 'ACTIVE', '1b4a64b3-96fb-404c-a73c-294802dc9852', hr_domain_id, '2025-10-28 18:14:07.371512', NULL, NULL, data_product_lifecycle_id, NULL);
INSERT INTO public.data_products (id, name, namespace, description, about, status, type_id, domain_id, created_on, updated_on, deleted_at, lifecycle_id, usage) VALUES ('97af957a-70c4-465d-95f2-f70c11af8da0', 'DEI Insights Dashboard', 'dei-insights-dashboard', 'Monitors diversity, equity, and inclusion metrics across the organization.
It ensures transparency and compliance with internal and external reporting standards.', NULL, 'ACTIVE', '1b4a64b3-96fb-404c-a73c-294802dc9852', hr_domain_id, '2025-10-28 18:16:50.70893', NULL, NULL, data_product_lifecycle_id, NULL);
INSERT INTO public.data_products (id, name, namespace, description, about, status, type_id, domain_id, created_on, updated_on, deleted_at, lifecycle_id, usage) VALUES ('58b837a5-33d0-41cf-bf95-eb9af846f4d0', 'Patient Stratification Engine', 'patient-stratification-engine', 'Identifies patient subgroups most likely to respond to therapies.
It improves trial design and treatment personalization.', NULL, 'ACTIVE', '90ab1128-329f-47dd-9420-c9681bfc68c4', operations_and_logistics_domain_id, '2025-10-28 18:29:24.833167', NULL, NULL, data_product_lifecycle_id, NULL);
INSERT INTO public.data_products (id, name, namespace, description, about, status, type_id, domain_id, created_on, updated_on, deleted_at, lifecycle_id, usage) VALUES ('ccdc13fa-4a1a-4dde-ad1c-efa0d58eafb7', 'R&D Portfolio Prioritization Model', 'rd-portfolio-prioritization-model', 'Ranks R&D projects based on scientific potential, ROI, and strategic fit.
It provides leadership with an objective decision framework for resource allocation.', NULL, 'ACTIVE', 'f1672c38-ad1a-401a-8dd3-e0b026ab1416', operations_and_logistics_domain_id, '2025-10-28 18:34:32.308251', NULL, NULL, data_product_lifecycle_id, NULL);
-- DATASETS
INSERT INTO public.datasets (id, namespace, data_product_id, "name", description, about, status, access_type, created_on, updated_on, deleted_at) VALUES ('bab58ea1-0ccd-44f1-8d75-634822b6b95b', 'ab_test_outcomes', 'a8afca59-78ce-4808-adaa-8bbab998ac6d', 'Ab Test Outcomes', 'Results of A/B experiments per cohort', 'Provides experiment insights to inform product decisions. Key objectives: - Measure feature impact - Optimize UX - Support iteration', 'ACTIVE', 'RESTRICTED', timezone('utc'::text, CURRENT_TIMESTAMP), NULL, NULL);
INSERT INTO public.datasets (id, namespace, data_product_id, "name", description, about, status, access_type, created_on, updated_on, deleted_at) VALUES ('910a6eb4-fc3e-413b-bafa-b6b2666ca6e3', 'experiment_variants_comparison', 'a8afca59-78ce-4808-adaa-8bbab998ac6d', 'Experiment Variants Comparison', 'Comparison of different experiment variants', 'Enables detailed analysis of experimental results. Key objectives: - Identify best-performing variant - Support hypothesis validation - Guide feature rollout', 'ACTIVE', 'RESTRICTED', timezone('utc'::text, CURRENT_TIMESTAMP), NULL, NULL);
INSERT INTO public.datasets (id, namespace, data_product_id, "name", description, about, status, access_type, created_on, updated_on, deleted_at) VALUES ('03ff0760-1bed-4805-ad77-644d281f1f22', 'product_kpi_dashboard', '16f9cdac-f0ab-45f9-84e1-fb28bf7eda2c', 'Product KPI Dashboard', 'Uptime, error rates, adoption metrics', 'Provides high-level performance metrics for products. Key objectives: - Track health and reliability - Support operations - Enable strategic decisions', 'ACTIVE', 'RESTRICTED', timezone('utc'::text, CURRENT_TIMESTAMP), NULL, NULL);
INSERT INTO public.datasets (id, namespace, data_product_id, "name", description, about, status, access_type, created_on, updated_on, deleted_at) VALUES ('fcd61536-b8db-4f83-bd62-ee8ed7c3031a', 'operational_risk_report', '4bba2a03-b51c-4525-b094-1f85a3dba31b', 'Operational Risk Report', 'KPIs for process and operational risks', 'Provides insight into operational vulnerabilities. Key objectives: - Monitor risks - Mitigate disruptions - Support continuity planning', 'ACTIVE', 'RESTRICTED', timezone('utc'::text, CURRENT_TIMESTAMP), NULL, NULL);
INSERT INTO public.datasets (id, namespace, data_product_id, "name", description, about, status, access_type, created_on, updated_on, deleted_at) VALUES ('8a4f5df8-4b5c-4290-a8e2-c8ec42713b7c', 'security_incident_summary', '92eb574f-10ec-42dc-af72-05aa06cc8ade', 'Security Incident Summary', 'Report on security events and breaches', 'Provides consolidated view of security incidents. Key objectives: - Track threats - Analyze patterns - Support mitigation', 'ACTIVE', 'RESTRICTED', timezone('utc'::text, CURRENT_TIMESTAMP), NULL, NULL);
INSERT INTO public.datasets (id, namespace, data_product_id, "name", description, about, status, access_type, created_on, updated_on, deleted_at) VALUES ('f1659a4f-95d5-40bb-a7b5-121cf7e74ea8', 'regulatory_audit_report', '3a3dc97d-2278-42e8-8e72-dd923192a4df', 'Regulatory Audit Report', 'Audit compliance metrics and findings', 'Provides regulatory audit insights. Key objectives: - Monitor compliance - Prepare for audits - Support executive reporting', 'ACTIVE', 'RESTRICTED', timezone('utc'::text, CURRENT_TIMESTAMP), NULL, NULL);
-- Data output configurations
INSERT INTO public.data_output_configurations (id, configuration_type) VALUES ('b6bc5710-8706-45fb-bf85-6ed90d8a7428', 'GlueTechnicalAssetConfiguration') ;
INSERT INTO public.glue_technical_asset_configurations(id, bucket_identifier, "database", database_suffix, "table", table_path, access_granularity, database_path, created_on, updated_on, deleted_at) VALUES ('b6bc5710-8706-45fb-bf85-6ed90d8a7428', 'datalake', 'pharma_research', 'glue_output', '*', '*', 'schema', 'pharma_research', timezone('utc'::text, CURRENT_TIMESTAMP), NULL, NULL) returning id into glue_configuration_id;
INSERT INTO public.data_output_configurations (id, configuration_type) VALUES ('cdd627e5-08b2-4dc8-add6-32ff569f543b', 'DatabricksTechnicalAssetConfiguration');
INSERT INTO public.databricks_technical_asset_configurations (id, bucket_identifier, "catalog", schema, catalog_path, table_path, "table", access_granularity, created_on, updated_on, deleted_at) VALUES ('cdd627e5-08b2-4dc8-add6-32ff569f543b', 'datalake', 'pharma_research', 'databricks_output', '', '', 'pharma_research', 'table', timezone('utc'::text, CURRENT_TIMESTAMP), NULL, NULL) returning id into databricks_configuration_id;
-- Data product settings
INSERT INTO public.data_product_settings (id, namespace, name, "default", "order", type, tooltip, category, scope) VALUES ('e12ec335-d7a4-4e27-8225-b66da70f3158', 'iam_role', 'IAM service accounts', 'false', '100', 'CHECKBOX', 'Generate IAM access credentials for this data product', 'AWS', 'DATAPRODUCT');
-- DATA OUTPUTS
INSERT INTO public.data_outputs (id, namespace, name, description, status, platform_id, service_id, owner_id, configuration, configuration_id, created_on, updated_on, deleted_at, "technical_mapping") VALUES ('b4caa471-99a2-40e3-9d43-67b85e466c5b', 'omics-data', 'Omics data', 'Captures genomic, proteomic, and transcriptomic measurements from lab experiments to provide a unified dataset for biomarker exploration.', 'ACTIVE', returned_platform_id, glue_service_id, '81815c4c-f323-4cf1-b25b-f43f231f510f', NULL, '12346cc6-f58d-4217-88d3-6443b01d5d0f', '2025-10-28 16:34:02.355842', NULL, NULL, 'default');
INSERT INTO public.data_outputs (id, namespace, name, description, status, platform_id, service_id, owner_id, configuration, configuration_id, created_on, updated_on, deleted_at, "technical_mapping") VALUES ('86d75ebd-8c3a-4c71-b5a5-33146b28b410', 'clinical-outcome-correlation', 'Clinical outcome correlation', 'Links omics samples to anonymized patient outcomes, enabling downstream hypothesis testing.', 'ACTIVE', 'baa5c47b-805a-4cbb-ad8b-038c66e81b7e', 'ce208413-b629-44d2-9f98-e5b47a315a56', '81815c4c-f323-4cf1-b25b-f43f231f510f', NULL, 'db8e84e9-e942-4ebb-ac78-ee0fa600db5d', '2025-10-28 16:34:31.5612', NULL, NULL, 'default');
INSERT INTO public.data_outputs (id, namespace, name, description, status, platform_id, service_id, owner_id, configuration, configuration_id, created_on, updated_on, deleted_at, "technical_mapping") VALUES ('904ccfd4-c5e5-4a0d-af0b-3a3c38b34696', 'trial-master-summary', 'Trial master summary', 'Central repository for study metadata and milestones.', 'ACTIVE', returned_platform_id, glue_service_id, '6e580d91-14ea-495e-a6d7-5db236a5c1d5', NULL, '17798a65-12e2-4a5e-84c0-9948041849e0', '2025-10-28 16:38:29.452913', NULL, NULL, 'default');
INSERT INTO public.data_outputs (id, namespace, name, description, status, platform_id, service_id, owner_id, configuration, configuration_id, created_on, updated_on, deleted_at, "technical_mapping") VALUES ('77951289-2f2c-46f3-a3e4-b4ba17fab169', 'enrollment-and-retention-metrics', 'Enrollment and retention metrics', 'Tracks patient recruitment and retention trends per site.', 'ACTIVE', returned_platform_id, glue_service_id, '6e580d91-14ea-495e-a6d7-5db236a5c1d5', NULL, '08877d52-a5c1-4fd4-8e8d-ca3c108f2363', '2025-10-28 16:39:02.184116', NULL, NULL, 'default');
INSERT INTO public.data_outputs (id, namespace, name, description, status, platform_id, service_id, owner_id, configuration, configuration_id, created_on, updated_on, deleted_at, "technical_mapping") VALUES ('c006b4a3-6840-4aa9-966d-21acc8d18366', 'ecrf-data-logs', 'ECRF data logs', 'Capture all clinical entries and edits in electronic forms.', 'ACTIVE', returned_platform_id, glue_service_id, '9fa5e299-fcc4-45e0-b48d-cc3deb68eefe', NULL, '43a09ac9-9576-4436-94f7-79339510c887', '2025-10-28 17:56:57.829806', NULL, NULL, 'default');
INSERT INTO public.data_outputs (id, namespace, name, description, status, platform_id, service_id, owner_id, configuration, configuration_id, created_on, updated_on, deleted_at, "technical_mapping") VALUES ('fbd3dbdf-76f1-4c0a-b732-66f1be456860', 'data-validation-results', 'Data validation results', 'Stores outcomes of automated QC rules and anomalies.', 'ACTIVE', returned_platform_id, glue_service_id, '9fa5e299-fcc4-45e0-b48d-cc3deb68eefe', NULL, '3871765b-881b-4654-a0ec-7e1db6a2de2f', '2025-10-28 17:57:32.996449', NULL, NULL, 'default');
INSERT INTO public.data_outputs (id, namespace, name, description, status, platform_id, service_id, owner_id, configuration, configuration_id, created_on, updated_on, deleted_at, "technical_mapping") VALUES ('d3f02123-b777-40b9-8c52-0ec66be68241', 'submission-package-metadata', 'Submission Package Metadata', 'Contains submission components and status per agency.', 'ACTIVE', returned_platform_id, glue_service_id, 'fbcd7899-2763-4659-bd28-2a278910ef85', NULL, '3f9ba1f0-84fb-4a5c-858d-11b1bca33b6b', '2025-10-28 17:59:45.865277', NULL, NULL, 'default');
INSERT INTO public.data_outputs (id, namespace, name, description, status, platform_id, service_id, owner_id, configuration, configuration_id, created_on, updated_on, deleted_at, "technical_mapping") VALUES ('361d6347-afd8-4927-af8b-ce5dc54cca96', 'compliance-audit-trail', 'Compliance Audit Trail', 'Logs document revisions and quality issues.', 'ACTIVE', returned_platform_id, s3_service_id, 'fbcd7899-2763-4659-bd28-2a278910ef85', NULL, 'b1a77a22-5dac-4631-9e22-b6129c67d037', '2025-10-28 18:00:21.273949', NULL, NULL, 'default');
INSERT INTO public.data_outputs (id, namespace, name, description, status, platform_id, service_id, owner_id, configuration, configuration_id, created_on, updated_on, deleted_at, "technical_mapping") VALUES ('561d2ab6-b9dc-405a-9190-8f2d3d443b28', 'adverse-event-database', 'Adverse event database', 'Collects standardized AE reports from multiple data sources.
Output: Consolidated case-level dataset for signal analysis.', 'ACTIVE', returned_platform_id, s3_service_id, '08039e5d-50a7-447a-b691-f5dc6b420dea', NULL, '10889f18-7156-4617-84f7-89aac3370027', '2025-10-28 18:02:28.302038', NULL, NULL, 'default');
INSERT INTO public.data_outputs (id, namespace, name, description, status, platform_id, service_id, owner_id, configuration, configuration_id, created_on, updated_on, deleted_at, "technical_mapping") VALUES ('9db5db83-a92b-4111-a0b6-dfe43fdc9454', 'signal-analytics-output', 'Signal analytics output', 'Aggregates statistical disproportionality metrics for safety signals.', 'ACTIVE', returned_platform_id, s3_service_id, '08039e5d-50a7-447a-b691-f5dc6b420dea', NULL, '2cd814a6-20fe-430e-ba62-ace42b10897e', '2025-10-28 18:03:02.685892', NULL, NULL, 'default');
INSERT INTO public.data_outputs (id, namespace, name, description, status, platform_id, service_id, owner_id, configuration, configuration_id, created_on, updated_on, deleted_at, "technical_mapping") VALUES ('fcbc3477-62cd-43ff-843f-bb18e24d31be', 'manufacturing-batch-data', 'Manufacturing Batch Data', 'Tracks production and quality of drug lots', 'ACTIVE', returned_platform_id, s3_service_id, '625b65b6-13d9-4c8c-a669-865e36fc3dfc', NULL, '83e1a9e2-19ec-4b31-aeb5-40ac81e3e27c', '2025-10-28 18:06:26.226197', NULL, NULL, 'default');
INSERT INTO public.data_outputs (id, namespace, name, description, status, platform_id, service_id, owner_id, configuration, configuration_id, created_on, updated_on, deleted_at, "technical_mapping") VALUES ('2aa6122b-833f-4386-894d-4a5af3af10c4', 'shipment-logs', 'Shipment logs', 'Records product shipments', 'ACTIVE', returned_platform_id, s3_service_id, '625b65b6-13d9-4c8c-a669-865e36fc3dfc', NULL, 'f8df446d-0211-4ee8-81e1-5410b6419e6e', '2025-10-28 18:07:05.924953', NULL, NULL, 'default');
INSERT INTO public.data_outputs (id, namespace, name, description, status, platform_id, service_id, owner_id, configuration, configuration_id, created_on, updated_on, deleted_at, "technical_mapping") VALUES ('c15caa28-c063-4e41-8dd3-c5cccccfa88c', 'site-inventory', 'Site inventory', 'Shows the stock levels at trial sites.', 'ACTIVE', returned_platform_id, s3_service_id, '625b65b6-13d9-4c8c-a669-865e36fc3dfc', NULL, '7bb075e0-70c3-44c2-811e-cd7bba757927', '2025-10-28 18:07:33.673309', NULL, NULL, 'default');
INSERT INTO public.data_outputs (id, namespace, name, description, status, platform_id, service_id, owner_id, configuration, configuration_id, created_on, updated_on, deleted_at, "technical_mapping") VALUES ('d1092134-aac6-4501-88ba-464a9f0cedc8', 'customer-master-data', 'Customer master data', 'Maintains a golden record of HCPs and organizations.', 'ACTIVE', 'baa5c47b-805a-4cbb-ad8b-038c66e81b7e', 'ce208413-b629-44d2-9f98-e5b47a315a56', '22488fe0-c30a-4447-972e-3eb22a1bd266', NULL, 'dc1cc43b-698e-424c-af5b-27f68f0c0781', '2025-10-28 18:09:39.615998', NULL, NULL, 'default');
INSERT INTO public.data_outputs (id, namespace, name, description, status, platform_id, service_id, owner_id, configuration, configuration_id, created_on, updated_on, deleted_at, "technical_mapping") VALUES ('1e9030f0-6e6e-485e-8bd9-0ff76bfc371f', 'engagement-activity-log', 'Engagement Activity Log', 'Tracks calls, emails, and events with customers.', 'ACTIVE', 'baa5c47b-805a-4cbb-ad8b-038c66e81b7e', 'ce208413-b629-44d2-9f98-e5b47a315a56', '22488fe0-c30a-4447-972e-3eb22a1bd266', NULL, '8d18f556-ccd2-425e-8e48-f24c185a053e', '2025-10-28 18:10:04.633488', NULL, NULL, 'default');
INSERT INTO public.data_outputs (id, namespace, name, description, status, platform_id, service_id, owner_id, configuration, configuration_id, created_on, updated_on, deleted_at, "technical_mapping") VALUES ('07fe77b2-f06f-4692-a76b-acdd2c412db3', 'entity-registry', 'Entity Registry', 'Stores canonical identifiers and metadata for all business entities.', 'ACTIVE', 'baa5c47b-805a-4cbb-ad8b-038c66e81b7e', 'ce208413-b629-44d2-9f98-e5b47a315a56', '90e65438-a942-43e0-a4a9-ee406b92df65', NULL, 'da19237f-eaf6-4a0a-8090-a2b724189978', '2025-10-28 18:12:07.053708', NULL, NULL, 'default');
INSERT INTO public.data_outputs (id, namespace, name, description, status, platform_id, service_id, owner_id, configuration, configuration_id, created_on, updated_on, deleted_at, "technical_mapping") VALUES ('967ca866-d868-49b8-9a31-3d2e97ed63f3', 'relationship-graph', 'Relationship Graph', 'Maps inter-entity relationships across domains.', 'ACTIVE', 'baa5c47b-805a-4cbb-ad8b-038c66e81b7e', 'ce208413-b629-44d2-9f98-e5b47a315a56', '90e65438-a942-43e0-a4a9-ee406b92df65', NULL, '502d4484-e332-4854-a2d8-7c387906f459', '2025-10-28 18:12:22.129267', NULL, NULL, 'default');
INSERT INTO public.data_outputs (id, namespace, name, description, status, platform_id, service_id, owner_id, configuration, configuration_id, created_on, updated_on, deleted_at, "technical_mapping") VALUES ('e1024306-a524-4142-8673-b0219dfad76b', 'project-delivery-metrics', 'Project Delivery Metrics', 'Tracks timelines, milestones, and outcomes of internal projects.', 'ACTIVE', returned_platform_id, glue_service_id, '68b28e38-3faa-45ca-9d00-3830d0a7b108', NULL, 'af1e8de6-3dc8-43e5-9c74-597c5676c137', '2025-10-28 18:14:25.794897', NULL, NULL, 'default');
INSERT INTO public.data_outputs (id, namespace, name, description, status, platform_id, service_id, owner_id, configuration, configuration_id, created_on, updated_on, deleted_at, "technical_mapping") VALUES ('dcf5270d-562b-4cd1-a0a3-c0835003698b', 'employee-kpi-log', 'Employee KPI log', 'Tracks how well each employee is performing with respect to their set KPIs', 'ACTIVE', returned_platform_id, glue_service_id, '68b28e38-3faa-45ca-9d00-3830d0a7b108', NULL, '677a9352-a968-44be-a5df-6e5e4094ebe7', '2025-10-28 18:15:10.920954', NULL, NULL, 'default');
INSERT INTO public.data_outputs (id, namespace, name, description, status, platform_id, service_id, owner_id, configuration, configuration_id, created_on, updated_on, deleted_at, "technical_mapping") VALUES ('cce652d7-b6a6-4000-a248-4cc9d9066fab', 'workforce-demographics', 'Workforce Demographics', 'Records representation by gender, age, and level.', 'ACTIVE', 'baa5c47b-805a-4cbb-ad8b-038c66e81b7e', 'ce208413-b629-44d2-9f98-e5b47a315a56', '97af957a-70c4-465d-95f2-f70c11af8da0', NULL, '44daa0b4-a027-4e5b-b233-b8342da71c38', '2025-10-28 18:17:04.80167', NULL, NULL, 'default');
INSERT INTO public.data_outputs (id, namespace, name, description, status, platform_id, service_id, owner_id, configuration, configuration_id, created_on, updated_on, deleted_at, "technical_mapping") VALUES ('a686ff78-3039-4006-9dd1-e8d5cf293ec7', 'compensation-equity-data', 'Compensation Equity Data', 'Captures pay and benefits information across roles.', 'ACTIVE', 'baa5c47b-805a-4cbb-ad8b-038c66e81b7e', 'ce208413-b629-44d2-9f98-e5b47a315a56', '97af957a-70c4-465d-95f2-f70c11af8da0', NULL, 'e0875fbb-f2ff-4804-a9ba-c9c3b006fca3', '2025-10-28 18:17:20.241114', NULL, NULL, 'default');
INSERT INTO public.data_outputs (id, namespace, name, description, status, platform_id, service_id, owner_id, configuration, configuration_id, created_on, updated_on, deleted_at, "technical_mapping") VALUES ('0473d934-3993-45d5-9d25-151162f673da', 'patient-demographic', 'Patient demographic', 'Stores baseline info about trial participants', 'ACTIVE', returned_platform_id, glue_service_id, '58b837a5-33d0-41cf-bf95-eb9af846f4d0', NULL, '74db2ed9-b28a-4875-8eb5-17b9fe445c8d', '2025-10-28 18:30:00.415068', NULL, NULL, 'default');
INSERT INTO public.data_outputs (id, namespace, name, description, status, platform_id, service_id, owner_id, configuration, configuration_id, created_on, updated_on, deleted_at, "technical_mapping") VALUES ('975b129b-d9c4-4a8a-8430-9be3be621c37', 'patient-clinical-profile', 'Patient clinical profile', 'Stores basic clinical information about the patients', 'ACTIVE', returned_platform_id, glue_service_id, '58b837a5-33d0-41cf-bf95-eb9af846f4d0', NULL, '22e9a60d-e8f8-4bf5-9efd-500f407dbb47', '2025-10-28 18:30:28.256785', NULL, NULL, 'default');
INSERT INTO public.data_outputs (id, namespace, name, description, status, platform_id, service_id, owner_id, configuration, configuration_id, created_on, updated_on, deleted_at, "technical_mapping") VALUES ('b4b4ba5e-1c1a-42f8-9017-25fed591f30b', 'response-to-treatment', 'Response to treatment', 'Records treatment outcomes and biomarkers linked to each patient.', 'ACTIVE', returned_platform_id, glue_service_id, '58b837a5-33d0-41cf-bf95-eb9af846f4d0', NULL, '2ea14ab5-a45b-4799-86fc-d6285377a4d6', '2025-10-28 18:30:57.415321', NULL, NULL, 'default');
INSERT INTO public.data_outputs (id, namespace, name, description, status, platform_id, service_id, owner_id, configuration, configuration_id, created_on, updated_on, deleted_at, "technical_mapping") VALUES ('2458ead6-6361-4542-a5aa-5ce45cba4aa3', 'competitive-intelligence', 'Competitive Intelligence ', 'Aggregates competitor activity, publications, and pipeline updates.', 'ACTIVE', returned_platform_id, glue_service_id, 'ccdc13fa-4a1a-4dde-ad1c-efa0d58eafb7', NULL, 'bbed68d4-8bda-420a-a6cf-37cb32ba9d45', '2025-10-28 18:35:42.552188', NULL, NULL, 'default');
INSERT INTO public.data_outputs (id, namespace, name, description, status, platform_id, service_id, owner_id, configuration, configuration_id, created_on, updated_on, deleted_at, "technical_mapping") VALUES ('eb93308b-a5bb-4f19-90e3-cf56b0855a07', 'rd-program-ranking', 'R&D program ranking', 'Ranking of the different R&D programs within our organisation', 'ACTIVE', returned_platform_id, glue_service_id, 'ccdc13fa-4a1a-4dde-ad1c-efa0d58eafb7', NULL, '8b6b6b35-c155-4f13-a847-c7598b08cea9', '2025-10-28 18:36:26.66997', NULL, NULL, 'default');
-- extra data output configurations
INSERT INTO public.data_output_configurations (id, configuration_type) VALUES ('12346cc6-f58d-4217-88d3-6443b01d5d0f', 'GlueTechnicalAssetConfiguration');
INSERT INTO public.glue_technical_asset_configurations (id, bucket_identifier, "database", database_suffix, "table", database_path, table_path, access_granularity, created_on, updated_on, deleted_at) VALUES ('12346cc6-f58d-4217-88d3-6443b01d5d0f', '', 'biomarker-discovery', '', 'omics_prod', 'biomarker-discovery', 'omics_prod', 'table', '2025-10-28 16:34:02.355842', NULL, NULL);
INSERT INTO public.data_output_configurations (id, configuration_type) VALUES ('db8e84e9-e942-4ebb-ac78-ee0fa600db5d', 'DatabricksTechnicalAssetConfiguration');
INSERT INTO public.databricks_technical_asset_configurations (id, bucket_identifier, "catalog", schema, catalog_path, table_path, "table", access_granularity, created_on, updated_on, deleted_at) VALUES ('db8e84e9-e942-4ebb-ac78-ee0fa600db5d', '', 'biomarker-discovery', '', 'biomarker-discovery', 'clinical_correlation', 'clinical_correlation', 'table', '2025-10-28 16:34:31.5612', NULL, NULL);
INSERT INTO public.data_output_configurations (id, configuration_type) VALUES ('17798a65-12e2-4a5e-84c0-9948041849e0', 'GlueTechnicalAssetConfiguration');
INSERT INTO public.glue_technical_asset_configurations (id, bucket_identifier, "database", database_suffix, "table", database_path, table_path, access_granularity, created_on, updated_on, deleted_at) VALUES ('17798a65-12e2-4a5e-84c0-9948041849e0', '', 'clinical-trial-performance', '', 'trial_master', 'clinical-trial-performance', 'trial_master', 'table', '2025-10-28 16:38:29.452913', NULL, NULL);
INSERT INTO public.data_output_configurations (id, configuration_type) VALUES ('08877d52-a5c1-4fd4-8e8d-ca3c108f2363', 'GlueTechnicalAssetConfiguration');
INSERT INTO public.glue_technical_asset_configurations (id, bucket_identifier, "database", database_suffix, "table", database_path, table_path, access_granularity, created_on, updated_on, deleted_at) VALUES ('08877d52-a5c1-4fd4-8e8d-ca3c108f2363', '', 'clinical-trial-performance', '', 'retention_metrics', 'clinical-trial-performance', 'retention_metrics', 'table', '2025-10-28 16:39:02.184116', NULL, NULL);
INSERT INTO public.data_output_configurations (id, configuration_type) VALUES ('43a09ac9-9576-4436-94f7-79339510c887', 'GlueTechnicalAssetConfiguration');
INSERT INTO public.glue_technical_asset_configurations (id, bucket_identifier, "database", database_suffix, "table", database_path, table_path, access_granularity, created_on, updated_on, deleted_at) VALUES ('43a09ac9-9576-4436-94f7-79339510c887', '', 'clinical-data-quality-monitor', '', '*', 'clinical-data-quality-monitor', '*', 'table', '2025-10-28 17:56:57.829806', NULL, NULL);
INSERT INTO public.data_output_configurations (id, configuration_type) VALUES ('3871765b-881b-4654-a0ec-7e1db6a2de2f', 'GlueTechnicalAssetConfiguration');
INSERT INTO public.glue_technical_asset_configurations (id, bucket_identifier, "database", database_suffix, "table", database_path, table_path, access_granularity, created_on, updated_on, deleted_at) VALUES ('3871765b-881b-4654-a0ec-7e1db6a2de2f', '', 'clinical-data-quality-monitor', '', 'clinical_data_quality', 'clinical-data-quality-monitor', 'clinical_data_quality', 'table', '2025-10-28 17:57:32.996449', NULL, NULL);
INSERT INTO public.data_output_configurations (id, configuration_type) VALUES ('3f9ba1f0-84fb-4a5c-858d-11b1bca33b6b', 'GlueTechnicalAssetConfiguration');
INSERT INTO public.glue_technical_asset_configurations (id, bucket_identifier, "database", database_suffix, "table", database_path, table_path, access_granularity, created_on, updated_on, deleted_at) VALUES ('3f9ba1f0-84fb-4a5c-858d-11b1bca33b6b', '', 'regulatory-submission-tracker', '', '*', 'regulatory-submission-tracker', '*', 'table', '2025-10-28 17:59:45.865277', NULL, NULL);
INSERT INTO public.data_output_configurations (id, configuration_type) VALUES ('b1a77a22-5dac-4631-9e22-b6129c67d037', 'S3TechnicalAssetConfiguration');
INSERT INTO public.s3_technical_asset_configurations (id, bucket, suffix, path, created_on, updated_on, deleted_at) VALUES ('b1a77a22-5dac-4631-9e22-b6129c67d037', 'datalake', 'regulatory-submission-tracker', 'compliance-audit-trail', '2025-10-28 18:00:21.273949', NULL, NULL);
INSERT INTO public.data_output_configurations (id, configuration_type) VALUES ('10889f18-7156-4617-84f7-89aac3370027', 'S3TechnicalAssetConfiguration');
INSERT INTO public.s3_technical_asset_configurations (id, bucket, suffix, path, created_on, updated_on, deleted_at) VALUES ('10889f18-7156-4617-84f7-89aac3370027', 'datalake', 'safety-signal-detection-system', 'adverse-event-db', '2025-10-28 18:02:28.302038', NULL, NULL);
INSERT INTO public.data_output_configurations (id, configuration_type) VALUES ('2cd814a6-20fe-430e-ba62-ace42b10897e', 'S3TechnicalAssetConfiguration');
INSERT INTO public.s3_technical_asset_configurations (id, bucket, suffix, path, created_on, updated_on, deleted_at) VALUES ('2cd814a6-20fe-430e-ba62-ace42b10897e', 'datalake', 'safety-signal-detection-system', 'signal-analytics', '2025-10-28 18:03:02.685892', NULL, NULL);
INSERT INTO public.data_output_configurations (id, configuration_type) VALUES ('83e1a9e2-19ec-4b31-aeb5-40ac81e3e27c', 'S3TechnicalAssetConfiguration');
INSERT INTO public.s3_technical_asset_configurations (id, bucket, suffix, path, created_on, updated_on, deleted_at) VALUES ('83e1a9e2-19ec-4b31-aeb5-40ac81e3e27c', 'datalake', 'drug-supply-chain-optimization', 'manufactoring', '2025-10-28 18:06:26.226197', NULL, NULL);
INSERT INTO public.data_output_configurations (id, configuration_type) VALUES ('f8df446d-0211-4ee8-81e1-5410b6419e6e', 'S3TechnicalAssetConfiguration');
INSERT INTO public.s3_technical_asset_configurations (id, bucket, suffix, path, created_on, updated_on, deleted_at) VALUES ('f8df446d-0211-4ee8-81e1-5410b6419e6e', 'datalake', 'drug-supply-chain-optimization', 'shipment-logs', '2025-10-28 18:07:05.924953', NULL, NULL);
INSERT INTO public.data_output_configurations (id, configuration_type) VALUES ('7bb075e0-70c3-44c2-811e-cd7bba757927', 'S3TechnicalAssetConfiguration');
INSERT INTO public.s3_technical_asset_configurations (id, bucket, suffix, path, created_on, updated_on, deleted_at) VALUES ('7bb075e0-70c3-44c2-811e-cd7bba757927', 'datalake', 'drug-supply-chain-optimization', 'site-inventory', '2025-10-28 18:07:33.673309', NULL, NULL);
INSERT INTO public.data_output_configurations (id, configuration_type) VALUES ('dc1cc43b-698e-424c-af5b-27f68f0c0781', 'DatabricksTechnicalAssetConfiguration');
INSERT INTO public.databricks_technical_asset_configurations (id, bucket_identifier, "catalog", schema, catalog_path, table_path, "table", access_granularity, created_on, updated_on, deleted_at) VALUES ('dc1cc43b-698e-424c-af5b-27f68f0c0781', '', 'customer-intelligence-platform', '', 'customer-intelligence-platform', 'custmer-master-data', 'custmer-master-data', 'table', '2025-10-28 18:09:39.615998', NULL, NULL);
INSERT INTO public.data_output_configurations (id, configuration_type) VALUES ('8d18f556-ccd2-425e-8e48-f24c185a053e', 'DatabricksTechnicalAssetConfiguration');
INSERT INTO public.databricks_technical_asset_configurations (id, bucket_identifier, "catalog", schema, catalog_path, table_path, "table", access_granularity, created_on, updated_on, deleted_at) VALUES ('8d18f556-ccd2-425e-8e48-f24c185a053e', '', 'customer-intelligence-platform', '', 'customer-intelligence-platform', 'engagement-activity', 'engagement-activity', 'table', '2025-10-28 18:10:04.633488', NULL, NULL);
INSERT INTO public.data_output_configurations (id, configuration_type) VALUES ('da19237f-eaf6-4a0a-8090-a2b724189978', 'DatabricksTechnicalAssetConfiguration');
INSERT INTO public.databricks_technical_asset_configurations (id, bucket_identifier, "catalog", schema, catalog_path, table_path, "table", access_granularity, created_on, updated_on, deleted_at) VALUES ('da19237f-eaf6-4a0a-8090-a2b724189978', '', 'enterprise-knowledge-graph', '', 'enterprise-knowledge-graph', '*', '*', 'table', '2025-10-28 18:12:07.053708', NULL, NULL);
INSERT INTO public.data_output_configurations (id, configuration_type) VALUES ('502d4484-e332-4854-a2d8-7c387906f459', 'DatabricksTechnicalAssetConfiguration');
INSERT INTO public.databricks_technical_asset_configurations (id, bucket_identifier, "catalog", schema, catalog_path, table_path, "table", access_granularity, created_on, updated_on, deleted_at) VALUES ('502d4484-e332-4854-a2d8-7c387906f459', '', 'enterprise-knowledge-graph', '', 'enterprise-knowledge-graph', '*', '*', 'table', '2025-10-28 18:12:22.129267', NULL, NULL);
INSERT INTO public.data_output_configurations (id, configuration_type) VALUES ('af1e8de6-3dc8-43e5-9c74-597c5676c137', 'GlueTechnicalAssetConfiguration');
INSERT INTO public.glue_technical_asset_configurations (id, bucket_identifier, "database", database_suffix, "table", database_path, table_path, access_granularity, created_on, updated_on, deleted_at) VALUES ('af1e8de6-3dc8-43e5-9c74-597c5676c137', '', 'employee-productivity', '', '*', 'employee-productivity', '*', 'table', '2025-10-28 18:14:25.794897', NULL, NULL);
INSERT INTO public.data_output_configurations (id, configuration_type) VALUES ('677a9352-a968-44be-a5df-6e5e4094ebe7', 'GlueTechnicalAssetConfiguration');
INSERT INTO public.glue_technical_asset_configurations (id, bucket_identifier, "database", database_suffix, "table", database_path, table_path, access_granularity, created_on, updated_on, deleted_at) VALUES ('677a9352-a968-44be-a5df-6e5e4094ebe7', '', 'employee-productivity', '', '*', 'employee-productivity', '*', 'table', '2025-10-28 18:15:10.920954', NULL, NULL);
INSERT INTO public.data_output_configurations (id, configuration_type) VALUES ('44daa0b4-a027-4e5b-b233-b8342da71c38', 'DatabricksTechnicalAssetConfiguration');
INSERT INTO public.databricks_technical_asset_configurations (id, bucket_identifier, "catalog", schema, catalog_path, table_path, "table", access_granularity, created_on, updated_on, deleted_at) VALUES ('44daa0b4-a027-4e5b-b233-b8342da71c38', '', 'dei-insights-dashboard', '', 'dei-insights-dashboard', '*', '*', 'table', '2025-10-28 18:17:04.80167', NULL, NULL);
INSERT INTO public.data_output_configurations (id, configuration_type) VALUES ('e0875fbb-f2ff-4804-a9ba-c9c3b006fca3', 'DatabricksTechnicalAssetConfiguration');
INSERT INTO public.databricks_technical_asset_configurations (id, bucket_identifier, "catalog", schema, catalog_path, table_path, "table", access_granularity, created_on, updated_on, deleted_at) VALUES ('e0875fbb-f2ff-4804-a9ba-c9c3b006fca3', '', 'dei-insights-dashboard', '', 'dei-insights-dashboard', '*', '*', 'table', '2025-10-28 18:17:20.241114', NULL, NULL);
INSERT INTO public.data_output_configurations (id, configuration_type) VALUES ('ff632a7d-4ddd-4fd1-800a-ba8098c26c18', 'GlueTechnicalAssetConfiguration');
INSERT INTO public.glue_technical_asset_configurations (id, bucket_identifier, "database", database_suffix, "table", database_path, table_path, access_granularity, created_on, updated_on, deleted_at) VALUES ('ff632a7d-4ddd-4fd1-800a-ba8098c26c18', '', 'sales-performance-model', '', '*', 'sales-performance-model', '*', 'table', '2025-10-28 18:19:44.674412', NULL, NULL);
INSERT INTO public.data_output_configurations (id, configuration_type) VALUES ('e8129149-bdb5-4c15-8211-4b6b83fcb64a', 'GlueTechnicalAssetConfiguration');
INSERT INTO public.glue_technical_asset_configurations (id, bucket_identifier, "database", database_suffix, "table", database_path, table_path, access_granularity, created_on, updated_on, deleted_at) VALUES ('e8129149-bdb5-4c15-8211-4b6b83fcb64a', '', 'sales-performance-model', '', '*', 'sales-performance-model', '*', 'table', '2025-10-28 18:20:01.401722', NULL, NULL);
INSERT INTO public.data_output_configurations (id, configuration_type) VALUES ('74db2ed9-b28a-4875-8eb5-17b9fe445c8d', 'GlueTechnicalAssetConfiguration');
INSERT INTO public.glue_technical_asset_configurations (id, bucket_identifier, "database", database_suffix, "table", database_path, table_path, access_granularity, created_on, updated_on, deleted_at) VALUES ('74db2ed9-b28a-4875-8eb5-17b9fe445c8d', '', 'patient-stratification-engine', '', '*', 'patient-stratification-engine', '*', 'table', '2025-10-28 18:30:00.415068', NULL, NULL);
INSERT INTO public.data_output_configurations (id, configuration_type) VALUES ('22e9a60d-e8f8-4bf5-9efd-500f407dbb47', 'GlueTechnicalAssetConfiguration');
INSERT INTO public.glue_technical_asset_configurations (id, bucket_identifier, "database", database_suffix, "table", database_path, table_path, access_granularity, created_on, updated_on, deleted_at) VALUES ('22e9a60d-e8f8-4bf5-9efd-500f407dbb47', '', 'patient-stratification-engine', '', '*', 'patient-stratification-engine', '*', 'table', '2025-10-28 18:30:28.256785', NULL, NULL);
INSERT INTO public.data_output_configurations (id, configuration_type) VALUES ('2ea14ab5-a45b-4799-86fc-d6285377a4d6', 'GlueTechnicalAssetConfiguration');
INSERT INTO public.glue_technical_asset_configurations (id, bucket_identifier, "database", database_suffix, "table", database_path, table_path, access_granularity, created_on, updated_on, deleted_at) VALUES ('2ea14ab5-a45b-4799-86fc-d6285377a4d6', '', 'patient-stratification-engine', '', '*', 'patient-stratification-engine', '*', 'table', '2025-10-28 18:30:57.415321', NULL, NULL);
INSERT INTO public.data_output_configurations (id, configuration_type) VALUES ('bbed68d4-8bda-420a-a6cf-37cb32ba9d45', 'GlueTechnicalAssetConfiguration');
INSERT INTO public.glue_technical_asset_configurations (id, bucket_identifier, "database", database_suffix, "table", database_path, table_path, access_granularity, created_on, updated_on, deleted_at) VALUES ('bbed68d4-8bda-420a-a6cf-37cb32ba9d45', '', 'rd-portfolio-prioritization-model', '', '*', 'rd-portfolio-prioritization-model', '*', 'table', '2025-10-28 18:35:42.552188', NULL, NULL);
INSERT INTO public.data_output_configurations (id, configuration_type) VALUES ('8b6b6b35-c155-4f13-a847-c7598b08cea9', 'GlueTechnicalAssetConfiguration');
INSERT INTO public.glue_technical_asset_configurations (id, bucket_identifier, "database", database_suffix, "table", database_path, table_path, access_granularity, created_on, updated_on, deleted_at) VALUES ('8b6b6b35-c155-4f13-a847-c7598b08cea9', '', 'rd-portfolio-prioritization-model', '', '*', 'rd-portfolio-prioritization-model', '*', 'table', '2025-10-28 18:36:26.66997', NULL, NULL);
-- INSERT ROLE ASSIGNMENTS FOR DATA PRODUCTS
INSERT INTO public.role_assignments_data_product (id, data_product_id, user_id, role_id, decision, requested_by_id, requested_on, decided_by_id, decided_on, created_on, updated_on, deleted_at) VALUES ('3502276b-b9b3-47f2-901b-3c4502fb7d1e', '81815c4c-f323-4cf1-b25b-f43f231f510f', john_id, 'e43b6f7a-e776-49b2-9b51-117d8644d971', 'APPROVED', john_id, '2025-10-28 16:32:57.902449', john_id, '2025-10-28 16:32:57.910346', '2025-10-28 16:32:57.89898', '2025-10-28 16:32:57.908607', NULL);
INSERT INTO public.role_assignments_data_product (id, data_product_id, user_id, role_id, decision, requested_by_id, requested_on, decided_by_id, decided_on, created_on, updated_on, deleted_at) VALUES ('5a1f650c-a4cf-4a59-825c-08fa699617ca', '6e580d91-14ea-495e-a6d7-5db236a5c1d5', jane_id, 'e43b6f7a-e776-49b2-9b51-117d8644d971', 'APPROVED', john_id, '2025-10-28 16:37:39.90644', john_id, '2025-10-28 16:37:39.917665', '2025-10-28 16:37:39.901065', '2025-10-28 16:37:39.914117', NULL);
INSERT INTO public.role_assignments_data_product (id, data_product_id, user_id, role_id, decision, requested_by_id, requested_on, decided_by_id, decided_on, created_on, updated_on, deleted_at) VALUES ('4c94a3f1-1fd3-44ea-aef2-c220773eb969', '6e580d91-14ea-495e-a6d7-5db236a5c1d5', john_id, 'e43b6f7a-e776-49b2-9b51-117d8644d971', 'APPROVED', john_id, '2025-10-28 16:41:33.829482', john_id, '2025-10-28 16:41:33.839374', '2025-10-28 16:41:33.822617', '2025-10-28 16:41:33.836909', NULL);
INSERT INTO public.role_assignments_data_product (id, data_product_id, user_id, role_id, decision, requested_by_id, requested_on, decided_by_id, decided_on, created_on, updated_on, deleted_at) VALUES ('da86ebb4-5e20-4be8-88ed-3d33a890c7a9', '9fa5e299-fcc4-45e0-b48d-cc3deb68eefe', john_id, 'e43b6f7a-e776-49b2-9b51-117d8644d971', 'APPROVED', john_id, '2025-10-28 17:56:19.876226', john_id, '2025-10-28 17:56:19.881112', '2025-10-28 17:56:19.873821', '2025-10-28 17:56:19.880351', NULL);
INSERT INTO public.role_assignments_data_product (id, data_product_id, user_id, role_id, decision, requested_by_id, requested_on, decided_by_id, decided_on, created_on, updated_on, deleted_at) VALUES ('d3695c76-2163-41f7-bff7-bd1dedcc8096', 'fbcd7899-2763-4659-bd28-2a278910ef85', john_id, 'e43b6f7a-e776-49b2-9b51-117d8644d971', 'APPROVED', john_id, '2025-10-28 17:59:19.862559', john_id, '2025-10-28 17:59:19.8694', '2025-10-28 17:59:19.858731', '2025-10-28 17:59:19.867782', NULL);
INSERT INTO public.role_assignments_data_product (id, data_product_id, user_id, role_id, decision, requested_by_id, requested_on, decided_by_id, decided_on, created_on, updated_on, deleted_at) VALUES ('bfac90c4-9290-472b-9123-0b2f4ae45d2e', 'fbcd7899-2763-4659-bd28-2a278910ef85', jane_id, 'e43b6f7a-e776-49b2-9b51-117d8644d971', 'APPROVED', john_id, '2025-10-28 17:59:19.88175', john_id, '2025-10-28 17:59:19.887169', '2025-10-28 17:59:19.874011', '2025-10-28 17:59:19.885869', NULL);
INSERT INTO public.role_assignments_data_product (id, data_product_id, user_id, role_id, decision, requested_by_id, requested_on, decided_by_id, decided_on, created_on, updated_on, deleted_at) VALUES ('5c6f6c98-1401-4ca1-a577-0a9e8db701a9', '08039e5d-50a7-447a-b691-f5dc6b420dea', jane_id, 'e43b6f7a-e776-49b2-9b51-117d8644d971', 'APPROVED', john_id, '2025-10-28 18:01:54.338886', john_id, '2025-10-28 18:01:54.343617', '2025-10-28 18:01:54.336493', '2025-10-28 18:01:54.342708', NULL);
INSERT INTO public.role_assignments_data_product (id, data_product_id, user_id, role_id, decision, requested_by_id, requested_on, decided_by_id, decided_on, created_on, updated_on, deleted_at) VALUES ('54b4577d-f571-4d53-99e5-e83380c47438', '08039e5d-50a7-447a-b691-f5dc6b420dea', john_id, 'e43b6f7a-e776-49b2-9b51-117d8644d971', 'APPROVED', john_id, '2025-10-28 18:01:54.352817', john_id, '2025-10-28 18:01:54.356766', '2025-10-28 18:01:54.347504', '2025-10-28 18:01:54.356012', NULL);
INSERT INTO public.role_assignments_data_product (id, data_product_id, user_id, role_id, decision, requested_by_id, requested_on, decided_by_id, decided_on, created_on, updated_on, deleted_at) VALUES ('7c5123ac-0e60-43a1-bdfd-54ff59d4164c', '625b65b6-13d9-4c8c-a669-865e36fc3dfc', john_id, 'e43b6f7a-e776-49b2-9b51-117d8644d971', 'APPROVED', john_id, '2025-10-28 18:05:44.192946', john_id, '2025-10-28 18:05:44.198121', '2025-10-28 18:05:44.190775', '2025-10-28 18:05:44.197289', NULL);
INSERT INTO public.role_assignments_data_product (id, data_product_id, user_id, role_id, decision, requested_by_id, requested_on, decided_by_id, decided_on, created_on, updated_on, deleted_at) VALUES ('44cec659-3489-447d-850f-c8ea65ec6f5a', '22488fe0-c30a-4447-972e-3eb22a1bd266', john_id, 'e43b6f7a-e776-49b2-9b51-117d8644d971', 'APPROVED', john_id, '2025-10-28 18:09:11.683137', john_id, '2025-10-28 18:09:11.688498', '2025-10-28 18:09:11.679884', '2025-10-28 18:09:11.6877', NULL);
INSERT INTO public.role_assignments_data_product (id, data_product_id, user_id, role_id, decision, requested_by_id, requested_on, decided_by_id, decided_on, created_on, updated_on, deleted_at) VALUES ('7676860f-32be-49b2-adbf-85087ce9da9d', '90e65438-a942-43e0-a4a9-ee406b92df65', john_id, 'e43b6f7a-e776-49b2-9b51-117d8644d971', 'APPROVED', john_id, '2025-10-28 18:11:47.504193', john_id, '2025-10-28 18:11:47.508956', '2025-10-28 18:11:47.502037', '2025-10-28 18:11:47.508201', NULL);
INSERT INTO public.role_assignments_data_product (id, data_product_id, user_id, role_id, decision, requested_by_id, requested_on, decided_by_id, decided_on, created_on, updated_on, deleted_at) VALUES ('8591f923-2696-4aa6-98ed-e396c7cb2ded', '68b28e38-3faa-45ca-9d00-3830d0a7b108', john_id, 'e43b6f7a-e776-49b2-9b51-117d8644d971', 'APPROVED', john_id, '2025-10-28 18:14:07.388736', john_id, '2025-10-28 18:14:07.394139', '2025-10-28 18:14:07.385202', '2025-10-28 18:14:07.393015', NULL);
INSERT INTO public.role_assignments_data_product (id, data_product_id, user_id, role_id, decision, requested_by_id, requested_on, decided_by_id, decided_on, created_on, updated_on, deleted_at) VALUES ('437b00ab-7473-4a31-b5ff-f15794d9b56e', '97af957a-70c4-465d-95f2-f70c11af8da0', john_id, 'e43b6f7a-e776-49b2-9b51-117d8644d971', 'APPROVED', john_id, '2025-10-28 18:16:50.723993', john_id, '2025-10-28 18:16:50.72973', '2025-10-28 18:16:50.720213', '2025-10-28 18:16:50.728845', NULL);
INSERT INTO public.role_assignments_data_product (id, data_product_id, user_id, role_id, decision, requested_by_id, requested_on, decided_by_id, decided_on, created_on, updated_on, deleted_at) VALUES ('9ef6eaae-f46e-440a-8cd6-88d30de94516', '86b74246-734f-4cea-a984-3dd0d27fc565', john_id, 'e43b6f7a-e776-49b2-9b51-117d8644d971', 'APPROVED', john_id, '2025-10-28 18:19:20.46085', john_id, '2025-10-28 18:19:20.465528', '2025-10-28 18:19:20.458588', '2025-10-28 18:19:20.464641', NULL);
INSERT INTO public.role_assignments_data_product (id, data_product_id, user_id, role_id, decision, requested_by_id, requested_on, decided_by_id, decided_on, created_on, updated_on, deleted_at) VALUES ('884c0d5e-e442-4bdf-8a67-c0e752e80d86', '58b837a5-33d0-41cf-bf95-eb9af846f4d0', john_id, 'e43b6f7a-e776-49b2-9b51-117d8644d971', 'APPROVED', john_id, '2025-10-28 18:29:24.843296', john_id, '2025-10-28 18:29:24.848553', '2025-10-28 18:29:24.841102', '2025-10-28 18:29:24.847524', NULL);
INSERT INTO public.role_assignments_data_product (id, data_product_id, user_id, role_id, decision, requested_by_id, requested_on, decided_by_id, decided_on, created_on, updated_on, deleted_at) VALUES ('240dbbb2-ea7f-4900-8a02-30ec084e0a5d', 'ccdc13fa-4a1a-4dde-ad1c-efa0d58eafb7', john_id, 'e43b6f7a-e776-49b2-9b51-117d8644d971', 'APPROVED', john_id, '2025-10-28 18:34:32.318606', john_id, '2025-10-28 18:34:32.323823', '2025-10-28 18:34:32.316108', '2025-10-28 18:34:32.323078', NULL);
-- ------------------------------------------------------------------------------------------------
-- START of Insert dynamic dataset query stats
-- ------------------------------------------------------------------------------------------------
-- 1. Sales performance (adding 4 to test the other category aggregation)
-- Single-query daily consumer over the last six months
INSERT INTO public.dataset_query_stats_daily (date, dataset_id, consumer_data_product_id, query_count)
SELECT gs::date, sales_performance_model_output_port, revenue_dashboard, 1
FROM generate_series((CURRENT_DATE - INTERVAL '6 months')::date, CURRENT_DATE - 1, INTERVAL '1 day') AS gs;
-- -- Ten weekday queries for the last four months
INSERT INTO public.dataset_query_stats_daily (date, dataset_id, consumer_data_product_id, query_count)
SELECT gs::date, sales_performance_model_output_port, cash_flow_monitoring, 10
FROM generate_series((CURRENT_DATE - INTERVAL '4 months')::date, CURRENT_DATE - 1, INTERVAL '1 day') AS gs
WHERE EXTRACT(ISODOW FROM gs) BETWEEN 1 AND 5;
-- -- Weekly Monday pings (consumer #3)
INSERT INTO public.dataset_query_stats_daily (date, dataset_id, consumer_data_product_id, query_count)
SELECT gs::date, sales_performance_model_output_port, fraud_detection, 3
FROM generate_series((CURRENT_DATE - INTERVAL '5 months')::date, CURRENT_DATE - 1, INTERVAL '1 day') AS gs
WHERE EXTRACT(ISODOW FROM gs) = 1;
-- -- Mid-week bursts (consumer #4)
INSERT INTO public.dataset_query_stats_daily (date, dataset_id, consumer_data_product_id, query_count)
SELECT gs::date, sales_performance_model_output_port, financial_risk_assessment, 8
FROM generate_series((CURRENT_DATE - INTERVAL '4 months')::date, CURRENT_DATE - 1, INTERVAL '1 day') AS gs
WHERE EXTRACT(ISODOW FROM gs) = 3;
-- ------------------------------------------------------------------------------------------------
-- START of Insert data quality summary for half of the existing datasets
-- ------------------------------------------------------------------------------------------------
WITH dataset_selection AS (
-- Get up to 20 datasets and assign a row number for variety in data generation
SELECT id, name, ROW_NUMBER() OVER (ORDER BY id) as rn
FROM public.datasets
LIMIT 20
),
summary_generation AS (
SELECT
gen_random_uuid() as summary_id,
id as dataset_id,
name as dataset_name,
rn,
(ARRAY['success', 'failure', 'warning', 'error'])[((rn - 1) % 4) + 1] as status
FROM dataset_selection
)
INSERT INTO public.output_port_data_quality_summaries
(id, output_port_id, assets_with_checks, assets_with_issues, details_url, description, overall_status, created_at, dimensions)
SELECT
summary_id,
dataset_id,
10 + rn,
CASE WHEN status = 'success' THEN 0 ELSE (rn % 3) + 1 END,
'https://quality-tool.internal/view/' || dataset_id,
'Recursive CTE generated report for ' || dataset_name,
status,
NOW() - (rn || ' hours')::interval,
json_build_object('validity', lower(status), 'completeness', 'success')
FROM summary_generation;
-- 2. Generate the Technical Assets
WITH dataset_selection AS (
SELECT id, name, ROW_NUMBER() OVER (ORDER BY id) as rn FROM public.datasets LIMIT 20
),
summary_mapping AS (
-- We need to join back to the summaries we just created to get the IDs
SELECT s.id as summary_id, d.name as dataset_name, d.rn
FROM public.output_port_data_quality_summaries s
JOIN dataset_selection d ON s.output_port_id = d.id
)
INSERT INTO public.data_quality_technical_assets (name, status, data_quality_summary_id)
SELECT dataset_name || '_table', 'success', summary_id FROM summary_mapping
UNION ALL
SELECT dataset_name || '_view', 'warning', summary_id FROM summary_mapping;
end $$;