datahub/data-model/DDL/ETL_DDL/owner_metadata.sql

75 lines
3.3 KiB
MySQL
Raw Normal View History

2015-12-03 17:09:03 -08:00
--
-- Copyright 2015 LinkedIn Corp. All rights reserved.
--
-- Licensed under the Apache License, Version 2.0 (the "License");
-- you may not use this file except in compliance with the License.
-- You may obtain a copy of the License at
--
-- http://www.apache.org/licenses/LICENSE-2.0
--
-- Unless required by applicable law or agreed to in writing, software
-- distributed under the License is distributed on an "AS IS" BASIS,
-- WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
--
CREATE TABLE dataset_owner (
`dataset_id` INT UNSIGNED NOT NULL,
`dataset_urn` VARCHAR(200) NOT NULL,
`owner_id` VARCHAR(127) NOT NULL,
2015-12-07 15:27:20 -08:00
`app_id` SMALLINT NOT NULL COMMENT 'application id of the namespace',
2015-12-03 17:09:03 -08:00
`namespace` VARCHAR(127) COMMENT 'the namespace of the user',
`owner_type` VARCHAR(127) COMMENT 'Producer, Consumer, Stakeholder',
`owner_sub_type` VARCHAR(127) COMMENT 'DWH, UMP, BA, etc',
`db_ids` VARCHAR(127) COMMENT 'comma separated database ids',
`is_group` CHAR(1) COMMENT 'if owner is a group',
`is_active` CHAR(1) COMMENT 'if owner is active',
`is_deleted` CHAR(1) COMMENT 'if owner has been removed from the dataset',
`sort_id` SMALLINT COMMENT '0 = primary owner, order by priority/importance',
`source_time` INT UNSIGNED COMMENT 'the source time in epoch',
`created_time` INT UNSIGNED COMMENT 'the create time in epoch',
`modified_time` INT UNSIGNED COMMENT 'the modified time in epoch',
wh_etl_exec_id BIGINT COMMENT 'wherehows etl execution id that modified this record',
2015-12-07 15:27:20 -08:00
PRIMARY KEY (`dataset_id`, `owner_id`, `app_id`),
UNIQUE KEY (`dataset_urn`, `owner_id`, `app_id`)
2015-12-03 17:09:03 -08:00
);
CREATE TABLE stg_dataset_owner (
`dataset_id` INT COMMENT 'dataset_id',
`dataset_urn` VARCHAR(200) NOT NULL,
`owner_id` VARCHAR(127) NOT NULL,
`sort_id` SMALLINT COMMENT '0 = primary owner, order by priority/importance',
`app_id` INT COMMENT 'application id of the namesapce',
`namespace` VARCHAR(127) COMMENT 'the namespace of the user',
`owner_type` VARCHAR(127) COMMENT 'Producer, Consumer, Stakeholder',
`owner_sub_type` VARCHAR(127) COMMENT 'DWH, UMP, BA, etc',
`is_group` CHAR(1) COMMENT 'if owner is a group',
`db_name` VARCHAR(127) COMMENT 'database name',
`db_id` INT COMMENT 'database id',
`is_active` CHAR(1) COMMENT 'if owner is active',
`source_time` INT UNSIGNED COMMENT 'the source event time in epoch',
`is_parent_urn` CHAR(1) DEFAULT 'N' COMMENT 'if the urn is a directory for datasets',
2015-12-07 15:27:20 -08:00
KEY (dataset_urn, owner_id, namespace, db_name),
KEY dataset_index (dataset_urn),
KEY db_name_index (db_name)
2015-12-03 17:09:03 -08:00
);
CREATE TABLE stg_dataset_owner_unmatched (
`dataset_urn` VARCHAR(200) NOT NULL,
`owner_id` VARCHAR(127) NOT NULL,
`sort_id` SMALLINT COMMENT '0 = primary owner, order by priority/importance',
`app_id` INT COMMENT 'application id of the namesapce',
`namespace` VARCHAR(127) COMMENT 'the namespace of the user',
`owner_type` VARCHAR(127) COMMENT 'Producer, Consumer, Stakeholder',
`owner_sub_type` VARCHAR(127) COMMENT 'DWH, UMP, BA, etc',
`is_group` CHAR(1) COMMENT 'if owner is a group',
`db_name` VARCHAR(127) COMMENT 'database name',
`db_id` INT COMMENT 'database id',
`is_active` CHAR(1) COMMENT 'if owner is active',
`source_time` INT UNSIGNED COMMENT 'the source event time in epoch',
2015-12-07 15:27:20 -08:00
KEY (dataset_urn, owner_id, namespace, db_name),
KEY dataset_index (dataset_urn),
KEY db_name_index (db_name)
2015-12-03 17:09:03 -08:00
);