2015-11-19 14:39:21 -08:00
--
-- Copyright 2015 LinkedIn Corp. All rights reserved.
--
-- Licensed under the Apache License, Version 2.0 (the "License");
-- you may not use this file except in compliance with the License.
-- You may obtain a copy of the License at
--
-- http://www.apache.org/licenses/LICENSE-2.0
--
-- Unless required by applicable law or agreed to in writing, software
-- distributed under the License is distributed on an "AS IS" BASIS,
-- WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
--
-- create statement for dataset related tables :
-- dict_dataset, dict_dataset_sample, dict_field_detail, dict_dataset_schema_history
-- stagging table for dataset
CREATE TABLE ` stg_dict_dataset ` (
` name ` VARCHAR ( 200 ) NOT NULL ,
2016-05-19 12:39:06 -07:00
` schema ` MEDIUMTEXT CHARACTER SET utf8 ,
` schema_type ` VARCHAR ( 50 ) DEFAULT ' JSON ' COMMENT ' JSON, Hive, DDL, XML, CSV ' ,
` properties ` TEXT CHARACTER SET utf8 ,
` fields ` MEDIUMTEXT CHARACTER SET utf8 ,
2015-11-19 14:39:21 -08:00
` db_id ` SMALLINT UNSIGNED ,
2017-10-18 14:57:58 -07:00
` urn ` VARCHAR ( 500 ) NOT NULL ,
2016-05-19 12:39:06 -07:00
` source ` VARCHAR ( 50 ) NULL ,
` location_prefix ` VARCHAR ( 200 ) NULL ,
2017-10-18 14:57:58 -07:00
` parent_name ` VARCHAR ( 500 ) NULL COMMENT ' Schema Name for RDBMS, Group Name for Jobs/Projects/Tracking Datasets on HDFS ' ,
2017-10-17 12:48:42 -07:00
` storage_type ` ENUM ( ' Table ' , ' View ' , ' Avro ' , ' ORC ' , ' RC ' , ' Sequence ' , ' Flat File ' , ' JSON ' , ' BINARY_JSON ' , ' XML ' , ' Thrift ' , ' Parquet ' , ' Protobuff ' ) NULL ,
2016-05-19 12:39:06 -07:00
` ref_dataset_name ` VARCHAR ( 200 ) NULL ,
` ref_dataset_id ` INT ( 11 ) UNSIGNED NULL COMMENT ' Refer to Master/Main dataset for Views/ExternalTables ' ,
2017-07-19 17:07:28 -07:00
` is_active ` BOOLEAN NULL COMMENT ' is the dataset active / exist ? ' ,
` is_deprecated ` BOOLEAN NULL COMMENT ' is the dataset deprecated by user ? ' ,
2016-05-19 12:39:06 -07:00
` dataset_type ` VARCHAR ( 30 ) NULL
COMMENT ' hdfs, hive, kafka, teradata, mysql, sqlserver, file, nfs, pinot, salesforce, oracle, db2, netezza, cassandra, hbase, qfs, zfs ' ,
` hive_serdes_class ` VARCHAR ( 300 ) NULL ,
` is_partitioned ` CHAR ( 1 ) NULL ,
` partition_layout_pattern_id ` SMALLINT ( 6 ) NULL ,
` sample_partition_full_path ` VARCHAR ( 256 ) COMMENT ' sample partition full path of the dataset ' ,
` source_created_time ` INT UNSIGNED NULL
2015-11-19 14:39:21 -08:00
COMMENT ' source created time of the flow ' ,
2016-05-19 12:39:06 -07:00
` source_modified_time ` INT UNSIGNED NULL
2015-11-19 14:39:21 -08:00
COMMENT ' latest source modified time of the flow ' ,
` created_time ` INT UNSIGNED COMMENT ' wherehows created time ' ,
` modified_time ` INT UNSIGNED COMMENT ' latest wherehows modified ' ,
` wh_etl_exec_id ` BIGINT COMMENT ' wherehows etl execution id that modified this record ' ,
2016-05-19 12:39:06 -07:00
PRIMARY KEY ( ` urn ` , ` db_id ` )
2015-11-19 14:39:21 -08:00
)
ENGINE = InnoDB
2016-05-19 12:39:06 -07:00
DEFAULT CHARSET = latin1
PARTITION BY HASH ( db_id )
PARTITIONS 8 ;
2015-11-19 14:39:21 -08:00
-- dataset table
CREATE TABLE ` dict_dataset ` (
` id ` INT ( 11 ) UNSIGNED NOT NULL AUTO_INCREMENT ,
2017-10-26 10:41:12 -07:00
` name ` VARCHAR ( 200 ) NOT NULL ,
2016-05-19 12:39:06 -07:00
` schema ` MEDIUMTEXT CHARACTER SET utf8 ,
2015-11-19 14:39:21 -08:00
` schema_type ` VARCHAR ( 50 ) DEFAULT ' JSON '
COMMENT ' JSON, Hive, DDL, XML, CSV ' ,
2016-05-19 12:39:06 -07:00
` properties ` TEXT CHARACTER SET utf8 ,
` fields ` MEDIUMTEXT CHARACTER SET utf8 ,
2017-10-26 10:41:12 -07:00
` urn ` VARCHAR ( 500 ) NOT NULL ,
2016-05-19 12:39:06 -07:00
` source ` VARCHAR ( 50 ) NULL
2015-11-19 14:39:21 -08:00
COMMENT ' The original data source type (for dataset in data warehouse). Oracle, Kafka ... ' ,
2016-05-19 12:39:06 -07:00
` location_prefix ` VARCHAR ( 200 ) NULL ,
2017-10-18 14:57:58 -07:00
` parent_name ` VARCHAR ( 500 ) NULL
2015-11-19 14:39:21 -08:00
COMMENT ' Schema Name for RDBMS, Group Name for Jobs/Projects/Tracking Datasets on HDFS ' ,
2017-10-17 12:48:42 -07:00
` storage_type ` ENUM ( ' Table ' , ' View ' , ' Avro ' , ' ORC ' , ' RC ' , ' Sequence ' , ' Flat File ' , ' JSON ' , ' BINARY_JSON ' , ' XML ' , ' Thrift ' , ' Parquet ' , ' Protobuff ' ) NULL ,
2016-05-19 12:39:06 -07:00
` ref_dataset_id ` INT ( 11 ) UNSIGNED NULL
2015-11-19 14:39:21 -08:00
COMMENT ' Refer to Master/Main dataset for Views/ExternalTables ' ,
2017-07-19 17:07:28 -07:00
` is_active ` BOOLEAN NULL COMMENT ' is the dataset active / exist ? ' ,
` is_deprecated ` BOOLEAN NULL COMMENT ' is the dataset deprecated by user ? ' ,
2016-05-19 12:39:06 -07:00
` dataset_type ` VARCHAR ( 30 ) NULL
COMMENT ' hdfs, hive, kafka, teradata, mysql, sqlserver, file, nfs, pinot, salesforce, oracle, db2, netezza, cassandra, hbase, qfs, zfs ' ,
` hive_serdes_class ` VARCHAR ( 300 ) NULL ,
` is_partitioned ` CHAR ( 1 ) NULL ,
` partition_layout_pattern_id ` SMALLINT ( 6 ) NULL ,
2015-11-19 14:39:21 -08:00
` sample_partition_full_path ` VARCHAR ( 256 )
COMMENT ' sample partition full path of the dataset ' ,
2016-05-19 12:39:06 -07:00
` source_created_time ` INT UNSIGNED NULL
2015-11-19 14:39:21 -08:00
COMMENT ' source created time of the flow ' ,
2016-05-19 12:39:06 -07:00
` source_modified_time ` INT UNSIGNED NULL
2015-11-19 14:39:21 -08:00
COMMENT ' latest source modified time of the flow ' ,
` created_time ` INT UNSIGNED COMMENT ' wherehows created time ' ,
` modified_time ` INT UNSIGNED COMMENT ' latest wherehows modified ' ,
` wh_etl_exec_id ` BIGINT COMMENT ' wherehows etl execution id that modified this record ' ,
PRIMARY KEY ( ` id ` ) ,
2017-10-26 10:41:12 -07:00
UNIQUE KEY ` uq_dataset_urn ` ( ` urn ` )
2015-11-19 14:39:21 -08:00
)
2016-04-05 12:43:02 -07:00
ENGINE = InnoDB
2015-11-19 14:39:21 -08:00
DEFAULT CHARSET = latin1 ;
-- stagging table for sample data
CREATE TABLE ` stg_dict_dataset_sample ` (
` db_id ` SMALLINT UNSIGNED ,
` urn ` VARCHAR ( 200 ) NOT NULL DEFAULT ' ' ,
2016-05-19 12:39:06 -07:00
` dataset_id ` INT ( 11 ) NULL ,
` ref_urn ` VARCHAR ( 200 ) NULL ,
` ref_id ` INT ( 11 ) NULL ,
2015-11-19 14:39:21 -08:00
` data ` MEDIUMTEXT ,
PRIMARY KEY ( ` db_id ` , ` urn ` ) ,
KEY ` ref_urn_key ` ( ` ref_urn ` )
)
ENGINE = InnoDB
DEFAULT CHARSET = utf8 ;
-- sample data table
CREATE TABLE ` dict_dataset_sample ` (
` id ` INT ( 11 ) NOT NULL AUTO_INCREMENT ,
2016-05-19 12:39:06 -07:00
` dataset_id ` INT ( 11 ) NULL ,
` urn ` VARCHAR ( 200 ) NULL ,
` ref_id ` INT ( 11 ) NULL
2015-11-19 14:39:21 -08:00
COMMENT ' Reference dataset id of which dataset that we fetch sample from. e.g. for tables we do not have permission, fetch sample data from DWH_STG correspond tables ' ,
` data ` MEDIUMTEXT ,
2016-05-19 12:39:06 -07:00
` modified ` DATETIME NULL ,
` created ` DATETIME NULL ,
2015-11-19 14:39:21 -08:00
PRIMARY KEY ( ` id ` ) ,
2016-06-22 19:37:55 -07:00
UNIQUE KEY ` ak_dict_dataset_sample__datasetid ` ( ` dataset_id ` )
2015-11-19 14:39:21 -08:00
)
ENGINE = InnoDB
AUTO_INCREMENT = 0
DEFAULT CHARSET = utf8 ;
-- stagging table for field detail
CREATE TABLE ` stg_dict_field_detail ` (
` db_id ` SMALLINT UNSIGNED ,
` urn ` VARCHAR ( 200 ) NOT NULL ,
` sort_id ` SMALLINT ( 5 ) UNSIGNED NOT NULL ,
` parent_sort_id ` SMALLINT ( 5 ) UNSIGNED NOT NULL ,
2016-05-19 12:39:06 -07:00
` parent_path ` VARCHAR ( 200 ) NULL ,
2015-11-19 14:39:21 -08:00
` field_name ` VARCHAR ( 100 ) NOT NULL ,
2016-05-19 12:39:06 -07:00
` field_label ` VARCHAR ( 100 ) NULL ,
2015-11-19 14:39:21 -08:00
` data_type ` VARCHAR ( 50 ) NOT NULL ,
2016-05-19 12:39:06 -07:00
` data_size ` INT ( 10 ) UNSIGNED NULL ,
` data_precision ` TINYINT ( 3 ) UNSIGNED NULL ,
` data_scale ` TINYINT ( 3 ) UNSIGNED NULL ,
` is_nullable ` CHAR ( 1 ) NULL ,
` is_indexed ` CHAR ( 1 ) NULL ,
` is_partitioned ` CHAR ( 1 ) NULL ,
` is_distributed ` CHAR ( 1 ) NULL ,
` default_value ` VARCHAR ( 200 ) NULL ,
` namespace ` VARCHAR ( 200 ) NULL ,
` description ` VARCHAR ( 1000 ) NULL ,
2015-11-19 14:39:21 -08:00
` last_modified ` TIMESTAMP NOT NULL DEFAULT CURRENT_TIMESTAMP ON UPDATE CURRENT_TIMESTAMP ,
2016-05-19 12:39:06 -07:00
` dataset_id ` INT UNSIGNED NULL COMMENT ' used to opitimize metadata ETL performance ' ,
KEY ` idx_stg_dict_field_detail__description ` ( ` description ` ( 100 ) ) ,
PRIMARY KEY ( ` urn ` , ` sort_id ` , ` db_id ` )
2015-11-19 14:39:21 -08:00
)
ENGINE = InnoDB
2016-06-22 19:37:55 -07:00
DEFAULT CHARSET = latin1
2016-05-19 12:39:06 -07:00
PARTITION BY HASH ( db_id )
PARTITIONS 8 ;
2015-11-19 14:39:21 -08:00
-- field detail table
CREATE TABLE ` dict_field_detail ` (
` field_id ` INT ( 11 ) UNSIGNED NOT NULL AUTO_INCREMENT ,
` dataset_id ` INT ( 11 ) UNSIGNED NOT NULL ,
` fields_layout_id ` INT ( 11 ) UNSIGNED NOT NULL ,
` sort_id ` SMALLINT ( 6 ) UNSIGNED NOT NULL ,
` parent_sort_id ` SMALLINT ( 5 ) UNSIGNED NOT NULL ,
2016-06-22 19:37:55 -07:00
` parent_path ` VARCHAR ( 200 ) NULL ,
2015-11-19 14:39:21 -08:00
` field_name ` VARCHAR ( 100 ) NOT NULL ,
2016-05-19 12:39:06 -07:00
` field_label ` VARCHAR ( 100 ) NULL ,
2015-11-19 14:39:21 -08:00
` data_type ` VARCHAR ( 50 ) NOT NULL ,
2016-05-19 12:39:06 -07:00
` data_size ` INT ( 10 ) UNSIGNED NULL ,
` data_precision ` TINYINT ( 4 ) NULL
2015-12-11 19:46:35 -08:00
COMMENT ' only in decimal type ' ,
2016-05-19 12:39:06 -07:00
` data_fraction ` TINYINT ( 4 ) NULL
2015-12-11 19:46:35 -08:00
COMMENT ' only in decimal type ' ,
2016-05-19 12:39:06 -07:00
` default_comment_id ` INT ( 11 ) UNSIGNED NULL
2015-11-19 14:39:21 -08:00
COMMENT ' a list of comment_id ' ,
2016-05-19 12:39:06 -07:00
` comment_ids ` VARCHAR ( 500 ) NULL ,
` is_nullable ` CHAR ( 1 ) NULL ,
` is_indexed ` CHAR ( 1 ) NULL
2015-12-11 19:46:35 -08:00
COMMENT ' only in RDBMS ' ,
2016-05-19 12:39:06 -07:00
` is_partitioned ` CHAR ( 1 ) NULL
2015-12-11 19:46:35 -08:00
COMMENT ' only in RDBMS ' ,
2016-05-19 12:39:06 -07:00
` is_distributed ` TINYINT ( 4 ) NULL
2015-12-11 19:46:35 -08:00
COMMENT ' only in RDBMS ' ,
2016-08-24 09:10:35 -07:00
` is_recursive ` CHAR ( 1 ) NULL ,
2016-09-08 09:34:29 -07:00
` confidential_flags ` VARCHAR ( 200 ) NULL ,
2016-05-19 12:39:06 -07:00
` default_value ` VARCHAR ( 200 ) NULL ,
` namespace ` VARCHAR ( 200 ) NULL ,
` java_data_type ` VARCHAR ( 50 ) NULL
2015-12-11 19:46:35 -08:00
COMMENT ' correspond type in java ' ,
2016-05-19 12:39:06 -07:00
` jdbc_data_type ` VARCHAR ( 50 ) NULL
2015-12-11 19:46:35 -08:00
COMMENT ' correspond type in jdbc ' ,
2016-05-19 12:39:06 -07:00
` pig_data_type ` VARCHAR ( 50 ) NULL
2015-12-11 19:46:35 -08:00
COMMENT ' correspond type in pig ' ,
2016-05-19 12:39:06 -07:00
` hcatalog_data_type ` VARCHAR ( 50 ) NULL
2015-12-11 19:46:35 -08:00
COMMENT ' correspond type in hcatalog ' ,
2015-11-19 14:39:21 -08:00
` modified ` TIMESTAMP NOT NULL DEFAULT CURRENT_TIMESTAMP ON UPDATE CURRENT_TIMESTAMP ,
PRIMARY KEY ( ` field_id ` ) ,
2016-06-22 19:37:55 -07:00
UNIQUE KEY ` uix_dict_field__datasetid_parentpath_fieldname ` ( ` dataset_id ` , ` parent_path ` , ` field_name ` ) USING BTREE ,
UNIQUE KEY ` uix_dict_field__datasetid_sortid ` ( ` dataset_id ` , ` sort_id ` ) USING BTREE
2015-11-19 14:39:21 -08:00
)
2016-04-05 12:43:02 -07:00
ENGINE = InnoDB
2015-11-19 14:39:21 -08:00
AUTO_INCREMENT = 0
2016-06-22 19:37:55 -07:00
DEFAULT CHARSET = latin1
COMMENT = ' Flattened Fields/Columns ' ;
2015-11-19 14:39:21 -08:00
-- schema history
CREATE TABLE ` dict_dataset_schema_history ` (
` id ` INT ( 11 ) AUTO_INCREMENT NOT NULL ,
` dataset_id ` INT ( 11 ) NULL ,
2016-05-19 12:39:06 -07:00
` urn ` VARCHAR ( 200 ) NOT NULL ,
2015-11-19 14:39:21 -08:00
` modified_date ` DATE NULL ,
2016-05-19 12:39:06 -07:00
` schema ` MEDIUMTEXT CHARACTER SET utf8 NULL ,
2015-11-19 14:39:21 -08:00
PRIMARY KEY ( id ) ,
2016-05-19 12:39:06 -07:00
UNIQUE KEY ` uk_dict_dataset_schema_history__urn_modified ` ( ` urn ` , ` modified_date ` )
2015-11-19 14:39:21 -08:00
)
ENGINE = InnoDB
AUTO_INCREMENT = 0 ;
2016-03-10 15:41:51 -08:00
-- staging table table of fields to comments mapping
CREATE TABLE ` stg_dict_dataset_field_comment ` (
2016-06-22 19:37:55 -07:00
` field_id ` int ( 11 ) UNSIGNED NOT NULL ,
2016-03-10 15:41:51 -08:00
` comment_id ` bigint ( 20 ) NOT NULL ,
2016-06-22 19:37:55 -07:00
` dataset_id ` int ( 11 ) UNSIGNED NOT NULL ,
2016-03-10 15:41:51 -08:00
` db_id ` smallint ( 6 ) unsigned NOT NULL DEFAULT ' 0 ' ,
2016-06-22 19:37:55 -07:00
PRIMARY KEY ( ` field_id ` , ` comment_id ` , ` db_id ` )
2016-08-24 09:10:35 -07:00
) ENGINE = InnoDB
2016-05-19 12:39:06 -07:00
DEFAULT CHARSET = utf8
2016-06-22 19:37:55 -07:00
PARTITION BY HASH ( db_id )
PARTITIONS 8
2016-03-10 15:41:51 -08:00
;
-- fields to comments mapping
2015-11-19 14:39:21 -08:00
CREATE TABLE ` dict_dataset_field_comment ` (
2016-06-22 19:37:55 -07:00
` field_id ` INT ( 11 ) UNSIGNED NOT NULL ,
2015-11-19 14:39:21 -08:00
` comment_id ` BIGINT ( 20 ) NOT NULL ,
2016-06-22 19:37:55 -07:00
` dataset_id ` INT ( 11 ) UNSIGNED NOT NULL ,
2015-11-19 14:39:21 -08:00
` is_default ` TINYINT ( 1 ) NULL DEFAULT ' 0 ' ,
2016-06-22 19:37:55 -07:00
PRIMARY KEY ( field_id , comment_id ) ,
KEY ( comment_id )
2015-11-19 14:39:21 -08:00
)
ENGINE = InnoDB ;
2016-06-22 19:37:55 -07:00
-- dataset comments
2015-11-19 14:39:21 -08:00
CREATE TABLE comments (
` id ` INT ( 11 ) AUTO_INCREMENT NOT NULL ,
2016-05-19 12:39:06 -07:00
` text ` TEXT CHARACTER SET utf8 NOT NULL ,
2015-11-19 14:39:21 -08:00
` user_id ` INT ( 11 ) NOT NULL ,
` dataset_id ` INT ( 11 ) NOT NULL ,
` created ` DATETIME NULL ,
` modified ` DATETIME NULL ,
` comment_type ` ENUM ( ' Description ' , ' Grain ' , ' Partition ' , ' ETL Schedule ' , ' DQ Issue ' , ' Question ' , ' Comment ' ) NULL ,
PRIMARY KEY ( id ) ,
KEY ` user_id ` ( ` user_id ` ) USING BTREE ,
KEY ` dataset_id ` ( ` dataset_id ` ) USING BTREE ,
FULLTEXT KEY ` fti_comment ` ( ` text ` )
)
ENGINE = InnoDB
CHARACTER SET latin1
COLLATE latin1_swedish_ci
AUTO_INCREMENT = 0 ;
-- field comments
CREATE TABLE ` field_comments ` (
` id ` INT ( 11 ) UNSIGNED NOT NULL AUTO_INCREMENT ,
2016-06-22 19:37:55 -07:00
` user_id ` INT ( 11 ) NOT NULL DEFAULT ' 0 ' ,
2015-11-19 14:39:21 -08:00
` comment ` VARCHAR ( 4000 ) NOT NULL ,
2016-06-22 19:37:55 -07:00
` created ` TIMESTAMP NOT NULL ,
2015-11-19 14:39:21 -08:00
` modified ` TIMESTAMP NOT NULL DEFAULT CURRENT_TIMESTAMP ON UPDATE CURRENT_TIMESTAMP ,
2016-05-19 12:39:06 -07:00
` comment_crc32_checksum ` INT ( 11 ) UNSIGNED NULL COMMENT ' 4-byte CRC32 ' ,
2015-11-19 14:39:21 -08:00
PRIMARY KEY ( ` id ` ) ,
2016-03-10 15:41:51 -08:00
KEY ` comment_key ` ( ` comment ` ( 100 ) ) ,
2015-11-19 14:39:21 -08:00
FULLTEXT KEY ` fti_comment ` ( ` comment ` )
)
ENGINE = InnoDB
AUTO_INCREMENT = 0
DEFAULT CHARSET = utf8 ;
2016-06-22 19:37:55 -07:00
-- dict_dataset_instance
2016-08-24 09:10:35 -07:00
CREATE TABLE dict_dataset_instance (
2016-06-22 19:37:55 -07:00
dataset_id int ( 11 ) UNSIGNED NOT NULL ,
db_id smallint ( 6 ) UNSIGNED COMMENT ' FK to cfg_database ' NOT NULL DEFAULT ' 0 ' ,
deployment_tier enum ( ' local ' , ' grid ' , ' dev ' , ' int ' , ' ei ' , ' ei2 ' , ' ei3 ' , ' qa ' , ' stg ' , ' prod ' ) NOT NULL DEFAULT ' dev ' ,
data_center varchar ( 30 ) COMMENT ' data center code: lva1, ltx1, dc2, dc3... ' NULL DEFAULT ' * ' ,
server_cluster varchar ( 150 ) COMMENT ' sfo1-bigserver, jfk3-sqlserver03 ' NULL DEFAULT ' * ' ,
slice varchar ( 50 ) COMMENT ' virtual group/tenant id/instance tag ' NOT NULL DEFAULT ' * ' ,
2017-07-19 17:07:28 -07:00
is_active BOOLEAN NULL COMMENT ' is the dataset active / exist ? ' ,
is_deprecated BOOLEAN NULL COMMENT ' is the dataset deprecated by user ? ' ,
2016-06-22 19:37:55 -07:00
native_name varchar ( 250 ) NOT NULL ,
logical_name varchar ( 250 ) NOT NULL ,
version varchar ( 30 ) COMMENT ' 1.2.3 or 0.3.131 ' NULL ,
2016-06-29 23:00:18 -07:00
version_sort_id bigint ( 20 ) COMMENT ' 4-digit for each version number: 000100020003, 000000030131 ' NOT NULL DEFAULT ' 0 ' ,
2016-07-20 18:01:25 -07:00
schema_text MEDIUMTEXT CHARACTER SET utf8 NULL ,
ddl_text MEDIUMTEXT CHARACTER SET utf8 NULL ,
2016-06-22 19:37:55 -07:00
instance_created_time int ( 10 ) UNSIGNED COMMENT ' source instance created time ' NULL ,
created_time int ( 10 ) UNSIGNED COMMENT ' wherehows created time ' NULL ,
modified_time int ( 10 ) UNSIGNED COMMENT ' latest wherehows modified ' NULL ,
wh_etl_exec_id bigint ( 20 ) COMMENT ' wherehows etl execution id that modified this record ' NULL ,
2016-06-29 18:00:10 -07:00
PRIMARY KEY ( dataset_id , db_id , version_sort_id )
2016-06-22 19:37:55 -07:00
)
ENGINE = InnoDB
CHARACTER SET latin1
COLLATE latin1_swedish_ci
AUTO_INCREMENT = 0
PARTITION BY HASH ( db_id )
( PARTITION p0 ,
PARTITION p1 ,
PARTITION p2 ,
PARTITION p3 ,
PARTITION p4 ,
PARTITION p5 ,
PARTITION p6 ,
PARTITION p7 ) ;
2016-08-24 09:10:35 -07:00
CREATE INDEX logical_name USING BTREE
2016-06-22 19:37:55 -07:00
ON dict_dataset_instance ( logical_name ) ;
2016-08-24 09:10:35 -07:00
CREATE INDEX server_cluster USING BTREE
2016-06-22 19:37:55 -07:00
ON dict_dataset_instance ( server_cluster , deployment_tier , data_center , slice ) ;
2016-08-24 09:10:35 -07:00
CREATE INDEX native_name USING BTREE
2016-06-22 19:37:55 -07:00
ON dict_dataset_instance ( native_name ) ;
2016-08-24 09:10:35 -07:00
CREATE TABLE stg_dict_dataset_instance (
2016-06-22 19:37:55 -07:00
dataset_urn varchar ( 200 ) NOT NULL ,
db_id smallint ( 6 ) UNSIGNED NOT NULL DEFAULT ' 0 ' ,
deployment_tier enum ( ' local ' , ' grid ' , ' dev ' , ' int ' , ' ei ' , ' ei2 ' , ' ei3 ' , ' qa ' , ' stg ' , ' prod ' ) NOT NULL DEFAULT ' dev ' ,
data_center varchar ( 30 ) COMMENT ' data center code: lva1, ltx1, dc2, dc3... ' NULL DEFAULT ' * ' ,
server_cluster varchar ( 150 ) COMMENT ' sfo1-bigserver ' NULL DEFAULT ' * ' ,
slice varchar ( 50 ) COMMENT ' virtual group/tenant id/instance tag ' NOT NULL DEFAULT ' * ' ,
2017-07-19 17:07:28 -07:00
is_active BOOLEAN NULL COMMENT ' is the dataset active / exist ? ' ,
is_deprecated BOOLEAN NULL COMMENT ' is the dataset deprecated by user ? ' ,
2016-06-22 19:37:55 -07:00
native_name varchar ( 250 ) NOT NULL ,
logical_name varchar ( 250 ) NOT NULL ,
version varchar ( 30 ) COMMENT ' 1.2.3 or 0.3.131 ' NULL ,
2017-01-27 11:35:41 -08:00
schema_text MEDIUMTEXT CHARACTER SET utf8 NULL ,
ddl_text MEDIUMTEXT CHARACTER SET utf8 NULL ,
2016-06-22 19:37:55 -07:00
instance_created_time int ( 10 ) UNSIGNED COMMENT ' source instance created time ' NULL ,
created_time int ( 10 ) UNSIGNED COMMENT ' wherehows created time ' NULL ,
wh_etl_exec_id bigint ( 20 ) COMMENT ' wherehows etl execution id that modified this record ' NULL ,
dataset_id int ( 11 ) UNSIGNED NULL ,
abstract_dataset_urn varchar ( 200 ) NULL ,
PRIMARY KEY ( dataset_urn , db_id )
)
ENGINE = InnoDB
CHARACTER SET latin1
COLLATE latin1_swedish_ci
AUTO_INCREMENT = 0
PARTITION BY HASH ( db_id )
( PARTITION p0 ,
PARTITION p1 ,
PARTITION p2 ,
PARTITION p3 ,
PARTITION p4 ,
PARTITION p5 ,
PARTITION p6 ,
PARTITION p7 ) ;
2016-08-24 09:10:35 -07:00
CREATE INDEX server_cluster USING BTREE
2016-06-22 19:37:55 -07:00
ON stg_dict_dataset_instance ( server_cluster , deployment_tier , data_center , slice ) ;