-
Notifications
You must be signed in to change notification settings - Fork 15
/
Copy pathtamr-config.yml.tmpl
93 lines (82 loc) · 3.75 KB
/
tamr-config.yml.tmpl
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
---
# RDS
TAMR_PERSISTENCE_DB_USER: ${rds_pg_username}
TAMR_PERSISTENCE_DB_URL: jdbc:postgresql://${rds_pg_hostname}:${rds_pg_db_port}/${rds_pg_dbname}
TAMR_PERSISTENCE_DB_PASS: ${rds_pg_password}
TAMR_PERSISTENCE_DB_PORT: ${rds_pg_db_port}
# HBase
TAMR_REMOTE_HBASE_ENABLED: true
TAMR_HBASE_REMOTE_DOWNLOAD_ENABLED: true
TAMR_CONNECTION_INFO_TYPE: hbase-site
TAMR_HBASE_NAMESPACE: ${hbase_namespace}
TAMR_HBASE_COMPRESSION: snappy
TAMR_HBASE_CONFIG_URIS: s3://${tamr_data_bucket}/${hbase_config_path}hbase-site.xml
# HBase - Properties
TAMR_HBASE_STORAGE_MODE: ${hbase_storage_mode}
TAMR_HBASE_NUMBER_OF_REGIONS: ${hbase_number_of_regions}
TAMR_HBASE_NUMBER_OF_SALT_VALUES: ${hbase_number_of_salt_values}
%{ if ephemeral_spark_configured }
# Spark
TAMR_REMOTE_SPARK_ENABLED: true
TAMR_JOB_SPARK_CLUSTER : emr-ephemeral
TAMR_JOB_EMR_CLUSTER_ID: ${spark_emr_cluster_id}
TAMR_DATASET_EMR_LOG_URI: ${spark_cluster_log_uri}
TAMR_DATASET_EMR_RELEASE: ${emr_release_label}
TAMR_DATASET_EMR_INSTANCE_PROFILE: ${emr_instance_profile_name}
TAMR_DATASET_EMR_SERVICE_ROLE: ${emr_service_role_name}
TAMR_DATASET_EMR_KEY_NAME: ${emr_key_pair_name}
TAMR_DATASET_EMR_SUBNET_ID: ${emr_subnet_id}
TAMR_DATASET_EMR_MASTER_INSTANCE_TYPE: ${master_instance_type}
TAMR_DATASET_EMR_MASTER_VOLUME_COUNT: ${master_ebs_volumes_count}
TAMR_DATASET_EMR_MASTER_VOLUME_SIZE: ${master_ebs_size}
TAMR_DATASET_EMR_MASTER_VOLUME_TYPE: ${master_ebs_type}
TAMR_DATASET_EMR_CORE_VOLUME_COUNT: ${core_ebs_volumes_count}
TAMR_DATASET_EMR_CORE_VOLUME_SIZE: ${core_ebs_size}
TAMR_DATASET_EMR_CORE_VOLUME_TYPE: ${core_ebs_type}
TAMR_DATASET_EMR_INSTANCE_COUNT: ${core_group_instance_count}
TAMR_DATASET_EMR_INSTANCE_TYPE: ${core_instance_type}
TAMR_DATASET_EMR_ACCESS_SECURITY_GROUP: ${emr_service_access_sg_id}
TAMR_DATASET_EMR_MASTER_SECURITY_GROUP: ${emr_managed_master_sg_id}
TAMR_DATASET_EMR_MASTER_SECURITY_GROUP_ADDITIONAL: ${emr_additional_master_sg_id}
TAMR_DATASET_EMR_WORKER_SECURITY_GROUP: ${emr_managed_core_sg_id}
TAMR_DATASET_EMR_WORKER_SECURITY_GROUP_ADDITIONAL: ${emr_additional_core_sg_id}
TAMR_EMRFS_DYNAMO_TABLE: ${emrfs_dynamodb_table_name}
TAMR_DATASET_EMR_ROOT_VOLUME_SIZE: ${emr_root_volume_size}
TAMR_DATASET_EMR_CLUSTER_NAME_PREFIX: ${emr_cluster_name_prefix}
TAMR_DATASET_EMR_CLUSTER_TAGS: ${emr_cluster_tags}
TAMR_DATASET_EMR_SECURITY_CONFIGURATION: ${emr_security_configuration}
%{ endif }
# Spark - Scale
TAMR_JOB_SPARK_DRIVER_MEM: ${spark_driver_memory}
TAMR_JOB_SPARK_EXECUTOR_INSTANCES: ${spark_executor_instances}
TAMR_JOB_SPARK_EXECUTOR_MEM: ${spark_executor_memory}
TAMR_JOB_SPARK_EXECUTOR_CORES: ${spark_executor_cores}
TAMR_JOB_SPARK_CONFIG_OVERRIDES: "${tamr_spark_config_override}"
TAMR_JOB_SPARK_PROPS: "${tamr_spark_properties_override}"
# Elasticsearch
TAMR_ES_ENABLED: ${es_enabled}
TAMR_REMOTE_ES_ENABLED: ${remote_es_enabled}
TAMR_ES_APIHOST: ${es_api_host}
TAMR_ES_HEALTH_CHECK_METADATA: false
TAMR_ES_SSL_ENABLED: ${es_ssl_enabled}
# FileSystem
TAMR_UNIFY_DATA_DIR: s3://${tamr_data_bucket}/${tamr_data_path}
TAMR_FS_URI: s3://${tamr_data_bucket}
# ESP
TAMR_STORAGE_PROVIDERS: '${tamr_external_storage_providers}'
# Misc
TAMR_BIGQUERY_ENABLED: false
# Backup Config
TAMR_FILE_BASED_HBASE_BACKUP_ENABLED: ${tamr_file_based_hbase_backup_enabled}
TAMR_BACKUP_AWS_CLI_ENABLED: ${tamr_backup_aws_cli_enabled}
TAMR_UNIFY_BACKUP_ES: ${tamr_unify_backup_es}
TAMR_UNIFY_BACKUP_AWS_ROLE_BASED_ACCESS: ${tamr_unify_backup_aws_role_based_access}
TAMR_UNIFY_BACKUP_URI: s3://${tamr_data_bucket}/${tamr_unify_backup_path}
TAMR_BACKUP_S3DISTCP_ENABLED: ${tamr_backup_s3distcp_enabled}
TAMR_BACKUP_EMR_CLUSTER_ID: ${tamr_backup_emr_cluster_id}
# DMS Config
APPS_DMS_ENABLED: ${apps_dms_enabled}
APPS_DMS_DEFAULT_CLOUD_PROVIDER: ${apps_dms_default_cloud_provider}
%{ for k, v in additional_templated_variables }
${k}: ${v}
%{ endfor }