-
Notifications
You must be signed in to change notification settings - Fork 15
/
variables.tf
381 lines (312 loc) · 9.11 KB
/
variables.tf
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
210
211
212
213
214
215
216
217
218
219
220
221
222
223
224
225
226
227
228
229
230
231
232
233
234
235
236
237
238
239
240
241
242
243
244
245
246
247
248
249
250
251
252
253
254
255
256
257
258
259
260
261
262
263
264
265
266
267
268
269
270
271
272
273
274
275
276
277
278
279
280
281
282
283
284
285
286
287
288
289
290
291
292
293
294
295
296
297
298
299
300
301
302
303
304
305
306
307
308
309
310
311
312
313
314
315
316
317
318
319
320
321
322
323
324
325
326
327
328
329
330
331
332
333
334
335
336
337
338
339
340
341
342
343
344
345
346
347
348
349
350
351
352
353
354
355
356
357
358
359
360
361
362
363
364
365
366
367
368
369
370
371
372
373
374
375
376
377
378
379
380
381
variable "config_template_path" {
type = string
description = "Path to Tamr config template."
default = "./tamr-config.yml"
}
variable "rendered_config_path" {
type = string
description = "If provided, the populated Tamr config will be output to this path. Include a file name (E.g. /path/to/config.yml). NOTE: Any required parent directories will be created automatically, and any existing file with the given name will be overwritten."
default = ""
}
variable "ephemeral_spark_configured" {
type = bool
description = "True if EMR was configured for ephemeral spark clusters."
}
variable "additional_templated_variables" {
type = map(string)
description = "Mapping of additional Tamr variables (not included in template) to its value."
default = {}
}
#
# RDS
#
variable "rds_pg_hostname" {
type = string
description = "Hostname of RDS postgres instance."
}
variable "rds_pg_dbname" {
type = string
description = "RDS postgres database name."
default = "doit"
}
variable "rds_pg_username" {
type = string
description = "Master username for RDS postgres database instance."
default = "tamr"
}
variable "rds_pg_password" {
type = string
description = "Master password for RDS postgres database instance."
}
variable "rds_pg_db_port" {
type = number
description = "The RDS postgres database port."
default = 5432
}
#
# HBase
#
variable "hbase_namespace" {
type = string
default = "tamr"
}
variable "tamr_data_bucket" {
type = string
description = "Name of Tamr root directory bucket."
}
variable "hbase_config_path" {
type = string
description = "Path to HBase configuration in EMR root directory bucket."
default = "config/hbase/conf.dist/"
}
#
# HBase - properties
#
variable "hbase_storage_mode" {
type = string
description = "Storage mode for HBase. Valid values: `SHARED`, `DEDICATED`"
default = "SHARED"
}
variable "hbase_number_of_regions" {
type = string
description = "Number of regions to create by default in HBase"
default = "1000"
}
variable "hbase_number_of_salt_values" {
type = string
description = "Number of distinct salt values to be used for prefixing row keys in HBase tables. Must be >= hbase_number_of_regions"
default = "1000"
}
#
# Spark
#
variable "spark_emr_cluster_id" {
type = string
description = "Spark cluster ID. Value will not be used if deployment is spinning up ephemeral Spark clusters."
default = ""
}
variable "spark_cluster_log_uri" {
type = string
description = "The path to the S3 location where logs for the Spark cluster are stored."
}
#
# Spark - Scale
#
variable "spark_driver_memory" {
type = string
default = "5G"
}
variable "spark_executor_instances" {
type = number
default = 2
}
variable "spark_executor_memory" {
type = string
default = "8G"
}
variable "spark_executor_cores" {
type = number
default = 2
}
variable "tamr_spark_config_override" {
type = string
description = "A list of spark config overrides. If not set all jobs will run with the default spark settings. Used for setting job-by-job spark resource settings."
default = ""
}
variable "tamr_spark_properties_override" {
type = string
description = "JSON blob of spark properties to override. If not set, will use a default set of properties that should work for most use cases."
default = ""
}
#
# Elasticsearch
#
variable "es_domain_endpoint" {
type = string
description = "Endpoint of Elasticsearch domain."
}
variable "es_enabled" {
type = bool
description = "Whether or not to enable Elasticsearch by setting TAMR_ES_ENABLED flag"
default = true
}
#
# FileSystem
#
variable "tamr_data_path" {
type = string
description = "Path in root directory bucket (bucket provided for tamr_bucket_name input) to write data to."
default = "tamr/unify-data"
}
#
# ESP
#
variable "tamr_external_storage_providers" {
type = string
description = "Filesystem connection information for external storage providers."
default = ""
}
#
# Ephemeral Spark
#
variable "emr_release_label" {
type = string
description = "The release label for the Amazon EMR release."
default = "emr-5.29.0"
}
variable "emr_instance_profile_name" {
type = string
description = "Name of instance profile for EMR EC2 instances."
default = ""
}
variable "emr_service_role_name" {
type = string
description = "Name of IAM service role for EMR cluster."
default = ""
}
variable "emr_key_pair_name" {
type = string
description = "Name of the Key Pair that will be attached to the EMR EC2 instances."
default = ""
}
variable "emr_subnet_id" {
type = string
description = "ID of the subnet where the EMR cluster will be created."
default = ""
}
variable "master_instance_type" {
type = string
description = "The EC2 instance type of the master nodes."
default = ""
}
variable "master_ebs_volumes_count" {
type = string
description = "Number of volumes to attach to the master nodes."
default = ""
}
variable "master_ebs_size" {
type = string
description = "The master EBS volume size, in gibibytes (GiB)."
default = ""
}
variable "master_ebs_type" {
type = string
description = "Type of volumes to attach to the master nodes. Valid options are gp2, io1, standard and st1."
default = ""
}
variable "core_ebs_volumes_count" {
type = string
description = "Number of volumes to attach to the core nodes."
default = ""
}
variable "core_ebs_size" {
type = string
description = "The core EBS volume size, in gibibytes (GiB)."
default = ""
}
variable "core_ebs_type" {
type = string
description = "Type of volumes to attach to the core nodes. Valid options are gp2, io1, standard and st1."
default = ""
}
variable "core_group_instance_count" {
type = string
description = "Number of Amazon EC2 instances used to execute the job flow."
default = ""
}
variable "core_instance_type" {
type = string
description = "The EC2 instance type of the core nodes."
default = ""
}
variable "emr_service_access_sg_id" {
type = string
description = "Security group ID of EMR Service Access Security Group."
default = ""
}
variable "emr_managed_master_sg_id" {
type = string
description = "Security group ID of the EMR Managed Master Security Group."
default = ""
}
variable "emr_additional_master_sg_id" {
type = string
description = "Security group ID of the EMR Additional Master Security Group."
default = ""
}
variable "emr_managed_core_sg_id" {
type = string
description = "Security group ID of the EMR Managed Core Security Group."
default = ""
}
variable "emr_additional_core_sg_id" {
type = string
description = "Security group ID of the EMR Additional Core Security Group."
default = ""
}
variable "emrfs_dynamodb_table_name" {
type = string
description = "Name for the EMRFS DynamoDB table."
default = ""
}
variable "emr_root_volume_size" {
default = "10"
type = string
description = "The size, in GiB, of the EBS root device volume of the Linux AMI that is used for each EMR EC2 instance."
}
variable "emr_tags" {
type = map(string)
description = "Map of tags to add to new resources in EMR"
default = {}
}
variable "emr_cluster_name_prefix" {
type = string
description = "A prefix to add to the name of created EMR Spark clusters"
default = "tamr-emr-"
}
variable "emr_security_configuration" {
type = string
description = "Security configuration to attach to created EMR Spark clusters. Supported in Tamr v2022.009.0 and later."
default = ""
}
#
# Backup Config
#
variable "tamr_file_based_hbase_backup_enabled" {
type = bool
description = "Whether to backup contents of HBase root directory to backup path"
default = true
}
variable "tamr_unify_backup_es" {
type = bool
description = "Defines whether or not to back up Elasticsearch"
default = false
}
variable "tamr_unify_backup_aws_role_based_access" {
type = bool
description = "Set to `true` if Tamr should use EC2 instance profile (role-based) credentials instead of static credentials"
default = true
}
variable "tamr_unify_backup_path" {
type = string
description = "Identifies the path for storing backup files"
default = "tamr/backups"
}
variable "tamr_backup_emr_cluster_id" {
type = string
description = "ID of the static EMR cluster to run s3distcp on when backing up to or restoring from S3."
default = ""
}
#
# DMS Config
#
variable "apps_dms_enabled" {
type = bool
description = "Set to `true` to enable the Data Movement Service (DMS)"
default = true
}
variable "apps_dms_default_cloud_provider" {
type = string
description = "Defines the default cloud service provider for DMS when `APPS_DMS_ENABLED` is set to `true`"
default = "s3"
}