Skip to content

Commit

Permalink
Update 43-aws-glue-job-rentsense.tf
Browse files Browse the repository at this point in the history
Editing the Terraform for rentsense to accommodate the new script. I presume it is fine in the same file?
  • Loading branch information
daroclark authored May 15, 2024
1 parent 24d7502 commit e60caff
Showing 1 changed file with 48 additions and 0 deletions.
48 changes: 48 additions & 0 deletions terraform/etl/43-aws-glue-job-rentsense.tf
Original file line number Diff line number Diff line change
Expand Up @@ -47,5 +47,53 @@ module "rentsense_output_to_landing_S3" {
}

}

module "rentsense_former_tenant_output_to_refined_S3" {
source = "../modules/aws-glue-job"
is_production_environment = local.is_production_environment
is_live_environment = local.is_live_environment
job_name = "${local.short_identifier_prefix}Rentsense former tenant outputs to refined S3"
glue_scripts_bucket_id = module.glue_scripts_data_source.bucket_id
glue_temp_bucket_id = module.glue_temp_storage_data_source.bucket_id
glue_role_arn = data.aws_iam_role.glue_role.arn
glue_job_worker_type = "G.1X"
number_of_workers_for_glue_job = 8
max_retries = 3
glue_version = "4.0"
helper_module_key = data.aws_s3_object.helpers.key
pydeequ_zip_key = data.aws_s3_object.pydeequ.key
spark_ui_output_storage_id = module.spark_ui_output_storage_data_source.bucket_id
job_parameters = {
"--job-bookmark-option" = "job-bookmark-enable"
"--s3_bucket" = module.refined_zone_data_source.bucket_id
"--s3_bucket_target" = "s3://${module.refined_zone_data_source.bucket_id}/housing/rentsense-ft"
"--s3_landing" = module.landing_zone_data_source.bucket_id
"--enable-glue-datacatalog" = "true"
"--source_raw_database" = module.department_housing_data_source.raw_zone_catalog_database_name
"--source_catalog_database" = module.department_housing_data_source.refined_zone_catalog_database_name
}
script_name = "rentsense_former_tenants_to_refined"
triggered_by_crawler = data.aws_ssm_parameter.ingest_housing_interim_finance_database_to_housing_raw_zone_crawler_name.value
glue_crawler_excluded_blobs = ["*.json",
"*.txt",
"*.zip",
"*.xlsx",
"**/*.csv",
"**.csv.gz"]
crawler_details = {
database_name = module.department_housing_data_source.refined_zone_catalog_database_name
s3_target_location = "s3://${module.refined_zone_data_source.bucket_id}/housing/rentsense-ft"
configuration = jsonencode({
Version = 1.0
Grouping = {
TableLevelConfiguration = 4
}
})
table_prefix = null
}

}




0 comments on commit e60caff

Please sign in to comment.