Skip to content
This repository has been archived by the owner on Aug 16, 2022. It is now read-only.

feat: Added glue dev endpoints #1361

Merged
merged 4 commits into from
Aug 3, 2022
Merged
Show file tree
Hide file tree
Changes from 1 commit
Commits
File filter

Filter by extension

Filter by extension

Conversations
Failed to load comments.
Loading
Jump to
Jump to file
Failed to load files.
Loading
Diff view
Diff view
20 changes: 20 additions & 0 deletions client/mocks/glue.go

Some generated files are not rendered by default. Learn more about how customized files appear on GitHub.

1 change: 1 addition & 0 deletions client/services.go
Original file line number Diff line number Diff line change
Expand Up @@ -752,6 +752,7 @@ type GlueClient interface {
GetTags(ctx context.Context, params *glue.GetTagsInput, optFns ...func(*glue.Options)) (*glue.GetTagsOutput, error)
GetWorkflow(ctx context.Context, params *glue.GetWorkflowInput, optFns ...func(*glue.Options)) (*glue.GetWorkflowOutput, error)
ListWorkflows(ctx context.Context, params *glue.ListWorkflowsInput, optFns ...func(*glue.Options)) (*glue.ListWorkflowsOutput, error)
GetDevEndpoints(ctx context.Context, params *glue.GetDevEndpointsInput, optFns ...func(*glue.Options)) (*glue.GetDevEndpointsOutput, error)
}

//go:generate mockgen -package=mocks -destination=./mocks/kinesis.go . KinesisClient
Expand Down
35 changes: 35 additions & 0 deletions docs/tables/aws_glue_dev_endpoints.md
Original file line number Diff line number Diff line change
@@ -0,0 +1,35 @@

# Table: aws_glue_dev_endpoints
A development endpoint where a developer can remotely debug extract, transform, and load (ETL) scripts
## Columns
| Name | Type | Description |
| ------------- | ------------- | ----- |
|account_id|text|The AWS Account ID of the resource.|
|region|text|The AWS Region of the resource.|
|arn|text|The Amazon Resource Name (ARN) of the workflow.|
|tags|jsonb|Resource tags.|
|arguments|jsonb|A map of arguments used to configure the DevEndpoint|
|availability_zone|text|The AWS Availability Zone where this DevEndpoint is located|
|created_timestamp|timestamp without time zone|The point in time at which this DevEndpoint was created|
|name|text|The name of the DevEndpoint|
|extra_jars_s3_path|text|The path to one or more Java jar files in an S3 bucket that should be loaded in your DevEndpoint|
|extra_python_libs_s3_path|text|The paths to one or more Python libraries in an Amazon S3 bucket that should be loaded in your DevEndpoint|
|failure_reason|text|The reason for a current failure in this DevEndpoint|
|glue_version|text|Glue version determines the versions of Apache Spark and Python that Glue supports|
|last_modified_timestamp|timestamp without time zone|The point in time at which this DevEndpoint was last modified|
|last_update_status|text|The status of the last update|
|number_of_nodes|bigint|The number of Glue Data Processing Units (DPUs) allocated to this DevEndpoint|
|number_of_workers|bigint|The number of workers of a defined workerType that are allocated to the development endpoint|
|private_address|text|A private IP address to access the DevEndpoint within a VPC if the DevEndpoint is created within one|
|public_address|text|The public IP address used by this DevEndpoint|
|public_key|text|The public key to be used by this DevEndpoint for authentication|
|public_keys|text[]|A list of public keys to be used by the DevEndpoints for authentication|
|role_arn|text|The Amazon Resource Name (ARN) of the IAM role used in this DevEndpoint|
|security_configuration|text|The name of the SecurityConfiguration structure to be used with this DevEndpoint|
|security_group_ids|text[]|A list of security group identifiers used in this DevEndpoint|
|status|text|The current status of this DevEndpoint|
|subnet_id|text|The subnet ID for this DevEndpoint|
|vpc_id|text|The ID of the virtual private cloud (VPC) used by this DevEndpoint|
|worker_type|text|The type of predefined worker that is allocated to the development endpoint Accepts a value of Standard, G1X, or G2X * For the Standard worker type, each worker provides 4 vCPU, 16 GB of memory and a 50GB disk, and 2 executors per worker * For the G1X worker type, each worker maps to 1 DPU (4 vCPU, 16 GB of memory, 64 GB disk), and provides 1 executor per worker|
|yarn_endpoint_address|text|The YARN endpoint address used by this DevEndpoint|
|zeppelin_remote_spark_interpreter_port|bigint|The Apache Zeppelin port for the remote Apache Spark interpreter|
1 change: 1 addition & 0 deletions resources/provider/provider.go
Original file line number Diff line number Diff line change
Expand Up @@ -168,6 +168,7 @@ func Provider() *provider.Provider {
"emr.block_public_access_configs": emr.EmrBlockPublicAccessConfigs(),
"emr.clusters": emr.EmrClusters(),
"fsx.backups": fsx.FsxBackups(),
"glue.dev_endpoints": glue.DevEndpoints(),
"glue.workflows": glue.Workflows(),
"guardduty.detectors": guardduty.GuarddutyDetectors(),
"iam.accounts": iam.IamAccounts(),
Expand Down
229 changes: 229 additions & 0 deletions resources/services/glue/dev_endpoints.go
Original file line number Diff line number Diff line change
@@ -0,0 +1,229 @@
package glue

import (
"context"

"github.com/aws/aws-sdk-go-v2/aws"
"github.com/aws/aws-sdk-go-v2/service/glue"
"github.com/aws/aws-sdk-go-v2/service/glue/types"
"github.com/cloudquery/cq-provider-aws/client"
"github.com/cloudquery/cq-provider-sdk/provider/diag"
"github.com/cloudquery/cq-provider-sdk/provider/schema"
)

//go:generate cq-gen --resource dev_endpoints --config dev_endpoints.hcl --output .
func DevEndpoints() *schema.Table {
return &schema.Table{
Name: "aws_glue_dev_endpoints",
Description: "A development endpoint where a developer can remotely debug extract, transform, and load (ETL) scripts",
Resolver: fetchGlueDevEndpoints,
Multiplex: client.ServiceAccountRegionMultiplexer("glue"),
IgnoreError: client.IgnoreAccessDeniedServiceDisabled,
DeleteFilter: client.DeleteAccountRegionFilter,
Options: schema.TableCreationOptions{PrimaryKeys: []string{"arn"}},
Columns: []schema.Column{
{
Name: "account_id",
Description: "The AWS Account ID of the resource.",
Type: schema.TypeString,
Resolver: client.ResolveAWSAccount,
},
{
Name: "region",
Description: "The AWS Region of the resource.",
Type: schema.TypeString,
Resolver: client.ResolveAWSRegion,
},
{
Name: "arn",
Description: "The Amazon Resource Name (ARN) of the workflow.",
Type: schema.TypeString,
Resolver: resolveGlueDevEndpointArn,
},
{
Name: "tags",
Description: "Resource tags.",
Type: schema.TypeJSON,
Resolver: resolveGlueDevEndpointTags,
},
{
Name: "arguments",
Description: "A map of arguments used to configure the DevEndpoint",
Type: schema.TypeJSON,
},
{
Name: "availability_zone",
Description: "The AWS Availability Zone where this DevEndpoint is located",
Type: schema.TypeString,
},
{
Name: "created_timestamp",
Description: "The point in time at which this DevEndpoint was created",
Type: schema.TypeTimestamp,
},
{
Name: "name",
Description: "The name of the DevEndpoint",
Type: schema.TypeString,
Resolver: schema.PathResolver("EndpointName"),
},
{
Name: "extra_jars_s3_path",
Description: "The path to one or more Java jar files in an S3 bucket that should be loaded in your DevEndpoint",
Type: schema.TypeString,
},
{
Name: "extra_python_libs_s3_path",
Description: "The paths to one or more Python libraries in an Amazon S3 bucket that should be loaded in your DevEndpoint",
Type: schema.TypeString,
},
{
Name: "failure_reason",
Description: "The reason for a current failure in this DevEndpoint",
Type: schema.TypeString,
},
{
Name: "glue_version",
Description: "Glue version determines the versions of Apache Spark and Python that Glue supports",
Type: schema.TypeString,
},
{
Name: "last_modified_timestamp",
Description: "The point in time at which this DevEndpoint was last modified",
Type: schema.TypeTimestamp,
},
{
Name: "last_update_status",
Description: "The status of the last update",
Type: schema.TypeString,
},
{
Name: "number_of_nodes",
Description: "The number of Glue Data Processing Units (DPUs) allocated to this DevEndpoint",
Type: schema.TypeBigInt,
},
{
Name: "number_of_workers",
Description: "The number of workers of a defined workerType that are allocated to the development endpoint",
Type: schema.TypeBigInt,
},
{
Name: "private_address",
Description: "A private IP address to access the DevEndpoint within a VPC if the DevEndpoint is created within one",
Type: schema.TypeString,
},
{
Name: "public_address",
Description: "The public IP address used by this DevEndpoint",
Type: schema.TypeString,
},
{
Name: "public_key",
Description: "The public key to be used by this DevEndpoint for authentication",
Type: schema.TypeString,
},
{
Name: "public_keys",
Description: "A list of public keys to be used by the DevEndpoints for authentication",
Type: schema.TypeStringArray,
},
{
Name: "role_arn",
Description: "The Amazon Resource Name (ARN) of the IAM role used in this DevEndpoint",
Type: schema.TypeString,
},
{
Name: "security_configuration",
Description: "The name of the SecurityConfiguration structure to be used with this DevEndpoint",
Type: schema.TypeString,
},
{
Name: "security_group_ids",
Description: "A list of security group identifiers used in this DevEndpoint",
Type: schema.TypeStringArray,
},
{
Name: "status",
Description: "The current status of this DevEndpoint",
Type: schema.TypeString,
},
{
Name: "subnet_id",
Description: "The subnet ID for this DevEndpoint",
Type: schema.TypeString,
},
{
Name: "vpc_id",
Description: "The ID of the virtual private cloud (VPC) used by this DevEndpoint",
Type: schema.TypeString,
},
{
Name: "worker_type",
Description: "The type of predefined worker that is allocated to the development endpoint Accepts a value of Standard, G1X, or G2X * For the Standard worker type, each worker provides 4 vCPU, 16 GB of memory and a 50GB disk, and 2 executors per worker * For the G1X worker type, each worker maps to 1 DPU (4 vCPU, 16 GB of memory, 64 GB disk), and provides 1 executor per worker",
amanenk marked this conversation as resolved.
Show resolved Hide resolved
Type: schema.TypeString,
},
{
Name: "yarn_endpoint_address",
Description: "The YARN endpoint address used by this DevEndpoint",
Type: schema.TypeString,
},
{
Name: "zeppelin_remote_spark_interpreter_port",
Description: "The Apache Zeppelin port for the remote Apache Spark interpreter",
Type: schema.TypeBigInt,
},
},
}
}

// ====================================================================================================================
// Table Resolver Functions
// ====================================================================================================================

func fetchGlueDevEndpoints(ctx context.Context, meta schema.ClientMeta, parent *schema.Resource, res chan<- interface{}) error {
cl := meta.(*client.Client)
svc := cl.Services().Glue
input := glue.GetDevEndpointsInput{}
for {
result, err := svc.GetDevEndpoints(ctx, &input)
if err != nil {
if cl.IsNotFoundError(err) {
return nil
}
return diag.WrapError(err)
}
res <- result.DevEndpoints
if aws.ToString(result.NextToken) == "" {
break
}
input.NextToken = result.NextToken
}
return nil
}
func resolveGlueDevEndpointArn(ctx context.Context, meta schema.ClientMeta, resource *schema.Resource, c schema.Column) error {
cl := meta.(*client.Client)
arn := aws.String(devEndpointARN(cl, aws.ToString(resource.Item.(types.DevEndpoint).EndpointName)))
return diag.WrapError(resource.Set(c.Name, arn))
}
func resolveGlueDevEndpointTags(ctx context.Context, meta schema.ClientMeta, resource *schema.Resource, c schema.Column) error {
cl := meta.(*client.Client)
svc := cl.Services().Glue
result, err := svc.GetTags(ctx, &glue.GetTagsInput{
ResourceArn: aws.String(devEndpointARN(cl, aws.ToString(resource.Item.(types.DevEndpoint).EndpointName))),
})
if err != nil {
if cl.IsNotFoundError(err) {
return nil
}
return diag.WrapError(err)
}
return diag.WrapError(resource.Set(c.Name, result.Tags))
}

// ====================================================================================================================
// User Defined Helpers
// ====================================================================================================================

func devEndpointARN(cl *client.Client, name string) string {
return cl.ARN(client.GlueService, "devEndpoint", name)
}
55 changes: 55 additions & 0 deletions resources/services/glue/dev_endpoints.hcl
Original file line number Diff line number Diff line change
@@ -0,0 +1,55 @@
service = "aws"
output_directory = "."
add_generate = true


description_modifier "remove_read_only" {
words = [" This member is required."]
}

resource "aws" "glue" "dev_endpoints" {
path = "github.com/aws/aws-sdk-go-v2/service/glue/types.DevEndpoint"
ignoreError "IgnoreAccessDenied" {
path = "github.com/cloudquery/cq-provider-aws/client.IgnoreAccessDeniedServiceDisabled"
}
deleteFilter "AccountRegionFilter" {
path = "github.com/cloudquery/cq-provider-aws/client.DeleteAccountRegionFilter"
}
multiplex "AwsAccountRegion" {
path = "github.com/cloudquery/cq-provider-aws/client.ServiceAccountRegionMultiplexer"
params = ["glue"]
}
options {
primary_keys = ["arn"]
}
userDefinedColumn "account_id" {
description = "The AWS Account ID of the resource."
type = "string"
resolver "resolveAWSAccount" {
path = "github.com/cloudquery/cq-provider-aws/client.ResolveAWSAccount"
}
}
userDefinedColumn "region" {
type = "string"
description = "The AWS Region of the resource."
resolver "resolveAWSRegion" {
path = "github.com/cloudquery/cq-provider-aws/client.ResolveAWSRegion"
}
}
userDefinedColumn "arn" {
type = "string"
description = "The Amazon Resource Name (ARN) of the workflow."
generate_resolver = true
}

column "endpoint_name" {
rename = "name"
}


userDefinedColumn "tags" {
type = "json"
description = "Resource tags."
generate_resolver = true
}
}
Loading