Skip to content
New issue

Have a question about this project? Sign up for a free GitHub account to open an issue and contact its maintainers and the community.

By clicking “Sign up for GitHub”, you agree to our terms of service and privacy statement. We’ll occasionally send you account related emails.

Already on GitHub? Sign in to your account

July 17,2023 release -- config updates #295

Merged
merged 1 commit into from
Jul 17, 2023
Merged
Show file tree
Hide file tree
Changes from all commits
Commits
File filter

Filter by extension

Filter by extension

Conversations
Failed to load comments.
Loading
Jump to
Jump to file
Failed to load files.
Loading
Diff view
Diff view
1 change: 1 addition & 0 deletions config_templates/gretel/synthetics/amplify.yml
Original file line number Diff line number Diff line change
Expand Up @@ -16,3 +16,4 @@ models:
params:
num_records: null
target_size_mb: null
auto_transform_datetimes: True
13 changes: 7 additions & 6 deletions config_templates/gretel/synthetics/default.yml
Original file line number Diff line number Diff line change
@@ -1,17 +1,18 @@
# deprecated: This configuration will be deprecated soon. Please use the "synthetics/tabular-lstm" configuration.

schema_version: "1.0"
name: "default-config"
name: "tabular-lstm"
models:
- synthetics:
data_source: __tmp__
params:
epochs: 100
vocab_size: 20000
learning_rate: 0.01
validation_split: False
epochs: auto
vocab_size: auto
learning_rate: auto
batch_size: auto
rnn_units: auto
generate:
num_records: 5000
privacy_filters:
outliers: auto
similarity: auto
similarity: auto
5 changes: 3 additions & 2 deletions config_templates/gretel/synthetics/high-dimensionality.yml
Original file line number Diff line number Diff line change
Expand Up @@ -12,8 +12,9 @@ models:
generator_lr: 0.0001
discriminator_lr: .00033
batch_size: auto
auto_transform_datetimes: False
generate:
num_records: 5000
privacy_filters:
outliers: auto
similarity: auto
outliers: null # Set to "auto" for additional protections
similarity: null # Set to "auto" for additional protections
27 changes: 14 additions & 13 deletions config_templates/gretel/synthetics/low-record-count.yml
Original file line number Diff line number Diff line change
Expand Up @@ -4,16 +4,17 @@ schema_version: "1.0"
name: "low-record-count"
models:
- actgan:
data_source: __tmp__
params:
epochs: auto
generator_dim: [1024, 1024]
discriminator_dim: [1024, 1024]
generator_lr: 0.0001
discriminator_lr: .00033
batch_size: auto
generate:
num_records: 5000
privacy_filters:
outliers: auto
similarity: auto
data_source: __tmp__
params:
epochs: auto
generator_dim: [1024, 1024]
discriminator_dim: [1024, 1024]
generator_lr: 0.0001
discriminator_lr: .00033
batch_size: auto
auto_transform_datetimes: False
generate:
num_records: 5000
privacy_filters:
outliers: null # Set to "auto" for additional protections
similarity: null # Set to "auto" for additional protections
5 changes: 3 additions & 2 deletions config_templates/gretel/synthetics/tabular-actgan.yml
Original file line number Diff line number Diff line change
Expand Up @@ -12,8 +12,9 @@ models:
generator_lr: 0.0001
discriminator_lr: .00033
batch_size: auto
auto_transform_datetimes: False
generate:
num_records: 5000
privacy_filters:
outliers: auto
similarity: auto
outliers: null # Set to "auto" for additional protections
similarity: null # Set to "auto" for additional protections
22 changes: 5 additions & 17 deletions config_templates/gretel/synthetics/tabular-lstm-evaluate.yml
Original file line number Diff line number Diff line change
@@ -1,19 +1,10 @@
# Blueprint configuration for evaluating synthetic data on classification and regression models

### IMPORTANT: rename "target" to match the label/target header of your data ###

# See https://docs.gretel.ai/reference/evaluate/evaluate-tasks/classification and
# https://docs.gretel.ai/reference/evaluate/evaluate-tasks/regression
# for detailed info on all config options

# You can substitute with any synthetic model. For example, to use Gretel ACTGAN or TabularDP models,
# edit the default config and add the "evaluate" parameters below.

schema_version: "1.0"
name: "tabular-lstm-evaluate"
models:

# This config uses the Gretel LSTM model to generate synthetic data.
# You can substitute with any synthetic model. For example, to use Gretel ACTGAN model,
# copy the config from "tabular-actgan.yml"
- synthetics:
data_source: __tmp__
params:
Expand All @@ -28,14 +19,11 @@ models:
outliers: auto
similarity: auto
evaluate:

### Indicate classification or regression
task: classification

### IMPORTANT: rename to match the label/target header of your data
target: "y"
task: classification # Indicate classification or regression
target: "y" # The column in your dataset containing the desired label

### Optional metrics. See docs for all config options: https://docs.gretel.ai/reference/evaluate/evaluate-tasks/
### Optional metrics
# holdout: null
# metric: null
# models: null