-
Notifications
You must be signed in to change notification settings - Fork 17
Commit
This commit does not belong to any branch on this repository, and may belong to a fork outside of the repository.
- Loading branch information
1 parent
0c754f9
commit 9caa66e
Showing
24 changed files
with
128 additions
and
131 deletions.
There are no files selected for viewing
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
Original file line number | Diff line number | Diff line change |
---|---|---|
@@ -1,5 +1,5 @@ | ||
name: 'dbt_ml_preprocessing' | ||
version: '1.0.0' | ||
version: '1.0.1' | ||
|
||
require-dbt-version: ">=0.15.1" | ||
|
||
|
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
22 changes: 7 additions & 15 deletions
22
integration_tests/macros/quantile_transformer_model_macro.sql
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
Original file line number | Diff line number | Diff line change |
---|---|---|
@@ -1,24 +1,16 @@ | ||
-- macro is only supported in Snowflake | ||
{% macro snowflake__quantile_transformer_model_macro() %} | ||
with data as ( | ||
|
||
{{ dbt_ml_preprocessing.quantile_transformer( ref('data_quantile_transformer') ,'col_to_transform') }} | ||
|
||
) | ||
select * from data | ||
{% endmacro %} | ||
|
||
-- other adapters we generate an empty test result to force a test pass | ||
{% macro bigquery__quantile_transformer_model_macro() %} | ||
with data as ( | ||
|
||
{{ dbt_ml_preprocessing.quantile_transformer( ref('data_quantile_transformer') ,'col_to_transform') }} | ||
|
||
) | ||
select * from data | ||
{% endmacro %} | ||
|
||
-- other adapters we generate an empty test result to force a test pass | ||
-- macro not supported in other databases | ||
{% macro default__quantile_transformer_model_macro() %} | ||
select 1 as empty_result from (select 1) where 1=2 | ||
select 1 from (select 1) where 1=2 -- empty result set so that test passes | ||
{% endmacro %} | ||
|
||
-- macro not supported in sqlserver | ||
{% macro sqlserver__quantile_transformer_model_macro() %} | ||
select null as '1' where 1=2 -- empty result set so that test passes | ||
{% endmacro %} |
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
Original file line number | Diff line number | Diff line change |
---|---|---|
@@ -0,0 +1,16 @@ | ||
{% macro default__standard_scaler_model_macro() %} | ||
with data as ( | ||
{{ dbt_ml_preprocessing.standard_scaler( ref('data_standard_scaler') ,['col_to_scale_1','col_to_scale_2']) }} | ||
) | ||
select id_col, | ||
col_to_scale_1, | ||
col_to_scale_2, | ||
round(col_to_scale_1_scaled,10) as col_to_scale_1_scaled, | ||
round(col_to_scale_2_scaled,10) as col_to_scale_2_scaled | ||
from data | ||
{% endmacro %} | ||
|
||
-- macro is not supported in mssql | ||
{% macro sqlserver__standard_scaler_model_macro() %} | ||
select null as '1' where 1=2 | ||
{% endmacro %} |
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
8 changes: 1 addition & 7 deletions
8
integration_tests/models/sql/test_k_bins_discretizer_50_bins.sql
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
Original file line number | Diff line number | Diff line change |
---|---|---|
@@ -1,10 +1,4 @@ | ||
{{ config(materialized='view') }} | ||
|
||
with data as ( | ||
{{ dbt_ml_preprocessing.k_bins_discretizer( ref('data_k_bins_discretizer') ,['col_to_bin_1'],n_bins=50) }} | ||
|
||
{{ dbt_ml_preprocessing.k_bins_discretizer( ref('data_k_bins_discretizer') ,['col_to_bin_1'],n_bins=50) }} | ||
|
||
) | ||
|
||
select * from data | ||
order by id_col |
9 changes: 1 addition & 8 deletions
9
integration_tests/models/sql/test_k_bins_discretizer_default_bins.sql
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
Original file line number | Diff line number | Diff line change |
---|---|---|
@@ -1,10 +1,3 @@ | ||
{{ config(materialized='view') }} | ||
|
||
with data as ( | ||
|
||
{{ dbt_ml_preprocessing.k_bins_discretizer( ref('data_k_bins_discretizer') ,['col_to_bin_1','col_to_bin_2']) }} | ||
|
||
) | ||
|
||
select * from data | ||
order by id_col | ||
{{ dbt_ml_preprocessing.k_bins_discretizer( ref('data_k_bins_discretizer') ,['col_to_bin_1','col_to_bin_2']) }} |
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
Original file line number | Diff line number | Diff line change |
---|---|---|
@@ -1,9 +1,4 @@ | ||
{{ config(materialized='table') }} -- as a table because Redshift can't handle the equality checker query when it's a view | ||
|
||
with data as ( | ||
{{ dbt_ml_preprocessing.label_encoder( ref('data_label_encoder') ,'col_to_label_encode') }} | ||
|
||
{{ dbt_ml_preprocessing.label_encoder( ref('data_label_encoder') ,'col_to_label_encode') }} | ||
|
||
) | ||
|
||
select * from data |
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
Original file line number | Diff line number | Diff line change |
---|---|---|
@@ -1,9 +1,3 @@ | ||
{{ config(materialized='view') }} | ||
|
||
with data as ( | ||
|
||
{{ dbt_ml_preprocessing.max_abs_scaler( ref('data_max_abs_scaler') ,['col_to_scale']) }} | ||
|
||
) | ||
|
||
select * from data | ||
{{ dbt_ml_preprocessing.max_abs_scaler( ref('data_max_abs_scaler') ,['col_to_scale']) }} |
7 changes: 1 addition & 6 deletions
7
integration_tests/models/sql/test_max_abs_scaler_with_column_selection.sql
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
Original file line number | Diff line number | Diff line change |
---|---|---|
@@ -1,9 +1,4 @@ | ||
{{ config(materialized='view') }} | ||
|
||
with data as ( | ||
{{ dbt_ml_preprocessing.max_abs_scaler( ref('data_max_abs_scaler') ,['col_to_scale'],include_columns=['id_col']) }} | ||
|
||
{{ dbt_ml_preprocessing.max_abs_scaler( ref('data_max_abs_scaler') ,['col_to_scale'],include_columns=['id_col']) }} | ||
|
||
) | ||
|
||
select * from data |
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
Original file line number | Diff line number | Diff line change |
---|---|---|
@@ -1,9 +1,3 @@ | ||
{{ config(materialized='view') }} | ||
|
||
with data as ( | ||
|
||
{{ dbt_ml_preprocessing.min_max_scaler( ref('data_max_abs_scaler') ,['col_to_scale']) }} | ||
|
||
) | ||
|
||
select * from data | ||
{{ dbt_ml_preprocessing.min_max_scaler( ref('data_max_abs_scaler') ,['col_to_scale']) }} |
8 changes: 1 addition & 7 deletions
8
integration_tests/models/sql/test_min_max_scaler_with_column_selection.sql
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
Original file line number | Diff line number | Diff line change |
---|---|---|
@@ -1,9 +1,3 @@ | ||
{{ config(materialized='view') }} | ||
|
||
with data as ( | ||
|
||
{{ dbt_ml_preprocessing.min_max_scaler( ref('data_max_abs_scaler') ,['col_to_scale'],include_columns=['id_col']) }} | ||
|
||
) | ||
|
||
select * from data | ||
{{ dbt_ml_preprocessing.min_max_scaler( ref('data_max_abs_scaler') ,['col_to_scale'],include_columns=['id_col']) }} |
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
Original file line number | Diff line number | Diff line change |
---|---|---|
@@ -1,9 +1,3 @@ | ||
{{ config(materialized='view') }} | ||
|
||
with data as ( | ||
|
||
{{ dbt_ml_preprocessing.normalizer( ref('data_normalizer') ,['col1','col2','col3','col4']) }} | ||
|
||
) | ||
|
||
select * from data | ||
{{ dbt_ml_preprocessing.normalizer( ref('data_normalizer') ,['col1','col2','col3','col4']) }} |
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
Original file line number | Diff line number | Diff line change |
---|---|---|
@@ -1,9 +1,3 @@ | ||
{{ config(materialized='view') }} | ||
|
||
with data as ( | ||
|
||
{{ dbt_ml_preprocessing.one_hot_encoder( ref('data_one_hot_encoder') ,'column_to_encode',handle_unknown='ignore') }} | ||
|
||
) | ||
|
||
select * from data | ||
{{ dbt_ml_preprocessing.one_hot_encoder( ref('data_one_hot_encoder') ,'column_to_encode',handle_unknown='ignore') }} |
6 changes: 1 addition & 5 deletions
6
integration_tests/models/sql/test_one_hot_encoder_category_selected.sql
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
Original file line number | Diff line number | Diff line change |
---|---|---|
@@ -1,12 +1,8 @@ | ||
{{ config(materialized='view') }} | ||
|
||
with data as ( | ||
|
||
{{ dbt_ml_preprocessing.one_hot_encoder( source_table=ref('data_one_hot_encoder'), | ||
{{ dbt_ml_preprocessing.one_hot_encoder( source_table=ref('data_one_hot_encoder'), | ||
source_column='column_to_encode', | ||
categories=['A','B'], | ||
handle_unknown='ignore') }} | ||
|
||
) | ||
|
||
select * from data |
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
Original file line number | Diff line number | Diff line change |
---|---|---|
@@ -1,9 +1,3 @@ | ||
{{ config(materialized='view') }} | ||
|
||
with data as ( | ||
|
||
{{ dbt_ml_preprocessing.robust_scaler( ref('data_robust_scaler') ,['col_to_scale']) }} | ||
|
||
) | ||
|
||
select * from data | ||
{{ dbt_ml_preprocessing.robust_scaler( ref('data_robust_scaler') ,['col_to_scale']) }} |
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
Original file line number | Diff line number | Diff line change |
---|---|---|
@@ -1,14 +1,5 @@ | ||
{{ config(materialized='view') }} | ||
{{ config(materialized='table') }} | ||
|
||
with data as ( | ||
|
||
{{ dbt_ml_preprocessing.standard_scaler( ref('data_standard_scaler') ,['col_to_scale_1','col_to_scale_2']) }} | ||
|
||
) | ||
|
||
select id_col, | ||
col_to_scale_1, | ||
col_to_scale_2, | ||
round(col_to_scale_1_scaled,10) as col_to_scale_1_scaled, | ||
round(col_to_scale_2_scaled,10) as col_to_scale_2_scaled | ||
from data | ||
-- test model is generated by adapter-specific macro, | ||
-- because the quantile_transformer is not supported by all DBs | ||
{{ adapter.dispatch('standard_scaler_model_macro')() }} |
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
Oops, something went wrong.