74
74
"tests" ,
75
75
"fixture_data" ,
76
76
"outliering" ,
77
- "winsorisation " ,
77
+ "winsorise " ,
78
78
f"{ scenario_category } _scenarios" ,
79
79
"*_input.csv" ,
80
80
)
94
94
def test_input_not_a_dataframe ():
95
95
with pytest .raises (TypeError ):
96
96
# noinspection PyTypeChecker
97
- outliering .winsorisation ("not_a_dataframe" , * params )
97
+ outliering .winsorise ("not_a_dataframe" , * params )
98
98
99
99
100
100
# --- Test if params not strings ---
@@ -106,7 +106,7 @@ def test_params_not_string(fxt_load_test_csv):
106
106
dataframe_columns ,
107
107
dataframe_types ,
108
108
"outliering" ,
109
- "winsorisation " ,
109
+ "winsorise " ,
110
110
"unit" ,
111
111
"basic_functionality" ,
112
112
)
@@ -120,7 +120,7 @@ def test_params_not_string(fxt_load_test_csv):
120
120
outlier_weight_col ,
121
121
)
122
122
with pytest .raises (TypeError ):
123
- outliering .winsorisation (test_dataframe , * bad_params )
123
+ outliering .winsorise (test_dataframe , * bad_params )
124
124
125
125
126
126
# --- Test if params null ---
@@ -132,7 +132,7 @@ def test_params_null(fxt_load_test_csv):
132
132
dataframe_columns ,
133
133
dataframe_types ,
134
134
"outliering" ,
135
- "winsorisation " ,
135
+ "winsorise " ,
136
136
"unit" ,
137
137
"basic_functionality" ,
138
138
)
@@ -146,7 +146,7 @@ def test_params_null(fxt_load_test_csv):
146
146
outlier_weight_col ,
147
147
)
148
148
with pytest .raises (ValueError ):
149
- outliering .winsorisation (test_dataframe , * bad_params )
149
+ outliering .winsorise (test_dataframe , * bad_params )
150
150
151
151
152
152
# --- Test validation fail if mismatched calibration cols ---
@@ -158,7 +158,7 @@ def test_params_mismatched_calibration_cols(fxt_load_test_csv):
158
158
dataframe_columns ,
159
159
dataframe_types ,
160
160
"outliering" ,
161
- "winsorisation " ,
161
+ "winsorise " ,
162
162
"unit" ,
163
163
"basic_functionality" ,
164
164
)
@@ -173,7 +173,7 @@ def test_params_mismatched_calibration_cols(fxt_load_test_csv):
173
173
calibration_weight_col ,
174
174
)
175
175
with pytest .raises (TypeError ):
176
- outliering .winsorisation (test_dataframe , * bad_params )
176
+ outliering .winsorise (test_dataframe , * bad_params )
177
177
178
178
179
179
# --- Test validation fail if nulls in data ---
@@ -185,12 +185,12 @@ def test_dataframe_nulls_in_data(fxt_load_test_csv):
185
185
dataframe_columns ,
186
186
dataframe_types ,
187
187
"outliering" ,
188
- "winsorisation " ,
188
+ "winsorise " ,
189
189
"unit" ,
190
190
"null_value_present" ,
191
191
)
192
192
with pytest .raises (outliering .ValidationError ):
193
- outliering .winsorisation (test_dataframe , * params )
193
+ outliering .winsorise (test_dataframe , * params )
194
194
195
195
196
196
# --- Test if cols missing from input dataframe(s) ---
@@ -202,13 +202,13 @@ def test_dataframe_column_missing(fxt_load_test_csv):
202
202
dataframe_columns ,
203
203
dataframe_types ,
204
204
"outliering" ,
205
- "winsorisation " ,
205
+ "winsorise " ,
206
206
"unit" ,
207
207
"basic_functionality" ,
208
208
)
209
209
bad_dataframe = test_dataframe .drop (target_col )
210
210
with pytest .raises (outliering .ValidationError ):
211
- outliering .winsorisation (bad_dataframe , * params )
211
+ outliering .winsorise (bad_dataframe , * params )
212
212
213
213
214
214
# --- Test if output contents are as expected, both new columns and data ---
@@ -220,13 +220,13 @@ def test_dataframe_returned_as_expected(fxt_spark_session, fxt_load_test_csv):
220
220
dataframe_columns ,
221
221
dataframe_types ,
222
222
"outliering" ,
223
- "winsorisation " ,
223
+ "winsorise " ,
224
224
"unit" ,
225
225
"basic_functionality" ,
226
226
)
227
227
# Make sure that no extra columns pass through.
228
228
test_dataframe = test_dataframe .withColumn ("bonus_column" , lit (0 ))
229
- ret_val = outliering .winsorisation (test_dataframe , * params )
229
+ ret_val = outliering .winsorise (test_dataframe , * params )
230
230
# perform action on the dataframe to trigger lazy evaluation...
231
231
ret_val .count ()
232
232
# ...and then check
@@ -242,11 +242,11 @@ def test_dataframe_expected_columns(fxt_spark_session, fxt_load_test_csv):
242
242
dataframe_columns ,
243
243
dataframe_types ,
244
244
"outliering" ,
245
- "winsorisation " ,
245
+ "winsorise " ,
246
246
"unit" ,
247
247
"basic_functionality" ,
248
248
)
249
- ret_val = outliering .winsorisation (
249
+ ret_val = outliering .winsorise (
250
250
test_dataframe ,
251
251
* default_params ,
252
252
)
@@ -283,7 +283,7 @@ def test_calculations(fxt_load_test_csv, scenario_type, scenario):
283
283
dataframe_columns ,
284
284
dataframe_types ,
285
285
"outliering" ,
286
- "winsorisation " ,
286
+ "winsorise " ,
287
287
scenario_type ,
288
288
f"{ scenario } _input" ,
289
289
)
@@ -297,12 +297,12 @@ def test_calculations(fxt_load_test_csv, scenario_type, scenario):
297
297
dataframe_columns ,
298
298
dataframe_types ,
299
299
"outliering" ,
300
- "winsorisation " ,
300
+ "winsorise " ,
301
301
scenario_type ,
302
302
f"{ scenario } _output" ,
303
303
)
304
304
305
- ret_val = outliering .winsorisation (test_dataframe , * params , ** winsorisation_kwargs )
305
+ ret_val = outliering .winsorise (test_dataframe , * params , ** winsorisation_kwargs )
306
306
307
307
assert isinstance (ret_val , type (test_dataframe ))
308
308
sort_col_list = [reference_col , period_col ]
@@ -320,13 +320,13 @@ def test_winsorise_different_stratum_l_values_in_same_period_fails(fxt_load_test
320
320
dataframe_columns ,
321
321
dataframe_types ,
322
322
"outliering" ,
323
- "winsorisation " ,
323
+ "winsorise " ,
324
324
"unit" ,
325
325
"different_l_values_stratum_same_period" ,
326
326
)
327
327
328
328
with pytest .raises (outliering .ValidationError ):
329
- outliering .winsorisation (
329
+ outliering .winsorise (
330
330
test_dataframe ,
331
331
* default_params ,
332
332
)
@@ -340,12 +340,12 @@ def test_winsorise_different_stratum_l_values_in_different_periods_succeeds(
340
340
dataframe_columns ,
341
341
dataframe_types ,
342
342
"outliering" ,
343
- "winsorisation " ,
343
+ "winsorise " ,
344
344
"unit" ,
345
345
"different_l_values_stratum_different_periods" ,
346
346
)
347
347
348
- outliering .winsorisation (
348
+ outliering .winsorise (
349
349
test_dataframe ,
350
350
* default_params ,
351
351
)
0 commit comments