Linearly Transform a Numeric Target to Match Given Boundaries

Linearly transforms a numeric target of a TaskRegr so it is between lower and upper. The formula for this is $x' = offset + x * scale$, where $scale$ is $(upper - lower) / (max(x) - min(x))$ and $offset$ is $-min(x) * scale + lower$. The same transformation is applied during training and prediction.

Format

R6Class object inheriting from PipeOpTargetTrafo/PipeOp

Construction

PipeOpTargetTrafoScaleRange$new(id = "targettrafoscalerange", param_vals = list())

id :: character(1)
Identifier of resulting object, default "targettrafoscalerange".
param_vals :: named list
List of hyperparameter settings, overwriting the hyperparameter settings that would otherwise be set during construction. Default list().

Input and Output Channels

Input and output channels are inherited from PipeOpTargetTrafo.

State

The $state is a named list containing the slots $offset and $scale.

Parameters

The parameters are the parameters inherited from PipeOpTargetTrafo, as well as:

lower :: numeric(1)
Target value of smallest item of input target. Initialized to 0.
upper :: numeric(1)
Target value of greatest item of input target. Initialized to 1.

Internals

Overloads PipeOpTargetTrafo's .get_state(), .transform(), and .invert(). Should be used in combination with PipeOpTargetInvert.

Fields

Only fields inherited from PipeOp.

Methods

Only methods inherited from PipeOpTargetTrafo/PipeOp.

Examples

library(mlr3)
task = tsk("boston_housing")
po = PipeOpTargetTrafoScaleRange$new()

po$train(list(task))
#> $fun
#> NULL
#> 
#> $output
#> 
#> ── <TaskRegr> (506x18): Boston Housing Prices ──────────────────────────────────
#> • Target: cmedv.scaled
#> • Properties: -
#> • Features (17):
#>   • dbl (12): age, b, crim, dis, indus, lat, lon, lstat, nox, ptratio, rm, zn
#>   • int (3): rad, tax, tract
#>   • fct (2): chas, town
#> 
po$predict(list(task))
#> $fun
#> function (inputs) 
#> {
#>     assert_list(inputs, len = 1L, types = "Prediction")
#>     list(private$.invert(inputs[[1L]], predict_phase_state))
#> }
#> <bytecode: 0x556148458260>
#> <environment: 0x55615ba18b88>
#> 
#> $output
#> 
#> ── <TaskRegr> (506x18): Boston Housing Prices ──────────────────────────────────
#> • Target: cmedv.scaled
#> • Properties: -
#> • Features (17):
#>   • dbl (12): age, b, crim, dis, indus, lat, lon, lstat, nox, ptratio, rm, zn
#>   • int (3): rad, tax, tract
#>   • fct (2): chas, town
#> 

#syntactic sugar for a graph using ppl():
ttscalerange = ppl("targettrafo", trafo_pipeop = PipeOpTargetTrafoScaleRange$new(),
  graph = PipeOpLearner$new(LearnerRegrRpart$new()))
ttscalerange$train(task)
#> $targetinvert.output
#> NULL
#> 
ttscalerange$predict(task)
#> $targetinvert.output
#> 
#> ── <PredictionRegr> for 506 observations: ──────────────────────────────────────
#>  row_ids truth response
#>        1  24.0 24.53538
#>        2  21.6 26.91481
#>        3  34.7 32.96875
#>      ---   ---      ---
#>      504  23.9 24.53538
#>      505  22.0 24.53538
#>      506  19.0 20.96400
#> 
ttscalerange$state$regr.rpart
#> $model
#> n= 506 
#> 
#> node), split, n, deviance, yval
#>       * denotes terminal node
#> 
#>  1) root 506 21.0260400 0.3895301  
#>    2) town=Arlington,Ashland,Beverly,Boston Allston-Brighton,Boston Charlestown,Boston Dorchester,Boston Downtown,Boston East Boston,Boston Forest Hills,Boston Hyde Park,Boston Mattapan,Boston North End,Boston Roxbury,Boston Savin Hill,Boston South Boston,Boston West Roxbury,Braintree,Burlington,Cambridge,Chelsea,Danvers,Dedham,Everett,Framingham,Hamilton,Hanover,Holbrook,Hull,Lynn,Malden,Marshfield,Medford,Melrose,Middleton,Millis,Nahant,Natick,Norfolk,North Reading,Norwell,Norwood,Peabody,Pembroke,Quincy,Randolph,Reading,Revere,Rockland,Salem,Sargus,Scituate,Sharon,Somerville,Stoneham,Wakefield,Walpole,Waltham,Watertown,Weymouth,Wilmington,Winthrop,Woburn 400  7.5706490 0.3174944  
#>      4) lstat>=14.4 176  1.6065670 0.2189646  
#>        8) town=Boston Charlestown,Boston East Boston,Boston Forest Hills,Boston North End,Boston Roxbury,Boston Savin Hill,Boston South Boston,Chelsea,Lynn 93  0.4849460 0.1569654 *
#>        9) town=Arlington,Beverly,Boston Allston-Brighton,Boston Dorchester,Boston Downtown,Boston Hyde Park,Boston Mattapan,Cambridge,Everett,Framingham,Malden,Medford,Middleton,Norwood,Peabody,Quincy,Revere,Salem,Somerville,Waltham,Watertown 83  0.3635828 0.2884337 *
#>      5) lstat< 14.4 224  2.9129590 0.3949107  
#>       10) lstat>=4.63 215  0.9995600 0.3787494  
#>         20) lstat>=7.765 150  0.5226398 0.3547556 *
#>         21) lstat< 7.765 65  0.1912833 0.4341197 *
#>       11) lstat< 4.63 9  0.5157443 0.7809877 *
#>    3) town=Bedford,Belmont,Boston Back Bay,Boston Beacon Hill,Brookline,Canton,Cohasset,Concord,Dover,Duxbury,Hingham,Lexington,Lincoln,Lynnfield,Manchester,Marblehead,Medfield,Milton,Needham,Newton,Sherborn,Sudbury,Swampscott,Topsfield,Wayland,Wellesley,Wenham,Weston,Westwood,Winchester 106  3.5470870 0.6613627  
#>      6) rm< 7.437 82  1.5639410 0.5961518  
#>       12) crim< 4.12641 75  0.6617538 0.5730963  
#>         24) rm< 6.727 27  0.1925600 0.4869959 *
#>         25) rm>=6.727 48  0.1564460 0.6215278 *
#>       13) crim>=4.12641 7  0.4351788 0.8431746 *
#>      7) rm>=7.437 24  0.4430451 0.8841667 *
#> 
#> $param_vals
#> $param_vals$xval
#> [1] 0
#> 
#> 
#> $log
#> Empty data.table (0 rows and 3 cols): stage,class,msg
#> 
#> $train_time
#> [1] 0.007
#> 
#> $task_hash
#> [1] "88d153e8827d7aff"
#> 
#> $feature_names
#>  [1] "age"     "b"       "chas"    "crim"    "dis"     "indus"   "lat"    
#>  [8] "lon"     "lstat"   "nox"     "ptratio" "rad"     "rm"      "tax"    
#> [15] "town"    "tract"   "zn"     
#> 
#> $validate
#> NULL
#> 
#> $mlr3_version
#> [1] ‘1.1.0’
#> 
#> $data_prototype
#> Empty data.table (0 rows and 18 cols): cmedv.scaled,age,b,chas,crim,dis...
#> 
#> $task_prototype
#> Empty data.table (0 rows and 18 cols): cmedv.scaled,age,b,chas,crim,dis...
#> 
#> $train_task
#> 
#> ── <TaskRegr> (506x18): Boston Housing Prices ──────────────────────────────────
#> • Target: cmedv.scaled
#> • Properties: -
#> • Features (17):
#>   • dbl (12): age, b, crim, dis, indus, lat, lon, lstat, nox, ptratio, rm, zn
#>   • int (3): rad, tax, tract
#>   • fct (2): chas, town
#> 
#> attr(,"class")
#> [1] "learner_state" "list"