From 0d872ed33b43f9a953cc83c8ea158c5b24f0f102 Mon Sep 17 00:00:00 2001 From: "jeremie.desgagne.bouchard" Date: Wed, 7 Sep 2022 16:21:17 -0400 Subject: [PATCH 1/2] up --- src/MLJ.jl | 5 + src/find_split.jl | 163 ++++++++-------- src/fit.jl | 2 +- src/models.jl | 4 +- src/predict.jl | 2 +- test/monotonic.jl | 479 +++++++++++++++++++++++----------------------- test/runtests.jl | 1 + 7 files changed, 336 insertions(+), 320 deletions(-) diff --git a/src/MLJ.jl b/src/MLJ.jl index d70ae16f..4a201d48 100644 --- a/src/MLJ.jl +++ b/src/MLJ.jl @@ -140,6 +140,8 @@ EvoTreeRegressor is used to perform the following regression types: - `rowsample=1.0`: Proportion of rows that are sampled at each iteration to build the tree. Should be in `]0, 1]`. - `colsample=1.0`: Proportion of columns / features that are sampled at each iteration to build the tree. Should be in `]0, 1]`. - `nbins=32`: Number of bins into which each feature is quantized. Buckets are defined based on quantiles, hence resulting in equal weight bins. +- `monotone_constraints=Dict{Int, Int}()`: Specify monotonic constraints using a dict where the key is the feature index and the value the applicable constraint (-1=decreasing, 0=none, 1=increasing). + Only `:linear` and `:logistic` losses are supported at the moment. - `rng=123`: Either an integer used as a seed to the random number generator or an actual random number generator (`::Random.AbstractRNG`). - `metric::Symbol=:none`: Metric that is to be tracked during the training process. One of: `:none`, `:mse`, `:mae`, `:logloss`. - `device="cpu"`: Hardware device to use for computations. Can be either `"cpu"` or `"gpu"`. Only `:linear` and `:logistic` losses are supported on GPU. @@ -365,6 +367,7 @@ EvoTreeCount is used to perform Poisson probabilistic regression on count target - `rowsample=1.0`: Proportion of rows that are sampled at each iteration to build the tree. Should be `]0, 1]`. - `colsample=1.0`: Proportion of columns / features that are sampled at each iteration to build the tree. Should be `]0, 1]`. - `nbins=32`: Number of bins into which each feature is quantized. Buckets are defined based on quantiles, hence resulting in equal weight bins. +- `monotone_constraints=Dict{Int, Int}()`: Specify monotonic constraints using a dict where the key is the feature index and the value the applicable constraint (-1=decreasing, 0=none, 1=increasing). - `rng=123`: Either an integer used as a seed to the random number generator or an actual random number generator (`::Random.AbstractRNG`). - `metric::Symbol=:none`: Metric that is to be tracked during the training process. One of: `:none`, `:poisson`, `:mae`, `:mse`. - `device="cpu"`: Hardware device to use for computations. Only CPU is supported at the moment. @@ -485,6 +488,8 @@ EvoTreeGaussian is used to perform Gaussain probabilistic regression, fitting μ - `rowsample=1.0`: Proportion of rows that are sampled at each iteration to build the tree. Should be in `]0, 1]`. - `colsample=1.0`: Proportion of columns / features that are sampled at each iteration to build the tree. Should be in `]0, 1]`. - `nbins=32`: Number of bins into which each feature is quantized. Buckets are defined based on quantiles, hence resulting in equal weight bins. +- `monotone_constraints=Dict{Int, Int}()`: Specify monotonic constraints using a dict where the key is the feature index and the value the applicable constraint (-1=decreasing, 0=none, 1=increasing). + !Experimental feature: note that for Gaussian regression, constraints may not be enforce systematically. - `rng=123`: Either an integer used as a seed to the random number generator or an actual random number generator (`::Random.AbstractRNG`). - `metric::Symbol=:none`: Metric that is to be tracked during the training process. One of: `:none`, `:gaussian`. - `device="cpu"`: Hardware device to use for computations. Can be either `"cpu"` or `"gpu"`. diff --git a/src/find_split.jl b/src/find_split.jl index 1f84c6f2..db3f22fe 100644 --- a/src/find_split.jl +++ b/src/find_split.jl @@ -127,7 +127,7 @@ function update_hist!( 𝑖::AbstractVector{S}, 𝑗::AbstractVector{S}, K) where {L<:GradientRegression,T,S} - @inbounds @threads for j in 𝑗 + @threads for j in 𝑗 @inbounds @simd for i in 𝑖 hid = 3 * X_bin[i, j] - 2 hist[j][hid] += δ𝑤[1, i] @@ -150,7 +150,7 @@ function update_hist!( 𝑖::AbstractVector{S}, 𝑗::AbstractVector{S}, K) where {L<:GaussianRegression,T,S} - @inbounds @threads for j in 𝑗 + @threads for j in 𝑗 @inbounds @simd for i in 𝑖 hid = 5 * X_bin[i, j] - 4 hist[j][hid] += δ𝑤[1, i] @@ -175,8 +175,8 @@ function update_hist!( 𝑖::AbstractVector{S}, 𝑗::AbstractVector{S}, K) where {L,T,S} - @inbounds @threads for j in 𝑗 - @inbounds @simd for i in 𝑖 + @threads for j in 𝑗 + @inbounds for i in 𝑖 hid = (2 * K + 1) * (X_bin[i, j] - 1) for k = 1:(2*K+1) hist[j][hid+k] += δ𝑤[k, i] @@ -187,86 +187,91 @@ function update_hist!( end -""" - update_gains! - GradientRegression -""" -function update_gains!( - loss::L, - node::TrainNode{T}, - 𝑗::Vector{S}, - params::EvoTypes, K, monotone_constraints) where {L<:GradientRegression,T,S} - - @inbounds @threads for j in 𝑗 - node.hL[j][1] = node.h[j][1] - node.hL[j][2] = node.h[j][2] - node.hL[j][3] = node.h[j][3] - - node.hR[j][1] = node.∑[1] - node.h[j][1] - node.hR[j][2] = node.∑[2] - node.h[j][2] - node.hR[j][3] = node.∑[3] - node.h[j][3] - @inbounds for bin = 2:params.nbins - binid = 3 * bin - 2 - node.hL[j][binid] = node.hL[j][binid-3] + node.h[j][binid] - node.hL[j][binid+1] = node.hL[j][binid-2] + node.h[j][binid+1] - node.hL[j][binid+2] = node.hL[j][binid-1] + node.h[j][binid+2] - - node.hR[j][binid] = node.hR[j][binid-3] - node.h[j][binid] - node.hR[j][binid+1] = node.hR[j][binid-2] - node.h[j][binid+1] - node.hR[j][binid+2] = node.hR[j][binid-1] - node.h[j][binid+2] - - end - hist_gains_cpu!(loss, view(node.gains, :, j), node.hL[j], node.hR[j], params, K, monotone_constraints[j]) - end - return nothing -end +# """ +# update_gains! +# GradientRegression +# """ +# function update_gains!( +# loss::L, +# node::TrainNode{T}, +# 𝑗::Vector{S}, +# params::EvoTypes, K, monotone_constraints) where {L<:GradientRegression,T,S} + +# @threads for j in 𝑗 +# node.hL[j][1] = node.h[j][1] +# node.hL[j][2] = node.h[j][2] +# node.hL[j][3] = node.h[j][3] + +# node.hR[j][1] = node.∑[1] - node.h[j][1] +# node.hR[j][2] = node.∑[2] - node.h[j][2] +# node.hR[j][3] = node.∑[3] - node.h[j][3] +# @inbounds @simd for bin = 2:params.nbins +# binid = 3 * bin - 2 +# node.hL[j][binid] = node.hL[j][binid-3] + node.h[j][binid] +# node.hL[j][binid+1] = node.hL[j][binid-2] + node.h[j][binid+1] +# node.hL[j][binid+2] = node.hL[j][binid-1] + node.h[j][binid+2] + +# node.hR[j][binid] = node.hR[j][binid-3] - node.h[j][binid] +# node.hR[j][binid+1] = node.hR[j][binid-2] - node.h[j][binid+1] +# node.hR[j][binid+2] = node.hR[j][binid-1] - node.h[j][binid+2] -""" - update_gains! - GaussianRegression -""" -function update_gains!( - loss::L, - node::TrainNode{T}, - 𝑗::Vector{S}, - params::EvoTypes, K, monotone_constraints) where {L<:GaussianRegression,T,S} +# end +# hist_gains_cpu!(loss, view(node.gains, :, j), node.hL[j], node.hR[j], params, K, monotone_constraints[j]) +# end +# return nothing +# end - @inbounds @threads for j in 𝑗 - node.hL[j][1] = node.h[j][1] - node.hL[j][2] = node.h[j][2] - node.hL[j][3] = node.h[j][3] - node.hL[j][4] = node.h[j][4] - node.hL[j][5] = node.h[j][5] - - node.hR[j][1] = node.∑[1] - node.h[j][1] - node.hR[j][2] = node.∑[2] - node.h[j][2] - node.hR[j][3] = node.∑[3] - node.h[j][3] - node.hR[j][4] = node.∑[4] - node.h[j][4] - node.hR[j][5] = node.∑[5] - node.h[j][5] - @inbounds for bin in 2:params.nbins - binid = 5 * bin - 4 - node.hL[j][binid] = node.hL[j][binid-5] + node.h[j][binid] - node.hL[j][binid+1] = node.hL[j][binid-4] + node.h[j][binid+1] - node.hL[j][binid+2] = node.hL[j][binid-3] + node.h[j][binid+2] - node.hL[j][binid+3] = node.hL[j][binid-2] + node.h[j][binid+3] - node.hL[j][binid+4] = node.hL[j][binid-1] + node.h[j][binid+4] - - node.hR[j][binid] = node.hR[j][binid-5] - node.h[j][binid] - node.hR[j][binid+1] = node.hR[j][binid-4] - node.h[j][binid+1] - node.hR[j][binid+2] = node.hR[j][binid-3] - node.h[j][binid+2] - node.hR[j][binid+3] = node.hR[j][binid-2] - node.h[j][binid+3] - node.hR[j][binid+4] = node.hR[j][binid-1] - node.h[j][binid+4] +# """ +# update_gains! +# GaussianRegression +# """ +# function update_gains!( +# loss::L, +# node::TrainNode{T}, +# 𝑗::Vector{S}, +# params::EvoTypes, K, monotone_constraints) where {L<:GaussianRegression,T,S} + +# @threads for j in 𝑗 +# node.hL[j][1] = node.h[j][1] +# node.hL[j][2] = node.h[j][2] +# node.hL[j][3] = node.h[j][3] +# node.hL[j][4] = node.h[j][4] +# node.hL[j][5] = node.h[j][5] + +# node.hR[j][1] = node.∑[1] - node.h[j][1] +# node.hR[j][2] = node.∑[2] - node.h[j][2] +# node.hR[j][3] = node.∑[3] - node.h[j][3] +# node.hR[j][4] = node.∑[4] - node.h[j][4] +# node.hR[j][5] = node.∑[5] - node.h[j][5] +# @inbounds @simd for bin in 2:params.nbins +# binid = 5 * bin - 4 +# node.hL[j][binid] = node.hL[j][binid-5] + node.h[j][binid] +# node.hL[j][binid+1] = node.hL[j][binid-4] + node.h[j][binid+1] +# node.hL[j][binid+2] = node.hL[j][binid-3] + node.h[j][binid+2] +# node.hL[j][binid+3] = node.hL[j][binid-2] + node.h[j][binid+3] +# node.hL[j][binid+4] = node.hL[j][binid-1] + node.h[j][binid+4] + +# node.hR[j][binid] = node.hR[j][binid-5] - node.h[j][binid] +# node.hR[j][binid+1] = node.hR[j][binid-4] - node.h[j][binid+1] +# node.hR[j][binid+2] = node.hR[j][binid-3] - node.h[j][binid+2] +# node.hR[j][binid+3] = node.hR[j][binid-2] - node.h[j][binid+3] +# node.hR[j][binid+4] = node.hR[j][binid-1] - node.h[j][binid+4] - end - hist_gains_cpu!(loss, view(node.gains, :, j), node.hL[j], node.hR[j], params, K, monotone_constraints[j]) - end - return nothing -end +# end +# hist_gains_cpu!(loss, view(node.gains, :, j), node.hL[j], node.hR[j], params, K, monotone_constraints[j]) +# end +# return nothing +# end """ - update_gains! - Generic fallback + update_gains!( + loss::L, + node::TrainNode{T}, + 𝑗::Vector{S}, + params::EvoTypes, K, monotone_constraints) where {L,T,S} + +Generic fallback """ function update_gains!( loss::L, @@ -283,7 +288,7 @@ function update_gains!( end @inbounds for bin in 2:params.nbins - @inbounds for k = 1:KK + @inbounds @simd for k = 1:KK binid = KK * (bin - 1) node.hL[j][binid+k] = node.hL[j][binid-KK+k] + node.h[j][binid+k] node.hR[j][binid+k] = node.hR[j][binid-KK+k] - node.h[j][binid+k] diff --git a/src/fit.jl b/src/fit.jl index 101d2a7e..f4d823af 100644 --- a/src/fit.jl +++ b/src/fit.jl @@ -67,7 +67,7 @@ function init_evotree(params::EvoTypes{T,U,S}, X::AbstractMatrix, Y::AbstractVec # monotone constraints vector monotone_constraints = zeros(Int32, X_size[2]) - for (k, v) in params.monotone_constraints + hasproperty(params, :monotone_constraints) && for (k, v) in params.monotone_constraints monotone_constraints[k] = v end diff --git a/src/models.jl b/src/models.jl index 7b5427af..1540584c 100644 --- a/src/models.jl +++ b/src/models.jl @@ -163,6 +163,8 @@ function EvoTreeCount(; kwargs...) if args[:loss] != :poisson error("Invalid loss: $(args[:loss]). Only `:poisson` is supported by EvoTreeCount.") + else + args[:loss] = Poisson() end args[:rng] = mk_rng(args[:rng])::Random.AbstractRNG @@ -330,7 +332,7 @@ function EvoTreeGaussian(; kwargs...) args[:rng] = mk_rng(args[:rng])::Random.AbstractRNG - model = EvoTreeCount( + model = EvoTreeGaussian( args[:loss], args[:nrounds], args[:T](args[:lambda]), diff --git a/src/predict.jl b/src/predict.jl index 5893bc81..6a0154c8 100644 --- a/src/predict.jl +++ b/src/predict.jl @@ -103,7 +103,7 @@ function pred_scalar_cpu!(::S, ∑::Vector{T}, params::EvoTypes, K) where {S<:Ga end # prediction in Leaf - MultiClassRegression -function pred_leaf_cpu!(::S, pred, n, ∑::Vector{T}, params::EvoTypes, K) where {S<:MultiClassRegression,T} +function pred_leaf_cpu!(::S, pred, n, ∑::Vector{T}, params::EvoTypes, K, δ𝑤, 𝑖) where {S<:MultiClassRegression,T} @inbounds for k = 1:K pred[k, n] = -params.eta * ∑[k] / (∑[k+K] + params.lambda * ∑[2*K+1]) end diff --git a/test/monotonic.jl b/test/monotonic.jl index eed93271..7db4c413 100644 --- a/test/monotonic.jl +++ b/test/monotonic.jl @@ -1,238 +1,241 @@ -using Revise -using Statistics -using StatsBase: sample -using EvoTrees -using EvoTrees: sigmoid, logit - -# prepare a dataset -features = rand(10_000) .* 2.5 -X = reshape(features, (size(features)[1], 1)) -Y = sin.(features) .* 0.5 .+ 0.5 -Y = logit(Y) + randn(size(Y)) .* 0.2 -Y = sigmoid(Y) -𝑖 = collect(1:size(X, 1)) -seed = 123 - -# train-eval split -𝑖_sample = sample(𝑖, size(𝑖, 1), replace=false) -train_size = 0.8 -𝑖_train = 𝑖_sample[1:floor(Int, train_size * size(𝑖, 1))] -𝑖_eval = 𝑖_sample[floor(Int, train_size * size(𝑖, 1))+1:end] - -X_train, X_eval = X[𝑖_train, :], X[𝑖_eval, :] -Y_train, Y_eval = Y[𝑖_train], Y[𝑖_eval] - -###################################### -### Linear - CPU -###################################### -# benchmark -params1 = EvoTreeRegressor( - device="cpu", - loss=:linear, metric=:mse, - nrounds=200, nbins=32, - lambda=1.0, gamma=0.0, eta=0.05, - max_depth=6, min_weight=0.0, - rowsample=0.5, colsample=1.0, rng=seed) - -model = fit_evotree(params1, X_train, Y_train, X_eval=X_eval, Y_eval=Y_eval, print_every_n=25); -preds_ref = predict(model, X_train); - -# monotonic constraint -params1 = EvoTreeRegressor( - device="cpu", - loss=:linear, metric=:mse, - nrounds=200, nbins=32, - lambda=1.0, gamma=0.0, eta=0.5, - max_depth=6, min_weight=0.0, - monotone_constraints=Dict(1 => 1), - rowsample=0.5, colsample=1.0, rng=seed) - -model = fit_evotree(params1, X_train, Y_train, X_eval=X_eval, Y_eval=Y_eval, print_every_n=25); -preds_mono = predict(model, X_train); - -using Plots -using Colors -x_perm = sortperm(X_train[:, 1]) -plot(X_train, Y_train, msize=1, mcolor="gray", mswidth=0, background_color=RGB(1, 1, 1), seriestype=:scatter, xaxis=("feature"), yaxis=("target"), legend=true, label="") -plot!(X_train[:, 1][x_perm], preds_ref[x_perm], color="navy", linewidth=1.5, label="Reference") -plot!(X_train[:, 1][x_perm], preds_mono[x_perm], color="red", linewidth=1.5, label="Monotonic") - - -###################################### -### Linear - GPU -###################################### -# benchmark -params1 = EvoTreeRegressor( - device="gpu", - loss=:linear, metric=:mse, - nrounds=200, nbins=32, - lambda=1.0, gamma=0.0, eta=0.05, - max_depth=6, min_weight=0.0, - rowsample=0.5, colsample=1.0, rng=seed) - -model = fit_evotree(params1, X_train, Y_train, X_eval=X_eval, Y_eval=Y_eval, print_every_n=25); -preds_ref = predict(model, X_train); - -# monotonic constraint -params1 = EvoTreeRegressor( - device="gpu", - loss=:linear, metric=:mse, - nrounds=200, nbins=32, - lambda=1.0, gamma=0.0, eta=0.5, - max_depth=6, min_weight=0.0, - monotone_constraints=Dict(1 => 1), - rowsample=0.5, colsample=1.0, rng=seed) - -model = fit_evotree(params1, X_train, Y_train, X_eval=X_eval, Y_eval=Y_eval, print_every_n=25); -preds_mono = predict(model, X_train); - -using Plots -using Colors -x_perm = sortperm(X_train[:, 1]) -plot(X_train, Y_train, msize=1, mcolor="gray", mswidth=0, background_color=RGB(1, 1, 1), seriestype=:scatter, xaxis=("feature"), yaxis=("target"), legend=true, label="") -plot!(X_train[:, 1][x_perm], preds_ref[x_perm], color="navy", linewidth=1.5, label="Reference") -plot!(X_train[:, 1][x_perm], preds_mono[x_perm], color="red", linewidth=1.5, label="Monotonic") - - -###################################### -### Logistic - CPU -###################################### -# benchmark -params1 = EvoTreeRegressor( - device="cpu", - loss=:logistic, metric=:logloss, - nrounds=200, nbins=32, - lambda=0.05, gamma=0.0, eta=0.05, - max_depth=6, min_weight=0.0, - rowsample=0.5, colsample=1.0, rng=seed) - -model = fit_evotree(params1, X_train, Y_train, X_eval=X_eval, Y_eval=Y_eval, print_every_n=25); -preds_ref = predict(model, X_train); - -# monotonic constraint -params1 = EvoTreeRegressor( - device="cpu", - loss=:logistic, metric=:logloss, - nrounds=200, nbins=32, - lambda=0.05, gamma=0.0, eta=0.05, - max_depth=6, min_weight=0.0, - monotone_constraints=Dict(1 => 1), - rowsample=0.5, colsample=1.0, rng=seed) - -model = fit_evotree(params1, X_train, Y_train, X_eval=X_eval, Y_eval=Y_eval, print_every_n=25); -preds_mono = predict(model, X_train); - -using Plots -using Colors -x_perm = sortperm(X_train[:, 1]) -plot(X_train, Y_train, msize=1, mcolor="gray", mswidth=0, background_color=RGB(1, 1, 1), seriestype=:scatter, xaxis=("feature"), yaxis=("target"), legend=true, label="") -plot!(X_train[:, 1][x_perm], preds_ref[x_perm], color="navy", linewidth=1.5, label="Reference") -plot!(X_train[:, 1][x_perm], preds_mono[x_perm], color="red", linewidth=1.5, label="Monotonic") - - -###################################### -### Logistic - GPU -###################################### -# benchmark -params1 = EvoTreeRegressor( - device="gpu", - loss=:logistic, metric=:logloss, - nrounds=200, nbins=32, - lambda=0.05, gamma=0.0, eta=0.05, - max_depth=6, min_weight=0.0, - rowsample=0.5, colsample=1.0, rng=seed) - -model = fit_evotree(params1, X_train, Y_train, X_eval=X_eval, Y_eval=Y_eval, print_every_n=25); -preds_ref = predict(model, X_train); - -# monotonic constraint -params1 = EvoTreeRegressor( - device="gpu", - loss=:logistic, metric=:logloss, - nrounds=200, nbins=32, - lambda=0.05, gamma=0.0, eta=0.05, - max_depth=6, min_weight=0.0, - monotone_constraints=Dict(1 => 1), - rowsample=0.5, colsample=1.0, rng=seed) - -model = fit_evotree(params1, X_train, Y_train, X_eval=X_eval, Y_eval=Y_eval, print_every_n=25); -preds_mono = predict(model, X_train); - -using Plots -using Colors -x_perm = sortperm(X_train[:, 1]) -plot(X_train, Y_train, msize=1, mcolor="gray", mswidth=0, background_color=RGB(1, 1, 1), seriestype=:scatter, xaxis=("feature"), yaxis=("target"), legend=true, label="") -plot!(X_train[:, 1][x_perm], preds_ref[x_perm], color="navy", linewidth=1.5, label="Reference") -plot!(X_train[:, 1][x_perm], preds_mono[x_perm], color="red", linewidth=1.5, label="Monotonic") - - -###################################### -### Gaussian - CPU -###################################### -# linear - benchmark -params1 = EvoTreeGaussian( - device="cpu", - metric=:gaussian, - nrounds=200, nbins=32, - lambda=1.0, gamma=0.0, eta=0.05, - max_depth=6, min_weight=0.0, - rowsample=0.5, colsample=1.0, rng=seed) - -model = fit_evotree(params1, X_train, Y_train, X_eval=X_eval, Y_eval=Y_eval, print_every_n=25); -preds_ref = predict(model, X_train); - -# monotonic constraint -params1 = EvoTreeGaussian( - device="cpu", - metric=:gaussian, - nrounds=200, nbins=32, - lambda=1.0, gamma=0.0, eta=0.5, - max_depth=6, min_weight=0.0, - monotone_constraints=Dict(1 => 1), - rowsample=0.5, colsample=1.0, rng=seed) - -model = fit_evotree(params1, X_train, Y_train, X_eval=X_eval, Y_eval=Y_eval, print_every_n=25); -preds_mono = predict(model, X_train); - -using Plots -using Colors -x_perm = sortperm(X_train[:, 1]) -plot(X_train, Y_train, msize=1, mcolor="gray", mswidth=0, background_color=RGB(1, 1, 1), seriestype=:scatter, xaxis=("feature"), yaxis=("target"), legend=true, label="") -plot!(X_train[:, 1][x_perm], preds_ref[x_perm], color="navy", linewidth=1.5, label="Reference") -plot!(X_train[:, 1][x_perm], preds_mono[x_perm], color="red", linewidth=1.5, label="Monotonic") - - -###################################### -### Gaussian - GPU -###################################### -# linear - benchmark -params1 = EvoTreeGaussian( - device="gpu", - metric=:gaussian, - nrounds=200, nbins=32, - lambda=1.0, gamma=0.0, eta=0.05, - max_depth=6, min_weight=0.0, - rowsample=0.5, colsample=1.0, rng=seed) - -model = fit_evotree(params1, X_train, Y_train, X_eval=X_eval, Y_eval=Y_eval, print_every_n=25); -preds_ref = predict(model, X_train); - -# monotonic constraint -params1 = EvoTreeGaussian( - device="gpu", - metric=:gaussian, - nrounds=200, nbins=32, - lambda=1.0, gamma=0.0, eta=0.5, - max_depth=6, min_weight=0.0, - monotone_constraints=Dict(1 => 1), - rowsample=0.5, colsample=1.0, rng=seed) - -model = fit_evotree(params1, X_train, Y_train, X_eval=X_eval, Y_eval=Y_eval, print_every_n=25); -preds_mono = predict(model, X_train); - -using Plots -using Colors -x_perm = sortperm(X_train[:, 1]) -plot(X_train, Y_train, msize=1, mcolor="gray", mswidth=0, background_color=RGB(1, 1, 1), seriestype=:scatter, xaxis=("feature"), yaxis=("target"), legend=true, label="") -plot!(X_train[:, 1][x_perm], preds_ref[x_perm], color="navy", linewidth=1.5, label="Reference") -plot!(X_train[:, 1][x_perm], preds_mono[x_perm], color="red", linewidth=1.5, label="Monotonic") +@testset "Monotonic Constraints" begin + + using Statistics + using StatsBase: sample + using EvoTrees + using EvoTrees: sigmoid, logit + + # prepare a dataset + features = rand(10_000) .* 2.5 + X = reshape(features, (size(features)[1], 1)) + Y = sin.(features) .* 0.5 .+ 0.5 + Y = logit(Y) + randn(size(Y)) .* 0.2 + Y = sigmoid(Y) + 𝑖 = collect(1:size(X, 1)) + seed = 123 + + # train-eval split + 𝑖_sample = sample(𝑖, size(𝑖, 1), replace=false) + train_size = 0.8 + 𝑖_train = 𝑖_sample[1:floor(Int, train_size * size(𝑖, 1))] + 𝑖_eval = 𝑖_sample[floor(Int, train_size * size(𝑖, 1))+1:end] + + X_train, X_eval = X[𝑖_train, :], X[𝑖_eval, :] + Y_train, Y_eval = Y[𝑖_train], Y[𝑖_eval] + + ###################################### + ### Linear - CPU + ###################################### + # benchmark + params1 = EvoTreeRegressor( + device="cpu", + loss=:linear, metric=:mse, + nrounds=200, nbins=32, + lambda=1.0, gamma=0.0, eta=0.05, + max_depth=6, min_weight=0.0, + rowsample=0.5, colsample=1.0, rng=seed) + + model = fit_evotree(params1, X_train, Y_train, X_eval=X_eval, Y_eval=Y_eval, print_every_n=25) + preds_ref = predict(model, X_train) + + # monotonic constraint + params1 = EvoTreeRegressor( + device="cpu", + loss=:linear, metric=:mse, + nrounds=200, nbins=32, + lambda=1.0, gamma=0.0, eta=0.5, + max_depth=6, min_weight=0.0, + monotone_constraints=Dict(1 => 1), + rowsample=0.5, colsample=1.0, rng=seed) + + model = fit_evotree(params1, X_train, Y_train, X_eval=X_eval, Y_eval=Y_eval, print_every_n=25) + preds_mono = predict(model, X_train) + + # using Plots + # using Colors + # x_perm = sortperm(X_train[:, 1]) + # plot(X_train, Y_train, msize=1, mcolor="gray", mswidth=0, background_color=RGB(1, 1, 1), seriestype=:scatter, xaxis=("feature"), yaxis=("target"), legend=true, label="") + # plot!(X_train[:, 1][x_perm], preds_ref[x_perm], color="navy", linewidth=1.5, label="Reference") + # plot!(X_train[:, 1][x_perm], preds_mono[x_perm], color="red", linewidth=1.5, label="Monotonic") + + + ###################################### + ### Linear - GPU + ###################################### + # benchmark + # params1 = EvoTreeRegressor( + # device="gpu", + # loss=:linear, metric=:mse, + # nrounds=200, nbins=32, + # lambda=1.0, gamma=0.0, eta=0.05, + # max_depth=6, min_weight=0.0, + # rowsample=0.5, colsample=1.0, rng=seed) + + # model = fit_evotree(params1, X_train, Y_train, X_eval=X_eval, Y_eval=Y_eval, print_every_n=25); + # preds_ref = predict(model, X_train); + + # # monotonic constraint + # params1 = EvoTreeRegressor( + # device="gpu", + # loss=:linear, metric=:mse, + # nrounds=200, nbins=32, + # lambda=1.0, gamma=0.0, eta=0.5, + # max_depth=6, min_weight=0.0, + # monotone_constraints=Dict(1 => 1), + # rowsample=0.5, colsample=1.0, rng=seed) + + # model = fit_evotree(params1, X_train, Y_train, X_eval=X_eval, Y_eval=Y_eval, print_every_n=25); + # preds_mono = predict(model, X_train); + + # using Plots + # using Colors + # x_perm = sortperm(X_train[:, 1]) + # plot(X_train, Y_train, msize=1, mcolor="gray", mswidth=0, background_color=RGB(1, 1, 1), seriestype=:scatter, xaxis=("feature"), yaxis=("target"), legend=true, label="") + # plot!(X_train[:, 1][x_perm], preds_ref[x_perm], color="navy", linewidth=1.5, label="Reference") + # plot!(X_train[:, 1][x_perm], preds_mono[x_perm], color="red", linewidth=1.5, label="Monotonic") + + + ###################################### + ### Logistic - CPU + ###################################### + # benchmark + params1 = EvoTreeRegressor( + device="cpu", + loss=:logistic, metric=:logloss, + nrounds=200, nbins=32, + lambda=0.05, gamma=0.0, eta=0.05, + max_depth=6, min_weight=0.0, + rowsample=0.5, colsample=1.0, rng=seed) + + model = fit_evotree(params1, X_train, Y_train, X_eval=X_eval, Y_eval=Y_eval, print_every_n=25) + preds_ref = predict(model, X_train) + + # monotonic constraint + params1 = EvoTreeRegressor( + device="cpu", + loss=:logistic, metric=:logloss, + nrounds=200, nbins=32, + lambda=0.05, gamma=0.0, eta=0.05, + max_depth=6, min_weight=0.0, + monotone_constraints=Dict(1 => 1), + rowsample=0.5, colsample=1.0, rng=seed) + + model = fit_evotree(params1, X_train, Y_train, X_eval=X_eval, Y_eval=Y_eval, print_every_n=25) + preds_mono = predict(model, X_train) + + # using Plots + # using Colors + # x_perm = sortperm(X_train[:, 1]) + # plot(X_train, Y_train, msize=1, mcolor="gray", mswidth=0, background_color=RGB(1, 1, 1), seriestype=:scatter, xaxis=("feature"), yaxis=("target"), legend=true, label="") + # plot!(X_train[:, 1][x_perm], preds_ref[x_perm], color="navy", linewidth=1.5, label="Reference") + # plot!(X_train[:, 1][x_perm], preds_mono[x_perm], color="red", linewidth=1.5, label="Monotonic") + + + ###################################### + ### Logistic - GPU + ###################################### + # benchmark + # params1 = EvoTreeRegressor( + # device="gpu", + # loss=:logistic, metric=:logloss, + # nrounds=200, nbins=32, + # lambda=0.05, gamma=0.0, eta=0.05, + # max_depth=6, min_weight=0.0, + # rowsample=0.5, colsample=1.0, rng=seed) + + # model = fit_evotree(params1, X_train, Y_train, X_eval=X_eval, Y_eval=Y_eval, print_every_n=25); + # preds_ref = predict(model, X_train); + + # # monotonic constraint + # params1 = EvoTreeRegressor( + # device="gpu", + # loss=:logistic, metric=:logloss, + # nrounds=200, nbins=32, + # lambda=0.05, gamma=0.0, eta=0.05, + # max_depth=6, min_weight=0.0, + # monotone_constraints=Dict(1 => 1), + # rowsample=0.5, colsample=1.0, rng=seed) + + # model = fit_evotree(params1, X_train, Y_train, X_eval=X_eval, Y_eval=Y_eval, print_every_n=25); + # preds_mono = predict(model, X_train); + + # using Plots + # using Colors + # x_perm = sortperm(X_train[:, 1]) + # plot(X_train, Y_train, msize=1, mcolor="gray", mswidth=0, background_color=RGB(1, 1, 1), seriestype=:scatter, xaxis=("feature"), yaxis=("target"), legend=true, label="") + # plot!(X_train[:, 1][x_perm], preds_ref[x_perm], color="navy", linewidth=1.5, label="Reference") + # plot!(X_train[:, 1][x_perm], preds_mono[x_perm], color="red", linewidth=1.5, label="Monotonic") + + + ###################################### + ### Gaussian - CPU + ###################################### + # linear - benchmark + params1 = EvoTreeGaussian( + device="cpu", + metric=:gaussian, + nrounds=200, nbins=32, + lambda=1.0, gamma=0.0, eta=0.05, + max_depth=6, min_weight=0.0, + rowsample=0.5, colsample=1.0, rng=seed) + + model = fit_evotree(params1, X_train, Y_train, X_eval=X_eval, Y_eval=Y_eval, print_every_n=25) + preds_ref = predict(model, X_train) + + # monotonic constraint + params1 = EvoTreeGaussian( + device="cpu", + metric=:gaussian, + nrounds=200, nbins=32, + lambda=1.0, gamma=0.0, eta=0.5, + max_depth=6, min_weight=0.0, + monotone_constraints=Dict(1 => 1), + rowsample=0.5, colsample=1.0, rng=seed) + + model = fit_evotree(params1, X_train, Y_train, X_eval=X_eval, Y_eval=Y_eval, print_every_n=25) + preds_mono = predict(model, X_train) + + # using Plots + # using Colors + # x_perm = sortperm(X_train[:, 1]) + # plot(X_train, Y_train, msize=1, mcolor="gray", mswidth=0, background_color=RGB(1, 1, 1), seriestype=:scatter, xaxis=("feature"), yaxis=("target"), legend=true, label="") + # plot!(X_train[:, 1][x_perm], preds_ref[x_perm], color="navy", linewidth=1.5, label="Reference") + # plot!(X_train[:, 1][x_perm], preds_mono[x_perm], color="red", linewidth=1.5, label="Monotonic") + + + ###################################### + ### Gaussian - GPU + ###################################### + # linear - benchmark + # params1 = EvoTreeGaussian( + # device="gpu", + # metric=:gaussian, + # nrounds=200, nbins=32, + # lambda=1.0, gamma=0.0, eta=0.05, + # max_depth=6, min_weight=0.0, + # rowsample=0.5, colsample=1.0, rng=seed) + + # model = fit_evotree(params1, X_train, Y_train, X_eval=X_eval, Y_eval=Y_eval, print_every_n=25); + # preds_ref = predict(model, X_train); + + # # monotonic constraint + # params1 = EvoTreeGaussian( + # device="gpu", + # metric=:gaussian, + # nrounds=200, nbins=32, + # lambda=1.0, gamma=0.0, eta=0.5, + # max_depth=6, min_weight=0.0, + # monotone_constraints=Dict(1 => 1), + # rowsample=0.5, colsample=1.0, rng=seed) + + # model = fit_evotree(params1, X_train, Y_train, X_eval=X_eval, Y_eval=Y_eval, print_every_n=25); + # preds_mono = predict(model, X_train); + + # using Plots + # using Colors + # x_perm = sortperm(X_train[:, 1]) + # plot(X_train, Y_train, msize=1, mcolor="gray", mswidth=0, background_color=RGB(1, 1, 1), seriestype=:scatter, xaxis=("feature"), yaxis=("target"), legend=true, label="") + # plot!(X_train[:, 1][x_perm], preds_ref[x_perm], color="navy", linewidth=1.5, label="Reference") + # plot!(X_train[:, 1][x_perm], preds_mono[x_perm], color="red", linewidth=1.5, label="Monotonic") + +end \ No newline at end of file diff --git a/test/runtests.jl b/test/runtests.jl index 1e8c073e..d9137d0e 100644 --- a/test/runtests.jl +++ b/test/runtests.jl @@ -7,6 +7,7 @@ using Test @testset "Internal API" begin include("core.jl") + include("monotonic.jl") end @testset "MLJ" begin From 937d27daebd706b7614eecb2059de1c814ff404f Mon Sep 17 00:00:00 2001 From: "jeremie.desgagne.bouchard" Date: Thu, 8 Sep 2022 11:52:28 -0400 Subject: [PATCH 2/2] monotonic --- Project.toml | 2 +- src/find_split.jl | 100 +--------------------------------------------- 2 files changed, 3 insertions(+), 99 deletions(-) diff --git a/Project.toml b/Project.toml index 612e7063..96b0ab4b 100644 --- a/Project.toml +++ b/Project.toml @@ -1,7 +1,7 @@ name = "EvoTrees" uuid = "f6006082-12f8-11e9-0c9c-0d5d367ab1e5" authors = ["jeremiedb "] -version = "0.10.0" +version = "0.10.1" [deps] BSON = "fbb218c0-5317-5bc6-957e-2ee96dd4b1f0" diff --git a/src/find_split.jl b/src/find_split.jl index db3f22fe..1a7cb8f8 100644 --- a/src/find_split.jl +++ b/src/find_split.jl @@ -26,25 +26,6 @@ function binarize(X, edges) return X_bin end -""" - Non Allocating split_set! - Take a view into left and right placeholders. Right ids are assigned at the end of the length of the current node set. -""" -# function split_set!(left::V, right::V, 𝑖, X_bin::Matrix{S}, feat, cond_bin::S, offset) where {S,V} -# left_count = 0 -# right_count = 0 -# @inbounds for i in 1:length(𝑖) -# @inbounds if X_bin[𝑖[i], feat] <= cond_bin -# left_count += 1 -# left[offset + left_count] = 𝑖[i] -# else -# right[offset + length(𝑖) - right_count] = 𝑖[i] -# right_count += 1 -# end -# end -# return (view(left, (offset + 1):(offset + left_count)), view(right, (offset + length(𝑖)):-1:(offset + left_count + 1))) -# end - """ Multi-threaded split_set! Take a view into left and right placeholders. Right ids are assigned at the end of the length of the current node set. @@ -178,7 +159,7 @@ function update_hist!( @threads for j in 𝑗 @inbounds for i in 𝑖 hid = (2 * K + 1) * (X_bin[i, j] - 1) - for k = 1:(2*K+1) + for k in 1:(2*K+1) hist[j][hid+k] += δ𝑤[k, i] end end @@ -187,83 +168,6 @@ function update_hist!( end -# """ -# update_gains! -# GradientRegression -# """ -# function update_gains!( -# loss::L, -# node::TrainNode{T}, -# 𝑗::Vector{S}, -# params::EvoTypes, K, monotone_constraints) where {L<:GradientRegression,T,S} - -# @threads for j in 𝑗 -# node.hL[j][1] = node.h[j][1] -# node.hL[j][2] = node.h[j][2] -# node.hL[j][3] = node.h[j][3] - -# node.hR[j][1] = node.∑[1] - node.h[j][1] -# node.hR[j][2] = node.∑[2] - node.h[j][2] -# node.hR[j][3] = node.∑[3] - node.h[j][3] -# @inbounds @simd for bin = 2:params.nbins -# binid = 3 * bin - 2 -# node.hL[j][binid] = node.hL[j][binid-3] + node.h[j][binid] -# node.hL[j][binid+1] = node.hL[j][binid-2] + node.h[j][binid+1] -# node.hL[j][binid+2] = node.hL[j][binid-1] + node.h[j][binid+2] - -# node.hR[j][binid] = node.hR[j][binid-3] - node.h[j][binid] -# node.hR[j][binid+1] = node.hR[j][binid-2] - node.h[j][binid+1] -# node.hR[j][binid+2] = node.hR[j][binid-1] - node.h[j][binid+2] - -# end -# hist_gains_cpu!(loss, view(node.gains, :, j), node.hL[j], node.hR[j], params, K, monotone_constraints[j]) -# end -# return nothing -# end - -# """ -# update_gains! -# GaussianRegression -# """ -# function update_gains!( -# loss::L, -# node::TrainNode{T}, -# 𝑗::Vector{S}, -# params::EvoTypes, K, monotone_constraints) where {L<:GaussianRegression,T,S} - -# @threads for j in 𝑗 -# node.hL[j][1] = node.h[j][1] -# node.hL[j][2] = node.h[j][2] -# node.hL[j][3] = node.h[j][3] -# node.hL[j][4] = node.h[j][4] -# node.hL[j][5] = node.h[j][5] - -# node.hR[j][1] = node.∑[1] - node.h[j][1] -# node.hR[j][2] = node.∑[2] - node.h[j][2] -# node.hR[j][3] = node.∑[3] - node.h[j][3] -# node.hR[j][4] = node.∑[4] - node.h[j][4] -# node.hR[j][5] = node.∑[5] - node.h[j][5] -# @inbounds @simd for bin in 2:params.nbins -# binid = 5 * bin - 4 -# node.hL[j][binid] = node.hL[j][binid-5] + node.h[j][binid] -# node.hL[j][binid+1] = node.hL[j][binid-4] + node.h[j][binid+1] -# node.hL[j][binid+2] = node.hL[j][binid-3] + node.h[j][binid+2] -# node.hL[j][binid+3] = node.hL[j][binid-2] + node.h[j][binid+3] -# node.hL[j][binid+4] = node.hL[j][binid-1] + node.h[j][binid+4] - -# node.hR[j][binid] = node.hR[j][binid-5] - node.h[j][binid] -# node.hR[j][binid+1] = node.hR[j][binid-4] - node.h[j][binid+1] -# node.hR[j][binid+2] = node.hR[j][binid-3] - node.h[j][binid+2] -# node.hR[j][binid+3] = node.hR[j][binid-2] - node.h[j][binid+3] -# node.hR[j][binid+4] = node.hR[j][binid-1] - node.h[j][binid+4] - -# end -# hist_gains_cpu!(loss, view(node.gains, :, j), node.hL[j], node.hR[j], params, K, monotone_constraints[j]) -# end -# return nothing -# end - - """ update_gains!( loss::L, @@ -288,7 +192,7 @@ function update_gains!( end @inbounds for bin in 2:params.nbins - @inbounds @simd for k = 1:KK + @inbounds for k = 1:KK binid = KK * (bin - 1) node.hL[j][binid+k] = node.hL[j][binid-KK+k] + node.h[j][binid+k] node.hR[j][binid+k] = node.hR[j][binid-KK+k] - node.h[j][binid+k]