~ajf/root/LossFunction_8cxx_source.html

 // @(#)root/tmva $Id$

 // Author: Andreas Hoecker, Peter Speckmayer, Joerg Stelzer, Helge Voss, Jan Therhaag


 /**********************************************************************************

  * Project: TMVA - a Root-integrated toolkit for multivariate data analysis       *

  * Package: TMVA                                                                  *

  * Class  : LossFunction                                                          *

  * Web    : http://tmva.sourceforge.net                                           *

  *                                                                                *

  * Description:                                                                   *

  *      Implementation (see header for description)                               *

  *                                                                                *

  * Authors (alphabetical):                                                        *

  *      Andreas Hoecker <Andreas.Hocker@cern.ch> - CERN, Switzerland              *

  *      Peter Speckmayer <Peter.Speckmayer@cern.ch> - CERN, Switzerland           *

  *      Joerg Stelzer   <Joerg.Stelzer@cern.ch>  - CERN, Switzerland              *

  *      Jan Therhaag       <Jan.Therhaag@cern.ch>     - U of Bonn, Germany        *

  *      Helge Voss      <Helge.Voss@cern.ch>     - MPI-K Heidelberg, Germany      *

  *                                                                                *

  * Copyright (c) 2005-2011:                                                       *

  *      CERN, Switzerland                                                         *

  *      U. of Victoria, Canada                                                    *

  *      MPI-K Heidelberg, Germany                                                 *

  *      U. of Bonn, Germany                                                       *

  *                                                                                *

  * Redistribution and use in source and binary forms, with or without             *

  * modification, are permitted according to the terms listed in LICENSE           *

  * (http://mva.sourceforge.net/license.txt)                                       *

  **********************************************************************************/


 /*! \class TMVA::HuberLossFunction

 \ingroup TMVA


 Huber Loss Function.


 */


 #include "TMVA/LossFunction.h"

 #include "TMVA/Config.h"


 #include "TMVA/MsgLogger.h"


 #include "Rtypes.h"

 #include "TMath.h"

 #include <iostream>


 // multithreading only if the compilation flag is turned on

 #ifdef R__USE_IMT

 #include <ROOT/TThreadExecutor.hxx>

 #include "ROOT/TSeq.hxx"

 #endif


 ////////////////////////////////////////////////////////////////////////////////

 /// huber constructor


 TMVA::HuberLossFunction::HuberLossFunction(){

     fTransitionPoint = -9999;

     fSumOfWeights = -9999;

     fQuantile = 0.7;      // the quantile value determines the bulk of the data, e.g. 0.7 defines

                           // the core as the first 70% and the tails as the last 30%

 }


 TMVA::HuberLossFunction::HuberLossFunction(Double_t quantile){

     fSumOfWeights = -9999;

     fTransitionPoint = -9999;

     fQuantile = quantile;

 }


 ////////////////////////////////////////////////////////////////////////////////

 /// huber destructor


 TMVA::HuberLossFunction::~HuberLossFunction(){


 }


 ////////////////////////////////////////////////////////////////////////////////

 /// figure out the residual that determines the separation between the

 /// "core" and the "tails" of the residuals distribution


 void TMVA::HuberLossFunction::Init(std::vector<LossFunctionEventInfo>& evs){


    // Calculate the residual that separates the core and the tails

    SetSumOfWeights(evs);

    SetTransitionPoint(evs);

 }


 ////////////////////////////////////////////////////////////////////////////////

 /// huber, calculate the sum of weights for the events in the vector


 // Multithreaded version of HuberLossFunction::CalculateSumOfWeights

 #ifdef R__USE_IMT

 Double_t TMVA::HuberLossFunction::CalculateSumOfWeights(const std::vector<LossFunctionEventInfo>& evs){

    // need a lambda function to pass to TThreadExecutor::MapReduce

    auto mapFunc = [&evs](UInt_t i) { return evs[i].weight; };

    auto redFunc = [](const std::vector<Double_t> &a) { return std::accumulate(a.begin(), a.end(), 0.0); };


    return TMVA::Config::Instance().GetThreadExecutor().MapReduce(

       mapFunc, ROOT::TSeqU(evs.size()), redFunc, TMVA::Config::Instance().GetThreadExecutor().GetPoolSize());

 }


 // Standard version of HuberLossFunction::CalculateSumOfWeights

 #else

 Double_t TMVA::HuberLossFunction::CalculateSumOfWeights(const std::vector<LossFunctionEventInfo>& evs){


    // Calculate the sum of the weights

    Double_t sumOfWeights = 0;

    for(UInt_t i = 0; i<evs.size(); i++)

       sumOfWeights+=evs[i].weight;


    return sumOfWeights;

 }

 #endif


 ////////////////////////////////////////////////////////////////////////////////

 /// huber, determine the quantile for a given input


 Double_t TMVA::HuberLossFunction::CalculateQuantile(std::vector<LossFunctionEventInfo>& evs, Double_t whichQuantile, Double_t sumOfWeights, bool abs){


    // use a lambda function to tell the vector how to sort the LossFunctionEventInfo data structures

    // (sort them in ascending order of residual magnitude) if abs is true

    // otherwise sort them in ascending order of residual

    if(abs)

       std::sort(evs.begin(), evs.end(), [](LossFunctionEventInfo a, LossFunctionEventInfo b){

                                            return TMath::Abs(a.trueValue-a.predictedValue) < TMath::Abs(b.trueValue-b.predictedValue); });

    else

       std::sort(evs.begin(), evs.end(), [](LossFunctionEventInfo a, LossFunctionEventInfo b){

                                            return (a.trueValue-a.predictedValue) < (b.trueValue-b.predictedValue); });

    UInt_t i = 0;

    Double_t temp = 0.0;

    while(i<evs.size()-1 && temp <= sumOfWeights*whichQuantile){

       temp += evs[i].weight;

       i++;

    }

    // edge cases

    // Output warning for low return values

    if(whichQuantile == 0) i=0;             // assume 0th quantile to mean the 0th entry in the ordered series


    // usual returns

    if(abs) return TMath::Abs(evs[i].trueValue-evs[i].predictedValue);

    else return evs[i].trueValue-evs[i].predictedValue;

 }


 ////////////////////////////////////////////////////////////////////////////////

 /// huber, determine the transition point using the values for fQuantile and fSumOfWeights

 /// which presumably have already been set


 void TMVA::HuberLossFunction::SetTransitionPoint(std::vector<LossFunctionEventInfo>& evs){

    fTransitionPoint = CalculateQuantile(evs, fQuantile, fSumOfWeights, true);


    // if the transition point corresponding to the quantile is 0 then the loss function will not function

    // the quantile was chosen too low. Let's use the first nonzero residual as the transition point instead.

    if(fTransitionPoint == 0){

       // evs should already be sorted according to the magnitude of the residuals, since CalculateQuantile does this

       for(UInt_t i=0; i<evs.size(); i++){

          Double_t residual = TMath::Abs(evs[i].trueValue - evs[i].predictedValue);

          if(residual != 0){

             fTransitionPoint = residual;

             break;

          }

       }

    }


    // Let the user know that the transition point is zero and the loss function won't work properly

    if(fTransitionPoint == 0){

       //std::cout << "The residual transition point for the Huber loss function corresponding to quantile, " << fQuantile << ", is zero."

       //<< " This implies that all of the residuals are zero and the events have been predicted perfectly. Perhaps the regression is too complex"

       //<< " for the amount of data." << std::endl;

    }

 }


 ////////////////////////////////////////////////////////////////////////////////

 /// huber, set the sum of weights given a collection of events


 void TMVA::HuberLossFunction::SetSumOfWeights(std::vector<LossFunctionEventInfo>& evs){

    fSumOfWeights = CalculateSumOfWeights(evs);

 }


 ////////////////////////////////////////////////////////////////////////////////

 /// huber,  determine the loss for a single event


 Double_t TMVA::HuberLossFunction::CalculateLoss(LossFunctionEventInfo& e){

    // If the huber loss function is uninitialized then assume a group of one

    // and initialize the transition point and weights for this single event

    if(fSumOfWeights == -9999){

       std::vector<LossFunctionEventInfo> evs{e};

       SetSumOfWeights(evs);

       SetTransitionPoint(evs);

    }


    Double_t residual = TMath::Abs(e.trueValue - e.predictedValue);

    Double_t loss = 0;

    // Quadratic loss in terms of the residual for small residuals

    if(residual <= fTransitionPoint) loss = 0.5*residual*residual;

    // Linear loss for large residuals, so that the tails don't dominate the net loss calculation

    else loss = fQuantile*residual - 0.5*fQuantile*fQuantile;

    return e.weight*loss;

 }


 ////////////////////////////////////////////////////////////////////////////////

 /// huber, determine the net loss for a collection of events


 Double_t TMVA::HuberLossFunction::CalculateNetLoss(std::vector<LossFunctionEventInfo>& evs){

    // Initialize the Huber Loss Function so that we can calculate the loss.

    // The loss for each event depends on the other events in the group

    // that define the cutoff quantile (fTransitionPoint).

    SetSumOfWeights(evs);

    SetTransitionPoint(evs);


    Double_t netloss = 0;

    for(UInt_t i=0; i<evs.size(); i++)

        netloss+=CalculateLoss(evs[i]);

    return netloss;

    // should get a function to return the average loss as well

    // return netloss/fSumOfWeights

 }


 ////////////////////////////////////////////////////////////////////////////////

 /// huber, determine the mean loss for a collection of events


 Double_t TMVA::HuberLossFunction::CalculateMeanLoss(std::vector<LossFunctionEventInfo>& evs){

    // Initialize the Huber Loss Function so that we can calculate the loss.

    // The loss for each event depends on the other events in the group

    // that define the cutoff quantile (fTransitionPoint).

    SetSumOfWeights(evs);

    SetTransitionPoint(evs);


    Double_t netloss = 0;

    for(UInt_t i=0; i<evs.size(); i++)

        netloss+=CalculateLoss(evs[i]);

    return netloss/fSumOfWeights;

 }


 /*! \class TMVA::HuberLossFunctionBDT

 \ingroup TMVA


 Huber BDT Loss Function.


 */


 TMVA::HuberLossFunctionBDT::HuberLossFunctionBDT(){

 }


 ////////////////////////////////////////////////////////////////////////////////

 /// huber BDT, initialize the targets and prepare for the regression


 void TMVA::HuberLossFunctionBDT::Init(std::map<const TMVA::Event*, LossFunctionEventInfo>& evinfomap, std::vector<double>& boostWeights){

 // Run this once before building the forest. Set initial prediction to weightedMedian.


    std::vector<LossFunctionEventInfo> evinfovec(evinfomap.size());

    for (auto &e: evinfomap){

       evinfovec.push_back(LossFunctionEventInfo(e.second.trueValue, e.second.predictedValue, e.first->GetWeight()));

    }


    // Calculates fSumOfWeights and fTransitionPoint with the current residuals

    SetSumOfWeights(evinfovec);

    Double_t weightedMedian = CalculateQuantile(evinfovec, 0.5, fSumOfWeights, false);


    //Store the weighted median as a first boosweight for later use

    boostWeights.push_back(weightedMedian);

    for (auto &e: evinfomap ) {

       // set the initial prediction for all events to the median

       e.second.predictedValue += weightedMedian;

    }

 }


 ////////////////////////////////////////////////////////////////////////////////

 /// huber BDT, set the targets for a collection of events


 // Multithreaded version of HuberLossFunctionBDT::SetTargets

 #ifdef R__USE_IMT

 void TMVA::HuberLossFunctionBDT::SetTargets(std::vector<const TMVA::Event*>& evs, std::map< const TMVA::Event*, LossFunctionEventInfo >& evinfomap){


    std::vector<LossFunctionEventInfo> eventvec(evs.size());


    // first we need to copy the events from evs into eventvec since we require a vector of LossFunctionEventInfo

    // for SetSumOfWeights and SetTransitionPoint. We use TThreadExecutor to implement the copy in parallel

    // need a lambda function to pass to TThreadExecutor::Map

    auto fcopy = [&eventvec, &evs, &evinfomap](UInt_t i) {

       eventvec[i] = LossFunctionEventInfo(evinfomap[evs[i]].trueValue, evinfomap[evs[i]].predictedValue, evs[i]->GetWeight());

    };


    TMVA::Config::Instance().GetThreadExecutor().Foreach(fcopy, ROOT::TSeqU(evs.size()), TMVA::Config::Instance().GetThreadExecutor().GetPoolSize());


    // Recalculate the residual that separates the "core" of the data and the "tails"

    // This residual is the quantile given by fQuantile, defaulted to 0.7

    // the quantile corresponding to 0.5 would be the usual median

    SetSumOfWeights(eventvec); // This was already set in init, but may change if there is subsampling for each tree

    SetTransitionPoint(eventvec);


    // ok now set the targets in parallel

    // need a lambda function to pass to TThreadExecutor::Map

    auto f = [this, &evinfomap](const TMVA::Event* ev) {

       const_cast<TMVA::Event*>(ev)->SetTarget(0, Target(evinfomap[ev]));

    };


    TMVA::Config::Instance().GetThreadExecutor().Foreach(f, evs, TMVA::Config::Instance().GetThreadExecutor().GetPoolSize());

 }


 // Standard version of HuberLossFunctionBDT::SetTargets

 #else

 void TMVA::HuberLossFunctionBDT::SetTargets(std::vector<const TMVA::Event*>& evs, std::map< const TMVA::Event*, LossFunctionEventInfo >& evinfomap){


    std::vector<LossFunctionEventInfo> eventvec(evs.size());

    for (std::vector<const TMVA::Event*>::const_iterator e=evs.begin(); e!=evs.end();e++){

       eventvec.push_back(LossFunctionEventInfo(evinfomap[*e].trueValue, evinfomap[*e].predictedValue, (*e)->GetWeight()));

    }


    // Recalculate the residual that separates the "core" of the data and the "tails"

    // This residual is the quantile given by fQuantile, defaulted to 0.7

    // the quantile corresponding to 0.5 would be the usual median

    SetSumOfWeights(eventvec); // This was already set in init, but may change if there is subsampling for each tree

    SetTransitionPoint(eventvec);


    for (std::vector<const TMVA::Event*>::const_iterator e=evs.begin(); e!=evs.end();e++) {

          const_cast<TMVA::Event*>(*e)->SetTarget(0,Target(evinfomap[*e]));

    }

 }

 #endif


 ////////////////////////////////////////////////////////////////////////////////

 /// huber BDT, set the target for a single event


 Double_t TMVA::HuberLossFunctionBDT::Target(LossFunctionEventInfo& e){

     Double_t residual = e.trueValue - e.predictedValue;

     // The weight/target relationships are taken care of in the tmva decision tree operations so we don't need to worry about that here

     if(TMath::Abs(residual) <= fTransitionPoint) return residual;

     else return fTransitionPoint*(residual<0?-1.0:1.0);

 }


 ////////////////////////////////////////////////////////////////////////////////

 /// huber BDT, determine the fit value for the terminal node based upon the

 /// events in the terminal node


 Double_t TMVA::HuberLossFunctionBDT::Fit(std::vector<LossFunctionEventInfo>& evs){

 // The fit in the terminal node for huber is basically the median of the residuals.

 // Then you add the average difference from the median to that.

 // The tails are discounted. If a residual is in the tails then we just use the

 // cutoff residual that sets the "core" and the "tails" instead of the large residual.

 // So we get something between least squares (mean as fit) and absolute deviation (median as fit).

    Double_t sumOfWeights = CalculateSumOfWeights(evs);

    Double_t shift=0,diff= 0;

    Double_t residualMedian = CalculateQuantile(evs,0.5,sumOfWeights, false);

    for(UInt_t j=0;j<evs.size();j++){

       Double_t residual = evs[j].trueValue - evs[j].predictedValue;

       diff = residual-residualMedian;

       // if we are using weights then I'm not sure why this isn't weighted

       shift+=1.0/evs.size()*((diff<0)?-1.0:1.0)*TMath::Min(fTransitionPoint,fabs(diff));

       // I think this should be

       // shift+=evs[j].weight/sumOfWeights*((diff<0)?-1.0:1.0)*TMath::Min(fTransitionPoint,fabs(diff));

       // not sure why it was originally coded like this

    }

    return (residualMedian + shift);


 }


 /*! \class TMVA::LeastSquaresLossFunction

 \ingroup TMVA


 Least Squares Loss Function.


 */


 // Constructor and destructor are in header file. They don't do anything.


 ////////////////////////////////////////////////////////////////////////////////

 /// least squares ,  determine the loss for a single event


 Double_t TMVA::LeastSquaresLossFunction::CalculateLoss(LossFunctionEventInfo& e){

    Double_t residual = (e.trueValue - e.predictedValue);

    Double_t loss = 0;

    loss = residual*residual;

    return e.weight*loss;

 }


 ////////////////////////////////////////////////////////////////////////////////

 /// least squares , determine the net loss for a collection of events


 Double_t TMVA::LeastSquaresLossFunction::CalculateNetLoss(std::vector<LossFunctionEventInfo>& evs){

    Double_t netloss = 0;

    for(UInt_t i=0; i<evs.size(); i++)

        netloss+=CalculateLoss(evs[i]);

    return netloss;

    // should get a function to return the average loss as well

    // return netloss/fSumOfWeights

 }


 ////////////////////////////////////////////////////////////////////////////////

 /// least squares , determine the mean loss for a collection of events


 Double_t TMVA::LeastSquaresLossFunction::CalculateMeanLoss(std::vector<LossFunctionEventInfo>& evs){

    Double_t netloss = 0;

    Double_t sumOfWeights = 0;

    for(UInt_t i=0; i<evs.size(); i++){

        sumOfWeights+=evs[i].weight;

        netloss+=CalculateLoss(evs[i]);

    }

    // return the weighted mean

    return netloss/sumOfWeights;

 }


 /*! \class TMVA::LeastSquaresLossFunctionBDT

 \ingroup TMVA


 Least Squares BDT Loss Function.


 */


 // Constructor and destructor defined in header. They don't do anything.


 ////////////////////////////////////////////////////////////////////////////////

 /// least squares BDT, initialize the targets and prepare for the regression


 void TMVA::LeastSquaresLossFunctionBDT::Init(std::map<const TMVA::Event*, LossFunctionEventInfo>& evinfomap, std::vector<double>& boostWeights){

 // Run this once before building the forest. Set initial prediction to the weightedMean


    std::vector<LossFunctionEventInfo> evinfovec(evinfomap.size());

    for (auto &e: evinfomap){

       evinfovec.push_back(LossFunctionEventInfo(e.second.trueValue, e.second.predictedValue, e.first->GetWeight()));

    }


    // Initial prediction for least squares is the weighted mean

    Double_t weightedMean = Fit(evinfovec);


    //Store the weighted median as a first boosweight for later use

    boostWeights.push_back(weightedMean);

    for (auto &e: evinfomap ) {

       // set the initial prediction for all events to the median

       e.second.predictedValue += weightedMean;

    }

 }


 ////////////////////////////////////////////////////////////////////////////////

 /// least squares BDT, set the targets for a collection of events


 // Multithreaded version of LeastSquaresLossFunctionBDT::SetTargets

 #ifdef R__USE_IMT

 void TMVA::LeastSquaresLossFunctionBDT::SetTargets(std::vector<const TMVA::Event*>& evs, std::map< const TMVA::Event*, LossFunctionEventInfo >& evinfomap) {


    // need a lambda function to pass to TThreadExecutor::Map

    auto f = [this, &evinfomap](const TMVA::Event* ev) {

       const_cast<TMVA::Event*>(ev)->SetTarget(0, Target(evinfomap[ev]));

    };


    TMVA::Config::Instance().GetThreadExecutor().Foreach(f, evs, TMVA::Config::Instance().GetThreadExecutor().GetPoolSize());

 }

 // Standard version of LeastSquaresLossFunctionBDT::SetTargets

 #else

 void TMVA::LeastSquaresLossFunctionBDT::SetTargets(std::vector<const TMVA::Event*>& evs, std::map< const TMVA::Event*, LossFunctionEventInfo >& evinfomap){


    for (std::vector<const TMVA::Event*>::const_iterator e=evs.begin(); e!=evs.end();e++) {

          const_cast<TMVA::Event*>(*e)->SetTarget(0,Target(evinfomap[*e]));

    }

 }

 #endif


 ////////////////////////////////////////////////////////////////////////////////

 /// least squares BDT, set the target for a single event


 Double_t TMVA::LeastSquaresLossFunctionBDT::Target(LossFunctionEventInfo& e){

     Double_t residual = e.trueValue - e.predictedValue;

     // The weight/target relationships are taken care of in the tmva decision tree operations. We don't need to worry about that here

     // and we return the residual instead of the weight*residual.

     return residual;

 }


 ////////////////////////////////////////////////////////////////////////////////

 /// huber BDT, determine the fit value for the terminal node based upon the

 /// events in the terminal node


 Double_t TMVA::LeastSquaresLossFunctionBDT::Fit(std::vector<LossFunctionEventInfo>& evs){

 // The fit in the terminal node for least squares is the weighted average of the residuals.

    Double_t sumOfWeights = 0;

    Double_t weightedResidualSum = 0;

    for(UInt_t j=0;j<evs.size();j++){

       sumOfWeights += evs[j].weight;

       Double_t residual = evs[j].trueValue - evs[j].predictedValue;

       weightedResidualSum += evs[j].weight*residual;

    }

    Double_t weightedMean = weightedResidualSum/sumOfWeights;


    // return the weighted mean

    return weightedMean;

 }


 /*! \class TMVA::AbsoluteDeviationLossFunction

 \ingroup TMVA


 Absolute Deviation Loss Function.


 */


 // Constructors in the header. They don't do anything.


 ////////////////////////////////////////////////////////////////////////////////

 /// absolute deviation,  determine the loss for a single event


 Double_t TMVA::AbsoluteDeviationLossFunction::CalculateLoss(LossFunctionEventInfo& e){

    Double_t residual = e.trueValue - e.predictedValue;

    return e.weight*TMath::Abs(residual);

 }


 ////////////////////////////////////////////////////////////////////////////////

 /// absolute deviation, determine the net loss for a collection of events


 Double_t TMVA::AbsoluteDeviationLossFunction::CalculateNetLoss(std::vector<LossFunctionEventInfo>& evs){


    Double_t netloss = 0;

    for(UInt_t i=0; i<evs.size(); i++)

        netloss+=CalculateLoss(evs[i]);

    return netloss;

 }


 ////////////////////////////////////////////////////////////////////////////////

 /// absolute deviation, determine the mean loss for a collection of events


 Double_t TMVA::AbsoluteDeviationLossFunction::CalculateMeanLoss(std::vector<LossFunctionEventInfo>& evs){

    Double_t sumOfWeights = 0;

    Double_t netloss = 0;

    for(UInt_t i=0; i<evs.size(); i++){

        sumOfWeights+=evs[i].weight;

        netloss+=CalculateLoss(evs[i]);

    }

    return netloss/sumOfWeights;

 }


 /*! \class TMVA::AbsoluteDeviationLossFunctionBDT

 \ingroup TMVA


 Absolute Deviation BDT Loss Function.


 */


 ////////////////////////////////////////////////////////////////////////////////

 /// absolute deviation BDT, initialize the targets and prepare for the regression


 void TMVA::AbsoluteDeviationLossFunctionBDT::Init(std::map<const TMVA::Event*, LossFunctionEventInfo>& evinfomap, std::vector<double>& boostWeights){

 // Run this once before building the forest. Set initial prediction to weightedMedian.


    std::vector<LossFunctionEventInfo> evinfovec(evinfomap.size());

    for (auto &e: evinfomap){

       evinfovec.push_back(LossFunctionEventInfo(e.second.trueValue, e.second.predictedValue, e.first->GetWeight()));

    }


    Double_t weightedMedian = Fit(evinfovec);


    //Store the weighted median as a first boostweight for later use

    boostWeights.push_back(weightedMedian);

    for (auto &e: evinfomap ) {

       // set the initial prediction for all events to the median

       e.second.predictedValue += weightedMedian;

    }

 }


 ////////////////////////////////////////////////////////////////////////////////

 /// absolute deviation BDT, set the targets for a collection of events


 // Multithreaded version of AbsoluteDeviationLossFunctionBDT::SetTargets

 #ifdef R__USE_IMT

 void TMVA::AbsoluteDeviationLossFunctionBDT::SetTargets(std::vector<const TMVA::Event*>& evs, std::map< const TMVA::Event*, LossFunctionEventInfo >& evinfomap){

    // need a lambda function to pass to TThreadExecutor::Map

    auto f = [this, &evinfomap](const TMVA::Event* ev) {

          const_cast<TMVA::Event*>(ev)->SetTarget(0, Target(evinfomap[ev]));

    };


    TMVA::Config::Instance().GetThreadExecutor().Foreach(f, evs, TMVA::Config::Instance().GetThreadExecutor().GetPoolSize());

 }

 // Standard version of AbsoluteDeviationLossFunctionBDT::SetTargets

 #else

 void TMVA::AbsoluteDeviationLossFunctionBDT::SetTargets(std::vector<const TMVA::Event*>& evs, std::map< const TMVA::Event*, LossFunctionEventInfo >& evinfomap){


    for (std::vector<const TMVA::Event*>::const_iterator e=evs.begin(); e!=evs.end();e++) {

          const_cast<TMVA::Event*>(*e)->SetTarget(0,Target(evinfomap[*e]));

    }

 }

 #endif


 ////////////////////////////////////////////////////////////////////////////////

 /// absolute deviation BDT, set the target for a single event


 Double_t TMVA::AbsoluteDeviationLossFunctionBDT::Target(LossFunctionEventInfo& e){

 // The target is the sign of the residual.

     Double_t residual = e.trueValue - e.predictedValue;

     // The weight/target relationships are taken care of in the tmva decision tree operations so we don't need to worry about that here

     return (residual<0?-1.0:1.0);

 }


 ////////////////////////////////////////////////////////////////////////////////

 /// absolute deviation BDT, determine the fit value for the terminal node based upon the

 /// events in the terminal node


 Double_t TMVA::AbsoluteDeviationLossFunctionBDT::Fit(std::vector<LossFunctionEventInfo>& evs){

 // For Absolute Deviation, the fit in each terminal node is the weighted residual median.


    // use a lambda function to tell the vector how to sort the LossFunctionEventInfo data structures

    // sort in ascending order of residual value

    std::sort(evs.begin(), evs.end(), [](LossFunctionEventInfo a, LossFunctionEventInfo b){

                                         return (a.trueValue-a.predictedValue) < (b.trueValue-b.predictedValue); });


    // calculate the sum of weights, used in the weighted median calculation

    Double_t sumOfWeights = 0;

    for(UInt_t j=0; j<evs.size(); j++)

       sumOfWeights+=evs[j].weight;


    // get the index of the weighted median

    UInt_t i = 0;

    Double_t temp = 0.0;

    while(i<evs.size() && temp <= sumOfWeights*0.5){

       temp += evs[i].weight;

       i++;

    }

    if (i >= evs.size()) return 0.; // prevent uncontrolled memory access in return value calculation


    // return the median residual

    return evs[i].trueValue-evs[i].predictedValue;

 }

Rtypes.h

Config.h

LossFunction.h

TSeq.hxx

MsgLogger.h

TThreadExecutor.hxx

TMath.h