* This file is part of Shark. * * * Shark is free software: you can redistribute it and/or modify * it under the terms of the GNU Lesser General Public License as published * by the Free Software Foundation, either version 3 of the License, or * (at your option) any later version. * * Shark is distributed in the hope that it will be useful, * but WITHOUT ANY WARRANTY; without even the implied warranty of * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the * GNU Lesser General Public License for more details. * * You should have received a copy of the GNU Lesser General Public License * along with Shark. If not, see . * */ #ifndef SHARK_OBJECTIVEFUNCTIONS_LOOERROR_H #define SHARK_OBJECTIVEFUNCTIONS_LOOERROR_H #include #include #include #include #include #include namespace shark { /// /// \brief Leave-one-out error objective function. /// /// \par /// The leave-one-out measure is the average prediction performance of /// a learning machine on a dataset, where each sample is predicted by /// a machine trained on all but the sample to be predicted. This is an /// extreme form of cross-validation, with a fold size of one. /// /// \par /// In general the leave-one-out error is costly to compute, since it /// requires training of a large number of learning machines. However, /// certain machines allow for a more efficient implementation. Refer /// to LooErrorCSvm for an example. /// template class LooError : public AbstractObjectiveFunction< RealVector, double > { public: typedef ModelTypeT ModelType; typedef typename ModelType::InputType InputType; typedef typename ModelType::OutputType OutputType; typedef LabeledData DatasetType; typedef AbstractTrainer TrainerType; typedef AbstractLoss LossType; /// /// \brief Constructor. /// /// \param dataset Full data set for leave-one-out. /// \param model Model built on subsets of the data. /// \param trainer Trainer for learning on each subset. /// \param loss Loss function for judging the validation output. /// \param meta Meta object with parameters that influences the process, typically a trainer. /// LooError( DatasetType const& dataset, ModelType* model, TrainerType* trainer, LossType* loss, IParameterizable<>* meta = NULL) : m_dataset(dataset) , mep_meta(meta) , mep_model(model) , mep_trainer(trainer) , mep_loss(loss) { m_features |= HAS_VALUE; } /// \brief From INameable: return the class name. std::string name() const { return "LooError<" + mep_model->name() + "," + mep_trainer->name() + "," + mep_loss->name() + ">"; } std::size_t numberOfVariables()const{ return mep_meta->numberOfParameters(); } /// Evaluate the leave-one-out error: /// train sub-models, evaluate objective, /// return the average. double eval() const { this->m_evaluationCounter++; std::size_t ell = m_dataset.size(); Data output; double sum = 0.0; std::vector indices(ell - 1); boost::iota(indices,0); for (std::size_t i=0; itrain(*mep_model, train); OutputType validation = (*mep_model)(m_dataset[i].input); sum += mep_loss->eval(m_dataset[i].label, validation); if (i < ell - 1) indices[i] = i; } return sum / ell; } /// Evaluate the leave-one-out error for the given /// parameters passed to the meta object (typically /// these parameters need to be optimized in a model /// selection procedure). double eval(const RealVector& parameters) const { SHARK_ASSERT(mep_meta != NULL); mep_meta->setParameterVector(parameters); return eval(); } protected: DataView m_dataset; IParameterizable<>* mep_meta; ModelType* mep_model; TrainerType* mep_trainer; LossType* mep_loss; }; } #endif