00001 // -*- C++ -*- 00002 00003 // RepeatSplitter.h 00004 // 00005 // Copyright (C) 2003 Olivier Delalleau 00006 // 00007 // Redistribution and use in source and binary forms, with or without 00008 // modification, are permitted provided that the following conditions are met: 00009 // 00010 // 1. Redistributions of source code must retain the above copyright 00011 // notice, this list of conditions and the following disclaimer. 00012 // 00013 // 2. Redistributions in binary form must reproduce the above copyright 00014 // notice, this list of conditions and the following disclaimer in the 00015 // documentation and/or other materials provided with the distribution. 00016 // 00017 // 3. The name of the authors may not be used to endorse or promote 00018 // products derived from this software without specific prior written 00019 // permission. 00020 // 00021 // THIS SOFTWARE IS PROVIDED BY THE AUTHORS ``AS IS'' AND ANY EXPRESS OR 00022 // IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED WARRANTIES 00023 // OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE DISCLAIMED. IN 00024 // NO EVENT SHALL THE AUTHORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, 00025 // SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED 00026 // TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR 00027 // PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF 00028 // LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING 00029 // NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS 00030 // SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE. 00031 // 00032 // This file is part of the PLearn library. For more information on the PLearn 00033 // library, go to the PLearn Web site at www.plearn.org 00034 00035 /* ******************************************************* 00036 * $Id: RepeatSplitter.h,v 1.7 2004/04/01 18:04:35 tihocan Exp $ 00037 ******************************************************* */ 00038 00041 #ifndef RepeatSplitter_INC 00042 #define RepeatSplitter_INC 00043 00044 #include "Splitter.h" 00045 00046 namespace PLearn { 00047 using namespace std; 00048 00049 class RepeatSplitter: public Splitter 00050 { 00051 typedef Splitter inherited; 00052 00053 protected: 00054 00055 // ********************* 00056 // * protected options * 00057 // ********************* 00058 00061 TMat<int> indices; 00062 00064 int last_n; 00065 00066 public: 00067 00068 // ************************ 00069 // * public build options * 00070 // ************************ 00071 00072 bool do_not_shuffle_first; 00073 real force_proportion; 00074 int n; 00075 long seed; 00076 int shuffle; 00077 PP<Splitter> to_repeat; 00078 00079 // **************** 00080 // * Constructors * 00081 // **************** 00082 00083 RepeatSplitter(); 00084 00085 00086 // ****************** 00087 // * Object methods * 00088 // ****************** 00089 00091 virtual void setDataSet(VMat the_dataset); 00092 00093 private: 00095 // (Please implement in .cc) 00096 void build_(); 00097 00098 protected: 00100 // (Please implement in .cc) 00101 static void declareOptions(OptionList& ol); 00102 00103 public: 00104 // simply calls inherited::build() then build_() 00105 virtual void build(); 00106 00108 virtual void makeDeepCopyFromShallowCopy(map<const void*, void*>& copies); 00109 00111 PLEARN_DECLARE_OBJECT(RepeatSplitter); 00112 00113 00114 // ******************************** 00115 // * Splitter methods * 00116 // * (must be implemented in .cc) * 00117 // ******************************** 00118 00120 virtual int nsplits() const; 00121 00123 virtual int nSetsPerSplit() const; 00124 00126 virtual TVec<VMat> getSplit(int i=0); 00127 00128 }; 00129 00130 // Declares a few other classes and functions related to this class 00131 DECLARE_OBJECT_PTR(RepeatSplitter); 00132 00133 } // end of namespace PLearn 00134 00135 #endif