Skip to content
Snippets Groups Projects
Select Git revision
  • master
1 result

goDT.m

Blame
  • Andrew Cohen's avatar
    Andrew Cohen authored
    6467363a
    History
    goDT.m 3.37 KiB
    % 
    % /******************************************************************************
    % 
    % This program, "NCDM", the associated MATLAB scripts and all 
    % provided data, are copyright (C) 2013-2014 Andrew R. Cohen and Paul
    % M. B. Vitanyi.  All rights reserved.
    % 
    % This program uses bzip2 compressor as a static library.
    % See the file SRC\C\bz2static\LICENSE.txt for details on that software.
    % 
    % This software may be referenced as:
    % 
    % A.R.Cohen and P.M.B. Vitanyi, "Normalized Compression Distance of Multisets 
    % with Applications," IEEE Transactions on Pattern Analysis and Machine 
    % Intelligence. 2014. In Press. Also arXiv:1212.5711.  
    % 
    % Redistribution and use in source and binary forms, with or without
    % modification, are permitted provided that the following conditions
    % are met:
    % 
    % 1. Redistributions of source code must retain the above copyright
    %    notice, this list of conditions and the following disclaimer.
    % 
    % 2. The origin of this software must not be misrepresented; you must 
    %    not claim that you wrote the original software.  If you use this 
    %    software in a product, an acknowledgment in the product 
    %    documentation would be appreciated but is not required.
    % 
    % 3. Altered source versions must be plainly marked as such, and must
    %    not be misrepresented as being the original software.
    % 
    % 4. The name of the author may not be used to endorse or promote 
    %    products derived from this software without specific prior written 
    %    permission.
    % 
    % THIS SOFTWARE IS PROVIDED BY THE AUTHOR ``AS IS'' AND ANY EXPRESS
    % OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED
    % WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
    % ARE DISCLAIMED.  IN NO EVENT SHALL THE AUTHOR BE LIABLE FOR ANY
    % DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
    % DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE
    % GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS
    % INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY,
    % WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING
    % NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS
    % SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
    % 
    % Andrew R. Cohen acohen@coe.drexel.edu
    % Paul M. B. Vitanyi Paul.Vitanyi@cwi.nl
    % NCDM  version 1.0 of 13 March 2013
    % NCDM  version 2.0 (release) November 2014
    % 
    % ******************************************************************************/
    
    % goDT ensemble of random subspace discriminant classifiers
    
    function res=goDT(rgTrain,rgTest)
    
    trainData = rgTrain(:,2:end);
    trainLabel = rgTrain(:,1);
    
    testData = rgTest(:,2:end);
    testLabel = rgTest(:,1);
    
    [size(testData) size(trainData)]
    
    res=[];
    for nClass=[10 12 14]
        for npred=3000:1000:5000 %size(testData,2)
            tic
            ens = fitensemble(trainData,trainLabel,'subspace',nClass,'discriminant','NPredToSample',npred);
            pred=ens.predict(testData);
            accuracy=length(find(pred==testLabel))/length(testLabel);
    %         pred=ens.predict(trainData);
    %         cvAccuracy=length(find(pred==trainLabel))/length(trainLabel);
            cvEns = crossval(ens);
            cvAccuracy=1-kfoldLoss(cvEns);
            res=[res;nClass npred accuracy cvAccuracy];
            best = max(res(:,4));
            fprintf(1,'discriminant ensemble (%d,%d): accuracy=%.4f,cvAccuracy=%.4f best=%.4f\n',nClass,npred,accuracy,cvAccuracy,best);
            
            toc
            
        end
    end