source: prdatasets/arcene.m @ 153

Last change on this file since 153 was 150, checked in by bduin, 5 years ago
File size: 1.4 KB
RevLine 
[142]1%ARCENE Cancer recognition based on mass spectra
2%PRTools UCI dataset import, 100+100+700 objects, 10000 features, 2 classes
3%
4%  [TRAIN,VALID,TEST] = ARCENE
5%   TRAIN_VALID  = ARCENE
6%
7%DESCRIPTION
8%This command downloads one of the UCI data sets, converts it into PRTools
9%format and stores it locally for future use. Consult the <a href="http://archive.ics.uci.edu/ml/datasets/Arcene">related website</a>.
10%for further information. Please make the appropriate references in
11%publications that make use of this dataset.
12%
13%The training set (100 objects) and the validation set (100 objects) are
14%labeled. The test set (700 objects) is unlabeled. The order of the
15%original feature (spectral bands) is randomized. Moreover, the set is
16%merged with a large number of random features. See the dataset <a href="http://archive.ics.uci.edu/ml/datasets/Arcene">website</a>.
17%
[150]18%SEE ALSO <a href="http://prtools.tudelft.nl/prtools/">PRTools Guide</a>, <a href="http://archive.ics.uci.edu/ml/">UCI Website</a>
[142]19%PRTOOLS, DATASETS
20
[150]21% Copyright: R.P.W. Duin
[142]22
23function [a,b,c] = arcene
24
25datfiles = {'ARCENE/arcene_train.data','ARCENE/arcene_valid.data','ARCENE/arcene_test.data'};
26labfiles = {'ARCENE/arcene_train.labels','arcene_valid.labels',0};
27% use old call
28[a,b,c] = pr_download_uci('Arcene',datfiles,[],[],[3,3,18],[],[],' ',labfiles);
29c = setlablist(c,[]);
30
31if nargout < 2
32  a = [a;b];
33  a = setname(a,'Arcene Mass Spectra');
34end
35
36
37
Note: See TracBrowser for help on using the repository browser.