-
Notifications
You must be signed in to change notification settings - Fork 4
/
Copy pathExp1_huge_dataset.m
82 lines (72 loc) · 3.08 KB
/
Exp1_huge_dataset.m
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
function res_mean=Test_huge_dataset(data_name)
addpath('./methods');
addpath('./utils');
rand('state', 0)
totally=tic();
%% Parameters ----------
options = parameters(data_name);
train_fraction=0.7;
labeled_fraction=0.1;
%% Load Data ----------
dataset_path=['./datasets/', data_name];
[y, X]=libsvmread(dataset_path);
if length(y)>200000
y=y(1:200000);
X=X(1:200000,:);
end
%% Data split ----------
global X_train y_train X_test y_test labeled_idx sample_idx K_ms K_ts K_mm K_tm K_ns K_ss L
all_idx=randperm(length(y), length(y));
test_idx=all_idx(1:ceil((1-train_fraction)*length(all_idx)));
X_test=X(test_idx,:);
y_test=y(test_idx);
train_idx=setdiff(all_idx,test_idx);
X_train=X(train_idx,:);
y_train=y(train_idx);
clear X;
clear all_idx;
clear train_idx;
clear test_idx;
%% Generating grapha Laplacian L and predefinition of kernel----------
L=construct_laplacian_graph(data_name, X_train, options.NN);
kernel=load_kernel(data_name, length(y), options.KernelParam);
times=5;
res_RLS=[];
res_LapRLS=[];
res_LapRLS_pcg=[];
res_nystrom=[];
res_nystrom_pcg=[];
for t=1:times
%% Preprocess ----------
train_size=length(y_train);
labeled_unsorted=randperm(train_size, ceil(labeled_fraction*train_size));
unlabeled_idx=setdiff(1:train_size, labeled_unsorted);
labeled_idx=setdiff(1:train_size, unlabeled_idx);
sample_idx=1:ceil(4*sqrt(train_size));
K_ns=kernel(X_train, 1:length(y_train), X_train, sample_idx, i, 'kns');
K_mm=kernel(X_train, labeled_idx, X_train, labeled_idx, i, 'kmm');
K_ms=K_ns(labeled_idx,:);
K_ss=K_ns(sample_idx,:);
K_ts=kernel(X_test, 1:length(y_test), X_train, sample_idx, i, 'kts');
K_tm=kernel(X_test, 1:length(y_test), X_train, labeled_idx, i, 'ktm');
vectors = struct('labeled_idx',labeled_idx, ...
'unlabeled_idx',unlabeled_idx, ...
'sample_idx',sample_idx,...
'y_train',y_train,...
'y_test',y_test);
result=zeros(5,4);
[result(1,1), result(1,2), result(1,3), result(1,4)] = Method_RLS(K_mm, K_tm, vectors, options);
[result(4,1), result(4,2), result(4,3), result(4,4)] = Method_LapRLS_Nystrom1(K_ns, K_ms, K_ss, K_ts, L, vectors, options);
[result(5,1), result(5,2), result(5,3), result(5,4)] = Method_LapRLS_Nystrom_PCG1(K_ns, K_ms, K_ss, K_ts, L, vectors, options);
res_RLS=[res_RLS;result(1,:)];
res_LapRLS=[res_LapRLS;result(2,:)];
res_LapRLS_pcg=[res_LapRLS_pcg;result(3,:)];
res_nystrom=[res_nystrom;result(4,:)];
res_nystrom_pcg=[res_nystrom_pcg;result(5,:)];
disp(result);
end
res_mean=[mean(res_RLS); mean(res_LapRLS); mean(res_LapRLS_pcg); mean(res_nystrom); mean(res_nystrom_pcg)];
save(['./result/',data_name], 'res_mean', 'res_RLS', 'res_LapRLS', 'res_LapRLS_pcg', 'res_nystrom', 'res_nystrom_pcg');
disp(['totally cost ', num2str(toc(totally))]);
disp(res_mean);
end