-
Notifications
You must be signed in to change notification settings - Fork 5
/
Copy pathcaffe_train_net.m
99 lines (80 loc) · 3.56 KB
/
caffe_train_net.m
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
%% Description
% The training wrapper for caffe
% [ best_accuracy, best_iter, stat ] = caffe_train_net( solver_filename, best_snapshot_prefix, gpu_mode, save_intermediate_best )
% --- INPUTS
% solver_filename = filename of the solver used
% best_snapshot_prefix = prefix (with the full path) for the best snapshots
% gpu_mode = gpu or cpu mode:
% 0 = cpu
% 1 = gpu
% save_intermediate_best = should we save every time we have a better
% result
%
% --- OUTPUTS
% accuracy = vector of accuracies observed
% iterations = iterations at which the accuracies were observed
% best_accuracy = best accuracy
% best_iter = iteration at which the best accuracy was observed
% stat = other statistics
%% Remarks:
% if you don't want to save intermediate results set max_iter property of
% the solver to some very high value
function [ best_accuracy, best_iter, stat ] = caffe_train_net( solver_filename, best_snapshot_prefix, gpu_mode, save_intermediate_best )
%% Execution
caffe.reset_all();
if gpu_mode
caffe.set_mode_gpu();
else
caffe.set_mode_cpu();
end
solver_props = caffe_read_solverprototxt(solver_filename);
test_interval = str2num( solver_props.test_interval );
max_iter = str2num(solver_props.max_iter);
[snapshot_folder, snapshot_name_base] = fileparts (best_snapshot_prefix);
if ~exist(snapshot_folder, 'dir')
fprintf('%s : creating folder %s ... \n', mfilename, snapshot_folder);
mkdir(snapshot_folder);
end
%Load the solver
fprintf('%s : Loading solver = %s ... \n', mfilename, solver_filename);
solver = caffe.Solver(solver_filename);
%Init vars
steps_num = int32( max_iter / test_interval);
stat.accuracy = zeros([1,steps_num]);
stat.iterations = zeros([1,steps_num]);
stat.loss = zeros([1,steps_num]);
best_accuracy = solver.test_nets(1).blobs('accuracy').get_data();
best_iter = 0;
best_net = solver.net;
stat.best_snapshot_name = '';
prev_best_snapshot_name = '';
%Iterate
step_i = 0;
while solver.iter < max_iter
step_i = step_i + 1;
solver.step(test_interval);
stat.accuracy(step_i) = solver.test_nets(1).blobs('accuracy').get_data();
stat.loss(step_i) = solver.net(1).blobs('loss').get_data();
stat.loss_test(step_i) = solver.test_nets(1).blobs('loss').get_data();
stat.iterations(step_i) = solver.iter;
if stat.accuracy(step_i) > best_accuracy || length(stat.best_snapshot_name) == 0
best_net = solver.net;
best_accuracy = stat.accuracy(step_i);
best_iter = solver.iter;
prev_best_snapshot_name = stat.best_snapshot_name;
stat.best_snapshot_name = [best_snapshot_prefix sprintf('__iter_%06d__acc_%5.3f.caffemodel', best_iter, best_accuracy) ];
best_net.save(stat.best_snapshot_name);
if ~save_intermediate_best && length(prev_best_snapshot_name) > 0
delete(prev_best_snapshot_name);
end
end
fprintf('Iter = %d TRAIN: loss = %e VAL: Accuracy: cur = %f best: %f (iter: %d) \n', ...
solver.iter, stat.loss(step_i), stat.accuracy(step_i), best_accuracy, best_iter );
end
% Results
%[best_accuracy, best_indx] = max(accuracy);
%best_iter = iterations(best_indx);
% Saving the best snapshot (old version)
% stat.best_snapshot_name = [best_snapshot_prefix sprintf('__iter_%06d__acc_%5.3f.caffemodel', best_iter, best_accuracy) ];
% best_net.save(stat.best_snapshot_name);
end