Multi_Matrix_Factorization/Train.m at master · 134579/Multi_Matrix_Factorization · GitHub

1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
% function [ converge, factors ] = Train( matrixes , R , iteration , descentRate , logfile )
function [ converge, factors ] = Train( matrixes , param )

%% input paramater:
% matrixes : array of type Matrix
% R : size of factor , e.g. 10 20 100 500...
% iteration : iteration times
% descentRate : descent rate used in gradient descent algorithm e.g. 0.001 0.0001
% logfile : path of logfile

%% return value
% converge : 1 for converge ,0 for not converged
% factors : array of factor matrix

%% initilize
iteration=param.iteration;
R=param.R;
descentRate=param.descentRate;
factorNorm=param.factorNorm;
normWeight=param.normWeight;
logfile=param.logfile;


fp=fopen(strcat(logfile,'.txt'),'a');
nFactor=0;		% number of factor
nMatrix=length(matrixes);		% number of matrix
% factors=sym('factors');			% factor matrix
converge=0;

%% initilize number of factors(number of different dimensions)
for i=1:nMatrix
	if nFactor < matrixes(i).UIdx
		nFactor = matrixes(i).UIdx;
	end
	if nFactor < matrixes(i).VIdx
		nFactor = matrixes(i).VIdx;
	end
end

if nFactor~=length(normWeight);
	disp('regweight and factors must be same-lengthed');
	return
end

%% initilize size of factors
sizeFactor=-1*ones(nFactor,1);
for i=1:nMatrix
	[m n]=size(matrixes(i).data);
	if sizeFactor(matrixes(i).UIdx)==-1
		sizeFactor(matrixes(i).UIdx)=m;
	else
		if sizeFactor(matrixes(i).UIdx)~=m
			disp('error!!same dimension in different matrix must be equal')
			return
		end
	end
	if sizeFactor(matrixes(i).VIdx)==-1
		sizeFactor(matrixes(i).VIdx)=n;
	else
		if sizeFactor(matrixes(i).VIdx)~=n
			disp('error!!same dimension in different matrix must be equal')
			return
		end
	end
end

%% initilize random factor matrix
factors = initilizeFactor(sizeFactor,R);

%% begin loop

times=0;
losshis=0; % loss history
% descentRate=0.0001;
while times < iteration
	times=times+1;
% 	descentRate=0.001;
% 	if times<3
% 		descentRate=0.001;
% 	else
% 		if times<50
% 			descentRate=0.001;
% 		else
% 			if times<80
% 				descentRate=0.0005;
% 			else
% 				descentRate=0.00025;
% 			end
% 		end
% 	end

	if times==20 || times==40 || times==60 || times==80 || times==100 || times==120 || times==140 || times==160 || times==180 || times==200
		save(strcat(logfile,strcat((int2str(times)),'.mat')));
	end

	%% set descent rate
	if times>2
		if losshis(times-1)>losshis(times-2)
			descentRate=descentRate*0.8;
		end
		if isnan(losshis(times-1))
			return
		end
	end

	fprintf(1,'%d: rate:%f\n',times,descentRate);
	fprintf(fp,'%d: rate:%f\n',times,descentRate);

	%% calculate loss
	loss1=zeros(nMatrix,1);
	for i=1:nMatrix
		uindex=matrixes(i).UIdx;
		vindex=matrixes(i).VIdx;
		loss1(i)=matrixes(i).weight*matrixes(i).getLoss(factors{uindex},factors{vindex});
		fprintf(fp,'%d ',loss1(i));
		fprintf(1,'%d ',loss1(i));
	end

	loss2=zeros(nFactor,1);
	for i=1:nFactor
		loss2(i)=normWeight(i)*factorNorm(i).getNorm(factors{i});
		fprintf(fp,'%d ',loss2(i));
		fprintf(1,'%d ',loss2(i));
	end

	fprintf(fp,'\n');
	fprintf(1,'\n');
% 	disp(loss);
	losshis(times)=sum(loss1)+sum(loss2);

	%% allocate gradient space
	gradient=cell(nFactor,1);
	for i=1:nFactor
		gradient{i}=zeros(sizeFactor(i),R);
	end
	%% calculate gradient
	for i=1:nMatrix
		uindex=matrixes(i).UIdx;

		vindex=matrixes(i).VIdx;
		[gradientU gradientV]=matrixes(i).getGradient(factors{uindex},factors{vindex});
		gradient{uindex}=gradient{uindex}+matrixes(i).weight*gradientU;
		fprintf(1,'%d:matrix %d gradU:%d\n',uindex,i,norm(matrixes(i).weight*gradientU));
		fprintf(fp,'%d:matrix %d gradU:%d\n',uindex,i,norm(matrixes(i).weight*gradientU));
		gradient{vindex}=gradient{vindex}+matrixes(i).weight*gradientV;
		fprintf(1,'%d:matrix %d gradV:%d\n',vindex,i,norm(matrixes(i).weight*gradientV));
		fprintf(fp,'%d:matrix %d gradV:%d\n',vindex,i,norm(matrixes(i).weight*gradientV));
	end

	% gradient of norm
	for i=1:nFactor
		grad=factorNorm(i).getGradient(factors{i});
		gradient{i}=gradient{i}+normWeight(i)*grad;

		fprintf(1,'factor %d grad:%d\n',i,norm(normWeight(i)*grad));
		fprintf(fp,'factor %d grad:%d\n',i,norm(normWeight(i)*grad));
	end
	%% update factor matrix
	for i=1:nFactor
		factors{i}=factors{i}-descentRate*gradient{i};
	end
end

fclose(fp);
converge=1;
end