Context Navigation

straux1.m @ 706

Revision 706, 14.6 kB (checked in by smidl, 15 years ago)
eol-native
Property svn:eol-style set to `native`

Rev	Line
[566]	1	function [strout, rgrsout, statistics] = straux1(L, d, nu, L0, d0, nu0, belief, nbest, max_nrep, lambda, order_k);
	2	% structure estimation based on LD decomposition
	3	%
	4	% This m/mex file is internally called by facstr, IT IS NOT TO BE CALLED
	5	% BY USER!! Documentation guiven for reference.
	6	%
	7	%
	8	% [strout, rgrsout, statistics] = straux1(L, d, nu, L0, d0, nu0, belief, nbest, max_nrep, lambda, order_k);
	9	%
	10	% L : Actual LD decomposition based on data
	11	% d : Actual LD decomposition based on data
	12	% nu : Actual data amount
	13	% L0 : prior information
	14	% d0 : prior information
	15	% nu0 : prior data amount
	16	% belief: user's belief on maximum structure items
	17	% (1 items must be present, 2 items are probably present
	18	% 4 items must not be present, 3 items are probably not present)
	19	% 2 and 3 is the same
	20	% nbest : how many "best" regressors are maintained
	21	% strout : structure estimated (of the regressor, richest is 2:length(d)
	22	% max_nrep : maximal number of random starts in search for the best
	23	% structure
	24	% lambda : stooping rule threshold
	25	% order_k : order of k
	26	%
	27	% Design : L. Tesar
	28	% Updated : Feb-Apr 2003
	29	% Project : post-ProDaCTool
	30	% References: (only local inline functions)
	31	%
	32	% Todo: in add_new, we need to implement structure comparison, instead of
	33	% loglikelihood comparison: ~any(logliks == new.loglik)
	34
	35	% randun seed stuff:
	36	%global SEED
	37	%SEED = randn('seed');
	38
	39	% Argument's checking:
	40	if nargin<8;
	41	if nargout>=2;
[571]	42	nbest = 2;
[566]	43	else
	44	% If we don't need the second parameter it is better to avoid
	45	% calculating it at all, because it is very costly (5x slowdown).
	46	nbest = 1;
	47	end;
	48	end;
	49
	50	if nargin< 6, error('Incorrect number of input parameters in straux1'); end;
	51	if nargin< 7, belief = []; end; % Don't belive anybody.
[571]	52	if nargin< 9, max_nrep = 3; end;
[566]	53	if nargin<10, lambda = 0.75; end;
	54	if nargin<11, order_k = 2; end;
	55	% Arguments were just checked.
	56
	57	n_data = length(d);
	58
	59	belief_out = find(belief==4)+1; % we are avoiding to put this into regressor
	60	belief_in = find(belief==1)+1; % we are instantly keeping this in regressor
	61
	62	full.d0 = d0;
	63	full.nu0 = nu0;
	64	full.L0 = L0;
	65	full.L = L;
	66	full.d = d;
	67	full.nu = nu;
	68	full.strL = 1:n_data; % Current structure of L and d
	69	full.strRgr = 2:n_data; % Structure elements currently inside regressor (after regressand)
	70	full.strMis = []; % structure elements, that are currently outside regressor (before regressand)
	71	full.posit1 = 1; % regressand position
	72	full.nbits = floor(log2(bitmax))-1; % number of bits available in double
	73	full.bitstr = str_bitset(zeros(1,floor(n_data/full.nbits)+1),full.strRgr,full.nbits);
	74	full.loglik = seloglik1(full); % loglikelihood
	75
	76	% construct full and empty structure
	77	full = sestrremove(full,belief_out);
	78	empty = sestrremove(full,setdiff(full.strRgr,belief_in));
	79
	80	% stopping rule calculation:
	81	local_max = [];
	82	muto = 0;
	83
	84	% statistics:
	85	cputime0 = cputime;
	86	if nargout>=3;
	87	mutos = zeros(1,max_nrep+2);
	88	maxmutos = zeros(1,max_nrep+2);
	89	end;
	90	% ----------------------
	91
	92	% For stopping-rule calculation
	93	%so = 2^(n_data -1-length(belief_in)- length(belief_out)); % do we use this ?
	94	% ----------------------
	95
	96	all_str = 1:n_data;
	97
	98	global_best = full;
	99
	100	% MAIN LOOP is here.
	101	for n_start = -1:max_nrep;
	102	to = n_start+2;
	103
	104	if n_start == -1;
	105	% start from the full structure
	106	last = full;
	107	elseif n_start == 0;
	108	% start from the empty structure
	109	last = empty;
	110	else
	111	% start from random structure
	112	last_str = find([ 0 floor(2*randun(1,n_data-1))]); % this creates random vector consisting of indexes, and sorted
	113	last = sestrremove(full,setdiff(all_str,[1 last_str empty.strRgr]));
	114	end;
	115
	116	% DEBUGging print:
	117	%fprintf('STRUCTURE generated in loop %2i was %s\n', n_start, strPrintstr(last));
	118
	119	% The loop is repeated until likelihood stops growing (break condition
	120	% used at the end;
	121	while 1;
	122
	123	% This structure is going to hold the best elements
	124	best = last;
	125	% Nesting by removing elements (enpoorment)
	126	for removed_item = setdiff(last.strRgr,belief_in);
	127	new = sestrremove(last,removed_item);
	128	if nbest>1;
	129	global_best = add_new(global_best,new,nbest);
	130	end;
	131	if new.loglik>best.loglik;
	132	best = new;
	133	end;
	134	end;
	135	% Nesting by adding elements (enrichment)
	136	for added_item = setdiff(last.strMis,belief_out);
	137	new = sestrinsert(last,added_item);
	138	if nbest>1;
	139	global_best = add_new(global_best,new,nbest);
	140	end;
	141	if new.loglik>best.loglik;
	142	best = new;
	143	end;
	144	end;
	145
	146	% Break condition if likelihood does not change.
	147	if best.loglik <= last.loglik;
	148	break;
	149	else
	150	% Making best structure last structure.
	151	last = best;
	152	end;
	153
	154	end;
	155
	156	% DEBUGging print:
	157	%fprintf('STRUCTURE found (local maxima) in loop %2i was %s randun_seed=%11lu randun_counter=%4lu\n', n_start, strPrintstr(best), randn('seed'), RANDUN_COUNTER);
	158
	159	% Collecting of the best structure in case we don't need the second parameter
	160	if nbest<=1;
	161	if best.loglik>global_best.loglik;
	162	global_best = best;
	163	end;
	164	end;
	165
	166	% uniqueness of the structure found
	167	if ~ismember(best.bitstr,local_max,'rows');
	168	local_max = [local_max ; best.bitstr];
	169	muto = muto + 1;
	170	end;
	171
	172	% stopping rule:
	173	maxmuto = (to-order_k-1)/lambda-to+1;
	174	if to>2;
	175	if maxmuto>=muto;
	176	% fprintf('*');
	177	break;
	178	end;
	179	end;
	180
	181	% do statistics if necessary:
	182	if nargout>=3;
	183	mutos(to) = muto;
	184	maxmutos(to) = maxmuto;
	185	end;
	186	end;
	187
	188	% Aftermath: The best structure was in: global_best
	189
	190	% Updating loglikelihoods: we have to add the constant stuff
	191	for f=1:length(global_best);
	192	global_best(f).loglik = global_best(f).loglik + seloglik2(global_best(f));
	193	end;
	194
	195	% Making first output parameter:
	196	[lik i] = max([global_best.loglik]);
	197	best = global_best(i);
	198	strout = best.strRgr;
	199
	200	% Making the second output parameter
	201	[lik i] = sort([global_best.loglik]);
	202	rgrsout = global_best(i(length(i):-1:1));
	203
	204	if (nargout>=3);
	205	statistics.allstrs = 2^(n_data -1-length(belief_in) - length(belief_out));
	206	statistics.nrand = to-2;
	207	statistics.unique = muto;
	208	statistics.to = to;
	209	statistics.cputime_seconds = cputime - cputime0;
	210	statistics.itemspeed = statistics.to / statistics.cputime_seconds;
	211	statistics.muto = muto;
	212	statistics.mutos = mutos;
	213	statistics.maxmutos = maxmutos;
	214	end;
	215
	216	% randun seed stuff:
	217	%randn('seed',SEED);
	218
	219	% --------------------- END of MAIN program --------------------
	220
	221	% This is needed for bitstr manipulations
	222	function out = str_bitset(in,ns,nbits)
	223	out = in;
	224	for n = ns;
	225	index = 1+floor((n-2)/nbits);
	226	bitindex = 1+rem(n-2,nbits);
	227	out(index) = bitset(out(index),bitindex);
	228	end;
	229	function out = str_bitres(in,ns,nbits)
	230	out = in;
	231	for n = ns;
	232	index = 1+floor((n-2)/nbits);
	233	bitindex = 1+rem(n-2,nbits);
	234	mask = bitset(0,bitindex);
	235	out(index) = bitxor(bitor(out(index),mask),mask);
	236	end;
	237
	238	function out = strPrintstr(in)
	239	out = '0';
	240	nbits = in.nbits;
	241	for f = 2:length(in.d0);
	242	index = 1+floor((f-2)/nbits);
	243	bitindex = 1+rem(f-2,nbits);
	244	if bitget(in.bitstr(index),bitindex);
	245	out(f) = '1';
	246	else;
	247	out(f) = '0';
	248	end;
	249	end;
	250
	251	function global_best_out = add_new(global_best,new,nbest)
	252	% Eventually add to global best, but do not go over nbest values
	253	% Also avoids repeating things, which makes this function awfully slow
	254	if length(global_best)>=nbest;
	255	logliks = [global_best.loglik];
	256	[loglik i] = min(logliks);
	257	global_best_out = global_best;
	258	if loglik<new.loglik;
	259	% if ~any(logliks == new.loglik);
	260	addit=1;
	261	for f = [global_best.bitstr];
	262	if f == new.bitstr;
	263	addit = 0;
	264	break;
	265	end;
	266	end;
	267	if addit;
	268	global_best_out(i) = new;
	269	% DEBUGging print:
	270	% fprintf('ADDED structure, add_new: %s, loglik=%g\n', strPrintstr(new), new.loglik);
	271	end;
	272	end;
	273	else;
	274	global_best_out = [global_best new];
	275	end;
	276
	277	function out = sestrremove(in,removed_elements);
	278	% Removes elements from regressor
	279	n_strL = length(in.strL);
	280	out = in;
	281	for f=removed_elements;
	282	posit1 = find(out.strL==1);
	283	positf = find(out.strL==f);
	284	for g=(positf-1):-1:posit1;
	285	% BEGIN: We are swapping g and g+1 NOW!!!!
	286	[out.L, out.d] = seswapudl(out.L, out.d, g);
	287	[out.L0, out.d0] = seswapudl(out.L0, out.d0, g);
	288	out.strL([g g+1]) = [out.strL(g+1) out.strL(g)];
	289	% END
	290	end;
	291	end;
	292	out.posit1 = find(out.strL==1);
	293	out.strRgr = out.strL((out.posit1+1):n_strL);
	294	out.strMis = out.strL(1:(out.posit1-1));
	295	out.bitstr = str_bitres(out.bitstr,removed_elements,out.nbits);
	296	out.loglik = seloglik1(out);
	297
	298	function out = sestrinsert(in,inserted_elements);
	299	% Moves elements into regressor
	300	n_strL = length(in.strL);
	301	out = in;
	302	for f=inserted_elements;
	303	posit1 = find(out.strL==1);
	304	positf = find(out.strL==f);
	305	for g=positf:(posit1-1);
	306	% BEGIN: We are swapping g and g+1 NOW!!!!
	307	[out.L, out.d] = seswapudl(out.L, out.d, g);
	308	[out.L0, out.d0] = seswapudl(out.L0, out.d0, g);
	309	out.strL([g g+1]) = [out.strL(g+1) out.strL(g)];
	310	% END
	311	end;
	312	end;
	313	out.posit1 = find(out.strL==1);
	314	out.strRgr = out.strL((out.posit1+1):n_strL);
	315	out.strMis = out.strL(1:(out.posit1-1));
	316	out.bitstr = str_bitset(out.bitstr,inserted_elements,out.nbits);
	317	out.loglik = seloglik1(out);
	318
	319	%
	320	% seloglik_real = seloglik1 + seloglik2
	321	%
	322
	323	function l = seloglik1(in)
	324	% This is the loglikelihood (non-constant part) - this should be used in
	325	% frequent computation
	326	len = length(in.d);
	327	p1 = in.posit1;
	328
	329	i1 = -0.5in.nu log(in.d (p1)) -0.5*sum(log(in.d ((p1+1):len)));
	330	i0 = -0.5in.nu0log(in.d0(p1)) -0.5*sum(log(in.d0((p1+1):len)));
	331	l = i1-i0;
	332
	333	% DEBUGGing print:
	334	% fprintf('SELOGLIK1: str=%s loglik=%g\n', strPrintstr(in), l);
	335
	336
	337	function l = seloglik2(in)
	338	% This is the loglikelihood (constant part) - this should be added to
	339	% everything at the end. It needs some computation, so it is useless to
	340	% make it for all the stuff
	341	logpi = log(pi);
	342
	343	i1 = gammaln(in.nu /2) - 0.5in.nu logpi;
	344	i0 = gammaln(in.nu0/2) - 0.5in.nu0logpi;
	345	l = i1-i0;
	346
	347
	348	function [Lout, dout] = seswapudl(L,d,i);
	349	%SESWAPUDL swaps information matrix in decomposition V=L^T diag(d) L
	350	%
	351	% [Lout, dout] = seswapudl(L,d,i);
	352	%
	353	% L : lower triangular matrix with 1's on diagonal of the decomposistion
	354	% d : diagonal vector of diagonal matrix of the decomposition
	355	% i : index of line to be swapped with the next one
	356	% Lout : output lower triangular matrix
	357	% dout : output diagional vector of diagonal matrix D
	358	%
	359	% Description:
	360	% Lout' * diag(dout) * Lout = P(i,i+1) * L' * diag(d) * L * P(i,i+1);
	361	%
	362	% Where permutation matrix P(i,j) permutates columns if applied from the
	363	% right and line if applied from the left.
	364	%
	365	% Note: naming:
	366	% se = structure estimation
	367	% lite = light, simple
	368	% udl = UDL, or more precisely, L'DL, also called as ld
	369	%
	370	% Design : L. Tesar
	371	% Updated : Feb 2003
	372	% Project : post-ProDaCTool
	373	% Reference: sedydr
	374
	375	j = i+1;
	376
	377	pomd = d(i);
	378	d(i) = d(j);
	379	d(j) = pomd;
	380
	381	pomL = L(i,:);
	382	L(i,:) = L(j,:);
	383	L(j,:) = pomL;
	384
	385	pomL = L(:,i);
	386	L(:,i) = L(:,j);
	387	L(:,j) = pomL;
	388
	389	% We must be working with LINES of matrix L !
	390
	391	r = L(i,:)';
	392	f = L(j,:)';
	393	Dr = d(i);
	394	Df = d(j);
	395
	396	[r, f, Dr, Df] = sedydr(r, f, Dr, Df, j);
	397
	398	r0 = r(i);
	399	Dr = Drr0r0;
	400	r = r/r0;
	401
	402	L(i,:) = r';
	403	L(j,:) = f';
	404	d(i) = Dr;
	405	d(j) = Df;
	406
	407	L(i,i) = 1;
	408	L(j,j) = 1;
	409
	410	Lout = L;
	411	dout = d;
	412
	413	function [rout, fout, Drout, Dfout, kr] = sedydr(r,f,Dr,Df,R,jl,jh);
	414	%SEDYDR dyadic reduction, performs transformation of sum of 2 dyads
	415	%
	416	% [rout, fout, Drout, Dfout, kr] = sedydr(r,f,Dr,Df,R,jl,jh);
	417	% [rout, fout, Drout, Dfout] = sedydr(r,f,Dr,Df,R);
	418	%
	419	% Description: dyadic reduction, performs transformation of sum of
	420	% 2 dyads rDrr'+ fDff' so that the element of r pointed by R is zeroed
	421	%
	422	% r : column vector of reduced dyad
	423	% f : column vector of reducing dyad
	424	% Dr : scalar with weight of reduced dyad
	425	% Df : scalar with weight of reducing dyad
	426	% R : scalar number giving 1 based index to the element of r,
	427	% which is to be reduced to
	428	% zero; the corresponding element of f is assumed to be 1.
	429	% jl : lower index of the range within which the dyads are
	430	% modified (can be omitted, then everything is updated)
	431	% jh : upper index of the range within which the dyads are
	432	% modified (can be omitted then everything is updated)
	433	% rout,fout,Drout,dfout : resulting two dyads
	434	% kr : coefficient used in the transformation of r
	435	% rnew = r + kr*f
	436	%
	437	% Description: dyadic reduction, performs transformation of sum of
	438	% 2 dyads rDrr'+ fDff' so that the element of r indexed by R is zeroed
	439	% Remark1: Constant mzero means machine zero and should be modified
	440	% according to the precision of particular machine
	441	% Remark2: jl and jh are, in fact, obsolete. It takes longer time to
	442	% compute them compared to plain version. The reason is that we
	443	% are doing vector operations in m-file. Other reason is that
	444	% we need to copy whole vector anyway. It can save half of time for
	445	% c-file, if you use it correctly. (please do tests)
	446	%
	447	% Note: naming:
	448	% se = structure estimation
	449	% dydr = dyadic reduction
	450	%
	451	% Original Fortran design: V. Peterka 17-7-89
	452	% Modified for c-language: probably R. Kulhavy
	453	% Modified for m-language: L. Tesar 2/2003
	454	% Updated: Feb 2003
	455	% Project: post-ProDaCTool
	456	% Reference: none
	457
	458	if nargin<6;
	459	update_whole=1;
	460	else
	461	update_whole=0;
	462	end;
	463
	464	mzero = 1e-32;
	465
	466	if Dr<mzero;
	467	Dr=0;
	468	end;
	469
	470	r0 = r(R);
	471	kD = Df;
	472	kr = r0 * Dr;
	473	Dfout = kD + r0 * kr;
	474
	475	if Dfout > mzero;
	476	kD = kD / Dfout;
	477	kr = kr / Dfout;
	478	else;
	479	kD = 1;
	480	kr = 0;
	481	end;
	482
	483	Drout = Dr * kD;
	484
	485	% Try to uncomment marked stuff (*) if in numerical problems, but I don't
	486	% think it can make any difference for normal healthy floating-point unit
	487	if update_whole;
	488	rout = r - r0*f;
	489	% rout(R) = 0; % * could be needed for some nonsense cases(or numeric reasons?), normally not
	490	fout = f + kr*rout;
	491	% fout(R) = 1; % * could be needed for some nonsense cases(or numeric reasons?), normally not
	492	else;
	493	rout = r;
	494	fout = f;
	495	rout(jl:jh) = r(jl:jh) - r0 * f(jl:jh);
	496	rout(R) = 0;
	497	fout(jl:jh) = f(jl:jh) + kr * rout(jl:jh);
	498	end;
	499
	500
	501
	502
	503
	504

Note: See TracBrowser for help on using the browser.

Context Navigation

root/library/utia_legacy/ticket_12/straux1.m @ 706

Download in other formats: