Context Navigation

source: trunk/sources/HeuristicLab.ExtLibs/HeuristicLab.ALGLIB/2.3.0/ALGLIB-2.3.0/logit.cs @ 2806

Visit:

Last change on this file since 2806 was 2806, checked in by gkronber, 15 years ago
Added plugin for new version of ALGLIB. #875 (Update ALGLIB sources)
File size: 60.8 KB

Rev	Line
[2806]	1	/*************************************************************************
	2	Copyright (c) 2008, Sergey Bochkanov (ALGLIB project).
	3
	4	>>> SOURCE LICENSE >>>
	5	This program is free software; you can redistribute it and/or modify
	6	it under the terms of the GNU General Public License as published by
	7	the Free Software Foundation (www.fsf.org); either version 2 of the
	8	License, or (at your option) any later version.
	9
	10	This program is distributed in the hope that it will be useful,
	11	but WITHOUT ANY WARRANTY; without even the implied warranty of
	12	MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
	13	GNU General Public License for more details.
	14
	15	A copy of the GNU General Public License is available at
	16	http://www.fsf.org/licensing/licenses
	17
	18	>>> END OF LICENSE >>>
	19	*************************************************************************/
	20
	21	using System;
	22
	23	namespace alglib
	24	{
	25	public class logit
	26	{
	27	public struct logitmodel
	28	{
	29	public double[] w;
	30	};
	31
	32
	33	public struct logitmcstate
	34	{
	35	public bool brackt;
	36	public bool stage1;
	37	public int infoc;
	38	public double dg;
	39	public double dgm;
	40	public double dginit;
	41	public double dgtest;
	42	public double dgx;
	43	public double dgxm;
	44	public double dgy;
	45	public double dgym;
	46	public double finit;
	47	public double ftest1;
	48	public double fm;
	49	public double fx;
	50	public double fxm;
	51	public double fy;
	52	public double fym;
	53	public double stx;
	54	public double sty;
	55	public double stmin;
	56	public double stmax;
	57	public double width;
	58	public double width1;
	59	public double xtrapf;
	60	};
	61
	62
	63	/*************************************************************************
	64	MNLReport structure contains information about training process:
	65	* NGrad - number of gradient calculations
	66	* NHess - number of Hessian calculations
	67	*************************************************************************/
	68	public struct mnlreport
	69	{
	70	public int ngrad;
	71	public int nhess;
	72	};
	73
	74
	75
	76
	77	public const double xtol = 100*AP.Math.MachineEpsilon;
	78	public const double ftol = 0.0001;
	79	public const double gtol = 0.3;
	80	public const int maxfev = 20;
	81	public const double stpmin = 1.0E-2;
	82	public const double stpmax = 1.0E5;
	83	public const int logitvnum = 6;
	84
	85
	86	/*************************************************************************
	87	This subroutine trains logit model.
	88
	89	INPUT PARAMETERS:
	90	XY - training set, array[0..NPoints-1,0..NVars]
	91	First NVars columns store values of independent
	92	variables, next column stores number of class (from 0
	93	to NClasses-1) which dataset element belongs to. Fractional
	94	values are rounded to nearest integer.
	95	NPoints - training set size, NPoints>=1
	96	NVars - number of independent variables, NVars>=1
	97	NClasses - number of classes, NClasses>=2
	98
	99	OUTPUT PARAMETERS:
	100	Info - return code:
	101	* -2, if there is a point with class number
	102	outside of [0..NClasses-1].
	103	* -1, if incorrect parameters was passed
	104	(NPoints<NVars+2, NVars<1, NClasses<2).
	105	* 1, if task has been solved
	106	LM - model built
	107	Rep - training report
	108
	109	-- ALGLIB --
	110	Copyright 10.09.2008 by Bochkanov Sergey
	111	*************************************************************************/
	112	public static void mnltrainh(ref double[,] xy,
	113	int npoints,
	114	int nvars,
	115	int nclasses,
	116	ref int info,
	117	ref logitmodel lm,
	118	ref mnlreport rep)
	119	{
	120	int i = 0;
	121	int j = 0;
	122	int k = 0;
	123	int ssize = 0;
	124	bool allsame = new bool();
	125	int offs = 0;
	126	double threshold = 0;
	127	double wminstep = 0;
	128	double decay = 0;
	129	int wdim = 0;
	130	int expoffs = 0;
	131	double v = 0;
	132	double s = 0;
	133	mlpbase.multilayerperceptron network = new mlpbase.multilayerperceptron();
	134	int nin = 0;
	135	int nout = 0;
	136	int wcount = 0;
	137	double e = 0;
	138	double[] g = new double[0];
	139	double[,] h = new double[0,0];
	140	bool spd = new bool();
	141	double[] x = new double[0];
	142	double[] y = new double[0];
	143	double[] wbase = new double[0];
	144	double wstep = 0;
	145	double[] wdir = new double[0];
	146	double[] work = new double[0];
	147	int mcstage = 0;
	148	logitmcstate mcstate = new logitmcstate();
	149	int mcinfo = 0;
	150	int mcnfev = 0;
	151	int solverinfo = 0;
	152	densesolver.densesolverreport solverrep = new densesolver.densesolverreport();
	153	int i_ = 0;
	154	int i1_ = 0;
	155
	156	threshold = 1000*AP.Math.MachineEpsilon;
	157	wminstep = 0.001;
	158	decay = 0.001;
	159
	160	//
	161	// Test for inputs
	162	//
	163	if( npoints<nvars+2 \| nvars<1 \| nclasses<2 )
	164	{
	165	info = -1;
	166	return;
	167	}
	168	for(i=0; i<=npoints-1; i++)
	169	{
	170	if( (int)Math.Round(xy[i,nvars])<0 \| (int)Math.Round(xy[i,nvars])>=nclasses )
	171	{
	172	info = -2;
	173	return;
	174	}
	175	}
	176	info = 1;
	177
	178	//
	179	// Initialize data
	180	//
	181	rep.ngrad = 0;
	182	rep.nhess = 0;
	183
	184	//
	185	// Allocate array
	186	//
	187	wdim = (nvars+1)*(nclasses-1);
	188	offs = 5;
	189	expoffs = offs+wdim;
	190	ssize = 5+(nvars+1)*(nclasses-1)+nclasses;
	191	lm.w = new double[ssize-1+1];
	192	lm.w[0] = ssize;
	193	lm.w[1] = logitvnum;
	194	lm.w[2] = nvars;
	195	lm.w[3] = nclasses;
	196	lm.w[4] = offs;
	197
	198	//
	199	// Degenerate case: all outputs are equal
	200	//
	201	allsame = true;
	202	for(i=1; i<=npoints-1; i++)
	203	{
	204	if( (int)Math.Round(xy[i,nvars])!=(int)Math.Round(xy[i-1,nvars]) )
	205	{
	206	allsame = false;
	207	}
	208	}
	209	if( allsame )
	210	{
	211	for(i=0; i<=(nvars+1)*(nclasses-1)-1; i++)
	212	{
	213	lm.w[offs+i] = 0;
	214	}
	215	v = -(2*Math.Log(AP.Math.MinRealNumber));
	216	k = (int)Math.Round(xy[0,nvars]);
	217	if( k==nclasses-1 )
	218	{
	219	for(i=0; i<=nclasses-2; i++)
	220	{
	221	lm.w[offs+i*(nvars+1)+nvars] = -v;
	222	}
	223	}
	224	else
	225	{
	226	for(i=0; i<=nclasses-2; i++)
	227	{
	228	if( i==k )
	229	{
	230	lm.w[offs+i*(nvars+1)+nvars] = +v;
	231	}
	232	else
	233	{
	234	lm.w[offs+i*(nvars+1)+nvars] = 0;
	235	}
	236	}
	237	}
	238	return;
	239	}
	240
	241	//
	242	// General case.
	243	// Prepare task and network. Allocate space.
	244	//
	245	mlpbase.mlpcreatec0(nvars, nclasses, ref network);
	246	mlpbase.mlpinitpreprocessor(ref network, ref xy, npoints);
	247	mlpbase.mlpproperties(ref network, ref nin, ref nout, ref wcount);
	248	for(i=0; i<=wcount-1; i++)
	249	{
	250	network.weights[i] = (2*AP.Math.RandomReal()-1)/nvars;
	251	}
	252	g = new double[wcount-1+1];
	253	h = new double[wcount-1+1, wcount-1+1];
	254	wbase = new double[wcount-1+1];
	255	wdir = new double[wcount-1+1];
	256	work = new double[wcount-1+1];
	257
	258	//
	259	// First stage: optimize in gradient direction.
	260	//
	261	for(k=0; k<=wcount/3+10; k++)
	262	{
	263
	264	//
	265	// Calculate gradient in starting point
	266	//
	267	mlpbase.mlpgradnbatch(ref network, ref xy, npoints, ref e, ref g);
	268	v = 0.0;
	269	for(i_=0; i_<=wcount-1;i_++)
	270	{
	271	v += network.weights[i_]*network.weights[i_];
	272	}
	273	e = e+0.5decayv;
	274	for(i_=0; i_<=wcount-1;i_++)
	275	{
	276	g[i_] = g[i_] + decay*network.weights[i_];
	277	}
	278	rep.ngrad = rep.ngrad+1;
	279
	280	//
	281	// Setup optimization scheme
	282	//
	283	for(i_=0; i_<=wcount-1;i_++)
	284	{
	285	wdir[i_] = -g[i_];
	286	}
	287	v = 0.0;
	288	for(i_=0; i_<=wcount-1;i_++)
	289	{
	290	v += wdir[i_]*wdir[i_];
	291	}
	292	wstep = Math.Sqrt(v);
	293	v = 1/Math.Sqrt(v);
	294	for(i_=0; i_<=wcount-1;i_++)
	295	{
	296	wdir[i_] = v*wdir[i_];
	297	}
	298	mcstage = 0;
	299	mnlmcsrch(wcount, ref network.weights, ref e, ref g, ref wdir, ref wstep, ref mcinfo, ref mcnfev, ref work, ref mcstate, ref mcstage);
	300	while( mcstage!=0 )
	301	{
	302	mlpbase.mlpgradnbatch(ref network, ref xy, npoints, ref e, ref g);
	303	v = 0.0;
	304	for(i_=0; i_<=wcount-1;i_++)
	305	{
	306	v += network.weights[i_]*network.weights[i_];
	307	}
	308	e = e+0.5decayv;
	309	for(i_=0; i_<=wcount-1;i_++)
	310	{
	311	g[i_] = g[i_] + decay*network.weights[i_];
	312	}
	313	rep.ngrad = rep.ngrad+1;
	314	mnlmcsrch(wcount, ref network.weights, ref e, ref g, ref wdir, ref wstep, ref mcinfo, ref mcnfev, ref work, ref mcstate, ref mcstage);
	315	}
	316	}
	317
	318	//
	319	// Second stage: use Hessian when we are close to the minimum
	320	//
	321	while( true )
	322	{
	323
	324	//
	325	// Calculate and update E/G/H
	326	//
	327	mlpbase.mlphessiannbatch(ref network, ref xy, npoints, ref e, ref g, ref h);
	328	v = 0.0;
	329	for(i_=0; i_<=wcount-1;i_++)
	330	{
	331	v += network.weights[i_]*network.weights[i_];
	332	}
	333	e = e+0.5decayv;
	334	for(i_=0; i_<=wcount-1;i_++)
	335	{
	336	g[i_] = g[i_] + decay*network.weights[i_];
	337	}
	338	for(k=0; k<=wcount-1; k++)
	339	{
	340	h[k,k] = h[k,k]+decay;
	341	}
	342	rep.nhess = rep.nhess+1;
	343
	344	//
	345	// Select step direction
	346	// NOTE: it is important to use lower-triangle Cholesky
	347	// factorization since it is much faster than higher-triangle version.
	348	//
	349	spd = trfac.spdmatrixcholesky(ref h, wcount, false);
	350	densesolver.spdmatrixcholeskysolve(ref h, wcount, false, ref g, ref solverinfo, ref solverrep, ref wdir);
	351	spd = solverinfo>0;
	352	if( spd )
	353	{
	354
	355	//
	356	// H is positive definite.
	357	// Step in Newton direction.
	358	//
	359	for(i_=0; i_<=wcount-1;i_++)
	360	{
	361	wdir[i_] = -1*wdir[i_];
	362	}
	363	spd = true;
	364	}
	365	else
	366	{
	367
	368	//
	369	// H is indefinite.
	370	// Step in gradient direction.
	371	//
	372	for(i_=0; i_<=wcount-1;i_++)
	373	{
	374	wdir[i_] = -g[i_];
	375	}
	376	spd = false;
	377	}
	378
	379	//
	380	// Optimize in WDir direction
	381	//
	382	v = 0.0;
	383	for(i_=0; i_<=wcount-1;i_++)
	384	{
	385	v += wdir[i_]*wdir[i_];
	386	}
	387	wstep = Math.Sqrt(v);
	388	v = 1/Math.Sqrt(v);
	389	for(i_=0; i_<=wcount-1;i_++)
	390	{
	391	wdir[i_] = v*wdir[i_];
	392	}
	393	mcstage = 0;
	394	mnlmcsrch(wcount, ref network.weights, ref e, ref g, ref wdir, ref wstep, ref mcinfo, ref mcnfev, ref work, ref mcstate, ref mcstage);
	395	while( mcstage!=0 )
	396	{
	397	mlpbase.mlpgradnbatch(ref network, ref xy, npoints, ref e, ref g);
	398	v = 0.0;
	399	for(i_=0; i_<=wcount-1;i_++)
	400	{
	401	v += network.weights[i_]*network.weights[i_];
	402	}
	403	e = e+0.5decayv;
	404	for(i_=0; i_<=wcount-1;i_++)
	405	{
	406	g[i_] = g[i_] + decay*network.weights[i_];
	407	}
	408	rep.ngrad = rep.ngrad+1;
	409	mnlmcsrch(wcount, ref network.weights, ref e, ref g, ref wdir, ref wstep, ref mcinfo, ref mcnfev, ref work, ref mcstate, ref mcstage);
	410	}
	411	if( spd & (mcinfo==2 \| mcinfo==4 \| mcinfo==6) )
	412	{
	413	break;
	414	}
	415	}
	416
	417	//
	418	// Convert from NN format to MNL format
	419	//
	420	i1_ = (0) - (offs);
	421	for(i_=offs; i_<=offs+wcount-1;i_++)
	422	{
	423	lm.w[i_] = network.weights[i_+i1_];
	424	}
	425	for(k=0; k<=nvars-1; k++)
	426	{
	427	for(i=0; i<=nclasses-2; i++)
	428	{
	429	s = network.columnsigmas[k];
	430	if( (double)(s)==(double)(0) )
	431	{
	432	s = 1;
	433	}
	434	j = offs+(nvars+1)*i;
	435	v = lm.w[j+k];
	436	lm.w[j+k] = v/s;
	437	lm.w[j+nvars] = lm.w[j+nvars]+v*network.columnmeans[k]/s;
	438	}
	439	}
	440	for(k=0; k<=nclasses-2; k++)
	441	{
	442	lm.w[offs+(nvars+1)k+nvars] = -lm.w[offs+(nvars+1)k+nvars];
	443	}
	444	}
	445
	446
	447	/*************************************************************************
	448	Procesing
	449
	450	INPUT PARAMETERS:
	451	LM - logit model, passed by non-constant reference
	452	(some fields of structure are used as temporaries
	453	when calculating model output).
	454	X - input vector, array[0..NVars-1].
	455
	456	OUTPUT PARAMETERS:
	457	Y - result, array[0..NClasses-1]
	458	Vector of posterior probabilities for classification task.
	459	Subroutine does not allocate memory for this vector, it is
	460	responsibility of a caller to allocate it. Array must be
	461	at least [0..NClasses-1].
	462
	463	-- ALGLIB --
	464	Copyright 10.09.2008 by Bochkanov Sergey
	465	*************************************************************************/
	466	public static void mnlprocess(ref logitmodel lm,
	467	ref double[] x,
	468	ref double[] y)
	469	{
	470	int nvars = 0;
	471	int nclasses = 0;
	472	int offs = 0;
	473	int i = 0;
	474	int i1 = 0;
	475	double s = 0;
	476
	477	System.Diagnostics.Debug.Assert((double)(lm.w[1])==(double)(logitvnum), "MNLProcess: unexpected model version");
	478	nvars = (int)Math.Round(lm.w[2]);
	479	nclasses = (int)Math.Round(lm.w[3]);
	480	offs = (int)Math.Round(lm.w[4]);
	481	mnliexp(ref lm.w, ref x);
	482	s = 0;
	483	i1 = offs+(nvars+1)*(nclasses-1);
	484	for(i=i1; i<=i1+nclasses-1; i++)
	485	{
	486	s = s+lm.w[i];
	487	}
	488	for(i=0; i<=nclasses-1; i++)
	489	{
	490	y[i] = lm.w[i1+i]/s;
	491	}
	492	}
	493
	494
	495	/*************************************************************************
	496	Unpacks coefficients of logit model. Logit model have form:
	497
	498	P(class=i) = S(i) / (S(0) + S(1) + ... +S(M-1))
	499	S(i) = Exp(A[i,0]X[0] + ... + A[i,N-1]X[N-1] + A[i,N]), when i<M-1
	500	S(M-1) = 1
	501
	502	INPUT PARAMETERS:
	503	LM - logit model in ALGLIB format
	504
	505	OUTPUT PARAMETERS:
	506	V - coefficients, array[0..NClasses-2,0..NVars]
	507	NVars - number of independent variables
	508	NClasses - number of classes
	509
	510	-- ALGLIB --
	511	Copyright 10.09.2008 by Bochkanov Sergey
	512	*************************************************************************/
	513	public static void mnlunpack(ref logitmodel lm,
	514	ref double[,] a,
	515	ref int nvars,
	516	ref int nclasses)
	517	{
	518	int offs = 0;
	519	int i = 0;
	520	int i_ = 0;
	521	int i1_ = 0;
	522
	523	System.Diagnostics.Debug.Assert((double)(lm.w[1])==(double)(logitvnum), "MNLUnpack: unexpected model version");
	524	nvars = (int)Math.Round(lm.w[2]);
	525	nclasses = (int)Math.Round(lm.w[3]);
	526	offs = (int)Math.Round(lm.w[4]);
	527	a = new double[nclasses-2+1, nvars+1];
	528	for(i=0; i<=nclasses-2; i++)
	529	{
	530	i1_ = (offs+i*(nvars+1)) - (0);
	531	for(i_=0; i_<=nvars;i_++)
	532	{
	533	a[i,i_] = lm.w[i_+i1_];
	534	}
	535	}
	536	}
	537
	538
	539	/*************************************************************************
	540	"Packs" coefficients and creates logit model in ALGLIB format (MNLUnpack
	541	reversed).
	542
	543	INPUT PARAMETERS:
	544	A - model (see MNLUnpack)
	545	NVars - number of independent variables
	546	NClasses - number of classes
	547
	548	OUTPUT PARAMETERS:
	549	LM - logit model.
	550
	551	-- ALGLIB --
	552	Copyright 10.09.2008 by Bochkanov Sergey
	553	*************************************************************************/
	554	public static void mnlpack(ref double[,] a,
	555	int nvars,
	556	int nclasses,
	557	ref logitmodel lm)
	558	{
	559	int offs = 0;
	560	int i = 0;
	561	int wdim = 0;
	562	int ssize = 0;
	563	int i_ = 0;
	564	int i1_ = 0;
	565
	566	wdim = (nvars+1)*(nclasses-1);
	567	offs = 5;
	568	ssize = 5+(nvars+1)*(nclasses-1)+nclasses;
	569	lm.w = new double[ssize-1+1];
	570	lm.w[0] = ssize;
	571	lm.w[1] = logitvnum;
	572	lm.w[2] = nvars;
	573	lm.w[3] = nclasses;
	574	lm.w[4] = offs;
	575	for(i=0; i<=nclasses-2; i++)
	576	{
	577	i1_ = (0) - (offs+i*(nvars+1));
	578	for(i_=offs+i(nvars+1); i_<=offs+i(nvars+1)+nvars;i_++)
	579	{
	580	lm.w[i_] = a[i,i_+i1_];
	581	}
	582	}
	583	}
	584
	585
	586	/*************************************************************************
	587	Copying of LogitModel strucure
	588
	589	INPUT PARAMETERS:
	590	LM1 - original
	591
	592	OUTPUT PARAMETERS:
	593	LM2 - copy
	594
	595	-- ALGLIB --
	596	Copyright 15.03.2009 by Bochkanov Sergey
	597	*************************************************************************/
	598	public static void mnlcopy(ref logitmodel lm1,
	599	ref logitmodel lm2)
	600	{
	601	int k = 0;
	602	int i_ = 0;
	603
	604	k = (int)Math.Round(lm1.w[0]);
	605	lm2.w = new double[k-1+1];
	606	for(i_=0; i_<=k-1;i_++)
	607	{
	608	lm2.w[i_] = lm1.w[i_];
	609	}
	610	}
	611
	612
	613	/*************************************************************************
	614	Serialization of LogitModel strucure
	615
	616	INPUT PARAMETERS:
	617	LM - original
	618
	619	OUTPUT PARAMETERS:
	620	RA - array of real numbers which stores model,
	621	array[0..RLen-1]
	622	RLen - RA lenght
	623
	624	-- ALGLIB --
	625	Copyright 15.03.2009 by Bochkanov Sergey
	626	*************************************************************************/
	627	public static void mnlserialize(ref logitmodel lm,
	628	ref double[] ra,
	629	ref int rlen)
	630	{
	631	int i_ = 0;
	632	int i1_ = 0;
	633
	634	rlen = (int)Math.Round(lm.w[0])+1;
	635	ra = new double[rlen-1+1];
	636	ra[0] = logitvnum;
	637	i1_ = (0) - (1);
	638	for(i_=1; i_<=rlen-1;i_++)
	639	{
	640	ra[i_] = lm.w[i_+i1_];
	641	}
	642	}
	643
	644
	645	/*************************************************************************
	646	Unserialization of LogitModel strucure
	647
	648	INPUT PARAMETERS:
	649	RA - real array which stores model
	650
	651	OUTPUT PARAMETERS:
	652	LM - restored model
	653
	654	-- ALGLIB --
	655	Copyright 15.03.2009 by Bochkanov Sergey
	656	*************************************************************************/
	657	public static void mnlunserialize(ref double[] ra,
	658	ref logitmodel lm)
	659	{
	660	int i_ = 0;
	661	int i1_ = 0;
	662
	663	System.Diagnostics.Debug.Assert((int)Math.Round(ra[0])==logitvnum, "MNLUnserialize: incorrect array!");
	664	lm.w = new double[(int)Math.Round(ra[1])-1+1];
	665	i1_ = (1) - (0);
	666	for(i_=0; i_<=(int)Math.Round(ra[1])-1;i_++)
	667	{
	668	lm.w[i_] = ra[i_+i1_];
	669	}
	670	}
	671
	672
	673	/*************************************************************************
	674	Average cross-entropy (in bits per element) on the test set
	675
	676	INPUT PARAMETERS:
	677	LM - logit model
	678	XY - test set
	679	NPoints - test set size
	680
	681	RESULT:
	682	CrossEntropy/(NPoints*ln(2)).
	683
	684	-- ALGLIB --
	685	Copyright 10.09.2008 by Bochkanov Sergey
	686	*************************************************************************/
	687	public static double mnlavgce(ref logitmodel lm,
	688	ref double[,] xy,
	689	int npoints)
	690	{
	691	double result = 0;
	692	int nvars = 0;
	693	int nclasses = 0;
	694	int i = 0;
	695	double[] workx = new double[0];
	696	double[] worky = new double[0];
	697	int i_ = 0;
	698
	699	System.Diagnostics.Debug.Assert((double)(lm.w[1])==(double)(logitvnum), "MNLClsError: unexpected model version");
	700	nvars = (int)Math.Round(lm.w[2]);
	701	nclasses = (int)Math.Round(lm.w[3]);
	702	workx = new double[nvars-1+1];
	703	worky = new double[nclasses-1+1];
	704	result = 0;
	705	for(i=0; i<=npoints-1; i++)
	706	{
	707	System.Diagnostics.Debug.Assert((int)Math.Round(xy[i,nvars])>=0 & (int)Math.Round(xy[i,nvars])<nclasses, "MNLAvgCE: incorrect class number!");
	708
	709	//
	710	// Process
	711	//
	712	for(i_=0; i_<=nvars-1;i_++)
	713	{
	714	workx[i_] = xy[i,i_];
	715	}
	716	mnlprocess(ref lm, ref workx, ref worky);
	717	if( (double)(worky[(int)Math.Round(xy[i,nvars])])>(double)(0) )
	718	{
	719	result = result-Math.Log(worky[(int)Math.Round(xy[i,nvars])]);
	720	}
	721	else
	722	{
	723	result = result-Math.Log(AP.Math.MinRealNumber);
	724	}
	725	}
	726	result = result/(npoints*Math.Log(2));
	727	return result;
	728	}
	729
	730
	731	/*************************************************************************
	732	Relative classification error on the test set
	733
	734	INPUT PARAMETERS:
	735	LM - logit model
	736	XY - test set
	737	NPoints - test set size
	738
	739	RESULT:
	740	percent of incorrectly classified cases.
	741
	742	-- ALGLIB --
	743	Copyright 10.09.2008 by Bochkanov Sergey
	744	*************************************************************************/
	745	public static double mnlrelclserror(ref logitmodel lm,
	746	ref double[,] xy,
	747	int npoints)
	748	{
	749	double result = 0;
	750
	751	result = (double)(mnlclserror(ref lm, ref xy, npoints))/(double)(npoints);
	752	return result;
	753	}
	754
	755
	756	/*************************************************************************
	757	RMS error on the test set
	758
	759	INPUT PARAMETERS:
	760	LM - logit model
	761	XY - test set
	762	NPoints - test set size
	763
	764	RESULT:
	765	root mean square error (error when estimating posterior probabilities).
	766
	767	-- ALGLIB --
	768	Copyright 30.08.2008 by Bochkanov Sergey
	769	*************************************************************************/
	770	public static double mnlrmserror(ref logitmodel lm,
	771	ref double[,] xy,
	772	int npoints)
	773	{
	774	double result = 0;
	775	double relcls = 0;
	776	double avgce = 0;
	777	double rms = 0;
	778	double avg = 0;
	779	double avgrel = 0;
	780
	781	System.Diagnostics.Debug.Assert((int)Math.Round(lm.w[1])==logitvnum, "MNLRMSError: Incorrect MNL version!");
	782	mnlallerrors(ref lm, ref xy, npoints, ref relcls, ref avgce, ref rms, ref avg, ref avgrel);
	783	result = rms;
	784	return result;
	785	}
	786
	787
	788	/*************************************************************************
	789	Average error on the test set
	790
	791	INPUT PARAMETERS:
	792	LM - logit model
	793	XY - test set
	794	NPoints - test set size
	795
	796	RESULT:
	797	average error (error when estimating posterior probabilities).
	798
	799	-- ALGLIB --
	800	Copyright 30.08.2008 by Bochkanov Sergey
	801	*************************************************************************/
	802	public static double mnlavgerror(ref logitmodel lm,
	803	ref double[,] xy,
	804	int npoints)
	805	{
	806	double result = 0;
	807	double relcls = 0;
	808	double avgce = 0;
	809	double rms = 0;
	810	double avg = 0;
	811	double avgrel = 0;
	812
	813	System.Diagnostics.Debug.Assert((int)Math.Round(lm.w[1])==logitvnum, "MNLRMSError: Incorrect MNL version!");
	814	mnlallerrors(ref lm, ref xy, npoints, ref relcls, ref avgce, ref rms, ref avg, ref avgrel);
	815	result = avg;
	816	return result;
	817	}
	818
	819
	820	/*************************************************************************
	821	Average relative error on the test set
	822
	823	INPUT PARAMETERS:
	824	LM - logit model
	825	XY - test set
	826	NPoints - test set size
	827
	828	RESULT:
	829	average relative error (error when estimating posterior probabilities).
	830
	831	-- ALGLIB --
	832	Copyright 30.08.2008 by Bochkanov Sergey
	833	*************************************************************************/
	834	public static double mnlavgrelerror(ref logitmodel lm,
	835	ref double[,] xy,
	836	int ssize)
	837	{
	838	double result = 0;
	839	double relcls = 0;
	840	double avgce = 0;
	841	double rms = 0;
	842	double avg = 0;
	843	double avgrel = 0;
	844
	845	System.Diagnostics.Debug.Assert((int)Math.Round(lm.w[1])==logitvnum, "MNLRMSError: Incorrect MNL version!");
	846	mnlallerrors(ref lm, ref xy, ssize, ref relcls, ref avgce, ref rms, ref avg, ref avgrel);
	847	result = avgrel;
	848	return result;
	849	}
	850
	851
	852	/*************************************************************************
	853	Classification error on test set = MNLRelClsError*NPoints
	854
	855	-- ALGLIB --
	856	Copyright 10.09.2008 by Bochkanov Sergey
	857	*************************************************************************/
	858	public static int mnlclserror(ref logitmodel lm,
	859	ref double[,] xy,
	860	int npoints)
	861	{
	862	int result = 0;
	863	int nvars = 0;
	864	int nclasses = 0;
	865	int i = 0;
	866	int j = 0;
	867	double[] workx = new double[0];
	868	double[] worky = new double[0];
	869	int nmax = 0;
	870	int i_ = 0;
	871
	872	System.Diagnostics.Debug.Assert((double)(lm.w[1])==(double)(logitvnum), "MNLClsError: unexpected model version");
	873	nvars = (int)Math.Round(lm.w[2]);
	874	nclasses = (int)Math.Round(lm.w[3]);
	875	workx = new double[nvars-1+1];
	876	worky = new double[nclasses-1+1];
	877	result = 0;
	878	for(i=0; i<=npoints-1; i++)
	879	{
	880
	881	//
	882	// Process
	883	//
	884	for(i_=0; i_<=nvars-1;i_++)
	885	{
	886	workx[i_] = xy[i,i_];
	887	}
	888	mnlprocess(ref lm, ref workx, ref worky);
	889
	890	//
	891	// Logit version of the answer
	892	//
	893	nmax = 0;
	894	for(j=0; j<=nclasses-1; j++)
	895	{
	896	if( (double)(worky[j])>(double)(worky[nmax]) )
	897	{
	898	nmax = j;
	899	}
	900	}
	901
	902	//
	903	// compare
	904	//
	905	if( nmax!=(int)Math.Round(xy[i,nvars]) )
	906	{
	907	result = result+1;
	908	}
	909	}
	910	return result;
	911	}
	912
	913
	914	/*************************************************************************
	915	Internal subroutine. Places exponents of the anti-overflow shifted
	916	internal linear outputs into the service part of the W array.
	917	*************************************************************************/
	918	private static void mnliexp(ref double[] w,
	919	ref double[] x)
	920	{
	921	int nvars = 0;
	922	int nclasses = 0;
	923	int offs = 0;
	924	int i = 0;
	925	int i1 = 0;
	926	double v = 0;
	927	double mx = 0;
	928	int i_ = 0;
	929	int i1_ = 0;
	930
	931	System.Diagnostics.Debug.Assert((double)(w[1])==(double)(logitvnum), "LOGIT: unexpected model version");
	932	nvars = (int)Math.Round(w[2]);
	933	nclasses = (int)Math.Round(w[3]);
	934	offs = (int)Math.Round(w[4]);
	935	i1 = offs+(nvars+1)*(nclasses-1);
	936	for(i=0; i<=nclasses-2; i++)
	937	{
	938	i1_ = (0)-(offs+i*(nvars+1));
	939	v = 0.0;
	940	for(i_=offs+i(nvars+1); i_<=offs+i(nvars+1)+nvars-1;i_++)
	941	{
	942	v += w[i_]*x[i_+i1_];
	943	}
	944	w[i1+i] = v+w[offs+i*(nvars+1)+nvars];
	945	}
	946	w[i1+nclasses-1] = 0;
	947	mx = 0;
	948	for(i=i1; i<=i1+nclasses-1; i++)
	949	{
	950	mx = Math.Max(mx, w[i]);
	951	}
	952	for(i=i1; i<=i1+nclasses-1; i++)
	953	{
	954	w[i] = Math.Exp(w[i]-mx);
	955	}
	956	}
	957
	958
	959	/*************************************************************************
	960	Calculation of all types of errors
	961
	962	-- ALGLIB --
	963	Copyright 30.08.2008 by Bochkanov Sergey
	964	*************************************************************************/
	965	private static void mnlallerrors(ref logitmodel lm,
	966	ref double[,] xy,
	967	int npoints,
	968	ref double relcls,
	969	ref double avgce,
	970	ref double rms,
	971	ref double avg,
	972	ref double avgrel)
	973	{
	974	int nvars = 0;
	975	int nclasses = 0;
	976	int i = 0;
	977	double[] buf = new double[0];
	978	double[] workx = new double[0];
	979	double[] y = new double[0];
	980	double[] dy = new double[0];
	981	int i_ = 0;
	982
	983	System.Diagnostics.Debug.Assert((int)Math.Round(lm.w[1])==logitvnum, "MNL unit: Incorrect MNL version!");
	984	nvars = (int)Math.Round(lm.w[2]);
	985	nclasses = (int)Math.Round(lm.w[3]);
	986	workx = new double[nvars-1+1];
	987	y = new double[nclasses-1+1];
	988	dy = new double[0+1];
	989	bdss.dserrallocate(nclasses, ref buf);
	990	for(i=0; i<=npoints-1; i++)
	991	{
	992	for(i_=0; i_<=nvars-1;i_++)
	993	{
	994	workx[i_] = xy[i,i_];
	995	}
	996	mnlprocess(ref lm, ref workx, ref y);
	997	dy[0] = xy[i,nvars];
	998	bdss.dserraccumulate(ref buf, ref y, ref dy);
	999	}
	1000	bdss.dserrfinish(ref buf);
	1001	relcls = buf[0];
	1002	avgce = buf[1];
	1003	rms = buf[2];
	1004	avg = buf[3];
	1005	avgrel = buf[4];
	1006	}
	1007
	1008
	1009	/*************************************************************************
	1010	THE PURPOSE OF MCSRCH IS TO FIND A STEP WHICH SATISFIES A SUFFICIENT
	1011	DECREASE CONDITION AND A CURVATURE CONDITION.
	1012
	1013	AT EACH STAGE THE SUBROUTINE UPDATES AN INTERVAL OF UNCERTAINTY WITH
	1014	ENDPOINTS STX AND STY. THE INTERVAL OF UNCERTAINTY IS INITIALLY CHOSEN
	1015	SO THAT IT CONTAINS A MINIMIZER OF THE MODIFIED FUNCTION
	1016
	1017	F(X+STPS) - F(X) - FTOLSTP*(GRADF(X)'S).
	1018
	1019	IF A STEP IS OBTAINED FOR WHICH THE MODIFIED FUNCTION HAS A NONPOSITIVE
	1020	FUNCTION VALUE AND NONNEGATIVE DERIVATIVE, THEN THE INTERVAL OF
	1021	UNCERTAINTY IS CHOSEN SO THAT IT CONTAINS A MINIMIZER OF F(X+STP*S).
	1022
	1023	THE ALGORITHM IS DESIGNED TO FIND A STEP WHICH SATISFIES THE SUFFICIENT
	1024	DECREASE CONDITION
	1025
	1026	F(X+STPS) .LE. F(X) + FTOLSTP*(GRADF(X)'S),
	1027
	1028	AND THE CURVATURE CONDITION
	1029
	1030	ABS(GRADF(X+STPS)'S)) .LE. GTOLABS(GRADF(X)'S).
	1031
	1032	IF FTOL IS LESS THAN GTOL AND IF, FOR EXAMPLE, THE FUNCTION IS BOUNDED
	1033	BELOW, THEN THERE IS ALWAYS A STEP WHICH SATISFIES BOTH CONDITIONS.
	1034	IF NO STEP CAN BE FOUND WHICH SATISFIES BOTH CONDITIONS, THEN THE
	1035	ALGORITHM USUALLY STOPS WHEN ROUNDING ERRORS PREVENT FURTHER PROGRESS.
	1036	IN THIS CASE STP ONLY SATISFIES THE SUFFICIENT DECREASE CONDITION.
	1037
	1038	PARAMETERS DESCRIPRION
	1039
	1040	N IS A POSITIVE INTEGER INPUT VARIABLE SET TO THE NUMBER OF VARIABLES.
	1041
	1042	X IS AN ARRAY OF LENGTH N. ON INPUT IT MUST CONTAIN THE BASE POINT FOR
	1043	THE LINE SEARCH. ON OUTPUT IT CONTAINS X+STP*S.
	1044
	1045	F IS A VARIABLE. ON INPUT IT MUST CONTAIN THE VALUE OF F AT X. ON OUTPUT
	1046	IT CONTAINS THE VALUE OF F AT X + STP*S.
	1047
	1048	G IS AN ARRAY OF LENGTH N. ON INPUT IT MUST CONTAIN THE GRADIENT OF F AT X.
	1049	ON OUTPUT IT CONTAINS THE GRADIENT OF F AT X + STP*S.
	1050
	1051	S IS AN INPUT ARRAY OF LENGTH N WHICH SPECIFIES THE SEARCH DIRECTION.
	1052
	1053	STP IS A NONNEGATIVE VARIABLE. ON INPUT STP CONTAINS AN INITIAL ESTIMATE
	1054	OF A SATISFACTORY STEP. ON OUTPUT STP CONTAINS THE FINAL ESTIMATE.
	1055
	1056	FTOL AND GTOL ARE NONNEGATIVE INPUT VARIABLES. TERMINATION OCCURS WHEN THE
	1057	SUFFICIENT DECREASE CONDITION AND THE DIRECTIONAL DERIVATIVE CONDITION ARE
	1058	SATISFIED.
	1059
	1060	XTOL IS A NONNEGATIVE INPUT VARIABLE. TERMINATION OCCURS WHEN THE RELATIVE
	1061	WIDTH OF THE INTERVAL OF UNCERTAINTY IS AT MOST XTOL.
	1062
	1063	STPMIN AND STPMAX ARE NONNEGATIVE INPUT VARIABLES WHICH SPECIFY LOWER AND
	1064	UPPER BOUNDS FOR THE STEP.
	1065
	1066	MAXFEV IS A POSITIVE INTEGER INPUT VARIABLE. TERMINATION OCCURS WHEN THE
	1067	NUMBER OF CALLS TO FCN IS AT LEAST MAXFEV BY THE END OF AN ITERATION.
	1068
	1069	INFO IS AN INTEGER OUTPUT VARIABLE SET AS FOLLOWS:
	1070	INFO = 0 IMPROPER INPUT PARAMETERS.
	1071
	1072	INFO = 1 THE SUFFICIENT DECREASE CONDITION AND THE
	1073	DIRECTIONAL DERIVATIVE CONDITION HOLD.
	1074
	1075	INFO = 2 RELATIVE WIDTH OF THE INTERVAL OF UNCERTAINTY
	1076	IS AT MOST XTOL.
	1077
	1078	INFO = 3 NUMBER OF CALLS TO FCN HAS REACHED MAXFEV.
	1079
	1080	INFO = 4 THE STEP IS AT THE LOWER BOUND STPMIN.
	1081
	1082	INFO = 5 THE STEP IS AT THE UPPER BOUND STPMAX.
	1083
	1084	INFO = 6 ROUNDING ERRORS PREVENT FURTHER PROGRESS.
	1085	THERE MAY NOT BE A STEP WHICH SATISFIES THE
	1086	SUFFICIENT DECREASE AND CURVATURE CONDITIONS.
	1087	TOLERANCES MAY BE TOO SMALL.
	1088
	1089	NFEV IS AN INTEGER OUTPUT VARIABLE SET TO THE NUMBER OF CALLS TO FCN.
	1090
	1091	WA IS A WORK ARRAY OF LENGTH N.
	1092
	1093	ARGONNE NATIONAL LABORATORY. MINPACK PROJECT. JUNE 1983
	1094	JORGE J. MORE', DAVID J. THUENTE
	1095	*************************************************************************/
	1096	private static void mnlmcsrch(int n,
	1097	ref double[] x,
	1098	ref double f,
	1099	ref double[] g,
	1100	ref double[] s,
	1101	ref double stp,
	1102	ref int info,
	1103	ref int nfev,
	1104	ref double[] wa,
	1105	ref logitmcstate state,
	1106	ref int stage)
	1107	{
	1108	double v = 0;
	1109	double p5 = 0;
	1110	double p66 = 0;
	1111	double zero = 0;
	1112	int i_ = 0;
	1113
	1114
	1115	//
	1116	// init
	1117	//
	1118	p5 = 0.5;
	1119	p66 = 0.66;
	1120	state.xtrapf = 4.0;
	1121	zero = 0;
	1122
	1123	//
	1124	// Main cycle
	1125	//
	1126	while( true )
	1127	{
	1128	if( stage==0 )
	1129	{
	1130
	1131	//
	1132	// NEXT
	1133	//
	1134	stage = 2;
	1135	continue;
	1136	}
	1137	if( stage==2 )
	1138	{
	1139	state.infoc = 1;
	1140	info = 0;
	1141
	1142	//
	1143	// CHECK THE INPUT PARAMETERS FOR ERRORS.
	1144	//
	1145	if( n<=0 \| (double)(stp)<=(double)(0) \| (double)(ftol)<(double)(0) \| (double)(gtol)<(double)(zero) \| (double)(xtol)<(double)(zero) \| (double)(stpmin)<(double)(zero) \| (double)(stpmax)<(double)(stpmin) \| maxfev<=0 )
	1146	{
	1147	stage = 0;
	1148	return;
	1149	}
	1150
	1151	//
	1152	// COMPUTE THE INITIAL GRADIENT IN THE SEARCH DIRECTION
	1153	// AND CHECK THAT S IS A DESCENT DIRECTION.
	1154	//
	1155	v = 0.0;
	1156	for(i_=0; i_<=n-1;i_++)
	1157	{
	1158	v += g[i_]*s[i_];
	1159	}
	1160	state.dginit = v;
	1161	if( (double)(state.dginit)>=(double)(0) )
	1162	{
	1163	stage = 0;
	1164	return;
	1165	}
	1166
	1167	//
	1168	// INITIALIZE LOCAL VARIABLES.
	1169	//
	1170	state.brackt = false;
	1171	state.stage1 = true;
	1172	nfev = 0;
	1173	state.finit = f;
	1174	state.dgtest = ftol*state.dginit;
	1175	state.width = stpmax-stpmin;
	1176	state.width1 = state.width/p5;
	1177	for(i_=0; i_<=n-1;i_++)
	1178	{
	1179	wa[i_] = x[i_];
	1180	}
	1181
	1182	//
	1183	// THE VARIABLES STX, FX, DGX CONTAIN THE VALUES OF THE STEP,
	1184	// FUNCTION, AND DIRECTIONAL DERIVATIVE AT THE BEST STEP.
	1185	// THE VARIABLES STY, FY, DGY CONTAIN THE VALUE OF THE STEP,
	1186	// FUNCTION, AND DERIVATIVE AT THE OTHER ENDPOINT OF
	1187	// THE INTERVAL OF UNCERTAINTY.
	1188	// THE VARIABLES STP, F, DG CONTAIN THE VALUES OF THE STEP,
	1189	// FUNCTION, AND DERIVATIVE AT THE CURRENT STEP.
	1190	//
	1191	state.stx = 0;
	1192	state.fx = state.finit;
	1193	state.dgx = state.dginit;
	1194	state.sty = 0;
	1195	state.fy = state.finit;
	1196	state.dgy = state.dginit;
	1197
	1198	//
	1199	// NEXT
	1200	//
	1201	stage = 3;
	1202	continue;
	1203	}
	1204	if( stage==3 )
	1205	{
	1206
	1207	//
	1208	// START OF ITERATION.
	1209	//
	1210	// SET THE MINIMUM AND MAXIMUM STEPS TO CORRESPOND
	1211	// TO THE PRESENT INTERVAL OF UNCERTAINTY.
	1212	//
	1213	if( state.brackt )
	1214	{
	1215	if( (double)(state.stx)<(double)(state.sty) )
	1216	{
	1217	state.stmin = state.stx;
	1218	state.stmax = state.sty;
	1219	}
	1220	else
	1221	{
	1222	state.stmin = state.sty;
	1223	state.stmax = state.stx;
	1224	}
	1225	}
	1226	else
	1227	{
	1228	state.stmin = state.stx;
	1229	state.stmax = stp+state.xtrapf*(stp-state.stx);
	1230	}
	1231
	1232	//
	1233	// FORCE THE STEP TO BE WITHIN THE BOUNDS STPMAX AND STPMIN.
	1234	//
	1235	if( (double)(stp)>(double)(stpmax) )
	1236	{
	1237	stp = stpmax;
	1238	}
	1239	if( (double)(stp)<(double)(stpmin) )
	1240	{
	1241	stp = stpmin;
	1242	}
	1243
	1244	//
	1245	// IF AN UNUSUAL TERMINATION IS TO OCCUR THEN LET
	1246	// STP BE THE LOWEST POINT OBTAINED SO FAR.
	1247	//
	1248	if( state.brackt & ((double)(stp)<=(double)(state.stmin) \| (double)(stp)>=(double)(state.stmax)) \| nfev>=maxfev-1 \| state.infoc==0 \| state.brackt & (double)(state.stmax-state.stmin)<=(double)(xtol*state.stmax) )
	1249	{
	1250	stp = state.stx;
	1251	}
	1252
	1253	//
	1254	// EVALUATE THE FUNCTION AND GRADIENT AT STP
	1255	// AND COMPUTE THE DIRECTIONAL DERIVATIVE.
	1256	//
	1257	for(i_=0; i_<=n-1;i_++)
	1258	{
	1259	x[i_] = wa[i_];
	1260	}
	1261	for(i_=0; i_<=n-1;i_++)
	1262	{
	1263	x[i_] = x[i_] + stp*s[i_];
	1264	}
	1265
	1266	//
	1267	// NEXT
	1268	//
	1269	stage = 4;
	1270	return;
	1271	}
	1272	if( stage==4 )
	1273	{
	1274	info = 0;
	1275	nfev = nfev+1;
	1276	v = 0.0;
	1277	for(i_=0; i_<=n-1;i_++)
	1278	{
	1279	v += g[i_]*s[i_];
	1280	}
	1281	state.dg = v;
	1282	state.ftest1 = state.finit+stp*state.dgtest;
	1283
	1284	//
	1285	// TEST FOR CONVERGENCE.
	1286	//
	1287	if( state.brackt & ((double)(stp)<=(double)(state.stmin) \| (double)(stp)>=(double)(state.stmax)) \| state.infoc==0 )
	1288	{
	1289	info = 6;
	1290	}
	1291	if( (double)(stp)==(double)(stpmax) & (double)(f)<=(double)(state.ftest1) & (double)(state.dg)<=(double)(state.dgtest) )
	1292	{
	1293	info = 5;
	1294	}
	1295	if( (double)(stp)==(double)(stpmin) & ((double)(f)>(double)(state.ftest1) \| (double)(state.dg)>=(double)(state.dgtest)) )
	1296	{
	1297	info = 4;
	1298	}
	1299	if( nfev>=maxfev )
	1300	{
	1301	info = 3;
	1302	}
	1303	if( state.brackt & (double)(state.stmax-state.stmin)<=(double)(xtol*state.stmax) )
	1304	{
	1305	info = 2;
	1306	}
	1307	if( (double)(f)<=(double)(state.ftest1) & (double)(Math.Abs(state.dg))<=(double)(-(gtol*state.dginit)) )
	1308	{
	1309	info = 1;
	1310	}
	1311
	1312	//
	1313	// CHECK FOR TERMINATION.
	1314	//
	1315	if( info!=0 )
	1316	{
	1317	stage = 0;
	1318	return;
	1319	}
	1320
	1321	//
	1322	// IN THE FIRST STAGE WE SEEK A STEP FOR WHICH THE MODIFIED
	1323	// FUNCTION HAS A NONPOSITIVE VALUE AND NONNEGATIVE DERIVATIVE.
	1324	//
	1325	if( state.stage1 & (double)(f)<=(double)(state.ftest1) & (double)(state.dg)>=(double)(Math.Min(ftol, gtol)*state.dginit) )
	1326	{
	1327	state.stage1 = false;
	1328	}
	1329
	1330	//
	1331	// A MODIFIED FUNCTION IS USED TO PREDICT THE STEP ONLY IF
	1332	// WE HAVE NOT OBTAINED A STEP FOR WHICH THE MODIFIED
	1333	// FUNCTION HAS A NONPOSITIVE FUNCTION VALUE AND NONNEGATIVE
	1334	// DERIVATIVE, AND IF A LOWER FUNCTION VALUE HAS BEEN
	1335	// OBTAINED BUT THE DECREASE IS NOT SUFFICIENT.
	1336	//
	1337	if( state.stage1 & (double)(f)<=(double)(state.fx) & (double)(f)>(double)(state.ftest1) )
	1338	{
	1339
	1340	//
	1341	// DEFINE THE MODIFIED FUNCTION AND DERIVATIVE VALUES.
	1342	//
	1343	state.fm = f-stp*state.dgtest;
	1344	state.fxm = state.fx-state.stx*state.dgtest;
	1345	state.fym = state.fy-state.sty*state.dgtest;
	1346	state.dgm = state.dg-state.dgtest;
	1347	state.dgxm = state.dgx-state.dgtest;
	1348	state.dgym = state.dgy-state.dgtest;
	1349
	1350	//
	1351	// CALL CSTEP TO UPDATE THE INTERVAL OF UNCERTAINTY
	1352	// AND TO COMPUTE THE NEW STEP.
	1353	//
	1354	mnlmcstep(ref state.stx, ref state.fxm, ref state.dgxm, ref state.sty, ref state.fym, ref state.dgym, ref stp, state.fm, state.dgm, ref state.brackt, state.stmin, state.stmax, ref state.infoc);
	1355
	1356	//
	1357	// RESET THE FUNCTION AND GRADIENT VALUES FOR F.
	1358	//
	1359	state.fx = state.fxm+state.stx*state.dgtest;
	1360	state.fy = state.fym+state.sty*state.dgtest;
	1361	state.dgx = state.dgxm+state.dgtest;
	1362	state.dgy = state.dgym+state.dgtest;
	1363	}
	1364	else
	1365	{
	1366
	1367	//
	1368	// CALL MCSTEP TO UPDATE THE INTERVAL OF UNCERTAINTY
	1369	// AND TO COMPUTE THE NEW STEP.
	1370	//
	1371	mnlmcstep(ref state.stx, ref state.fx, ref state.dgx, ref state.sty, ref state.fy, ref state.dgy, ref stp, f, state.dg, ref state.brackt, state.stmin, state.stmax, ref state.infoc);
	1372	}
	1373
	1374	//
	1375	// FORCE A SUFFICIENT DECREASE IN THE SIZE OF THE
	1376	// INTERVAL OF UNCERTAINTY.
	1377	//
	1378	if( state.brackt )
	1379	{
	1380	if( (double)(Math.Abs(state.sty-state.stx))>=(double)(p66*state.width1) )
	1381	{
	1382	stp = state.stx+p5*(state.sty-state.stx);
	1383	}
	1384	state.width1 = state.width;
	1385	state.width = Math.Abs(state.sty-state.stx);
	1386	}
	1387
	1388	//
	1389	// NEXT.
	1390	//
	1391	stage = 3;
	1392	continue;
	1393	}
	1394	}
	1395	}
	1396
	1397
	1398	private static void mnlmcstep(ref double stx,
	1399	ref double fx,
	1400	ref double dx,
	1401	ref double sty,
	1402	ref double fy,
	1403	ref double dy,
	1404	ref double stp,
	1405	double fp,
	1406	double dp,
	1407	ref bool brackt,
	1408	double stmin,
	1409	double stmax,
	1410	ref int info)
	1411	{
	1412	bool bound = new bool();
	1413	double gamma = 0;
	1414	double p = 0;
	1415	double q = 0;
	1416	double r = 0;
	1417	double s = 0;
	1418	double sgnd = 0;
	1419	double stpc = 0;
	1420	double stpf = 0;
	1421	double stpq = 0;
	1422	double theta = 0;
	1423
	1424	info = 0;
	1425
	1426	//
	1427	// CHECK THE INPUT PARAMETERS FOR ERRORS.
	1428	//
	1429	if( brackt & ((double)(stp)<=(double)(Math.Min(stx, sty)) \| (double)(stp)>=(double)(Math.Max(stx, sty))) \| (double)(dx*(stp-stx))>=(double)(0) \| (double)(stmax)<(double)(stmin) )
	1430	{
	1431	return;
	1432	}
	1433
	1434	//
	1435	// DETERMINE IF THE DERIVATIVES HAVE OPPOSITE SIGN.
	1436	//
	1437	sgnd = dp*(dx/Math.Abs(dx));
	1438
	1439	//
	1440	// FIRST CASE. A HIGHER FUNCTION VALUE.
	1441	// THE MINIMUM IS BRACKETED. IF THE CUBIC STEP IS CLOSER
	1442	// TO STX THAN THE QUADRATIC STEP, THE CUBIC STEP IS TAKEN,
	1443	// ELSE THE AVERAGE OF THE CUBIC AND QUADRATIC STEPS IS TAKEN.
	1444	//
	1445	if( (double)(fp)>(double)(fx) )
	1446	{
	1447	info = 1;
	1448	bound = true;
	1449	theta = 3*(fx-fp)/(stp-stx)+dx+dp;
	1450	s = Math.Max(Math.Abs(theta), Math.Max(Math.Abs(dx), Math.Abs(dp)));
	1451	gamma = sMath.Sqrt(AP.Math.Sqr(theta/s)-dx/s(dp/s));
	1452	if( (double)(stp)<(double)(stx) )
	1453	{
	1454	gamma = -gamma;
	1455	}
	1456	p = gamma-dx+theta;
	1457	q = gamma-dx+gamma+dp;
	1458	r = p/q;
	1459	stpc = stx+r*(stp-stx);
	1460	stpq = stx+dx/((fx-fp)/(stp-stx)+dx)/2*(stp-stx);
	1461	if( (double)(Math.Abs(stpc-stx))<(double)(Math.Abs(stpq-stx)) )
	1462	{
	1463	stpf = stpc;
	1464	}
	1465	else
	1466	{
	1467	stpf = stpc+(stpq-stpc)/2;
	1468	}
	1469	brackt = true;
	1470	}
	1471	else
	1472	{
	1473	if( (double)(sgnd)<(double)(0) )
	1474	{
	1475
	1476	//
	1477	// SECOND CASE. A LOWER FUNCTION VALUE AND DERIVATIVES OF
	1478	// OPPOSITE SIGN. THE MINIMUM IS BRACKETED. IF THE CUBIC
	1479	// STEP IS CLOSER TO STX THAN THE QUADRATIC (SECANT) STEP,
	1480	// THE CUBIC STEP IS TAKEN, ELSE THE QUADRATIC STEP IS TAKEN.
	1481	//
	1482	info = 2;
	1483	bound = false;
	1484	theta = 3*(fx-fp)/(stp-stx)+dx+dp;
	1485	s = Math.Max(Math.Abs(theta), Math.Max(Math.Abs(dx), Math.Abs(dp)));
	1486	gamma = sMath.Sqrt(AP.Math.Sqr(theta/s)-dx/s(dp/s));
	1487	if( (double)(stp)>(double)(stx) )
	1488	{
	1489	gamma = -gamma;
	1490	}
	1491	p = gamma-dp+theta;
	1492	q = gamma-dp+gamma+dx;
	1493	r = p/q;
	1494	stpc = stp+r*(stx-stp);
	1495	stpq = stp+dp/(dp-dx)*(stx-stp);
	1496	if( (double)(Math.Abs(stpc-stp))>(double)(Math.Abs(stpq-stp)) )
	1497	{
	1498	stpf = stpc;
	1499	}
	1500	else
	1501	{
	1502	stpf = stpq;
	1503	}
	1504	brackt = true;
	1505	}
	1506	else
	1507	{
	1508	if( (double)(Math.Abs(dp))<(double)(Math.Abs(dx)) )
	1509	{
	1510
	1511	//
	1512	// THIRD CASE. A LOWER FUNCTION VALUE, DERIVATIVES OF THE
	1513	// SAME SIGN, AND THE MAGNITUDE OF THE DERIVATIVE DECREASES.
	1514	// THE CUBIC STEP IS ONLY USED IF THE CUBIC TENDS TO INFINITY
	1515	// IN THE DIRECTION OF THE STEP OR IF THE MINIMUM OF THE CUBIC
	1516	// IS BEYOND STP. OTHERWISE THE CUBIC STEP IS DEFINED TO BE
	1517	// EITHER STPMIN OR STPMAX. THE QUADRATIC (SECANT) STEP IS ALSO
	1518	// COMPUTED AND IF THE MINIMUM IS BRACKETED THEN THE THE STEP
	1519	// CLOSEST TO STX IS TAKEN, ELSE THE STEP FARTHEST AWAY IS TAKEN.
	1520	//
	1521	info = 3;
	1522	bound = true;
	1523	theta = 3*(fx-fp)/(stp-stx)+dx+dp;
	1524	s = Math.Max(Math.Abs(theta), Math.Max(Math.Abs(dx), Math.Abs(dp)));
	1525
	1526	//
	1527	// THE CASE GAMMA = 0 ONLY ARISES IF THE CUBIC DOES NOT TEND
	1528	// TO INFINITY IN THE DIRECTION OF THE STEP.
	1529	//
	1530	gamma = sMath.Sqrt(Math.Max(0, AP.Math.Sqr(theta/s)-dx/s(dp/s)));
	1531	if( (double)(stp)>(double)(stx) )
	1532	{
	1533	gamma = -gamma;
	1534	}
	1535	p = gamma-dp+theta;
	1536	q = gamma+(dx-dp)+gamma;
	1537	r = p/q;
	1538	if( (double)(r)<(double)(0) & (double)(gamma)!=(double)(0) )
	1539	{
	1540	stpc = stp+r*(stx-stp);
	1541	}
	1542	else
	1543	{
	1544	if( (double)(stp)>(double)(stx) )
	1545	{
	1546	stpc = stmax;
	1547	}
	1548	else
	1549	{
	1550	stpc = stmin;
	1551	}
	1552	}
	1553	stpq = stp+dp/(dp-dx)*(stx-stp);
	1554	if( brackt )
	1555	{
	1556	if( (double)(Math.Abs(stp-stpc))<(double)(Math.Abs(stp-stpq)) )
	1557	{
	1558	stpf = stpc;
	1559	}
	1560	else
	1561	{
	1562	stpf = stpq;
	1563	}
	1564	}
	1565	else
	1566	{
	1567	if( (double)(Math.Abs(stp-stpc))>(double)(Math.Abs(stp-stpq)) )
	1568	{
	1569	stpf = stpc;
	1570	}
	1571	else
	1572	{
	1573	stpf = stpq;
	1574	}
	1575	}
	1576	}
	1577	else
	1578	{
	1579
	1580	//
	1581	// FOURTH CASE. A LOWER FUNCTION VALUE, DERIVATIVES OF THE
	1582	// SAME SIGN, AND THE MAGNITUDE OF THE DERIVATIVE DOES
	1583	// NOT DECREASE. IF THE MINIMUM IS NOT BRACKETED, THE STEP
	1584	// IS EITHER STPMIN OR STPMAX, ELSE THE CUBIC STEP IS TAKEN.
	1585	//
	1586	info = 4;
	1587	bound = false;
	1588	if( brackt )
	1589	{
	1590	theta = 3*(fp-fy)/(sty-stp)+dy+dp;
	1591	s = Math.Max(Math.Abs(theta), Math.Max(Math.Abs(dy), Math.Abs(dp)));
	1592	gamma = sMath.Sqrt(AP.Math.Sqr(theta/s)-dy/s(dp/s));
	1593	if( (double)(stp)>(double)(sty) )
	1594	{
	1595	gamma = -gamma;
	1596	}
	1597	p = gamma-dp+theta;
	1598	q = gamma-dp+gamma+dy;
	1599	r = p/q;
	1600	stpc = stp+r*(sty-stp);
	1601	stpf = stpc;
	1602	}
	1603	else
	1604	{
	1605	if( (double)(stp)>(double)(stx) )
	1606	{
	1607	stpf = stmax;
	1608	}
	1609	else
	1610	{
	1611	stpf = stmin;
	1612	}
	1613	}
	1614	}
	1615	}
	1616	}
	1617
	1618	//
	1619	// UPDATE THE INTERVAL OF UNCERTAINTY. THIS UPDATE DOES NOT
	1620	// DEPEND ON THE NEW STEP OR THE CASE ANALYSIS ABOVE.
	1621	//
	1622	if( (double)(fp)>(double)(fx) )
	1623	{
	1624	sty = stp;
	1625	fy = fp;
	1626	dy = dp;
	1627	}
	1628	else
	1629	{
	1630	if( (double)(sgnd)<(double)(0.0) )
	1631	{
	1632	sty = stx;
	1633	fy = fx;
	1634	dy = dx;
	1635	}
	1636	stx = stp;
	1637	fx = fp;
	1638	dx = dp;
	1639	}
	1640
	1641	//
	1642	// COMPUTE THE NEW STEP AND SAFEGUARD IT.
	1643	//
	1644	stpf = Math.Min(stmax, stpf);
	1645	stpf = Math.Max(stmin, stpf);
	1646	stp = stpf;
	1647	if( brackt & bound )
	1648	{
	1649	if( (double)(sty)>(double)(stx) )
	1650	{
	1651	stp = Math.Min(stx+0.66*(sty-stx), stp);
	1652	}
	1653	else
	1654	{
	1655	stp = Math.Max(stx+0.66*(sty-stx), stp);
	1656	}
	1657	}
	1658	}
	1659	}
	1660	}

Note: See TracBrowser for help on using the repository browser.

Download in other formats:

Update cookies preferences