Context Navigation

source: branches/HeuristicLab.Algorithms.DataAnalysis.Glmnet/3.4/ElasticNetLinearRegression.cs @ 14349

Visit:

Last change on this file since 14349 was 14225, checked in by gkronber, 8 years ago
#745: used NMSE instead of squared Pearson's correlation coeff as results.
File size: 27.0 KB

Rev	Line
[13927]	1	using System;
	2	using System.Linq;
	3	using System.Runtime.InteropServices;
	4	using HeuristicLab.Analysis;
	5	using HeuristicLab.Common;
	6	using HeuristicLab.Core;
	7	using HeuristicLab.Data;
[13930]	8	using HeuristicLab.Encodings.SymbolicExpressionTreeEncoding;
[13927]	9	using HeuristicLab.Optimization;
	10	using HeuristicLab.Parameters;
	11	using HeuristicLab.Persistence.Default.CompositeSerializers.Storable;
	12	using HeuristicLab.Problems.DataAnalysis;
[13930]	13	using HeuristicLab.Problems.DataAnalysis.Symbolic;
	14	using HeuristicLab.Problems.DataAnalysis.Symbolic.Regression;
[13927]	15
[14225]	16	namespace HeuristicLab.Algorithms.DataAnalysis.Glmnet {
[13927]	17	[Item("Elastic-net Linear Regression (LR)", "Linear regression with elastic-net regularization (wrapper for glmnet)")]
	18	[Creatable(CreatableAttribute.Categories.DataAnalysisRegression, Priority = 110)]
	19	[StorableClass]
	20	public sealed class ElasticNetLinearRegression : FixedDataAnalysisAlgorithm<IRegressionProblem> {
	21	private const string PenalityParameterName = "Penality";
[13940]	22	private const string LogLambdaParameterName = "Log10(Lambda)";
[13927]	23	#region parameters
	24	public IFixedValueParameter<DoubleValue> PenalityParameter {
	25	get { return (IFixedValueParameter<DoubleValue>)Parameters[PenalityParameterName]; }
	26	}
[13940]	27	public IValueParameter<DoubleValue> LogLambdaParameter {
	28	get { return (IValueParameter<DoubleValue>)Parameters[LogLambdaParameterName]; }
[13930]	29	}
[13927]	30	#endregion
	31	#region properties
	32	public double Penality {
	33	get { return PenalityParameter.Value.Value; }
	34	set { PenalityParameter.Value.Value = value; }
	35	}
[13940]	36	public DoubleValue LogLambda {
	37	get { return LogLambdaParameter.Value; }
	38	set { LogLambdaParameter.Value = value; }
[13930]	39	}
[13927]	40	#endregion
	41
	42	[StorableConstructor]
	43	private ElasticNetLinearRegression(bool deserializing) : base(deserializing) { }
	44	private ElasticNetLinearRegression(ElasticNetLinearRegression original, Cloner cloner)
	45	: base(original, cloner) {
	46	}
[13940]	47	public ElasticNetLinearRegression()
	48	: base() {
[13927]	49	Problem = new RegressionProblem();
	50	Parameters.Add(new FixedValueParameter<DoubleValue>(PenalityParameterName, "Penalty factor for balancing between ridge (0.0) and lasso (1.0) regression", new DoubleValue(0.5)));
[13940]	51	Parameters.Add(new OptionalValueParameter<DoubleValue>(LogLambdaParameterName, "Optional: the value of lambda for which to calculate an elastic-net solution. lambda == null => calculate the whole path of all lambdas"));
[13927]	52	}
	53
	54	[StorableHook(HookType.AfterDeserialization)]
	55	private void AfterDeserialization() { }
	56
	57	public override IDeepCloneable Clone(Cloner cloner) {
	58	return new ElasticNetLinearRegression(this, cloner);
	59	}
	60
	61	protected override void Run() {
[13940]	62	if (LogLambda == null) {
[13930]	63	CreateSolutionPath();
	64	} else {
[13940]	65	CreateSolution(LogLambda.Value);
[13930]	66	}
	67	}
	68
[13940]	69	private void CreateSolution(double logLambda) {
[14225]	70	double trainNMSE;
	71	double testNMSE;
	72	var coeff = CreateElasticNetLinearRegressionSolution(Problem.ProblemData, Penality, Math.Pow(10, logLambda), out trainNMSE, out testNMSE);
	73	Results.Add(new Result("NMSE (train)", new DoubleValue(trainNMSE)));
	74	Results.Add(new Result("NMSE (test)", new DoubleValue(testNMSE)));
[13930]	75
	76	// copied from LR => TODO: reuse code (but skip coefficients = 0.0)
	77	ISymbolicExpressionTree tree = new SymbolicExpressionTree(new ProgramRootSymbol().CreateTreeNode());
	78	ISymbolicExpressionTreeNode startNode = new StartSymbol().CreateTreeNode();
	79	tree.Root.AddSubtree(startNode);
	80	ISymbolicExpressionTreeNode addition = new Addition().CreateTreeNode();
	81	startNode.AddSubtree(addition);
	82
	83	int col = 0;
	84	foreach (string column in Problem.ProblemData.AllowedInputVariables) {
	85	if (!coeff[col].IsAlmost(0.0)) {
	86	VariableTreeNode vNode = (VariableTreeNode)new HeuristicLab.Problems.DataAnalysis.Symbolic.Variable().CreateTreeNode();
	87	vNode.VariableName = column;
	88	vNode.Weight = coeff[col];
	89	addition.AddSubtree(vNode);
	90	}
	91	col++;
	92	}
	93
	94	if (!coeff[coeff.Length - 1].IsAlmost(0.0)) {
	95	ConstantTreeNode cNode = (ConstantTreeNode)new Constant().CreateTreeNode();
	96	cNode.Value = coeff[coeff.Length - 1];
	97	addition.AddSubtree(cNode);
	98	}
	99
[13961]	100	SymbolicRegressionSolution solution = new SymbolicRegressionSolution(
[14225]	101	new SymbolicRegressionModel(Problem.ProblemData.TargetVariable, tree, new SymbolicDataAnalysisExpressionTreeInterpreter()),
[13961]	102	(IRegressionProblemData)Problem.ProblemData.Clone());
[13930]	103	solution.Model.Name = "Elastic-net Linear Regression Model";
	104	solution.Name = "Elastic-net Linear Regression Solution";
	105
	106	Results.Add(new Result(solution.Name, solution.Description, solution));
	107	}
	108
	109	private void CreateSolutionPath() {
[13927]	110	double[] lambda;
[14225]	111	double[] trainNMSE;
	112	double[] testNMSE;
[13927]	113	double[,] coeff;
	114	double[] intercept;
[14225]	115	RunElasticNetLinearRegression(Problem.ProblemData, Penality, out lambda, out trainNMSE, out testNMSE, out coeff, out intercept);
[13927]	116
[13940]	117	var coeffTable = new DataTable("Coefficient Paths", "The paths of standarized coefficient values over different lambda values");
[13927]	118	var nLambdas = lambda.Length;
	119	var nCoeff = coeff.GetLength(1);
	120	var dataRows = new DataRow[nCoeff];
[13928]	121	var allowedVars = Problem.ProblemData.AllowedInputVariables.ToArray();
[13927]	122	for (int i = 0; i < nCoeff; i++) {
[13928]	123	var coeffId = allowedVars[i];
[13940]	124	double sigma = Problem.ProblemData.Dataset.GetDoubleValues(coeffId).StandardDeviation();
	125	var path = Enumerable.Range(0, nLambdas).Select(r => coeff[r, i] * sigma).ToArray();
[13928]	126	dataRows[i] = new DataRow(coeffId, coeffId, path);
[13927]	127	coeffTable.Rows.Add(dataRows[i]);
	128	}
	129
	130	Results.Add(new Result(coeffTable.Name, coeffTable.Description, coeffTable));
	131
[14225]	132	var nmsePlot = new ScatterPlot("NMSE", "Path of NMSE values over different lambda values");
	133	nmsePlot.VisualProperties.YAxisMaximumAuto = false;
	134	nmsePlot.VisualProperties.YAxisMinimumAuto = false;
	135	nmsePlot.VisualProperties.XAxisMaximumAuto = false;
	136	nmsePlot.VisualProperties.XAxisMinimumAuto = false;
[13940]	137
[14225]	138	nmsePlot.VisualProperties.YAxisMinimumFixedValue = 0;
	139	nmsePlot.VisualProperties.YAxisMaximumFixedValue = 1.0;
	140	nmsePlot.VisualProperties.XAxisTitle = "Log10(Lambda)";
	141	nmsePlot.VisualProperties.YAxisTitle = "Normalized mean of squared errors (NMSE)";
	142	nmsePlot.Rows.Add(new ScatterPlotDataRow("NMSE (train)", "Path of NMSE values over different lambda values", lambda.Zip(trainNMSE, (l, v) => new Point2D<double>(Math.Log10(l), v))));
	143	nmsePlot.Rows.Add(new ScatterPlotDataRow("NMSE (test)", "Path of NMSE values over different lambda values", lambda.Zip(testNMSE, (l, v) => new Point2D<double>(Math.Log10(l), v))));
[13940]	144	if (lambda.Length > 2) {
[14225]	145	nmsePlot.VisualProperties.XAxisMinimumFixedValue = Math.Floor(Math.Log10(lambda.Last()));
	146	nmsePlot.VisualProperties.XAxisMaximumFixedValue = Math.Ceiling(Math.Log10(lambda.Skip(1).First()));
[13940]	147	}
[14225]	148	nmsePlot.Rows["NMSE (train)"].VisualProperties.PointSize = 5;
	149	nmsePlot.Rows["NMSE (test)"].VisualProperties.PointSize = 5;
[13940]	150
[14225]	151	Results.Add(new Result(nmsePlot.Name, nmsePlot.Description, nmsePlot));
[13927]	152	}
	153
	154	public static double[] CreateElasticNetLinearRegressionSolution(IRegressionProblemData problemData, double penalty, double lambda,
[14225]	155	out double trainNMSE, out double testNMSE,
[13927]	156	double coeffLowerBound = double.NegativeInfinity, double coeffUpperBound = double.PositiveInfinity) {
[14225]	157	double[] trainNMSEs;
	158	double[] testNMSEs;
[13927]	159	// run for exactly one lambda
[14225]	160	var coeffs = CreateElasticNetLinearRegressionSolution(problemData, penalty, new double[] { lambda }, out trainNMSEs, out testNMSEs, coeffLowerBound, coeffUpperBound);
	161	trainNMSE = trainNMSEs[0];
	162	testNMSE = testNMSEs[0];
[13927]	163	return coeffs[0];
	164	}
	165	public static double[][] CreateElasticNetLinearRegressionSolution(IRegressionProblemData problemData, double penalty, double[] lambda,
[13929]	166	out double[] trainRsq, out double[] testRsq,
[13927]	167	double coeffLowerBound = double.NegativeInfinity, double coeffUpperBound = double.PositiveInfinity,
	168	int maxVars = -1) {
	169	// run for multiple user-supplied lambdas
	170	double[,] coeff;
	171	double[] intercept;
[13929]	172	RunElasticNetLinearRegression(problemData, penalty, lambda.Length, 1.0, lambda, out lambda, out trainRsq, out testRsq, out coeff, out intercept, coeffLowerBound, coeffUpperBound, maxVars);
[13927]	173
	174	int nRows = intercept.Length;
	175	int nCols = coeff.GetLength(1) + 1;
	176	double[][] sols = new double[nRows][];
	177	for (int solIdx = 0; solIdx < nRows; solIdx++) {
	178	sols[solIdx] = new double[nCols];
	179	for (int cIdx = 0; cIdx < nCols - 1; cIdx++) {
	180	sols[solIdx][cIdx] = coeff[solIdx, cIdx];
	181	}
	182	sols[solIdx][nCols - 1] = intercept[solIdx];
	183	}
	184	return sols;
	185	}
	186
	187	public static void RunElasticNetLinearRegression(IRegressionProblemData problemData, double penalty,
[14225]	188	out double[] lambda, out double[] trainNMSE, out double[] testNMSE, out double[,] coeff, out double[] intercept,
[13927]	189	double coeffLowerBound = double.NegativeInfinity, double coeffUpperBound = double.PositiveInfinity,
	190	int maxVars = -1
	191	) {
	192	double[] userLambda = new double[0];
	193	// automatically determine lambda values (maximum 100 different lambda values)
[14225]	194	RunElasticNetLinearRegression(problemData, penalty, 100, 0.0, userLambda, out lambda, out trainNMSE, out testNMSE, out coeff, out intercept, coeffLowerBound, coeffUpperBound, maxVars);
[13927]	195	}
	196
	197	/// <summary>
	198	/// Elastic net with squared-error-loss for dense predictor matrix, runs the full path of all lambdas
	199	/// </summary>
	200	/// <param name="problemData">Predictor target matrix x and target vector y</param>
	201	/// <param name="penalty">Penalty for balance between ridge (0.0) and lasso (1.0) regression</param>
	202	/// <param name="nlam">Maximum number of lambda values (default 100)</param>
	203	/// <param name="flmin">User control of lambda values (<1.0 => minimum lambda = flmin * (largest lambda value), >= 1.0 => use supplied lambda values</param>
	204	/// <param name="ulam">User supplied lambda values</param>
	205	/// <param name="lambda">Output lambda values</param>
[14225]	206	/// <param name="trainNMSE">Vector of normalized mean of squared error (NMSE = Variance(res) / Variance(y)) values on the training set for each set of coefficients along the path</param>
	207	/// <param name="testNMSE">Vector of normalized mean of squared error (NMSE = Variance(res) / Variance(y)) values on the test set for each set of coefficients along the path</param>
[13927]	208	/// <param name="coeff">Vector of coefficient vectors for each solution along the path</param>
	209	/// <param name="intercept">Vector of intercepts for each solution along the path</param>
	210	/// <param name="coeffLowerBound">Optional lower bound for all coefficients</param>
	211	/// <param name="coeffUpperBound">Optional upper bound for all coefficients</param>
	212	/// <param name="maxVars">Maximum allowed number of variables in each solution along the path (-1 => all variables are allowed)</param>
	213	private static void RunElasticNetLinearRegression(IRegressionProblemData problemData, double penalty,
[14225]	214	int nlam, double flmin, double[] ulam, out double[] lambda, out double[] trainNMSE, out double[] testNMSE, out double[,] coeff, out double[] intercept,
[13927]	215	double coeffLowerBound = double.NegativeInfinity, double coeffUpperBound = double.PositiveInfinity,
	216	int maxVars = -1
	217	) {
	218	if (penalty < 0.0 \|\| penalty > 1.0) throw new ArgumentException("0 <= penalty <= 1", "penalty");
	219
[13929]	220	double[,] trainX;
	221	double[,] testX;
	222
	223	double[] trainY;
	224	double[] testY;
	225	int numTrainObs, numTestObs;
[13927]	226	int numVars;
[13929]	227	PrepareData(problemData, out trainX, out trainY, out numTrainObs, out testX, out testY, out numTestObs, out numVars);
[13927]	228
	229	int ka = 1; // => covariance updating algorithm
	230	double parm = penalty;
[13929]	231	double[] w = Enumerable.Repeat(1.0, numTrainObs).ToArray(); // all observations have the same weight
[13927]	232	int[] jd = new int[1]; // do not force to use any of the variables
	233	double[] vp = Enumerable.Repeat(1.0, numVars).ToArray(); // all predictor variables are unpenalized
	234	double[,] cl = new double[numVars, 2]; // use the same bounds for all coefficients
	235	for (int i = 0; i < numVars; i++) {
	236	cl[i, 0] = coeffLowerBound;
	237	cl[i, 1] = coeffUpperBound;
	238	}
	239
	240	int ne = maxVars > 0 ? maxVars : numVars;
	241	int nx = numVars;
	242	double thr = 1.0e-5; // default value as recommended in glmnet
[13940]	243	int isd = 1; // => regression on standardized predictor variables
[13927]	244	int intr = 1; // => do include intercept in model
	245	int maxit = 100000; // default value as recommended in glmnet
	246	// outputs
	247	int lmu = -1;
	248	double[,] ca;
	249	int[] ia;
	250	int[] nin;
	251	int nlp = -99;
	252	int jerr = -99;
[14225]	253	double[] trainR2;
	254	elnet(ka, parm, numTrainObs, numVars, trainX, trainY, w, jd, vp, cl, ne, nx, nlam, flmin, ulam, thr, isd, intr, maxit, out lmu, out intercept, out ca, out ia, out nin, out trainR2, out lambda, out nlp, out jerr);
[13927]	255
[14225]	256	trainNMSE = new double[lmu]; // elnet returns R**2 as 1 - NMSE
	257	testNMSE = new double[lmu];
[13927]	258	coeff = new double[lmu, numVars];
	259	for (int solIdx = 0; solIdx < lmu; solIdx++) {
[14225]	260	trainNMSE[solIdx] = 1.0 - trainR2[solIdx];
	261
[13927]	262	// uncompress coefficients of solution
	263	int selectedNin = nin[solIdx];
	264	double[] coefficients;
	265	double[] selectedCa = new double[nx];
[13929]	266	for (int i = 0; i < nx; i++) {
	267	selectedCa[i] = ca[solIdx, i];
	268	}
[13927]	269
[14225]	270	// apply to test set to calculate test NMSE values for each lambda step
[13929]	271	double[] fn;
	272	modval(intercept[solIdx], selectedCa, ia, selectedNin, numTestObs, testX, out fn);
	273	OnlineCalculatorError error;
[14225]	274	var nmse = OnlineNormalizedMeanSquaredErrorCalculator.Calculate(testY, fn, out error);
	275	if (error != OnlineCalculatorError.None) nmse = double.MaxValue;
	276	testNMSE[solIdx] = nmse;
[13929]	277
	278	// uncompress coefficients
[13927]	279	uncomp(numVars, selectedCa, ia, selectedNin, out coefficients);
	280	for (int i = 0; i < coefficients.Length; i++) {
	281	coeff[solIdx, i] = coefficients[i];
	282	}
	283	}
	284	}
	285
[13930]	286	private static void PrepareData(IRegressionProblemData problemData, out double[,] trainX, out double[] trainY, out int numTrainObs,
[13929]	287	out double[,] testX, out double[] testY, out int numTestObs, out int numVars) {
[13927]	288	numVars = problemData.AllowedInputVariables.Count();
[13929]	289	numTrainObs = problemData.TrainingIndices.Count();
	290	numTestObs = problemData.TestIndices.Count();
[13927]	291
[13929]	292	trainX = new double[numVars, numTrainObs];
	293	trainY = new double[numTrainObs];
	294	testX = new double[numVars, numTestObs];
	295	testY = new double[numTestObs];
[13927]	296	var ds = problemData.Dataset;
	297	var targetVar = problemData.TargetVariable;
[13929]	298	// train
[13927]	299	int rIdx = 0;
	300	foreach (var row in problemData.TrainingIndices) {
	301	int cIdx = 0;
	302	foreach (var var in problemData.AllowedInputVariables) {
[13929]	303	trainX[cIdx, rIdx] = ds.GetDoubleValue(var, row);
[13927]	304	cIdx++;
	305	}
[13929]	306	trainY[rIdx] = ds.GetDoubleValue(targetVar, row);
[13927]	307	rIdx++;
	308	}
[13929]	309	// test
	310	rIdx = 0;
[13930]	311	foreach (var row in problemData.TestIndices) {
[13929]	312	int cIdx = 0;
[13930]	313	foreach (var var in problemData.AllowedInputVariables) {
[13929]	314	testX[cIdx, rIdx] = ds.GetDoubleValue(var, row);
	315	cIdx++;
	316	}
	317	testY[rIdx] = ds.GetDoubleValue(targetVar, row);
	318	rIdx++;
	319	}
[13927]	320	}
	321
	322
	323	#region dllimport
	324	/// <summary>Wrapper for elnet procedure in glmnet library</summary>
	325	/// (see: https://cran.r-project.org/web/packages/glmnet/index.html)
	326	///
	327	/// ka = algorithm flag
	328	/// ka=1 => covariance updating algorithm
	329	/// ka=2 => naive algorithm
	330	/// parm = penalty member index(0<= parm <= 1)
	331	/// = 0.0 => ridge
	332	/// = 1.0 => lasso
	333	/// no = number of observations
	334	/// ni = number of predictor variables
	335	/// y(no) = response vector(overwritten)
	336	/// w(no)= observation weights(overwritten)
	337	/// jd(jd(1)+1) = predictor variable deletion flag
	338	/// jd(1) = 0 => use all variables
	339	/// jd(1) != 0 => do not use variables jd(2)...jd(jd(1)+1)
	340	/// vp(ni) = relative penalties for each predictor variable
	341	/// vp(j) = 0 => jth variable unpenalized
	342	/// cl(2, ni) = interval constraints on coefficient values(overwritten)
	343	/// cl(1, j) = lower bound for jth coefficient value(<= 0.0)
	344	/// cl(2, j) = upper bound for jth coefficient value(>= 0.0)
	345	/// ne = maximum number of variables allowed to enter largest model
	346	/// (stopping criterion)
	347	/// nx = maximum number of variables allowed to enter all modesl
	348	/// along path(memory allocation, nx > ne).
	349	/// nlam = (maximum)number of lamda values
	350	/// flmin = user control of lamda values(>=0)
	351	/// flmin< 1.0 => minimum lamda = flmin * (largest lamda value)
	352	/// flmin >= 1.0 => use supplied lamda values(see below)
	353	/// ulam(nlam) = user supplied lamda values(ignored if flmin< 1.0)
	354	/// thr = convergence threshold for each lamda solution.
	355	/// iterations stop when the maximum reduction in the criterion value
	356	/// as a result of each parameter update over a single pass
	357	/// is less than thr times the null criterion value.
	358	/// (suggested value, thr= 1.0e-5)
	359	/// isd = predictor variable standarization flag:
	360	/// isd = 0 => regression on original predictor variables
	361	/// isd = 1 => regression on standardized predictor variables
	362	/// Note: output solutions always reference original
	363	/// variables locations and scales.
	364	/// intr = intercept flag
	365	/// intr = 0 / 1 => don't/do include intercept in model
	366	/// maxit = maximum allowed number of passes over the data for all lambda
	367	/// values (suggested values, maxit = 100000)
	368	///
	369	/// output:
	370	///
	371	/// lmu = actual number of lamda values(solutions)
	372	/// a0(lmu) = intercept values for each solution
	373	/// ca(nx, lmu) = compressed coefficient values for each solution
	374	/// ia(nx) = pointers to compressed coefficients
	375	/// nin(lmu) = number of compressed coefficients for each solution
	376	/// rsq(lmu) = R**2 values for each solution
	377	/// alm(lmu) = lamda values corresponding to each solution
	378	/// nlp = actual number of passes over the data for all lamda values
	379	/// jerr = error flag:
	380	/// jerr = 0 => no error
	381	/// jerr > 0 => fatal error - no output returned
	382	/// jerr< 7777 => memory allocation error
	383	/// jerr = 7777 => all used predictors have zero variance
	384	/// jerr = 10000 => maxval(vp) <= 0.0
	385	/// jerr< 0 => non fatal error - partial output:
	386	/// Solutions for larger lamdas (1:(k-1)) returned.
	387	/// jerr = -k => convergence for kth lamda value not reached
	388	/// after maxit(see above) iterations.
	389	/// jerr = -10000 - k => number of non zero coefficients along path
	390	/// exceeds nx(see above) at kth lamda value.
	391	///
	392	private static void elnet(
	393	int ka,
	394	double parm,
	395	int no,
	396	int ni,
	397	double[,] x,
	398	double[] y,
	399	double[] w,
	400	int[] jd,
	401	double[] vp,
	402	double[,] cl,
	403	int ne,
	404	int nx,
	405	int nlam,
	406	double flmin,
	407	double[] ulam,
	408	double thr,
	409	int isd,
	410	int intr,
	411	int maxit,
	412	// outputs
	413	out int lmu,
	414	out double[] a0,
	415	out double[,] ca,
	416	out int[] ia,
	417	out int[] nin,
	418	out double[] rsq,
	419	out double[] alm,
	420	out int nlp,
	421	out int jerr
	422	) {
	423	// initialize output values and allocate arrays big enough
	424	a0 = new double[nlam];
	425	ca = new double[nlam, nx];
	426	ia = new int[nx];
	427	nin = new int[nlam];
	428	rsq = new double[nlam];
	429	alm = new double[nlam];
	430	nlp = -1;
	431	jerr = -1;
	432	lmu = -1;
	433
	434	// load correct version of native dll based on process (x86/x64)
	435	if (Environment.Is64BitProcess) {
	436	elnet_x64(ref ka, ref parm, ref no, ref ni, x, y, w, jd, vp, cl, ref ne, ref ni, ref nlam, ref flmin, ulam, ref thr, ref isd, ref intr, ref maxit, ref lmu, a0, ca, ia, nin, rsq, alm, ref nlp, ref jerr);
	437	} else {
	438	elnet_x86(ref ka, ref parm, ref no, ref ni, x, y, w, jd, vp, cl, ref ne, ref ni, ref nlam, ref flmin, ulam, ref thr, ref isd, ref intr, ref maxit, ref lmu, a0, ca, ia, nin, rsq, alm, ref nlp, ref jerr);
	439	}
	440	// jerr = error flag:
	441	// jerr = 0 => no error
	442	// jerr > 0 => fatal error -no output returned
	443	// jerr < 7777 => memory allocation error
	444	// jerr = 7777 => all used predictors have zero variance
	445	// jerr = 10000 => maxval(vp) <= 0.0
	446	// jerr < 0 => non fatal error - partial output:
	447	// c Solutions for larger lamdas (1:(k - 1)) returned.
	448	// jerr = -k => convergence for kth lamda value not reached
	449	// after maxit(see above) iterations.
	450	// jerr = -10000 - k => number of non zero coefficients along path
	451	// exceeds nx(see above) at kth lamda value.
	452	if (jerr != 0) {
	453	if (jerr > 0 && jerr < 7777) throw new InvalidOperationException("glmnet: memory allocation error");
	454	else if (jerr == 7777) throw new InvalidOperationException("glmnet: all used predictors have zero variance");
	455	else if (jerr == 10000) throw new InvalidOperationException("glmnet: maxval(vp) <= 0.0");
	456	else if (jerr < 0 && jerr > -1000) throw new InvalidOperationException(string.Format("glmnet: convergence for {0}th lamda value not reached after maxit iterations ", -jerr));
	457	else if (jerr <= -10000) throw new InvalidOperationException(string.Format("glmnet: number of non zero coefficients along path exceeds number of maximally allowed variables (nx) at {0}th lamda value", -jerr - 10000));
	458	else throw new InvalidOperationException(string.Format("glmnet: error {0}", jerr));
	459	}
	460
	461
	462	// resize arrays to the capacity that is acutally necessary for the results
	463	Array.Resize(ref a0, lmu);
	464	Array.Resize(ref nin, lmu);
	465	Array.Resize(ref rsq, lmu);
	466	Array.Resize(ref alm, lmu);
	467	}
	468
	469	[DllImport("glmnet-x86.dll", EntryPoint = "elnet_", CallingConvention = CallingConvention.Cdecl)]
	470	private static extern void elnet_x86(
	471	ref int ka,
	472	ref double parm,
	473	ref int no,
	474	ref int ni,
	475	double[,] x,
	476	double[] y,
	477	double[] w,
	478	int[] jd,
	479	double[] vp,
	480	double[,] cl,
	481	ref int ne,
	482	ref int nx,
	483	ref int nlam,
	484	ref double flmin,
	485	double[] ulam,
	486	ref double thr,
	487	ref int isd,
	488	ref int intr,
	489	ref int maxit,
	490	// outputs:
	491	ref int lmu,
	492	[Out] double[] a0,
	493	[Out] double[,] ca,
	494	[Out] int[] ia,
	495	[Out] int[] nin,
	496	[Out] double[] rsq,
	497	[Out] double[] alm,
	498	ref int nlp,
	499	ref int jerr
	500	);
	501	[DllImport("glmnet-x64.dll", EntryPoint = "elnet_", CallingConvention = CallingConvention.Cdecl)]
	502	private static extern void elnet_x64(
	503	ref int ka,
	504	ref double parm,
	505	ref int no,
	506	ref int ni,
	507	double[,] x,
	508	double[] y,
	509	double[] w,
	510	int[] jd,
	511	double[] vp,
	512	double[,] cl,
	513	ref int ne,
	514	ref int nx,
	515	ref int nlam,
	516	ref double flmin,
	517	double[] ulam,
	518	ref double thr,
	519	ref int isd,
	520	ref int intr,
	521	ref int maxit,
	522	// outputs:
	523	ref int lmu,
	524	[Out] double[] a0,
	525	[Out] double[,] ca,
	526	[Out] int[] ia,
	527	[Out] int[] nin,
	528	[Out] double[] rsq,
	529	[Out] double[] alm,
	530	ref int nlp,
	531	ref int jerr
	532	);
	533
	534
	535	/// <summary>Wrapper for uncompress coefficient vector for particular solution in glmnet</summary>
	536	/// (see: https://cran.r-project.org/web/packages/glmnet/index.html)
	537	///
	538	/// call uncomp(ni, ca, ia, nin, a)
	539	///
	540	/// input:
	541	///
	542	/// ni = total number of predictor variables
	543	/// ca(nx) = compressed coefficient values for the solution
	544	/// ia(nx) = pointers to compressed coefficients
	545	/// nin = number of compressed coefficients for the solution
	546	///
	547	/// output:
	548	///
	549	/// a(ni) = uncompressed coefficient vector
	550	/// referencing original variables
	551	///
	552	private static void uncomp(int numVars, double[] ca, int[] ia, int nin, out double[] a) {
	553	a = new double[numVars];
	554	// load correct version of native dll based on process (x86/x64)
	555	if (Environment.Is64BitProcess) {
	556	uncomp_x64(ref numVars, ca, ia, ref nin, a);
	557	} else {
	558	uncomp_x86(ref numVars, ca, ia, ref nin, a);
	559	}
	560	}
	561
	562	[DllImport("glmnet-x86.dll", EntryPoint = "uncomp_", CallingConvention = CallingConvention.Cdecl)]
	563	private static extern void uncomp_x86(ref int numVars, double[] ca, int[] ia, ref int nin, double[] a);
	564	[DllImport("glmnet-x64.dll", EntryPoint = "uncomp_", CallingConvention = CallingConvention.Cdecl)]
	565	private static extern void uncomp_x64(ref int numVars, double[] ca, int[] ia, ref int nin, double[] a);
	566
[13929]	567	private static void modval(double a0, double[] ca, int[] ia, int nin, int numObs, double[,] x, out double[] fn) {
	568	fn = new double[numObs];
	569	if (Environment.Is64BitProcess) {
	570	modval_x64(ref a0, ca, ia, ref nin, ref numObs, x, fn);
	571	} else {
	572	modval_x86(ref a0, ca, ia, ref nin, ref numObs, x, fn);
	573	}
	574	}
	575	// evaluate linear model from compressed coefficients and
	576	// uncompressed predictor matrix:
	577	//
	578	// call modval(a0, ca, ia, nin, n, x, f);
	579	// c
	580	// c input:
	581	//
	582	// a0 = intercept
	583	// ca(nx) = compressed coefficient values for a solution
	584	// ia(nx) = pointers to compressed coefficients
	585	// nin = number of compressed coefficients for solution
	586	// n = number of predictor vectors(observations)
	587	// x(n, ni) = full(uncompressed) predictor matrix
	588	//
	589	// output:
	590	//
	591	// f(n) = model predictions
	592	[DllImport("glmnet-x86.dll", EntryPoint = "modval_", CallingConvention = CallingConvention.Cdecl)]
	593	private static extern void modval_x86(ref double a0, double[] ca, int[] ia, ref int nin, ref int numObs, [Out] double[,] x, double[] fn);
	594	[DllImport("glmnet-x64.dll", EntryPoint = "modval_", CallingConvention = CallingConvention.Cdecl)]
	595	private static extern void modval_x64(ref double a0, double[] ca, int[] ia, ref int nin, ref int numObs, [Out] double[,] x, double[] fn);
	596
[13927]	597	#endregion
	598	}
	599	}

Note: See TracBrowser for help on using the repository browser.

Download in other formats:

Update cookies preferences