Changeset 15482 for branches/HeuristicLab.EvolutionTracking/HeuristicLab.Problems.DataAnalysis.Symbolic/3.4/Tracking/SchemaDiversification/SchemaCreator.cs
- Timestamp:
- 11/21/17 16:00:15 (7 years ago)
- File:
-
- 1 edited
Legend:
- Unmodified
- Added
- Removed
-
branches/HeuristicLab.EvolutionTracking/HeuristicLab.Problems.DataAnalysis.Symbolic/3.4/Tracking/SchemaDiversification/SchemaCreator.cs
r15351 r15482 30 30 using HeuristicLab.Parameters; 31 31 using HeuristicLab.Persistence.Default.CompositeSerializers.Storable; 32 using HeuristicLab.PluginInfrastructure; 32 33 33 34 namespace HeuristicLab.Problems.DataAnalysis.Symbolic { 35 using Vertices = IEnumerable<IGenealogyGraphNode<ISymbolicExpressionTree>>; 36 34 37 [Item("SchemaCreator", "An operator that builds schemas based on the heredity relationship in the genealogy graph.")] 35 38 [StorableClass] … … 53 56 private const string StrictSchemaMatchingParameterName = "StrictSchemaMatching"; 54 57 private const string SchemaDefinitionParameterName = "SchemaDefinition"; 58 private const string SchemaManipulatorParameterName = "SchemaManipulator"; 55 59 #endregion 56 60 57 61 #region parameters 58 62 public IConstrainedValueParameter<ISymbolicExpressionTreeManipulator> SchemaManipulatorParameter { 63 get { return (IConstrainedValueParameter<ISymbolicExpressionTreeManipulator>)Parameters[SchemaManipulatorParameterName]; } 64 } 59 65 public IConstrainedValueParameter<StringValue> SchemaDefinitionParameter { 60 66 get { return (IConstrainedValueParameter<StringValue>)Parameters[SchemaDefinitionParameterName]; } … … 143 149 Parameters.Add(new FixedValueParameter<BoolValue>(UseAdaptiveReplacementRatioParameterName, new BoolValue(true))); 144 150 151 // add update rules 145 152 var replacementRatioUpdateRules = new ItemSet<StringValue>(new[] { 146 153 new StringValue("f(x) = x"), … … 155 162 Parameters.Add(replacementRatioUpdateRuleParameter); 156 163 157 var schemaDefinitions = new ItemSet<StringValue>(new[] { 158 new StringValue("="), 159 new StringValue("#"), 160 new StringValue("=,#") 161 }); 164 // add schema definitions 165 var schemaDefinitions = new ItemSet<StringValue>(new[] { "=", "#", "=,#" }.Select(x => new StringValue(x))); 162 166 var schemaDefinitionParameter = new ConstrainedValueParameter<StringValue>(SchemaDefinitionParameterName, schemaDefinitions); 163 167 schemaDefinitionParameter.Value = schemaDefinitions.First(); 164 168 Parameters.Add(schemaDefinitionParameter); 169 170 // use a separate set of manipulators in order to allow the user to specify different mutations for schemas 171 // and not be limited to the manipulator parameter for the whole algorithm 172 var manipulators = ApplicationManager.Manager.GetTypes(typeof(ISymbolicExpressionTreeManipulator)) 173 .Where(x => !typeof(IMultiOperator<ISymbolicExpressionTreeManipulator>).IsAssignableFrom(x) 174 && !typeof(ISymbolicExpressionTreeArchitectureAlteringOperator).IsAssignableFrom(x)) 175 .Select(x => (ISymbolicExpressionTreeManipulator)Activator.CreateInstance(x)).ToList(); 176 manipulators.Add(new MultiSymbolicExpressionTreeManipulator()); 177 178 // add individual manipulators 179 var manipulatorParameter = new ConstrainedValueParameter<ISymbolicExpressionTreeManipulator>(SchemaManipulatorParameterName, new ItemSet<ISymbolicExpressionTreeManipulator>(manipulators)); 180 // add a multi manipulator as well 181 manipulatorParameter.Value = manipulators.First(); 182 Parameters.Add(manipulatorParameter); 165 183 #endregion 166 184 … … 206 224 207 225 var replacementRule = ReplacementRatioUpdateRuleParameter.Value.Value; 226 var schemaManipulator = SchemaManipulatorParameter.Value; 208 227 209 228 var evaluateSchemas = new OperationCollection(); … … 218 237 219 238 List<ISymbolicExpressionTree> schemas; 220 var def = SchemaDefinitionParameter.Value.Value; 221 switch (def) { 239 switch (SchemaDefinitionParameter.Value.Value) { 222 240 case "=": 223 241 schemas = GenerateAnyNodeSchemas(vertices, MinimumSchemaLength, 0, StrictSchemaMatching).ToList(); … … 238 256 #region create schemas and add subscopes representing the individuals 239 257 foreach (var schema in schemas) { 240 evaluateSchemas.Add(ExecutionContext.CreateChildOperation(new SchemaEvaluator { Schema = schema, ReplacementRule = replacementRule }, ExecutionContext.Scope));258 evaluateSchemas.Add(ExecutionContext.CreateChildOperation(new SchemaEvaluator { Schema = schema, ReplacementRule = replacementRule, SchemaManipulator = schemaManipulator }, ExecutionContext.Scope)); 241 259 } 242 260 #endregion … … 257 275 258 276 #region schema generation 259 public static IEnumerable<ISymbolicExpressionTree> GenerateAnyNodeSchemas(IEnumerable<IGenealogyGraphNode<ISymbolicExpressionTree>> vertices, int minimumSchemaLength, int minOffspringCount = 1, bool strict = true) { 277 public static IEnumerable<ISymbolicExpressionTree> GenerateAnyNodeSchemas(Vertices vertices, int minimumSchemaLength, int minOffspringCount = 1, bool strict = true) { 278 return GenerateSchemas(vertices, ReplaceAnyNode, minimumSchemaLength, minOffspringCount, strict); 279 } 280 281 public static IEnumerable<ISymbolicExpressionTree> GenerateAnySubtreeSchemas(Vertices vertices, int minimumSchemaLength, int minOffspringCount = 1, bool strict = true) { 282 return GenerateSchemas(vertices, ReplaceAnySubtree, minimumSchemaLength, minOffspringCount, strict); 283 } 284 285 public static IEnumerable<ISymbolicExpressionTree> GenerateCombinedSchemas(Vertices vertices, int minimumSchemaLength, int minOffspringCount = 1, bool strict = true) { 286 return GenerateSchemas(vertices, ReplaceCombined, minimumSchemaLength, minOffspringCount, strict); 287 } 288 289 public static IEnumerable<ISymbolicExpressionTree> GenerateSchemas(Vertices vertices, Func<ISymbolicExpressionTree, ISymbolicExpressionTreeNode, int, bool> replaceFunc, int minimumSchemaLength, int minOffspringCount, bool strict = true) { 260 290 var anySubtreeSymbol = new AnySubtreeSymbol(); 261 var groups = vertices.GroupBy(x => x.Parents.First()).Where(g => g. Count() >= minOffspringCount).OrderByDescending(g => g.Count());291 var groups = vertices.GroupBy(x => x.Parents.First()).Where(g => g.Skip(minOffspringCount - 1).Any()).OrderByDescending(g => g.Count()); 262 292 var hash = new HashSet<string>(); 263 293 foreach (var g in groups) { … … 271 301 var indices = fragments.Select(x => x.Index1).Distinct().OrderByDescending(x => schema.Root.GetBranchLevel(nodes[x])); 272 302 foreach (var i in indices) { 273 var node = nodes[i]; 274 var anyNodeSymbol = new AnyNodeSymbol(node.Symbol.MinimumArity, node.Symbol.MaximumArity); 275 var replacement = anyNodeSymbol.CreateTreeNode(); 276 SchemaUtil.ReplaceSubtree(node, replacement, true); 277 replaced = true; 303 replaced |= replaceFunc(schema, nodes[i], minimumSchemaLength); 278 304 } 279 305 if (replaced) { … … 285 311 } 286 312 287 public static IEnumerable<ISymbolicExpressionTree> GenerateAnySubtreeSchemas(IEnumerable<IGenealogyGraphNode<ISymbolicExpressionTree>> vertices, int minimumSchemaLength, int minOffspringCount = 1, bool strict = true) { 313 // node replacement rules 314 private static bool ReplaceAnyNode(ISymbolicExpressionTree schema, ISymbolicExpressionTreeNode node, int minSchemaLength) { 315 var anyNodeSymbol = new AnyNodeSymbol(node.Symbol.MinimumArity, node.Symbol.MaximumArity); 316 var replacement = anyNodeSymbol.CreateTreeNode(); 317 SchemaUtil.ReplaceSubtree(node, replacement, true); 318 319 return true; 320 } 321 322 private static bool ReplaceAnySubtree(ISymbolicExpressionTree schema, ISymbolicExpressionTreeNode node, int minSchemaLength) { 323 if (schema.Length - node.GetLength() + 1 < minSchemaLength) 324 return false; 325 288 326 var anySubtreeSymbol = new AnySubtreeSymbol(); 289 var groups = vertices.GroupBy(x => x.Parents.First()).Where(g => g.Count() >= minOffspringCount).OrderByDescending(g => g.Count()); 290 var hash = new HashSet<string>(); 291 foreach (var g in groups) { 292 var parent = g.Key; 293 if (parent.Data.Length < minimumSchemaLength) 294 continue; 295 bool replaced = false; 296 var schema = (ISymbolicExpressionTree)parent.Data.Clone(); 297 var nodes = schema.IterateNodesPrefix().ToList(); 298 var fragments = g.Select(x => x.InArcs.Last().Data).Where(x => x != null).Cast<IFragment<ISymbolicExpressionTreeNode>>(); 299 var indices = fragments.Select(x => x.Index1).Distinct().OrderByDescending(x => schema.Root.GetBranchLevel(nodes[x])); 300 foreach (var i in indices) { 301 var node = nodes[i]; 302 // do not replace the node with a wildcard if it would result in a length < MinimumSchemaLength 303 if (schema.Length - node.GetLength() + 1 < minimumSchemaLength) 304 continue; 305 var replacement = anySubtreeSymbol.CreateTreeNode(); 306 SchemaUtil.ReplaceSubtree(node, replacement, false); 307 replaced = true; 308 } 309 if (replaced) { 310 var str = schema.Root.GetSubtree(0).GetSubtree(0).FormatToString(strict); 311 if (hash.Add(str)) 312 yield return schema; 313 } 314 } 315 } 316 317 public static IEnumerable<ISymbolicExpressionTree> GenerateCombinedSchemas(IEnumerable<IGenealogyGraphNode<ISymbolicExpressionTree>> vertices, int minimumSchemaLength, int minOffspringCount = 1, bool strict = true) { 318 var anySubtreeSymbol = new AnySubtreeSymbol(); 319 var groups = vertices.GroupBy(x => x.Parents.First()).Where(g => g.Count() >= minOffspringCount).OrderByDescending(g => g.Count()); 320 var hash = new HashSet<string>(); 321 foreach (var g in groups) { 322 var parent = g.Key; 323 if (parent.Data.Length < minimumSchemaLength) 324 continue; 325 bool replaced = false; 326 var schema = (ISymbolicExpressionTree)parent.Data.Clone(); 327 var nodes = schema.IterateNodesPrefix().ToList(); 328 var fragments = g.Select(x => x.InArcs.Last().Data).Where(x => x != null).Cast<IFragment<ISymbolicExpressionTreeNode>>(); 329 var indices = fragments.Select(x => x.Index1).Distinct().OrderByDescending(x => schema.Root.GetBranchLevel(nodes[x])); 330 foreach (var i in indices) { 331 var node = nodes[i]; 332 ISymbolicExpressionTreeNode replacement; 333 if (node.SubtreeCount > 0) { 334 replacement = new AnyNodeSymbol(node.Symbol.MinimumArity, node.Symbol.MaximumArity).CreateTreeNode(); 335 SchemaUtil.ReplaceSubtree(node, replacement, true); 336 } else { 337 replacement = anySubtreeSymbol.CreateTreeNode(); 338 SchemaUtil.ReplaceSubtree(node, replacement, false); 339 } 340 replaced = true; 341 } 342 if (replaced) { 343 var str = schema.Root.GetSubtree(0).GetSubtree(0).FormatToString(strict); 344 if (hash.Add(str)) 345 yield return schema; 346 } 347 } 327 var replacement = anySubtreeSymbol.CreateTreeNode(); 328 329 SchemaUtil.ReplaceSubtree(node, replacement, false); 330 return true; 331 } 332 333 private static bool ReplaceCombined(ISymbolicExpressionTree schema, ISymbolicExpressionTreeNode node, int minSchemaLength) { 334 ISymbol wildcard; 335 if (node.SubtreeCount > 0) 336 wildcard = new AnyNodeSymbol(node.Symbol.MinimumArity, node.Symbol.MaximumArity); 337 else 338 wildcard = new AnySubtreeSymbol(); 339 340 SchemaUtil.ReplaceSubtree(node, wildcard.CreateTreeNode(), node.SubtreeCount > 0); 341 return true; 348 342 } 349 343 #endregion
Note: See TracChangeset
for help on using the changeset viewer.