#region License Information /* HeuristicLab * Copyright (C) 2002-2018 Heuristic and Evolutionary Algorithms Laboratory (HEAL) * * This file is part of HeuristicLab. * * HeuristicLab is free software: you can redistribute it and/or modify * it under the terms of the GNU General Public License as published by * the Free Software Foundation, either version 3 of the License, or * (at your option) any later version. * * HeuristicLab is distributed in the hope that it will be useful, * but WITHOUT ANY WARRANTY; without even the implied warranty of * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the * GNU General Public License for more details. * * You should have received a copy of the GNU General Public License * along with HeuristicLab. If not, see . */ #endregion using System; using System.Collections.Generic; using System.Data.Linq; using System.Linq; using HeuristicLab.Services.Access.DataAccess; using HeuristicLab.Services.Hive.DataAccess; using HeuristicLab.Services.Hive.DataAccess.Manager; namespace HeuristicLab.Services.Hive { public class HiveStatisticsGenerator : IStatisticsGenerator { private const string UnknownUserName = "Unknown"; private static readonly TimeSpan SmallestTimeSpan = new TimeSpan(0, 5, 0); private static readonly TaskState[] CompletedStates = { TaskState.Finished, TaskState.Aborted, TaskState.Failed }; public void GenerateStatistics() { using (var pm = new PersistenceManager()) { pm.UseTransaction(() => { UpdateDimProjectTable(pm); pm.SubmitChanges(); }); pm.UseTransaction(() => { UpdateDimUserTable(pm); UpdateDimJobTable(pm); UpdateDimClientsTable(pm); pm.SubmitChanges(); }); DimTime time = null; pm.UseTransaction(() => { time = UpdateDimTimeTable(pm); pm.SubmitChanges(); }); if (time != null) { pm.UseTransaction(() => { UpdateFactClientInfoTable(time, pm); pm.SubmitChanges(); UpdateFactProjectInfoTable(time, pm); pm.SubmitChanges(); }); pm.UseTransaction(() => { UpdateFactTaskTable(pm); try { pm.SubmitChanges(); UpdateExistingDimJobs(pm); pm.SubmitChanges(); } catch (DuplicateKeyException e) { var logger = LogFactory.GetLogger(typeof(HiveStatisticsGenerator).Namespace); logger.Log(string.Format( @"Propable change from summertime to wintertime, resulting in overlapping times. On wintertime to summertime change, slave timeouts and a fact gap will occur. Exception Details: {0}", e)); } }); } pm.UseTransaction(() => { FlagJobsForDeletion(pm); pm.SubmitChanges(); }); } } private DimTime UpdateDimTimeTable(PersistenceManager pm) { var dimTimeDao = pm.DimTimeDao; var now = DateTime.Now; var timeEntry = new DimTime { Time = now, Minute = new DateTime(now.Year, now.Month, now.Day, now.Hour, now.Minute, 0), Hour = new DateTime(now.Year, now.Month, now.Day, now.Hour, 0, 0), Day = new DateTime(now.Year, now.Month, now.Day, 0, 0, 0), Month = new DateTime(now.Year, now.Month, 1, 0, 0, 0), Year = new DateTime(now.Year, 1, 1, 0, 0, 0) }; return dimTimeDao.Save(timeEntry); } private void UpdateDimUserTable(PersistenceManager pm) { var dimUserDao = pm.DimUserDao; var resourceDao = pm.ResourceDao; var jobDao = pm.JobDao; var existingUserIds = dimUserDao.GetAll().Select(x => x.UserId); var vaildResourceOwnerIds = resourceDao.GetResourcesWithValidOwner().Select(x => x.OwnerUserId.Value); var jobOwnerIds = jobDao.GetAll().Select(x => x.OwnerUserId); var newUserIds = vaildResourceOwnerIds .Union(jobOwnerIds) .Where(id => !existingUserIds.Contains(id)) .ToList(); dimUserDao.Save(newUserIds.Select(x => new DimUser { UserId = x, Name = GetUserName(x) })); } // add new projects // delete expired projects // update information of existing projects private void UpdateDimProjectTable(PersistenceManager pm) { var projectDao = pm.ProjectDao; var dimProjectDao = pm.DimProjectDao; var projects = projectDao.GetAll().ToList(); var dimProjects = dimProjectDao.GetAllOnlineProjects().ToList(); var onlineProjects = dimProjects.Where(x => projects.Select(y => y.ProjectId).Contains(x.ProjectId)); var addedProjects = projects.Where(x => !dimProjects.Select(y => y.ProjectId).Contains(x.ProjectId)); var removedProjects = dimProjects.Where(x => !projects.Select(y => y.ProjectId).Contains(x.ProjectId)); // set expiration time of removed projects foreach (var p in removedProjects) { p.DateExpired = DateTime.Now; } // add new projects dimProjectDao.Save(addedProjects.Select(x => new DimProject { ProjectId = x.ProjectId, ParentProjectId = x.ParentProjectId, Name = x.Name, Description = x.Description, OwnerUserId = x.OwnerUserId, StartDate = x.StartDate, EndDate = x.EndDate, DateCreated = x.DateCreated, DateExpired = null })); // expire project if its parent has changed and create a new entry // otherwise perform "normal" update foreach (var dimP in onlineProjects) { var p = projects.Where(x => x.ProjectId == dimP.ProjectId).SingleOrDefault(); if (p != null) { if (dimP.ParentProjectId == null ? p.ParentProjectId != null : dimP.ParentProjectId != p.ParentProjectId) { // or: (!object.Equals(dimP.ParentProjectId, p.ParentProjectId)) dimP.DateExpired = DateTime.Now; dimProjectDao.Save(new DimProject { ProjectId = p.ProjectId, ParentProjectId = p.ParentProjectId, Name = p.Name, Description = p.Description, OwnerUserId = p.OwnerUserId, StartDate = p.StartDate, EndDate = p.EndDate, DateCreated = p.DateCreated, DateExpired = null }); } else { dimP.Name = p.Name; dimP.Description = p.Description; dimP.OwnerUserId = p.OwnerUserId; dimP.StartDate = p.StartDate; dimP.EndDate = p.EndDate; } } } } private void UpdateDimJobTable(PersistenceManager pm) { var dimProjectDao = pm.DimProjectDao; var dimJobDao = pm.DimJobDao; var jobDao = pm.JobDao; var taskDao = pm.TaskDao; var dimJobIds = dimJobDao.GetAll().Select(x => x.JobId); var newJobs = jobDao.GetAll() .Where(x => !dimJobIds.Contains(x.JobId)) .Select(x => new { JobId = x.JobId, UserId = x.OwnerUserId, JobName = x.Name ?? string.Empty, DateCreated = x.DateCreated, ProjectId = dimProjectDao.GetLastValidIdByProjectId(x.ProjectId), TotalTasks = taskDao.GetAll().Count(y => y.JobId == x.JobId) }) .ToList(); dimJobDao.Save(newJobs.Select(x => new DimJob { JobId = x.JobId, JobName = x.JobName, UserId = x.UserId, UserName = GetUserName(x.UserId), DateCreated = x.DateCreated, ProjectId = x.ProjectId, TotalTasks = x.TotalTasks, CompletedTasks = 0, DateCompleted = null })); } private void UpdateExistingDimJobs(PersistenceManager pm) { var dimProjectDao = pm.DimProjectDao; var jobDao = pm.JobDao; var dimJobDao = pm.DimJobDao; var factTaskDao = pm.FactTaskDao; foreach (var dimJob in dimJobDao.GetNotCompletedJobs()) { var taskStates = factTaskDao.GetByJobId(dimJob.JobId) .GroupBy(x => x.TaskState) .Select(x => new { State = x.Key, Count = x.Count() }).ToList(); int totalTasks = 0, completedTasks = 0; foreach (var state in taskStates) { totalTasks += state.Count; if (CompletedStates.Contains(state.State)) { completedTasks += state.Count; } } var job = jobDao.GetById(dimJob.JobId); if (totalTasks == completedTasks) { var completeDate = factTaskDao.GetLastCompletedTaskFromJob(dimJob.JobId); if (completeDate == null) { if (job == null) { completeDate = DateTime.Now; } } dimJob.DateCompleted = completeDate; } if(job != null) { dimJob.JobName = job.Name; dimJob.ProjectId = dimProjectDao.GetLastValidIdByProjectId(job.ProjectId); } dimJob.TotalTasks = totalTasks; dimJob.CompletedTasks = completedTasks; } } private void FlagJobsForDeletion(PersistenceManager pm) { var jobDao = pm.JobDao; var jobs = jobDao.GetJobsReadyForDeletion(); foreach(var job in jobs) { job.State = JobState.DeletionPending; } } private void UpdateDimClientsTable(PersistenceManager pm) { var dimClientDao = pm.DimClientDao; var resourceDao = pm.ResourceDao; var resources = resourceDao.GetAll().ToList(); var dimClients = dimClientDao.GetAllOnlineClients().ToList(); var onlineClients = dimClients.Where(x => resources.Select(y => y.ResourceId).Contains(x.ResourceId)); var addedResources = resources.Where(x => !dimClients.Select(y => y.ResourceId).Contains(x.ResourceId)); var removedResources = dimClients.Where(x => !resources.Select(y => y.ResourceId).Contains(x.ResourceId)); // set expiration time of removed resources foreach(var r in removedResources) { r.DateExpired = DateTime.Now; } // add new resources dimClientDao.Save(addedResources.Select(x => new DimClient { ResourceId = x.ResourceId, ParentResourceId = x.ParentResourceId, Name = x.Name, ResourceType = x.ResourceType, DateCreated = DateTime.Now, DateExpired = null })); // expire client if its parent has changed and create a new entry // otherwise perform "normal" update foreach(var dimc in onlineClients) { var r = resources.Where(x => x.ResourceId == dimc.ResourceId).SingleOrDefault(); if(r != null) { if(dimc.ParentResourceId == null ? r.ParentResourceId != null : dimc.ParentResourceId != r.ParentResourceId) { var now = DateTime.Now; dimc.DateExpired = now; dimClientDao.Save(new DimClient { ResourceId = r.ResourceId, ParentResourceId = r.ParentResourceId, Name = r.Name, ResourceType = r.ResourceType, DateCreated = now, DateExpired = null }); } else { dimc.Name = r.Name; } } } } //// (1) for new slaves (not yet reported in Table DimClients) ... //// and modified slaves (name or parent resource changed) a new DimClient-entry is created //// (2) for already reported removed and modifid clients the expiration date is set //private void UpdateDimClientsTableOld(PersistenceManager pm) { // var dimClientDao = pm.DimClientDao; // var slaveDao = pm.SlaveDao; // var slaves = slaveDao.GetAll(); // var recentlyAddedClients = dimClientDao.GetAllOnlineClients(); // var slaveIds = slaves.Select(x => x.ResourceId); // var removedClientIds = recentlyAddedClients // .Where(x => !slaveIds.Contains(x.ResourceId)) // .Select(x => x.Id); // var modifiedClients = // from slave in slaves // join client in recentlyAddedClients on slave.ResourceId equals client.ResourceId // where (slave.Name != client.Name // || slave.ParentResourceId == null && client.ResourceGroupId != null // because both can be null and null comparison // || slave.ParentResourceId != null && client.ResourceGroupId == null // does return no entry on the sql server // || slave.ParentResourceId != client.ResourceGroupId // || ((slave.ParentResource != null) && slave.ParentResource.ParentResourceId != client.ResourceGroup2Id)) // select new { // SlaveId = slave.ResourceId, // ClientId = client.Id // }; // var clientIds = dimClientDao.GetAllOnlineClients().Select(x => x.ResourceId); // var modifiedClientIds = modifiedClients.Select(x => x.SlaveId); // var newClients = slaves // .Where(x => !clientIds.Contains(x.ResourceId) // || modifiedClientIds.Contains(x.ResourceId)) // .Select(x => new { // x.ResourceId, // x.Name, // ResourceGroupId = x.ParentResourceId, // GroupName = x.ParentResource != null ? x.ParentResource.Name : null, // ResourceGroup2Id = x.ParentResource != null ? x.ParentResource.ParentResourceId : null, // GroupName2 = x.ParentResource != null ? x.ParentResource.ParentResource != null ? x.ParentResource.ParentResource.Name : null : null // }) // .ToList(); // var clientsToUpdate = removedClientIds.Union(modifiedClients.Select(x => x.ClientId)); // dimClientDao.UpdateExpirationTime(clientsToUpdate, DateTime.Now); // dimClientDao.Save(newClients.Select(x => new DimClient { // ResourceId = x.ResourceId, // Name = x.Name, // ExpirationTime = null, // ResourceGroupId = x.ResourceGroupId, // GroupName = x.GroupName, // ResourceGroup2Id = x.ResourceGroup2Id, // GroupName2 = x.GroupName2 // })); //} private void UpdateFactClientInfoTable(DimTime newTime, PersistenceManager pm) { var factClientInfoDao = pm.FactClientInfoDao; var slaveDao = pm.SlaveDao; var dimClientDao = pm.DimClientDao; var newRawFactInfos = from s in slaveDao.GetAll() join c in dimClientDao.GetAllOnlineSlaves() on s.ResourceId equals c.ResourceId join lcf in factClientInfoDao.GetLastUpdateTimestamps() on c.ResourceId equals lcf.ResourceId into joinCf from cf in joinCf.DefaultIfEmpty() select new { ClientId = c.Id, UserId = s.OwnerUserId ?? Guid.Empty, TotalCores = s.Cores ?? 0, FreeCores = s.FreeCores ?? 0, TotalMemory = s.Memory ?? 0, FreeMemory = s.FreeMemory ?? 0, CpuUtilization = s.CpuUtilization, SlaveState = s.SlaveState, IsAllowedToCalculate = s.IsAllowedToCalculate, LastFactTimestamp = cf.Timestamp }; factClientInfoDao.Save( from x in newRawFactInfos.ToList() let duration = x.LastFactTimestamp != null ? (int)(newTime.Time - (DateTime)x.LastFactTimestamp).TotalSeconds : (int)SmallestTimeSpan.TotalSeconds select new FactClientInfo { ClientId = x.ClientId, DimTime = newTime, UserId = x.UserId, NumUsedCores = x.TotalCores - x.FreeCores, NumTotalCores = x.TotalCores, UsedMemory = x.TotalMemory - x.FreeMemory, TotalMemory = x.TotalMemory, CpuUtilization = Math.Round(x.CpuUtilization, 2), SlaveState = x.SlaveState, IdleTime = x.SlaveState == SlaveState.Idle && x.IsAllowedToCalculate ? duration : 0, UnavailableTime = x.SlaveState == SlaveState.Idle && !x.IsAllowedToCalculate ? duration : 0, OfflineTime = x.SlaveState == SlaveState.Offline ? duration : 0, IsAllowedToCalculate = x.IsAllowedToCalculate } ); } private void UpdateFactProjectInfoTable(DimTime newTime, PersistenceManager pm) { var factProjectInfoDao = pm.FactProjectInfoDao; var dimProjectDao = pm.DimProjectDao; var projectDao = pm.ProjectDao; var projectAvailabilityStats = projectDao.GetAvailabilityStatsPerProject(); var projectUsageStats = projectDao.GetUsageStatsPerProject(); var dimProjects = dimProjectDao.GetAllOnlineProjects().ToList(); factProjectInfoDao.Save( from dimp in dimProjects let aStats = projectAvailabilityStats.Where(x => x.ProjectId == dimp.ProjectId).SingleOrDefault() let uStats = projectUsageStats.Where(x => x.ProjectId == dimp.ProjectId).SingleOrDefault() select new FactProjectInfo { ProjectId = dimp.Id, DimTime = newTime, NumTotalCores = aStats != null ? aStats.Cores : 0, TotalMemory = aStats != null ? aStats.Memory : 0, NumUsedCores = uStats != null ? uStats.Cores : 0, UsedMemory = uStats != null ? uStats.Memory : 0 } ); } private void UpdateFactTaskTable(PersistenceManager pm) { var factTaskDao = pm.FactTaskDao; var taskDao = pm.TaskDao; var dimClientDao = pm.DimClientDao; var factTaskIds = factTaskDao.GetAll().Select(x => x.TaskId); var notFinishedFactTasks = factTaskDao.GetNotFinishedTasks(); //var notFinishedFactTasks = factTaskDao.GetNotFinishedTasks().Select(x => new { // x.TaskId, // x.LastClientId //}); // query several properties for all new and not finished tasks // in order to use them later either... // (1) to update the fact task entry of not finished tasks // (2) to insert a new fact task entry for new tasks var newAndNotFinishedTasks = (from task in taskDao.GetAllChildTasks() let stateLogs = task.StateLogs.OrderByDescending(x => x.DateTime) let lastSlaveId = stateLogs.First(x => x.SlaveId != null).SlaveId where (!factTaskIds.Contains(task.TaskId) || notFinishedFactTasks.Select(x => x.TaskId).Contains(task.TaskId)) join lastFactTask in notFinishedFactTasks on task.TaskId equals lastFactTask.TaskId into lastFactPerTask from lastFact in lastFactPerTask.DefaultIfEmpty() join client in dimClientDao.GetAllOnlineClients() on lastSlaveId equals client.ResourceId into clientsPerSlaveId from client in clientsPerSlaveId.DefaultIfEmpty() select new { TaskId = task.TaskId, JobId = task.JobId, Priority = task.Priority, CoresRequired = task.CoresNeeded, MemoryRequired = task.MemoryNeeded, State = task.State, StateLogs = stateLogs.OrderBy(x => x.DateTime), LastClientId = client != null ? client.Id : lastFact != null ? lastFact.LastClientId : (Guid?)null, NotFinishedTask = notFinishedFactTasks.Any(y => y.TaskId == task.TaskId) }).ToList(); // (1) update data of already existing facts // i.e. for all in newAndNotFinishedTasks where NotFinishedTask = true foreach (var notFinishedFactTask in notFinishedFactTasks) { var nfftUpdate = newAndNotFinishedTasks.Where(x => x.TaskId == notFinishedFactTask.TaskId).SingleOrDefault(); if(nfftUpdate != null) { var taskData = CalculateFactTaskData(nfftUpdate.StateLogs); notFinishedFactTask.StartTime = taskData.StartTime; notFinishedFactTask.EndTime = taskData.EndTime; notFinishedFactTask.LastClientId = nfftUpdate.LastClientId; notFinishedFactTask.Priority = nfftUpdate.Priority; notFinishedFactTask.CoresRequired = nfftUpdate.CoresRequired; notFinishedFactTask.MemoryRequired = nfftUpdate.MemoryRequired; notFinishedFactTask.NumCalculationRuns = taskData.CalculationRuns; notFinishedFactTask.NumRetries = taskData.Retries; notFinishedFactTask.WaitingTime = taskData.WaitingTime; notFinishedFactTask.CalculatingTime = taskData.CalculatingTime; notFinishedFactTask.TransferTime = taskData.TransferTime; notFinishedFactTask.TaskState = nfftUpdate.State; notFinishedFactTask.Exception = taskData.Exception; notFinishedFactTask.InitialWaitingTime = taskData.InitialWaitingTime; } } // (2) insert facts for new tasks // i.e. for all in newAndNotFinishedTasks where NotFinishedTask = false factTaskDao.Save( from x in newAndNotFinishedTasks where !x.NotFinishedTask let taskData = CalculateFactTaskData(x.StateLogs) select new FactTask { TaskId = x.TaskId, JobId = x.JobId, StartTime = taskData.StartTime, EndTime = taskData.EndTime, LastClientId = x.LastClientId, Priority = x.Priority, CoresRequired = x.CoresRequired, MemoryRequired = x.MemoryRequired, NumCalculationRuns = taskData.CalculationRuns, NumRetries = taskData.Retries, WaitingTime = taskData.WaitingTime, CalculatingTime = taskData.CalculatingTime, TransferTime = taskData.TransferTime, TaskState = x.State, Exception = taskData.Exception, InitialWaitingTime = taskData.InitialWaitingTime }); ////update data of already existing facts //foreach (var notFinishedTask in factTaskDao.GetNotFinishedTasks()) { // var ntc = newTasks.Where(x => x.TaskId == notFinishedTask.TaskId); // if (ntc.Any()) { // var x = ntc.Single(); // var taskData = CalculateFactTaskData(x.StateLogs); // notFinishedTask.StartTime = taskData.StartTime; // notFinishedTask.EndTime = taskData.EndTime; // notFinishedTask.LastClientId = x.LastClientId; // notFinishedTask.Priority = x.Priority; // notFinishedTask.CoresRequired = x.CoresRequired; // notFinishedTask.MemoryRequired = x.MemoryRequired; // notFinishedTask.NumCalculationRuns = taskData.CalculationRuns; // notFinishedTask.NumRetries = taskData.Retries; // notFinishedTask.WaitingTime = taskData.WaitingTime; // notFinishedTask.CalculatingTime = taskData.CalculatingTime; // notFinishedTask.TransferTime = taskData.TransferTime; // notFinishedTask.TaskState = x.State; // notFinishedTask.Exception = taskData.Exception; // notFinishedTask.InitialWaitingTime = taskData.InitialWaitingTime; // } //} } private string GetUserName(Guid userId) { try { // we cannot use the ServiceLocator.Instance.UserManager since the janitor service // is not hosted in the iis the MemberShip.GetUser method causes exceptions // needs to be further investigated current workaround: use the authenticationcontext // we could also connect to the access service to get the user name using (ASPNETAuthenticationDataContext dc = new ASPNETAuthenticationDataContext()) { var user = dc.aspnet_Users.SingleOrDefault(x => x.UserId == userId); return user != null ? user.UserName : UnknownUserName; } } catch (Exception) { return UnknownUserName; } } private class FactTaskData { public int CalculationRuns { get; set; } public int Retries { get; set; } public long CalculatingTime { get; set; } public long WaitingTime { get; set; } public long TransferTime { get; set; } public long InitialWaitingTime { get; set; } public string Exception { get; set; } public DateTime? StartTime { get; set; } public DateTime? EndTime { get; set; } } private FactTaskData CalculateFactTaskData(IEnumerable stateLogs) { var factTaskData = new FactTaskData(); var enumerator = stateLogs.GetEnumerator(); if (enumerator.MoveNext()) { StateLog current = enumerator.Current, first = current, prev = null; while (current != null) { var next = enumerator.MoveNext() ? enumerator.Current : null; int timeSpanInSeconds; if (next != null) { timeSpanInSeconds = (int)(next.DateTime - current.DateTime).TotalSeconds; } else { timeSpanInSeconds = (int)(DateTime.Now - current.DateTime).TotalSeconds; factTaskData.Exception = current.Exception; } switch (current.State) { case TaskState.Calculating: factTaskData.CalculatingTime += timeSpanInSeconds; factTaskData.CalculationRuns++; if (factTaskData.CalculationRuns == 1) { factTaskData.StartTime = current.DateTime; factTaskData.InitialWaitingTime = (int)(current.DateTime - first.DateTime).TotalSeconds; } if (prev != null && prev.State != TaskState.Transferring) { factTaskData.Retries++; } break; case TaskState.Waiting: factTaskData.WaitingTime += timeSpanInSeconds; break; case TaskState.Transferring: factTaskData.TransferTime += timeSpanInSeconds; break; case TaskState.Finished: case TaskState.Failed: case TaskState.Aborted: factTaskData.EndTime = current.DateTime; break; } prev = current; current = next; } } return factTaskData; } } }