/** * StonedMC * * Designed to properly split up a given tick among subsystems * Note: if you read parts of this code and think "why is it doing it that way" * Odds are, there is a reason * **/ // See initialization order in /code/game/world.dm GLOBAL_REAL(Master, /datum/controller/master) /datum/controller/master name = "Master" /// Are we processing (higher values increase the processing delay by n ticks) var/processing = TRUE /// How many times have we ran var/iteration = 0 /// Stack end detector to detect stack overflows that kill the mc's main loop var/datum/stack_end_detector/stack_end_detector /// world.time of last fire, for tracking lag outside of the mc var/last_run /// List of subsystems to process(). var/list/subsystems ///Most recent init stage to complete init. var/static/init_stage_completed // Vars for keeping track of tick drift. var/init_timeofday var/init_time var/tickdrift = 0 /// Tickdrift as of last tick, w no averaging going on var/olddrift = 0 /// How long is the MC sleeping between runs, read only (set by Loop() based off of anti-tick-contention heuristics) var/sleep_delta = 1 /// Only run ticker subsystems for the next n ticks. var/skip_ticks = 0 /// makes the mc main loop runtime var/make_runtime = FALSE var/initializations_finished_with_no_players_logged_in //I wonder what this could be? /// The type of the last subsystem to be fire()'d. var/last_type_processed var/datum/controller/subsystem/queue_head //!Start of queue linked list var/datum/controller/subsystem/queue_tail //!End of queue linked list (used for appending to the list) var/queue_priority_count = 0 //Running total so that we don't have to loop thru the queue each run to split up the tick var/queue_priority_count_bg = 0 //Same, but for background subsystems var/map_loading = FALSE //!Are we loading in a new map? var/current_runlevel //!for scheduling different subsystems for different stages of the round var/sleep_offline_after_initializations = TRUE /// During initialization, will be the instanced subsytem that is currently initializing. /// Outside of initialization, returns null. var/current_initializing_subsystem = null /// The last decisecond we force dumped profiling information /// Used to avoid spamming profile reads since they can be expensive (string memes) var/last_profiled = 0 var/static/restart_clear = 0 var/static/restart_timeout = 0 var/static/restart_count = 0 var/static/random_seed ///current tick limit, assigned before running a subsystem. ///used by CHECK_TICK as well so that the procs subsystems call can obey that SS's tick limits var/static/current_ticklimit = TICK_LIMIT_RUNNING /// Whether the Overview UI will update as fast as possible for viewers. var/overview_fast_update = FALSE /// Enables rolling usage averaging var/use_rolling_usage = FALSE /// How long to run our rolling usage averaging var/rolling_usage_length = 5 SECONDS /datum/controller/master/New() // Ensure usr is null, to prevent any potential weirdness resulting from the MC having a usr if it's manually restarted. usr = null if(!config) config = new // Highlander-style: there can only be one! Kill off the old and replace it with the new. if(!random_seed) #ifdef UNIT_TESTS random_seed = 29051994 // How about 22475? #else random_seed = rand(1, 1e9) #endif rand_seed(random_seed) var/list/_subsystems = list() subsystems = _subsystems if (Master != src) if (istype(Master)) //If there is an existing MC take over his stuff and delete it Recover() qdel(Master) Master = src else //Code used for first master on game boot or if existing master got deleted Master = src var/list/subsystem_types = subtypesof(/datum/controller/subsystem) sortTim(subsystem_types, GLOBAL_PROC_REF(cmp_subsystem_init_stage)) //Find any abandoned subsystem from the previous master (if there was any) var/list/existing_subsystems = list() for(var/global_var in global.vars) if (istype(global.vars[global_var], /datum/controller/subsystem)) existing_subsystems += global.vars[global_var] //Either init a new SS or if an existing one was found use that for(var/I in subsystem_types) var/ss_idx = existing_subsystems.Find(I) if (ss_idx) _subsystems += existing_subsystems[ss_idx] else _subsystems += new I if(!GLOB) new /datum/controller/global_vars /datum/controller/master/Destroy() ..() // Tell qdel() to Del() this object. return QDEL_HINT_HARDDEL_NOW /datum/controller/master/Shutdown() processing = FALSE sortTim(subsystems, GLOBAL_PROC_REF(cmp_subsystem_init)) reverseRange(subsystems) for(var/datum/controller/subsystem/ss in subsystems) log_world("Shutting down [ss.name] subsystem...") if (ss.slept_count > 0) log_world("Warning: Subsystem `[ss.name]` slept [ss.slept_count] times.") ss.Shutdown() log_world("Shutdown complete") ADMIN_VERB(cmd_controller_view_ui, R_SERVER|R_DEBUG, "Controller Overview", "View the current states of the Subsystem Controllers.", ADMIN_CATEGORY_DEBUG_INVESTIGATE) Master.tgui_interact(user.mob) /datum/controller/master/tgui_status(mob/user, datum/tgui_state/state) if(!user.client?.holder?.check_for_rights(R_SERVER|R_DEBUG)) return STATUS_CLOSE return STATUS_INTERACTIVE /datum/controller/master/tgui_interact(mob/user, datum/tgui/ui) ui = SStgui.try_update_ui(user, src, ui) if(isnull(ui)) ui = new /datum/tgui(user, src, "ControllerOverview") ui.open() use_rolling_usage = TRUE /datum/controller/master/tgui_close(mob/user) var/valid_found = FALSE for(var/datum/tgui/open_ui as anything in open_tguis) if(open_ui.user == user) continue valid_found = TRUE if(!valid_found) use_rolling_usage = FALSE return ..() /datum/controller/master/tgui_data(mob/user) var/list/data = list() var/list/subsystem_data = list() for(var/datum/controller/subsystem/subsystem as anything in subsystems) var/list/rolling_usage = subsystem.rolling_usage subsystem.prune_rolling_usage() // Then we sum var/sum = 0 for(var/i in 2 to length(rolling_usage) step 2) sum += rolling_usage[i] var/average = sum / DS2TICKS(rolling_usage_length) subsystem_data += list(list( "name" = subsystem.name, "ref" = REF(subsystem), "init_order" = subsystem.init_order, "last_fire" = subsystem.last_fire, "next_fire" = subsystem.next_fire, "can_fire" = subsystem.can_fire, "doesnt_fire" = !!(subsystem.flags & SS_NO_FIRE), "cost_ms" = subsystem.cost, "tick_usage" = subsystem.tick_usage, "usage_per_tick" = average, "tick_overrun" = subsystem.tick_overrun, "initialized" = subsystem.initialized, "initialization_failure_message" = subsystem.initialization_failure_message, )) data["subsystems"] = subsystem_data data["world_time"] = world.time data["map_cpu"] = world.map_cpu data["fast_update"] = overview_fast_update data["rolling_length"] = rolling_usage_length return data /datum/controller/master/tgui_act(action, list/params, datum/tgui/ui, datum/tgui_state/state) if(..()) return TRUE switch(action) if("toggle_fast_update") overview_fast_update = !overview_fast_update return TRUE if("set_rolling_length") var/length = text2num(params["rolling_length"]) if(!length || length < 0) return rolling_usage_length = length SECONDS return TRUE if("view_variables") var/datum/controller/subsystem/subsystem = locate(params["ref"]) in subsystems if(isnull(subsystem)) to_chat(ui.user, span_warning("Failed to locate subsystem.")) return SSadmin_verbs.dynamic_invoke_verb(ui.user, /datum/admin_verb/debug_variables, subsystem) return TRUE /datum/controller/master/proc/check_and_perform_fast_update() PRIVATE_PROC(TRUE) set waitfor = FALSE if(!overview_fast_update) return var/static/already_updating = FALSE if(already_updating) return already_updating = TRUE SStgui.update_uis(src) already_updating = FALSE // Returns 1 if we created a new mc, 0 if we couldn't due to a recent restart, // -1 if we encountered a runtime trying to recreate it /proc/Recreate_MC() . = -1 //so if we runtime, things know we failed if (world.time < Master.restart_timeout) return 0 if (world.time < Master.restart_clear) Master.restart_count *= 0.5 var/delay = 50 * ++Master.restart_count Master.restart_timeout = world.time + delay Master.restart_clear = world.time + (delay * 2) if (Master) //Can only do this if master hasn't been deleted Master.processing = FALSE //stop ticking this one try new/datum/controller/master() catch return -1 return 1 /datum/controller/master/Recover() var/msg = "## DEBUG: [time2text(world.timeofday, "DDD MMM DD hh:mm:ss YYYY", TIMEZONE_UTC)] MC restarted. Reports:\n" var/list/master_attributes = Master.vars var/list/filtered_variables = list( NAMEOF(src, name), NAMEOF(src, parent_type), NAMEOF(src, statclick), NAMEOF(src, tag), NAMEOF(src, type), NAMEOF(src, vars), ) for (var/varname in master_attributes - filtered_variables) var/varval = master_attributes[varname] if (isdatum(varval)) // Check if it has a type var. var/datum/D = varval msg += "\t [varname] = [D]([D.type])\n" else msg += "\t [varname] = [varval]\n" log_world(msg) var/datum/controller/subsystem/BadBoy = Master.last_type_processed var/FireHim = FALSE if(istype(BadBoy)) msg = null LAZYINITLIST(BadBoy.failure_strikes) switch(++BadBoy.failure_strikes[BadBoy.type]) if(2) msg = "The [BadBoy.name] subsystem was the last to fire for 2 controller restarts. It will be recovered now and disabled if it happens again." FireHim = TRUE if(3) msg = "The [BadBoy.name] subsystem seems to be destabilizing the MC and will be put offline." BadBoy.flags |= SS_NO_FIRE if(msg) to_chat(GLOB.admins, span_boldannounce("[msg]")) log_world(msg) if (istype(Master.subsystems)) if(FireHim) Master.subsystems += new BadBoy.type //NEW_SS_GLOBAL will remove the old one subsystems = Master.subsystems current_runlevel = Master.current_runlevel StartProcessing(10) else to_chat(world, span_boldannounce("The Master Controller is having some issues, we will need to re-initialize EVERYTHING")) Initialize(20, TRUE, FALSE) // Please don't stuff random bullshit here, // Make a subsystem, give it the SS_NO_FIRE flag, and do your work in its Initialize() /datum/controller/master/Initialize(delay, init_sss, tgs_prime) set waitfor = 0 if(delay) sleep(delay) if(init_sss) init_subtypes(/datum/controller/subsystem, subsystems) init_stage_completed = 0 var/mc_started = FALSE to_chat(world, span_boldannounce("Initializing subsystems..."), MESSAGE_TYPE_DEBUG) var/list/stage_sorted_subsystems = new(INITSTAGE_MAX) for (var/i in 1 to INITSTAGE_MAX) stage_sorted_subsystems[i] = list() var/list/type_to_subsystem = list() for(var/datum/controller/subsystem/subsystem as anything in subsystems) type_to_subsystem[subsystem.type] = subsystem // Allows subsystems to declare other subsystems that must initialize after them. for(var/datum/controller/subsystem/subsystem as anything in subsystems) for(var/dependent_type as anything in subsystem.dependents) if(!ispath(dependent_type, /datum/controller/subsystem)) stack_trace("ERROR: MC: subsystem `[subsystem.type]` has an invalid dependent: `[dependent_type]`. Skipping") continue var/datum/controller/subsystem/dependent = type_to_subsystem[dependent_type] dependent.dependencies |= subsystem.type subsystem.dependents = list() // Constructs a reverse-dependency graph. for(var/datum/controller/subsystem/subsystem as anything in subsystems) for(var/dependency_type as anything in subsystem.dependencies) if(!ispath(dependency_type, /datum/controller/subsystem)) stack_trace("ERROR: MC: subsystem `[subsystem.type]` has an invalid dependency: `[dependency_type]`. Skipping") continue var/datum/controller/subsystem/dependency = type_to_subsystem[dependency_type] // Not a foolproof failsafe, likely to only prevent any immediate issues if this is only triggered once. if(subsystem.init_stage < dependency.init_stage) stack_trace("ERROR: MC: subsystem `[subsystem.type]` has an init_stage before one of its dependencies (Dependency: `[dependency.type]`, [subsystem.init_stage] < [dependency.init_stage])! Setting init_stage to [dependency.init_stage]") subsystem.init_stage = dependency.init_stage dependency.dependents += subsystem // Topological sorting algorithm var/list/counts = new(subsystems.len) var/list/unsorted_subsystems = list() var/index = 1 for(var/datum/controller/subsystem/subsystem as anything in subsystems) counts[index] = length(subsystem.dependencies) subsystem.ordering_id = index if(counts[index] == 0) unsorted_subsystems += subsystem index += 1 var/list/sorted_subsystems = list() while(length(unsorted_subsystems) > 0) var/datum/controller/subsystem/sub = unsorted_subsystems[unsorted_subsystems.len] unsorted_subsystems.len-- sorted_subsystems += sub for(var/datum/controller/subsystem/dependent as anything in sub.dependents) counts[dependent.ordering_id] -= 1 if(counts[dependent.ordering_id] == 0) unsorted_subsystems += dependent // Topological sorting algorithm end if(length(subsystems) != length(sorted_subsystems)) var/list/circular_dependency = subsystems.Copy() - sorted_subsystems var/list/debug_msg = list() var/list/usr_msg = list() for(var/datum/controller/subsystem/subsystem as anything in circular_dependency) usr_msg += "[subsystem.name]" var/list/datum/controller/subsystem/nodes = list(circular_dependency[1]) var/list/loop = list() while(length(nodes) > 0) var/datum/controller/subsystem/node = nodes[nodes.len] nodes.len-- if(node in loop) loop += node break loop += node for(var/datum/controller/subsystem/connected as anything in node.dependencies) nodes += type_to_subsystem[connected] var/loop_position = 0 for(var/datum/controller/subsystem/node in loop) if(node == loop[loop.len]) break loop_position++ if(loop_position != 0) loop.Cut(1, loop_position + 1) for(var/datum/controller/subsystem/subsystem as anything in loop) debug_msg += "[subsystem.name]" // Can't initialize them if they have circular dependencies, there's no real failsafe here. stack_trace("ERROR: CRITICAL: MC: The following subsystems have circular dependencies: [jointext(debug_msg, " -> ")]") to_chat(world, span_bolddanger("CRITICAL: Failed to initialize [jointext(usr_msg, ", ")]"), MESSAGE_TYPE_DEBUG) for (var/datum/controller/subsystem/subsystem as anything in sorted_subsystems) var/subsystem_init_stage = subsystem.init_stage if (!isnum(subsystem_init_stage) || subsystem_init_stage < 1 || subsystem_init_stage > INITSTAGE_MAX || round(subsystem_init_stage) != subsystem_init_stage) stack_trace("ERROR: MC: subsystem `[subsystem.type]` has invalid init_stage: `[subsystem_init_stage]`. Setting to `[INITSTAGE_MAX]`") subsystem_init_stage = subsystem.init_stage = INITSTAGE_MAX stage_sorted_subsystems[subsystem_init_stage] += subsystem // Sort subsystems by display setting for easy access. var/evaluated_order = 1 sortTim(subsystems, GLOBAL_PROC_REF(cmp_subsystem_display)) var/start_timeofday = REALTIMEOFDAY for (var/current_init_stage in 1 to INITSTAGE_MAX) // Initialize subsystems. for (var/datum/controller/subsystem/subsystem in stage_sorted_subsystems[current_init_stage]) subsystem.init_order = evaluated_order evaluated_order++ init_subsystem(subsystem) CHECK_TICK current_initializing_subsystem = null init_stage_completed = current_init_stage if (!mc_started) mc_started = TRUE if (!current_runlevel) SetRunLevel(1) // Intentionally not using the defines here because the MC doesn't care about them // Loop. Master.StartProcessing(0) var/time = (REALTIMEOFDAY - start_timeofday) / 10 var/msg = "Initializations complete within [time] second[time == 1 ? "" : "s"]!" to_chat(world, span_boldannounce("[msg]"), MESSAGE_TYPE_DEBUG) log_world(msg) if(world.system_type == MS_WINDOWS && CONFIG_GET(flag/toast_notification_on_init) && !length(GLOB.clients)) world.shelleo("start /min powershell -ExecutionPolicy Bypass -File tools/initToast/initToast.ps1 -name \"[world.name]\" -icon %CD%\\icons\\virgoicon_16.png -port [world.port]") // Set world options. world.change_fps(CONFIG_GET(number/fps)) var/initialized_tod = REALTIMEOFDAY if(tgs_prime) world.TgsInitializationComplete() if(sleep_offline_after_initializations) world.sleep_offline = TRUE sleep(1 TICKS) if(sleep_offline_after_initializations && CONFIG_GET(flag/resume_after_initializations)) world.sleep_offline = FALSE initializations_finished_with_no_players_logged_in = initialized_tod < REALTIMEOFDAY - 10 /** * Initialize a given subsystem and handle the results. * * Arguments: * * subsystem - the subsystem to initialize. */ /datum/controller/master/proc/init_subsystem(datum/controller/subsystem/subsystem) var/static/list/valid_results = list( SS_INIT_FAILURE, SS_INIT_NONE, SS_INIT_SUCCESS, SS_INIT_NO_NEED, SS_INIT_NO_MESSAGE, ) if ((subsystem.flags & SS_NO_INIT) || subsystem.initialized) //Don't init SSs with the corresponding flag or if they already are initialized subsystem.initialized = TRUE // set initialized to TRUE, because the value of initialized may still be checked on SS_NO_INIT subsystems as an "is this ready" check return current_initializing_subsystem = subsystem rustg_time_reset(SS_INIT_TIMER_KEY) var/result = subsystem.Initialize() // Capture end time var/time = rustg_time_milliseconds(SS_INIT_TIMER_KEY) var/seconds = round(time / 1000, 0.01) // Always update the blackbox tally regardless. // NOT IMPLEMENTED: SSblackbox.record_feedback("tally", "subsystem_initialize", time, subsystem.name) feedback_set_details("subsystem_initialize", "[time] [subsystem.name]") // Gave invalid return value. if(result && !(result in valid_results)) WARNING("[subsystem.name] subsystem initialized, returning invalid result [result]. This is a bug.") // just returned ..() or didn't implement Initialize() at all if(result == SS_INIT_NONE) WARNING("[subsystem.name] subsystem does not implement Initialize() or it returns ..(). If the former is true, the SS_NO_INIT flag should be set for this subsystem.") if(result != SS_INIT_FAILURE) // Some form of success, implicit failure, or the SS in unused. subsystem.initialized = TRUE SEND_SIGNAL(subsystem, COMSIG_SUBSYSTEM_POST_INITIALIZE) else // The subsystem officially reports that it failed to init and wishes to be treated as such. subsystem.initialized = FALSE subsystem.can_fire = FALSE // The rest of this proc is printing the world log and chat message. var/message_prefix // If true, print the chat message with boldwarning text. var/chat_warning = FALSE switch(result) if(SS_INIT_FAILURE) message_prefix = "Failed to initialize [subsystem.name] subsystem after" chat_warning = TRUE if(SS_INIT_SUCCESS, SS_INIT_NO_MESSAGE) message_prefix = "Initialized [subsystem.name] subsystem within" if(SS_INIT_NO_NEED) // This SS is disabled or is otherwise shy. return else // SS_INIT_NONE or an invalid value. message_prefix = "Initialized [subsystem.name] subsystem with errors within" chat_warning = TRUE var/message = "[message_prefix] [seconds] second[seconds == 1 ? "" : "s"]!" var/chat_message = chat_warning ? span_boldwarning(message) : span_boldannounce(message) if(result != SS_INIT_NO_MESSAGE) to_chat(world, chat_message, MESSAGE_TYPE_DEBUG) log_world(message) /datum/controller/master/proc/SetRunLevel(new_runlevel) var/old_runlevel = current_runlevel testing("MC: Runlevel changed from [isnull(old_runlevel) ? "NULL" : old_runlevel] to [new_runlevel]") current_runlevel = log(2, new_runlevel) + 1 if(current_runlevel < 1) current_runlevel = old_runlevel CRASH("Attempted to set invalid runlevel: [new_runlevel]") // Starts the mc, and sticks around to restart it if the loop ever ends. /datum/controller/master/proc/StartProcessing(delay) set waitfor = 0 if(delay) sleep(delay) testing("Master starting processing") var/started_stage var/rtn = -2 do started_stage = init_stage_completed rtn = Loop(started_stage) while (rtn == MC_LOOP_RTN_NEWSTAGES && processing > 0 && started_stage < init_stage_completed) if (rtn >= MC_LOOP_RTN_GRACEFUL_EXIT || processing < 0) return //this was suppose to happen. //loop ended, restart the mc log_game("MC crashed or runtimed, restarting") message_admins("MC crashed or runtimed, restarting") var/rtn2 = Recreate_MC() if (rtn2 <= 0) log_game("Failed to recreate MC (Error code: [rtn2]), it's up to the failsafe now") message_admins("Failed to recreate MC (Error code: [rtn2]), it's up to the failsafe now") Failsafe.defcon = 2 // Main loop. /datum/controller/master/proc/Loop(init_stage) . = -1 //Prep the loop (most of this is because we want MC restarts to reset as much state as we can, and because // local vars rock //all this shit is here so that flag edits can be refreshed by restarting the MC. (and for speed) var/list/tickersubsystems = list() var/list/runlevel_sorted_subsystems = list(list()) //ensure we always have at least one runlevel var/timer = world.time for (var/thing in subsystems) var/datum/controller/subsystem/SS = thing if (SS.flags & SS_NO_FIRE) continue if (SS.init_stage > init_stage) continue SS.queued_time = 0 SS.queue_next = null SS.queue_prev = null SS.state = SS_IDLE if ((SS.flags & (SS_TICKER|SS_BACKGROUND)) == SS_TICKER) tickersubsystems += SS // Timer subsystems aren't allowed to bunch up, so we offset them a bit timer += world.tick_lag * rand(0, 1) SS.next_fire = timer continue var/ss_runlevels = SS.runlevels var/added_to_any = FALSE for(var/I in 1 to GLOB.bitflags.len) if(ss_runlevels & GLOB.bitflags[I]) while(runlevel_sorted_subsystems.len < I) runlevel_sorted_subsystems += list(list()) runlevel_sorted_subsystems[I] += SS added_to_any = TRUE if(!added_to_any) WARNING("[SS.name] subsystem is not SS_NO_FIRE but also does not have any runlevels set!") queue_head = null queue_tail = null //these sort by lower priorities first to reduce the number of loops needed to add subsequent SS's to the queue //(higher subsystems will be sooner in the queue, adding them later in the loop means we don't have to loop thru them next queue add) sortTim(tickersubsystems, GLOBAL_PROC_REF(cmp_subsystem_priority)) for(var/I in runlevel_sorted_subsystems) sortTim(I, GLOBAL_PROC_REF(cmp_subsystem_priority)) I += tickersubsystems var/cached_runlevel = current_runlevel var/list/current_runlevel_subsystems = runlevel_sorted_subsystems[cached_runlevel] init_timeofday = REALTIMEOFDAY init_time = world.time iteration = 1 var/error_level = 0 var/sleep_delta = 1 var/list/subsystems_to_check //setup the stack overflow detector stack_end_detector = new() var/datum/stack_canary/canary = stack_end_detector.prime_canary() canary.use_variable() //the actual loop. while (1) var/newdrift = ((REALTIMEOFDAY - init_timeofday) - (world.time - init_time)) / world.tick_lag tickdrift = max(0, MC_AVERAGE_FAST(tickdrift, newdrift)) var/starting_tick_usage = TICK_USAGE if(newdrift - olddrift >= CONFIG_GET(number/drift_dump_threshold)) AttemptProfileDump(CONFIG_GET(number/drift_profile_delay)) olddrift = newdrift if (init_stage != init_stage_completed) return MC_LOOP_RTN_NEWSTAGES if (processing <= 0) current_ticklimit = TICK_LIMIT_RUNNING sleep(1 SECONDS) continue //Anti-tick-contention heuristics: if (init_stage == INITSTAGE_MAX) //if there are multiple sleeping procs running before us hogging the cpu, we have to run later. // (because sleeps are processed in the order received, longer sleeps are more likely to run first) if (starting_tick_usage > TICK_LIMIT_MC) //if there isn't enough time to bother doing anything this tick, sleep a bit. sleep_delta *= 2 current_ticklimit = TICK_LIMIT_RUNNING * 0.5 sleep(world.tick_lag * (processing * sleep_delta)) continue //Byond resumed us late. assume it might have to do the same next tick if (last_run + CEILING(world.tick_lag * (processing * sleep_delta), world.tick_lag) < world.time) sleep_delta += 1 sleep_delta = MC_AVERAGE_FAST(sleep_delta, 1) //decay sleep_delta if (starting_tick_usage > (TICK_LIMIT_MC*0.75)) //we ran 3/4 of the way into the tick sleep_delta += 1 else sleep_delta = 1 //debug if (make_runtime) var/datum/controller/subsystem/SS SS.can_fire = 0 if (!Failsafe || (Failsafe.processing_interval > 0 && (Failsafe.lasttick+(Failsafe.processing_interval*5)) < world.time)) new/datum/controller/failsafe() // (re)Start the failsafe. //now do the actual stuff if (!skip_ticks) var/checking_runlevel = current_runlevel if(cached_runlevel != checking_runlevel) //resechedule subsystems var/list/old_subsystems = current_runlevel_subsystems cached_runlevel = checking_runlevel current_runlevel_subsystems = runlevel_sorted_subsystems[cached_runlevel] //now we'll go through all the subsystems we want to offset and give them a next_fire for(var/datum/controller/subsystem/SS as anything in current_runlevel_subsystems) //we only want to offset it if it's new and also behind if(SS.next_fire > world.time || (SS in old_subsystems)) continue SS.next_fire = world.time + world.tick_lag * rand(0, DS2TICKS(min(SS.wait, 2 SECONDS))) subsystems_to_check = current_runlevel_subsystems else subsystems_to_check = tickersubsystems if (CheckQueue(subsystems_to_check) <= 0) //error processing queue stack_trace("MC: CheckQueue failed. Current error_level is [round(error_level, 0.25)]") if (!SoftReset(tickersubsystems, runlevel_sorted_subsystems)) error_level++ CRASH("MC: SoftReset() failed, exiting loop()") if (error_level < 2) //except for the first strike, stop incrmenting our iteration so failsafe enters defcon iteration++ else cached_runlevel = null //3 strikes, Lets reset the runlevel lists current_ticklimit = TICK_LIMIT_RUNNING sleep((1 SECONDS) * error_level) error_level++ continue if (queue_head) if (RunQueue() <= 0) //error running queue stack_trace("MC: RunQueue failed. Current error_level is [round(error_level, 0.25)]") if (error_level > 1) //skip the first error, if (!SoftReset(tickersubsystems, runlevel_sorted_subsystems)) error_level++ CRASH("MC: SoftReset() failed, exiting loop()") if (error_level <= 2) //after 3 strikes stop incrmenting our iteration so failsafe enters defcon iteration++ else cached_runlevel = null //3 strikes, Lets also reset the runlevel lists current_ticklimit = TICK_LIMIT_RUNNING sleep((1 SECONDS) * error_level) error_level++ continue error_level++ if (error_level > 0) error_level = max(MC_AVERAGE_SLOW(error_level-1, error_level), 0) if (!queue_head) //reset the counts if the queue is empty, in the off chance they get out of sync queue_priority_count = 0 queue_priority_count_bg = 0 iteration++ last_run = world.time if (skip_ticks) skip_ticks-- src.sleep_delta = MC_AVERAGE_FAST(src.sleep_delta, sleep_delta) // Force any verbs into overtime, to test how they perfrom under load // For local ONLY #ifdef VERB_STRESS_TEST /// Target enough tick usage to only allow time for our maptick estimate and verb processing, and nothing else var/overtime_target = TICK_LIMIT_RUNNING // This will leave just enough cpu time for maptick, forcing verbs to run into overtime // Use this for testing the worst case scenario, when maptick is spiking and usage is otherwise completely consumed #ifdef FORCE_VERB_OVERTIME overtime_target += TICK_BYOND_RESERVE #endif CONSUME_UNTIL(overtime_target) #endif if (init_stage != INITSTAGE_MAX) current_ticklimit = TICK_LIMIT_RUNNING * 2 else current_ticklimit = TICK_LIMIT_RUNNING if (processing * sleep_delta <= world.tick_lag) current_ticklimit -= (TICK_LIMIT_RUNNING * 0.25) //reserve the tail 1/4 of the next tick for the mc if we plan on running next tick check_and_perform_fast_update() sleep(world.tick_lag * (processing * sleep_delta)) // This is what decides if something should run. /datum/controller/master/proc/CheckQueue(list/subsystemstocheck) . = 0 //so the mc knows if we runtimed //we create our variables outside of the loops to save on overhead var/datum/controller/subsystem/SS var/SS_flags for (var/thing in subsystemstocheck) if (!thing) subsystemstocheck -= thing SS = thing if (SS.state != SS_IDLE) continue if (SS.can_fire <= 0) continue if (SS.next_fire > world.time) continue SS_flags = SS.flags if (SS_flags & SS_NO_FIRE) subsystemstocheck -= SS continue if ((SS_flags & (SS_TICKER|SS_KEEP_TIMING)) == SS_KEEP_TIMING && SS.last_fire + (SS.wait * 0.75) > world.time) continue if (SS.postponed_fires >= 1) SS.postponed_fires-- SS.update_nextfire() continue SS.enqueue() . = 1 /// RunQueue - Run thru the queue of subsystems to run, running them while balancing out their allocated tick precentage /// Returns 0 if runtimed, a negitive number for logic errors, and a positive number if the operation completed without errors /datum/controller/master/proc/RunQueue() . = 0 var/datum/controller/subsystem/queue_node var/queue_node_flags var/queue_node_priority var/queue_node_paused var/current_tick_budget var/tick_precentage var/tick_remaining var/ran = TRUE //this is right var/bg_calc //have we swtiched current_tick_budget to background mode yet? var/tick_usage //keep running while we have stuff to run and we haven't gone over a tick // this is so subsystems paused eariler can use tick time that later subsystems never used while (ran && queue_head && TICK_USAGE < TICK_LIMIT_MC) ran = FALSE bg_calc = FALSE current_tick_budget = queue_priority_count queue_node = queue_head while (queue_node) if (ran && TICK_USAGE > TICK_LIMIT_RUNNING) break queue_node_flags = queue_node.flags queue_node_priority = queue_node.queued_priority if (!(queue_node_flags & SS_TICKER) && skip_ticks) queue_node = queue_node.queue_next continue if ((queue_node_flags & SS_BACKGROUND)) if (!bg_calc) current_tick_budget = queue_priority_count_bg bg_calc = TRUE else if (bg_calc) //error state, do sane fallback behavior if (. == 0) log_world("MC: Queue logic failure, non-background subsystem queued to run after a background subsystem: [queue_node] queue_prev:[queue_node.queue_prev]") . = -1 current_tick_budget = queue_priority_count //this won't even be right, but is the best we have. bg_calc = FALSE tick_remaining = TICK_LIMIT_RUNNING - TICK_USAGE if (queue_node_priority >= 0 && current_tick_budget > 0 && current_tick_budget >= queue_node_priority) //Give the subsystem a precentage of the remaining tick based on the remaining priority tick_precentage = tick_remaining * (queue_node_priority / current_tick_budget) else //error state if (. == 0) log_world("MC: tick_budget sync error. [json_encode(list(current_tick_budget, queue_priority_count, queue_priority_count_bg, bg_calc, queue_node, queue_node_priority))]") . = -1 tick_precentage = tick_remaining //just because we lost track of priority calculations doesn't mean we can't try to finish off the run, if the error state persists, we don't want to stop ticks from happening tick_precentage = max(tick_precentage*0.5, tick_precentage-queue_node.tick_overrun) current_ticklimit = round(TICK_USAGE + tick_precentage) ran = TRUE queue_node_paused = (queue_node.state == SS_PAUSED || queue_node.state == SS_PAUSING) last_type_processed = queue_node queue_node.state = SS_RUNNING if(queue_node.profiler_focused) world.Profile(PROFILE_START) tick_usage = TICK_USAGE var/state = queue_node.ignite(queue_node_paused) tick_usage = TICK_USAGE - tick_usage if(use_rolling_usage) queue_node.prune_rolling_usage() // Rolling usage is an unrolled list that we know the order off // OPTIMIZATION POSTING queue_node.rolling_usage += list(DS2TICKS(world.time), tick_usage) if(queue_node.profiler_focused) world.Profile(PROFILE_STOP) if (state == SS_RUNNING) state = SS_IDLE current_tick_budget -= queue_node_priority if (tick_usage < 0) tick_usage = 0 queue_node.tick_overrun = max(0, MC_AVG_FAST_UP_SLOW_DOWN(queue_node.tick_overrun, tick_usage-tick_precentage)) queue_node.state = state if (state == SS_PAUSED) queue_node.paused_ticks++ queue_node.paused_tick_usage += tick_usage queue_node = queue_node.queue_next continue queue_node.ticks = MC_AVERAGE(queue_node.ticks, queue_node.paused_ticks) tick_usage += queue_node.paused_tick_usage queue_node.tick_usage = MC_AVERAGE_FAST(queue_node.tick_usage, tick_usage) queue_node.cost = MC_AVERAGE_FAST(queue_node.cost, TICK_DELTA_TO_MS(tick_usage)) queue_node.paused_ticks = 0 queue_node.paused_tick_usage = 0 if (bg_calc) //update our running total queue_priority_count_bg -= queue_node_priority else queue_priority_count -= queue_node_priority queue_node.last_fire = world.time queue_node.times_fired++ queue_node.update_nextfire() queue_node.queued_time = 0 //remove from queue queue_node.dequeue() queue_node = queue_node.queue_next if (. == 0) . = 1 //resets the queue, and all subsystems, while filtering out the subsystem lists // called if any mc's queue procs runtime or exit improperly. /datum/controller/master/proc/SoftReset(list/ticker_SS, list/runlevel_SS) . = 0 stack_trace("MC: SoftReset called, resetting MC queue state.") if (!istype(subsystems) || !istype(ticker_SS) || !istype(runlevel_SS)) log_world("MC: SoftReset: Bad list contents: '[subsystems]' '[ticker_SS]' '[runlevel_SS]'") return var/subsystemstocheck = subsystems | ticker_SS for(var/I in runlevel_SS) subsystemstocheck |= I for (var/thing in subsystemstocheck) var/datum/controller/subsystem/SS = thing if (!SS || !istype(SS)) //list(SS) is so if a list makes it in the subsystem list, we remove the list, not the contents subsystems -= list(SS) ticker_SS -= list(SS) for(var/I in runlevel_SS) I -= list(SS) log_world("MC: SoftReset: Found bad entry in subsystem list, '[SS]'") continue if (SS.queue_next && !istype(SS.queue_next)) log_world("MC: SoftReset: Found bad data in subsystem queue, queue_next = '[SS.queue_next]'") SS.queue_next = null if (SS.queue_prev && !istype(SS.queue_prev)) log_world("MC: SoftReset: Found bad data in subsystem queue, queue_prev = '[SS.queue_prev]'") SS.queue_prev = null SS.queued_priority = 0 SS.queued_time = 0 SS.state = SS_IDLE if (queue_head && !istype(queue_head)) log_world("MC: SoftReset: Found bad data in subsystem queue, queue_head = '[queue_head]'") queue_head = null if (queue_tail && !istype(queue_tail)) log_world("MC: SoftReset: Found bad data in subsystem queue, queue_tail = '[queue_tail]'") queue_tail = null queue_priority_count = 0 queue_priority_count_bg = 0 log_world("MC: SoftReset: Finished.") . = 1 /// Warns us that the end of tick byond map_update will be laggier then normal, so that we can just skip running subsystems this tick. /datum/controller/master/proc/laggy_byond_map_update_incoming() if (!skip_ticks) skip_ticks = 1 /datum/controller/master/stat_entry(msg) msg = "(TickRate:[Master.processing]) (Iteration:[Master.iteration]) (TickLimit: [round(Master.current_ticklimit, 0.1)])" return msg /datum/controller/master/StartLoadingMap() //disallow more than one map to load at once, multithreading it will just cause race conditions while(map_loading) stoplag() for(var/S in subsystems) var/datum/controller/subsystem/SS = S SS.StartLoadingMap() map_loading = TRUE /datum/controller/master/StopLoadingMap(bounds = null) map_loading = FALSE for(var/S in subsystems) var/datum/controller/subsystem/SS = S SS.StopLoadingMap() /datum/controller/master/proc/UpdateTickRate() if (!processing) return var/client_count = length(GLOB.clients) if (client_count < CONFIG_GET(number/mc_tick_rate/disable_high_pop_mc_mode_amount)) processing = CONFIG_GET(number/mc_tick_rate/base_mc_tick_rate) else if (client_count > CONFIG_GET(number/mc_tick_rate/high_pop_mc_mode_amount)) processing = CONFIG_GET(number/mc_tick_rate/high_pop_mc_tick_rate) /datum/controller/master/proc/OnConfigLoad() for (var/thing in subsystems) var/datum/controller/subsystem/SS = thing SS.OnConfigLoad() /// Attempts to dump our current profile info into a file, triggered if the MC thinks shit is going down /// Accepts a delay in deciseconds of how long ago our last dump can be, this saves causing performance problems ourselves /datum/controller/master/proc/AttemptProfileDump(delay) if(REALTIMEOFDAY - last_profiled <= delay) return FALSE last_profiled = REALTIMEOFDAY SSprofiler.DumpFile(allow_yield = FALSE)