bootstrap-vz/bootstrapvz/base/tasklist.py

"""The tasklist module contains the TaskList class.
"""

from bootstrapvz.common.exceptions import TaskListError
import logging
log = logging.getLogger(__name__)


class TaskList(object):
	"""The tasklist class aggregates all tasks that should be run
	and orders them according to their dependencies.
	"""

	def __init__(self, tasks):
		self.tasks = tasks
		self.tasks_completed = []

	def run(self, info, dry_run=False):
		"""Converts the taskgraph into a list and runs all tasks in that list

		:param dict info: The bootstrap information object
		:param bool dry_run: Whether to actually run the tasks or simply step through them
		"""
		# Get a hold of every task we can find, so that we can topologically sort
		# all tasks, rather than just the subset we are going to run.
		from bootstrapvz.common import tasks as common_tasks
		modules = [common_tasks, info.manifest.modules['provider']] + info.manifest.modules['plugins']
		all_tasks = set(get_all_tasks(modules))
		# Create a list for us to run
		task_list = create_list(self.tasks, all_tasks)
		# Output the tasklist
		log.debug('Tasklist:\n\t' + ('\n\t'.join(map(repr, task_list))))

		for task in task_list:
			# Tasks are not required to have a description
			if hasattr(task, 'description'):
				log.info(task.description)
			else:
				# If there is no description, simply coerce the task into a string and print its name
				log.info('Running ' + str(task))
			if not dry_run:
				# Run the task
				task.run(info)
			# Remember which tasks have been run for later use (e.g. when rolling back, because of an error)
			self.tasks_completed.append(task)


def load_tasks(function, manifest, *args):
	"""Calls ``function`` on the provider and all plugins that have been loaded by the manifest.
	Any additional arguments are passed directly to ``function``.
	The function that is called shall accept the taskset as its first argument and the manifest
	as its second argument.

	:param str function: Name of the function to call
	:param Manifest manifest: The manifest
	:param list args: Additional arguments that should be passed to the function that is called
	"""
	tasks = set()
	# Call 'function' on the provider
	getattr(manifest.modules['provider'], function)(tasks, manifest, *args)
	for plugin in manifest.modules['plugins']:
		# Plugins are not required to have whatever function we call
		fn = getattr(plugin, function, None)
		if callable(fn):
			fn(tasks, manifest, *args)
	return tasks


def create_list(taskset, all_tasks):
	"""Creates a list of all the tasks that should be run.
	"""
	from bootstrapvz.common.phases import order
	# Make sure all_tasks is a superset of the resolved taskset
	if not all_tasks >= taskset:
		msg = ('bootstrap-vz generated a list of all available tasks. '
		       'That list is not a superset of the tasks required for bootstrapping. '
		       'The tasks that were not found are: {tasks} '
		       '(This is an error in the code and not the manifest, please report this issue.)'
		       .format(tasks=', '.join(map(str, taskset - all_tasks)))
		       )
		raise TaskListError(msg)
	# Create a graph over all tasks by creating a map of each tasks successors
	graph = {}
	for task in all_tasks:
		# Do a sanity check first
		check_ordering(task)
		successors = set()
		# Add all successors mentioned in the task
		successors.update(task.successors)
		# Add all tasks that mention this task as a predecessor
		successors.update(filter(lambda succ: task in succ.predecessors, all_tasks))
		# Create a list of phases that succeed the phase of this task
		succeeding_phases = order[order.index(task.phase) + 1:]
		# Add all tasks that occur in above mentioned succeeding phases
		successors.update(filter(lambda succ: succ.phase in succeeding_phases, all_tasks))
		# Map the successors to the task
		graph[task] = successors

	# Use the strongly connected components algorithm to check for cycles in our task graph
	components = strongly_connected_components(graph)
	cycles_found = 0
	for component in components:
		# Node of 1 is also a strongly connected component but hardly a cycle, so we filter them out
		if len(component) > 1:
			cycles_found += 1
			log.debug('Cycle: {list}\n' + (', '.join(map(repr, component))))
	if cycles_found > 0:
		msg = ('{num} cycles were found in the tasklist, '
		       'consult the logfile for more information.'.format(num=cycles_found))
		raise TaskListError(msg)

	# Run a topological sort on the graph, returning an ordered list
	sorted_tasks = topological_sort(graph)

	# Filter out any tasks not in the tasklist
	# We want to maintain ordering, so we don't use set intersection
	sorted_tasks = filter(lambda task: task in taskset, sorted_tasks)
	return sorted_tasks


def get_all_tasks(modules):
	"""Gets a list of all task classes in the package

	:return: A list of all tasks in the package
	:rtype: list
	"""
	import os.path
	# Get generators that return all classes in a module
	generators = []
	for module in modules:
		module_path = os.path.dirname(module.__file__)
		module_prefix = module.__name__ + '.'
		generators.append(get_all_classes(module_path, module_prefix))
	import itertools
	classes = itertools.chain(*generators)

	# lambda function to check whether a class is a task (excluding the superclass Task)
	def is_task(obj):
		from task import Task
		return issubclass(obj, Task) and obj is not Task
	return filter(is_task, classes)  # Only return classes that are tasks


def get_all_classes(path=None, prefix='', excludes=[]):
	""" Given a path to a package, this function retrieves all the classes in it

	:param str path: Path to the package
	:param str prefix: Name of the package followed by a dot
	:param list excludes: List of str matching module names that should be ignored
	:return: A generator that yields classes
	:rtype: generator
	:raises Exception: If a module cannot be inspected.
	"""
	import pkgutil
	import importlib
	import inspect

	def walk_error(module_name):
		if not any(map(lambda excl: module_name.startswith(excl), excludes)):
			raise TaskListError('Unable to inspect module ' + module_name)
	walker = pkgutil.walk_packages([path], prefix, walk_error)
	for _, module_name, _ in walker:
		if any(map(lambda excl: module_name.startswith(excl), excludes)):
			continue
		module = importlib.import_module(module_name)
		classes = inspect.getmembers(module, inspect.isclass)
		for class_name, obj in classes:
			# We only want classes that are defined in the module, and not imported ones
			if obj.__module__ == module_name:
					yield obj


def check_ordering(task):
	"""Checks the ordering of a task in relation to other tasks and their phases.

	This function checks for a subset of what the strongly connected components algorithm does,
	but can deliver a more precise error message, namely that there is a conflict between
	what a task has specified as its predecessors or successors and in which phase it is placed.

	:param Task task: The task to check the ordering for
	:raises TaskListError: If there is a conflict between task precedence and phase precedence
	"""
	for successor in task.successors:
		# Run through all successors and throw an error if the phase of the task
		# lies before the phase of a successor, log a warning if it lies after.
		if task.phase > successor.phase:
			msg = ("The task {task} is specified as running before {other}, "
			       "but its phase '{phase}' lies after the phase '{other_phase}'"
			       .format(task=task, other=successor, phase=task.phase, other_phase=successor.phase))
			raise TaskListError(msg)
		if task.phase < successor.phase:
			log.warn("The task {task} is specified as running before {other} "
			         "although its phase '{phase}' already lies before the phase '{other_phase}' "
			         "(or the task has been placed in the wrong phase)"
			         .format(task=task, other=successor, phase=task.phase, other_phase=successor.phase))
	for predecessor in task.predecessors:
		# Run through all successors and throw an error if the phase of the task
		# lies after the phase of a predecessor, log a warning if it lies before.
		if task.phase < predecessor.phase:
			msg = ("The task {task} is specified as running after {other}, "
			       "but its phase '{phase}' lies before the phase '{other_phase}'"
			       .format(task=task, other=predecessor, phase=task.phase, other_phase=predecessor.phase))
			raise TaskListError(msg)
		if task.phase > predecessor.phase:
			log.warn("The task {task} is specified as running after {other} "
			         "although its phase '{phase}' already lies after the phase '{other_phase}' "
			         "(or the task has been placed in the wrong phase)"
			         .format(task=task, other=predecessor, phase=task.phase, other_phase=predecessor.phase))


def strongly_connected_components(graph):
	"""Find the strongly connected components in a graph using Tarjan's algorithm.

	Source: http://www.logarithmic.net/pfh-files/blog/01208083168/sort.py

	:param dict graph: mapping of tasks to lists of successor tasks
	:return: List of tuples that are strongly connected comoponents
	:rtype: list
	"""

	result = []
	stack = []
	low = {}

	def visit(node):
		if node in low:
			return

		num = len(low)
		low[node] = num
		stack_pos = len(stack)
		stack.append(node)

		for successor in graph[node]:
			visit(successor)
			low[node] = min(low[node], low[successor])

		if num == low[node]:
			component = tuple(stack[stack_pos:])
			del stack[stack_pos:]
			result.append(component)
			for item in component:
				low[item] = len(graph)

	for node in graph:
		visit(node)

	return result


def topological_sort(graph):
	"""Runs a topological sort on a graph.

	Source: http://www.logarithmic.net/pfh-files/blog/01208083168/sort.py

	:param dict graph: mapping of tasks to lists of successor tasks
	:return: A list of all tasks in the graph sorted according to ther dependencies
	:rtype: list
	"""
	count = {}
	for node in graph:
		count[node] = 0
	for node in graph:
		for successor in graph[node]:
			count[successor] += 1

	ready = [node for node in graph if count[node] == 0]

	result = []
	while ready:
		node = ready.pop(-1)
		result.append(node)

		for successor in graph[node]:
			count[successor] -= 1
			if count[successor] == 0:
				ready.append(successor)

	return result
Everything in base/ is now commented. 2014-03-23 16:04:03 +01:00			`"""The tasklist module contains the TaskList class.`
			`"""`

Properly fix imports and make bootstrapvz work like a package 2014-03-23 23:12:07 +01:00			`from bootstrapvz.common.exceptions import TaskListError`
logging 2013-06-09 20:29:54 +02:00			`import logging`
			`log = logging.getLogger(__name__)`
Basic structure up and running 2013-05-02 19:13:35 +02:00

Task dependencies, bogus implementation 2013-06-23 15:26:08 +02:00			`class TaskList(object):`
Everything in base/ is now commented. 2014-03-23 16:04:03 +01:00			`"""The tasklist class aggregates all tasks that should be run`
			`and orders them according to their dependencies.`
			`"""`
Plugin architecture working 2013-05-16 08:00:28 +02:00
Refactor tasklist for easier integration by taskoverview 2014-05-10 17:24:50 +02:00			`def __init__(self, tasks):`
			`self.tasks = tasks`
Way better rollback architecture through improvements in flexibility 2013-06-26 23:40:42 +02:00			`self.tasks_completed = []`
Task dependencies, bogus implementation 2013-06-23 15:26:08 +02:00
Introduce some awesome signal handling We can now press Ctrl+C remotely while any subprocess of the bootstrapping process is running, previously SIGINTs weren't propagated to the bootstrapping process because there was a thread in between it all. Now the bootstrapping process is in it's own process group. 2015-01-25 17:38:17 +01:00			`def run(self, info, dry_run=False):`
Everything in base/ is now commented. 2014-03-23 16:04:03 +01:00			`"""Converts the taskgraph into a list and runs all tasks in that list`

Convert param docs into parseable format. 2014-05-04 19:31:53 +02:00			`:param dict info: The bootstrap information object`
			`:param bool dry_run: Whether to actually run the tasks or simply step through them`
Everything in base/ is now commented. 2014-03-23 16:04:03 +01:00			`"""`
Fix #98. External plugin architecture implemented 2015-05-03 13:07:26 +02:00			`# Get a hold of every task we can find, so that we can topologically sort`
			`# all tasks, rather than just the subset we are going to run.`
			`from bootstrapvz.common import tasks as common_tasks`
			`modules = [common_tasks, info.manifest.modules['provider']] + info.manifest.modules['plugins']`
			`all_tasks = set(get_all_tasks(modules))`
Everything in base/ is now commented. 2014-03-23 16:04:03 +01:00			`# Create a list for us to run`
Fix #98. External plugin architecture implemented 2015-05-03 13:07:26 +02:00			`task_list = create_list(self.tasks, all_tasks)`
Everything in base/ is now commented. 2014-03-23 16:04:03 +01:00			`# Output the tasklist`
Use string concatenation instead of format() String concatenation can at times be easier to read that format(). One should choose whichever approach is more readable. 2014-05-03 22:24:13 +02:00			`log.debug('Tasklist:\n\t' + ('\n\t'.join(map(repr, task_list))))`
Cycle detection and topological sorting 2013-06-23 17:03:55 +02:00
Don't instantiate tasks In practice they are just typed functions with attributes, having a reference to an object is just confusing. So: Task.run() is now a classmethod 2014-01-05 15:57:11 +01:00			`for task in task_list:`
Everything in base/ is now commented. 2014-03-23 16:04:03 +01:00			`# Tasks are not required to have a description`
Way better rollback architecture through improvements in flexibility 2013-06-26 23:40:42 +02:00			`if hasattr(task, 'description'):`
			`log.info(task.description)`
			`else:`
Everything in base/ is now commented. 2014-03-23 16:04:03 +01:00			`# If there is no description, simply coerce the task into a string and print its name`
Use string concatenation instead of format() String concatenation can at times be easier to read that format(). One should choose whichever approach is more readable. 2014-05-03 22:24:13 +02:00			`log.info('Running ' + str(task))`
Added the dry-run option 2013-10-27 18:37:43 +01:00			`if not dry_run:`
Everything in base/ is now commented. 2014-03-23 16:04:03 +01:00			`# Run the task`
Added the dry-run option 2013-10-27 18:37:43 +01:00			`task.run(info)`
Everything in base/ is now commented. 2014-03-23 16:04:03 +01:00			`# Remember which tasks have been run for later use (e.g. when rolling back, because of an error)`
Don't instantiate tasks In practice they are just typed functions with attributes, having a reference to an object is just confusing. So: Task.run() is now a classmethod 2014-01-05 15:57:11 +01:00			`self.tasks_completed.append(task)`
Various improvements and additions. I couldn't be bothered to untangle this, so here it goes: * Log colors depending on loglevel * Simplified Filelogger * Remove description=None from basetask * create_list creates task list from argument now * Task rollback feature: If a task fails, the tasklist calls rollback() on the completed tasks in reverse order * Added TaskException to common.exceptions as a base to extend from * Added TriggerRollback task to common.tasks for development purposes * An EBS volume for bootstrapping is now created and attached to the instance (including rollback actions) * EC2 Connect task now depends on host.GetInfo 2013-06-24 23:12:39 +02:00
Refactor tasklist for easier integration by taskoverview 2014-05-10 17:24:50 +02:00
			`def load_tasks(function, manifest, *args):`
			"""Calls ``function`` on the provider and all plugins that have been loaded by the manifest.
			Any additional arguments are passed directly to ``function``.
			`The function that is called shall accept the taskset as its first argument and the manifest`
			`as its second argument.`

			`:param str function: Name of the function to call`
			`:param Manifest manifest: The manifest`
			`:param list args: Additional arguments that should be passed to the function that is called`
			`"""`
			`tasks = set()`
			`# Call 'function' on the provider`
			`getattr(manifest.modules['provider'], function)(tasks, manifest, *args)`
			`for plugin in manifest.modules['plugins']:`
			`# Plugins are not required to have whatever function we call`
			`fn = getattr(plugin, function, None)`
			`if callable(fn):`
			`fn(tasks, manifest, *args)`
			`return tasks`


Fix #98. External plugin architecture implemented 2015-05-03 13:07:26 +02:00			`def create_list(taskset, all_tasks):`
Refactor tasklist for easier integration by taskoverview 2014-05-10 17:24:50 +02:00			`"""Creates a list of all the tasks that should be run.`
			`"""`
			`from bootstrapvz.common.phases import order`
Check whether all tasks found include the ones we resolved 2015-05-03 08:04:20 +02:00			`# Make sure all_tasks is a superset of the resolved taskset`
			`if not all_tasks >= taskset:`
			`msg = ('bootstrap-vz generated a list of all available tasks. '`
			`'That list is not a superset of the tasks required for bootstrapping. '`
			`'The tasks that were not found are: {tasks} '`
			`'(This is an error in the code and not the manifest, please report this issue.)'`
			`.format(tasks=', '.join(map(str, taskset - all_tasks)))`
			`)`
			`raise TaskListError(msg)`
Refactor tasklist for easier integration by taskoverview 2014-05-10 17:24:50 +02:00			`# Create a graph over all tasks by creating a map of each tasks successors`
			`graph = {}`
Check whether all tasks found include the ones we resolved 2015-05-03 08:04:20 +02:00			`for task in all_tasks:`
Refactor tasklist for easier integration by taskoverview 2014-05-10 17:24:50 +02:00			`# Do a sanity check first`
			`check_ordering(task)`
			`successors = set()`
			`# Add all successors mentioned in the task`
			`successors.update(task.successors)`
			`# Add all tasks that mention this task as a predecessor`
Check whether all tasks found include the ones we resolved 2015-05-03 08:04:20 +02:00			`successors.update(filter(lambda succ: task in succ.predecessors, all_tasks))`
Refactor tasklist for easier integration by taskoverview 2014-05-10 17:24:50 +02:00			`# Create a list of phases that succeed the phase of this task`
			`succeeding_phases = order[order.index(task.phase) + 1:]`
			`# Add all tasks that occur in above mentioned succeeding phases`
Check whether all tasks found include the ones we resolved 2015-05-03 08:04:20 +02:00			`successors.update(filter(lambda succ: succ.phase in succeeding_phases, all_tasks))`
Refactor tasklist for easier integration by taskoverview 2014-05-10 17:24:50 +02:00			`# Map the successors to the task`
			`graph[task] = successors`

			`# Use the strongly connected components algorithm to check for cycles in our task graph`
			`components = strongly_connected_components(graph)`
			`cycles_found = 0`
			`for component in components:`
			`# Node of 1 is also a strongly connected component but hardly a cycle, so we filter them out`
			`if len(component) > 1:`
			`cycles_found += 1`
			`log.debug('Cycle: {list}\n' + (', '.join(map(repr, component))))`
			`if cycles_found > 0:`
			`msg = ('{num} cycles were found in the tasklist, '`
			`'consult the logfile for more information.'.format(num=cycles_found))`
			`raise TaskListError(msg)`

			`# Run a topological sort on the graph, returning an ordered list`
			`sorted_tasks = topological_sort(graph)`

			`# Filter out any tasks not in the tasklist`
			`# We want to maintain ordering, so we don't use set intersection`
Check whether all tasks found include the ones we resolved 2015-05-03 08:04:20 +02:00			`sorted_tasks = filter(lambda task: task in taskset, sorted_tasks)`
Refactor tasklist for easier integration by taskoverview 2014-05-10 17:24:50 +02:00			`return sorted_tasks`


Fix #98. External plugin architecture implemented 2015-05-03 13:07:26 +02:00			`def get_all_tasks(modules):`
Refactor tasklist for easier integration by taskoverview 2014-05-10 17:24:50 +02:00			`"""Gets a list of all task classes in the package`

			`:return: A list of all tasks in the package`
			`:rtype: list`
			`"""`
			`import os.path`
Fix #98. External plugin architecture implemented 2015-05-03 13:07:26 +02:00			`# Get generators that return all classes in a module`
			`generators = []`
			`for module in modules:`
			`module_path = os.path.dirname(module.__file__)`
			`module_prefix = module.__name__ + '.'`
			`generators.append(get_all_classes(module_path, module_prefix))`
			`import itertools`
			`classes = itertools.chain(*generators)`
Refactor tasklist for easier integration by taskoverview 2014-05-10 17:24:50 +02:00
			`# lambda function to check whether a class is a task (excluding the superclass Task)`
			`def is_task(obj):`
			`from task import Task`
			`return issubclass(obj, Task) and obj is not Task`
Fix #98. External plugin architecture implemented 2015-05-03 13:07:26 +02:00			`return filter(is_task, classes) # Only return classes that are tasks`
Refactor tasklist for easier integration by taskoverview 2014-05-10 17:24:50 +02:00

Fix error mentioned in #152 (Pyro4 shouldn't be a dependency) 2015-04-12 09:40:09 +02:00			`def get_all_classes(path=None, prefix='', excludes=[]):`
Refactor tasklist for easier integration by taskoverview 2014-05-10 17:24:50 +02:00			`""" Given a path to a package, this function retrieves all the classes in it`

			`:param str path: Path to the package`
			`:param str prefix: Name of the package followed by a dot`
Fix error mentioned in #152 (Pyro4 shouldn't be a dependency) 2015-04-12 09:40:09 +02:00			`:param list excludes: List of str matching module names that should be ignored`
Refactor tasklist for easier integration by taskoverview 2014-05-10 17:24:50 +02:00			`:return: A generator that yields classes`
			`:rtype: generator`
			`:raises Exception: If a module cannot be inspected.`
			`"""`
			`import pkgutil`
			`import importlib`
			`import inspect`

Fix error mentioned in #152 (Pyro4 shouldn't be a dependency) 2015-04-12 09:40:09 +02:00			`def walk_error(module_name):`
			`if not any(map(lambda excl: module_name.startswith(excl), excludes)):`
Fix #98. External plugin architecture implemented 2015-05-03 13:07:26 +02:00			`raise TaskListError('Unable to inspect module ' + module_name)`
Refactor tasklist for easier integration by taskoverview 2014-05-10 17:24:50 +02:00			`walker = pkgutil.walk_packages([path], prefix, walk_error)`
			`for _, module_name, _ in walker:`
Fix error mentioned in #152 (Pyro4 shouldn't be a dependency) 2015-04-12 09:40:09 +02:00			`if any(map(lambda excl: module_name.startswith(excl), excludes)):`
			`continue`
Refactor tasklist for easier integration by taskoverview 2014-05-10 17:24:50 +02:00			`module = importlib.import_module(module_name)`
			`classes = inspect.getmembers(module, inspect.isclass)`
			`for class_name, obj in classes:`
			`# We only want classes that are defined in the module, and not imported ones`
			`if obj.__module__ == module_name:`
			`yield obj`


			`def check_ordering(task):`
			`"""Checks the ordering of a task in relation to other tasks and their phases.`

			`This function checks for a subset of what the strongly connected components algorithm does,`
			`but can deliver a more precise error message, namely that there is a conflict between`
			`what a task has specified as its predecessors or successors and in which phase it is placed.`

			`:param Task task: The task to check the ordering for`
			`:raises TaskListError: If there is a conflict between task precedence and phase precedence`
			`"""`
			`for successor in task.successors:`
Issue warning when specifying pre/successors across phases 2015-04-08 21:52:46 +02:00			`# Run through all successors and throw an error if the phase of the task`
			`# lies before the phase of a successor, log a warning if it lies after.`
Refactor tasklist for easier integration by taskoverview 2014-05-10 17:24:50 +02:00			`if task.phase > successor.phase:`
			`msg = ("The task {task} is specified as running before {other}, "`
			`"but its phase '{phase}' lies after the phase '{other_phase}'"`
			`.format(task=task, other=successor, phase=task.phase, other_phase=successor.phase))`
			`raise TaskListError(msg)`
Issue warning when specifying pre/successors across phases 2015-04-08 21:52:46 +02:00			`if task.phase < successor.phase:`
			`log.warn("The task {task} is specified as running before {other} "`
Add a little helpful not to tasklist ordering warning 2015-04-09 18:23:08 +02:00			`"although its phase '{phase}' already lies before the phase '{other_phase}' "`
			`"(or the task has been placed in the wrong phase)"`
Issue warning when specifying pre/successors across phases 2015-04-08 21:52:46 +02:00			`.format(task=task, other=successor, phase=task.phase, other_phase=successor.phase))`
Refactor tasklist for easier integration by taskoverview 2014-05-10 17:24:50 +02:00			`for predecessor in task.predecessors:`
Issue warning when specifying pre/successors across phases 2015-04-08 21:52:46 +02:00			`# Run through all successors and throw an error if the phase of the task`
			`# lies after the phase of a predecessor, log a warning if it lies before.`
Refactor tasklist for easier integration by taskoverview 2014-05-10 17:24:50 +02:00			`if task.phase < predecessor.phase:`
			`msg = ("The task {task} is specified as running after {other}, "`
			`"but its phase '{phase}' lies before the phase '{other_phase}'"`
			`.format(task=task, other=predecessor, phase=task.phase, other_phase=predecessor.phase))`
Cycle detection and topological sorting 2013-06-23 17:03:55 +02:00			`raise TaskListError(msg)`
Issue warning when specifying pre/successors across phases 2015-04-08 21:52:46 +02:00			`if task.phase > predecessor.phase:`
			`log.warn("The task {task} is specified as running after {other} "`
Add a little helpful not to tasklist ordering warning 2015-04-09 18:23:08 +02:00			`"although its phase '{phase}' already lies after the phase '{other_phase}' "`
			`"(or the task has been placed in the wrong phase)"`
Issue warning when specifying pre/successors across phases 2015-04-08 21:52:46 +02:00			`.format(task=task, other=predecessor, phase=task.phase, other_phase=predecessor.phase))`
Cycle detection and topological sorting 2013-06-23 17:03:55 +02:00

Refactor tasklist for easier integration by taskoverview 2014-05-10 17:24:50 +02:00			`def strongly_connected_components(graph):`
			`"""Find the strongly connected components in a graph using Tarjan's algorithm.`
Cycle detection and topological sorting 2013-06-23 17:03:55 +02:00
Refactor tasklist for easier integration by taskoverview 2014-05-10 17:24:50 +02:00			`Source: http://www.logarithmic.net/pfh-files/blog/01208083168/sort.py`
Everything in base/ is now commented. 2014-03-23 16:04:03 +01:00
Refactor tasklist for easier integration by taskoverview 2014-05-10 17:24:50 +02:00			`:param dict graph: mapping of tasks to lists of successor tasks`
			`:return: List of tuples that are strongly connected comoponents`
			`:rtype: list`
			`"""`
Cycle detection and topological sorting 2013-06-23 17:03:55 +02:00
Refactor tasklist for easier integration by taskoverview 2014-05-10 17:24:50 +02:00			`result = []`
			`stack = []`
			`low = {}`
Cycle detection and topological sorting 2013-06-23 17:03:55 +02:00
Refactor tasklist for easier integration by taskoverview 2014-05-10 17:24:50 +02:00			`def visit(node):`
			`if node in low:`
			`return`
Cycle detection and topological sorting 2013-06-23 17:03:55 +02:00
Refactor tasklist for easier integration by taskoverview 2014-05-10 17:24:50 +02:00			`num = len(low)`
			`low[node] = num`
			`stack_pos = len(stack)`
			`stack.append(node)`
Cycle detection and topological sorting 2013-06-23 17:03:55 +02:00
Refactor tasklist for easier integration by taskoverview 2014-05-10 17:24:50 +02:00			`for successor in graph[node]:`
			`visit(successor)`
			`low[node] = min(low[node], low[successor])`
Cycle detection and topological sorting 2013-06-23 17:03:55 +02:00
Refactor tasklist for easier integration by taskoverview 2014-05-10 17:24:50 +02:00			`if num == low[node]:`
			`component = tuple(stack[stack_pos:])`
			`del stack[stack_pos:]`
			`result.append(component)`
			`for item in component:`
			`low[item] = len(graph)`
Cycle detection and topological sorting 2013-06-23 17:03:55 +02:00
Refactor tasklist for easier integration by taskoverview 2014-05-10 17:24:50 +02:00			`for node in graph:`
			`visit(node)`
Cycle detection and topological sorting 2013-06-23 17:03:55 +02:00
Refactor tasklist for easier integration by taskoverview 2014-05-10 17:24:50 +02:00			`return result`
Cycle detection and topological sorting 2013-06-23 17:03:55 +02:00
Everything in base/ is now commented. 2014-03-23 16:04:03 +01:00
Refactor tasklist for easier integration by taskoverview 2014-05-10 17:24:50 +02:00			`def topological_sort(graph):`
			`"""Runs a topological sort on a graph.`
Everything in base/ is now commented. 2014-03-23 16:04:03 +01:00
Refactor tasklist for easier integration by taskoverview 2014-05-10 17:24:50 +02:00			`Source: http://www.logarithmic.net/pfh-files/blog/01208083168/sort.py`

			`:param dict graph: mapping of tasks to lists of successor tasks`
			`:return: A list of all tasks in the graph sorted according to ther dependencies`
			`:rtype: list`
			`"""`
			`count = {}`
			`for node in graph:`
			`count[node] = 0`
			`for node in graph:`
			`for successor in graph[node]:`
			`count[successor] += 1`

			`ready = [node for node in graph if count[node] == 0]`

			`result = []`
			`while ready:`
			`node = ready.pop(-1)`
			`result.append(node)`

			`for successor in graph[node]:`
			`count[successor] -= 1`
			`if count[successor] == 0:`
			`ready.append(successor)`

			`return result`