PyDPOCL.py

from GPlan import GPlan, math
from Flaws import OPF, TCLF
from uuid import uuid4
import copy
from heapq import heappush, heappop
from clockdeco import clock
import time
LOG = 0
REPORT = 0
RRP = 0
from collections import Counter

def log_message(message):
	if LOG:
		print(message)


class Frontier:

	def __init__(self):
		self._frontier = []

	def __len__(self):
		return len(self._frontier)

	def __getitem__(self, position):
		return self._frontier[position]

	def pop(self):
		return heappop(self._frontier)

	def insert(self, plan):
		heappush(self._frontier, plan)

	def extend(self, itera):
		for item in itera:
			self.insert(item)

	def __repr__(self):
		k = 'frontier plans\n'
		for plan in self._frontier:
			'{}:{} c={} h={} steps:\n{}\n'.format(k, str(plan.ID), plan.cost, plan.heuristic, plan.steps)
		return k


class GPlanner:
	"""
	Plan space planner, only instantiate once per planner, starts with ground steps
	"""

	def __init__(self, gsteps):
		self.gsteps = gsteps
		self.ID = uuid4()
		self.h_step_dict = dict()
		self.h_lit_dict = dict()

		root_plan = GPlan(gsteps[-2], gsteps[-1])
		root_plan.OrderingGraph.addOrdering(root_plan.dummy.init, root_plan.dummy.final)
		for p in root_plan.dummy.final.open_preconds:
			root_plan.flaws.insert(root_plan, OPF(root_plan.dummy.final, p, 100000))

		self._frontier = Frontier()
		self.insert(root_plan)
		self._h_visited = []
		self.plan_num = 0
		self.max_height = gsteps[-3].height

	# Private Hooks #

	def __len__(self):
		return len(self._frontier)

	def __getitem__(self, position):
		return self._frontier[position]

	# Methods #

	def pop(self):
		return self._frontier.pop()

	def insert(self, plan):
		plan.heuristic = self.h_plan(plan)
		log_message('>\tadd plan to frontier: {} with cost {} and heuristic {}\n'.format(plan.name, plan.cost, plan.heuristic))
		self._frontier.insert(plan)

	# @clock
	def solve(self, k=4, cutoff=6000):
		# find k solutions to problem

		completed = []
		expanded = 0
		leaves = 0
		tclf_visits = 0
		success_message = 'solution {} found at {} nodes expanded and {} nodes visited and {} branches terminated'

		t0 = time.time()
		print('k={}'.format(str(k)))
		print('time\texpanded\tvisited\tterminated\tdepth\tcost\ttrace')
		while len(self) > 0:
			plan = self.pop()

			if not plan.isInternallyConsistent():
				# if plan.name[-3] == 'a':
				# 	print('stop')
				log_message('prune {}'.format(plan.name))
				leaves += 1
				continue

			# debugging:
			# plan_schemata = Counter(step.schema for step in plan.steps)
			# Counter(plan_schemata)
			# for item, value in plan_schemata.items():
			# 	if value > 3:
			# 		print('check here')
			# if len(plan_schemata) > len(set(plan_schemata)):
			# 	print('check here')

			log_message('Plan {} selected cost={} heuristic={}'.format(plan.name, plan.cost, plan.heuristic))
			for step in plan.OrderingGraph.topoSort():
				log_message('\t\t {}\n'.format(str(step)))


			if len(plan.flaws) == 0:
				# success
				elapsed = time.time() - t0
				delay = str('%0.8f' % elapsed)
				completed.append(plan)

				trace = math.floor(len(plan.name.split('['))/2)
				print('{}\t{}\t{}\t{}\t{}\t{}\t{}'.format(delay, expanded, len(self) + expanded, leaves, str(plan.depth), plan.cost, trace))
				if REPORT:
					print(success_message.format(plan.name, expanded, len(self)+expanded, leaves))

					for step in plan.OrderingGraph.topoSort():
						print(step)
					print('\n')

				if len(completed) == k:
					return completed
				# if len(completed) == 6:
				# 	print('check here')
				continue

			if time.time() - t0 > cutoff:
				print('timedout: {}\t{}\t{}'.format(expanded, len(self) + expanded, leaves))
				return

			# Select Flaw
			flaw = plan.flaws.next()
			plan.name += '[' + str(flaw.flaw_type)[0] + ']'
			log_message('{} selected : {}\n'.format(flaw.name, flaw))

			self.plan_num = 0

			if isinstance(flaw, TCLF):
				tclf_visits += 1
				self.resolve_threat(plan, flaw)
			else:
				# only count expanded nodes as those that resolve open conditions
				expanded += 1
				self.add_step(plan, flaw)
				self.reuse_step(plan, flaw)

		raise ValueError('FAIL: No more plans to visit with {} nodes expanded'.format(expanded))

	def add_step(self, plan, flaw):
		s_need, p = flaw.flaw
		cndts = s_need.cndt_map[p.ID]

		if len(cndts) == 0:
			return

		# need indices
		s_index = plan.index(s_need)
		p_index = s_need.preconds.index(p)
		for cndt in cndts:

			if RRP:
				# the Recursive Repair Policty: only let steps with <= height repair open conditions.
				if self.gsteps[cndt].height > flaw.level:
					continue

			# cannot add a step which is the inital step
			if not self.gsteps[cndt].instantiable:
				continue
			# clone plan and new step

			new_plan = plan.instantiate(str(self.plan_num) + '[a] ')
			self.plan_num += 1

			# use indices befoer inserting new steps
			mutable_s_need = new_plan[s_index]
			mutable_p = mutable_s_need.preconds[p_index]

			# instantiate new step
			new_step = self.gsteps[cndt].instantiate()

			# pass depth to new Added step.
			new_step.depth = mutable_s_need.depth

			# recursively insert new step and substeps into plan, adding orderings and flaws
			new_plan.insert(new_step)
			log_message('Add step {} to plan {}\n'.format(str(new_step), new_plan.name))

			# resolve s_need with the new step
			new_plan.resolve(new_step, mutable_s_need, mutable_p)

			new_plan.cost += ((self.max_height*self.max_height)+1) - (new_step.height*new_step.height)
			# new_plan.cost += self.max_height + 1 - new_step.height
			# new_plan.cost += 1
			# self.max_height + 1 - new_step.height

			# insert our new mutated plan into the frontier
			self.insert(new_plan)


	def reuse_step(self, plan, flaw):
		s_need, p = flaw.flaw

		choices = [step for step in plan.steps
		           if step.stepnum in s_need.cndt_map[p.ID]
		           and not s_need.ID == step.ID
		           and not plan.OrderingGraph.isPath(s_need, step)]
		           # and not plan.CausalLinkGraph.isPath(s_need, step)]
		           # and plan.HierarchyGraph.satisfies_hierarchy(step, p, s_need)]
		if len(choices) == 0:
			return

		# need indices
		s_index = plan.index(s_need)
		p_index = s_need.preconds.index(p)
		for choice in choices:
			# clone plan and new step
			new_plan = plan.instantiate(str(self.plan_num) + '[r] ')
			self.plan_num += 1

			# use indices before inserting new steps
			mutable_s_need = new_plan[s_index]
			mutable_p = mutable_s_need.preconds[p_index]

			# use index to find old step
			old_step = new_plan.steps[plan.index(choice)]
			log_message('Reuse step {} to plan {}\n'.format(str(old_step), new_plan.name))

			# resolve open condition with old step
			new_plan.resolve(old_step, mutable_s_need, mutable_p)

			# insert mutated plan into frontier
			self.insert(new_plan)

	def resolve_threat(self, plan, tclf):
		threat_index = plan.index(tclf.threat)
		src_index = plan.index(tclf.link.source)
		snk_index = plan.index(tclf.link.sink)

		# Promotion
		new_plan = plan.instantiate(str(self.plan_num)+ '[tp] ')
		self.plan_num += 1
		threat = new_plan[threat_index]
		sink = new_plan[snk_index]
		new_plan.OrderingGraph.addEdge(sink, threat)
		if hasattr(threat, 'sibling'):
			new_plan.OrderingGraph.addEdge(sink, threat.sibling)
		if hasattr(sink, 'sibling'):
			new_plan.OrderingGraph.addEdge(sink.sibling, threat)
		threat.update_choices(new_plan)
		self.insert(new_plan)
		log_message('promote {} in front of {} in plan {}'.format(threat, sink, new_plan.name))


		# Demotion
		new_plan = plan.instantiate(str(self.plan_num) + '[td] ')
		self.plan_num += 1
		threat = new_plan[threat_index]
		source = new_plan[src_index]
		new_plan.OrderingGraph.addEdge(threat, source)
		if hasattr(threat, 'sibling'):
			new_plan.OrderingGraph.addEdge(source, threat.sibling)
		if hasattr(source, 'sibling'):
			new_plan.OrderingGraph.addEdge(source.sibling, threat)
		threat.update_choices(new_plan)
		self.insert(new_plan)
		log_message('demotion {} behind {} in plan {}'.format(threat, source, new_plan.name))

	# Heuristic Methods #

	def h_condition(self, plan, stepnum, precond):
		if precond.is_static:
			return 0
		if precond in plan.init:
			return 0
		if precond in self.h_lit_dict.keys():
			return self.h_lit_dict[precond]
		if precond in self._h_visited:
			return 0

		self._h_visited.append(precond)

		min_so_far = float('inf')
		# if the following is true, then we have an "sub-init" step in our mist
		if len(self.gsteps[stepnum].cndts) == 0:
			stepnum += 2

		for cndt in self.gsteps[stepnum].cndt_map[precond.ID]:
			if not self.gsteps[cndt].instantiable:
				continue
			if not self.gsteps[cndt].height == 0:
				continue
			cndt_heuristic = self.h_step(plan, cndt)
			if cndt_heuristic < min_so_far:
				min_so_far = cndt_heuristic

		self.h_lit_dict[precond] = min_so_far
		return min_so_far

	def h_step(self, plan, stepnum):
		if stepnum in self.h_step_dict.keys():
			return self.h_step_dict[stepnum]
		if stepnum == plan.dummy.init.stepnum:
			return 1
		if stepnum in self._h_visited:
			return 1

		self._h_visited.append(stepnum)
		sumo = 1
		for pre in self.gsteps[stepnum].preconds:
			sumo += self.h_condition(plan, stepnum, pre)

		if self.gsteps[stepnum].height > 0:
			sumo += self.h_subplan(plan, self.gsteps[stepnum])

		self.h_step_dict[stepnum] = sumo
		return sumo

	def h_plan(self, plan):
		sumo = 0

		self._h_visited = []
		self.h_lit_dict = dict()
		# flaw_gen = plan.flaws.OC_gen()
		for flaw in plan.flaws.OC_gen():
			# num_flaws += 1
			# exists_choice = False
			# if len(flaw.s_need.choices) > 0:
			# 	exists_choice = True


			if len(flaw.s_need.choices) == 0:
				sumo += self.h_condition(plan, flaw.s_need.stepnum, flaw.p)

		return sumo

	def h_subplan(self, plan, abstract_step):
		sumo = 0
		for sub_step in abstract_step.sub_steps:
			for pre in sub_step.open_preconds:
				if pre in abstract_step.preconds or pre in plan.init:
					continue
				sumo += self.h_condition(plan, sub_step.stepnum, pre)
		for pre in abstract_step.dummy.final.open_preconds:
			if pre in abstract_step.preconds or pre in plan.init:
				continue
			sumo += self.h_condition(plan, abstract_step.dummy.final.stepnum, pre)
		return sumo

import sys
import pickle
# import Ground_Compiler_Library
from Ground_Compiler_Library import Ground, precompile
# import json
# import jsonpickle
#
# class gstep_encoder(json.JSONEncoder):
# 	def default(self, obj):
# 		if hasattr(obj, 'to_json'):
# 			return obj.to_json()
# 		return json.JSONEncoder.default(self, obj)


def upload(GL, name):
	print(name)
	with open(name, 'wb') as afile:
		pickle.dump(GL, afile)

# def just_compile_no_saving_steps(domain_file, problem_file):
# 	GL = Ground.GLib(domain_file, problem_file)
# 	ground_step_list = precompile.deelementize_ground_library(GL)

def just_compile(domain_file, problem_file, pickle_names):
	GL = Ground.GLib(domain_file, problem_file)
	with open('ground_steps.txt', 'w') as gs:
		for step in GL:
			gs.write(str(step))
			gs.write('\n\tpreconditions:')
			for pre in step.Preconditions:
				gs.write('\n\t\t' + str(pre))
			gs.write('\n\teffects:')
			for eff in step.Effects:
				gs.write('\n\t\t' + str(eff))
			gs.write('\n\n')
	ground_step_list = precompile.deelementize_ground_library(GL)
	with open('ground_steps_stripped.txt', 'w') as gs:
		# gs.write('\n\n')
		for i, step in enumerate(ground_step_list):
			gs.write('\n')
			gs.write(str(i) + '\n')
			gs.write(str(step))
			gs.write('\n\tpreconditions:')
			for pre in step.preconds:
				gs.write('\n\t\t' + str(pre))
				if step.cndt_map is not None:
					if pre.ID in step.cndt_map.keys():
						gs.write('\n\t\t\tcndts:\t{}'.format(str(step.cndt_map[pre.ID])))
				if step.threat_map is not None:
					if pre.ID in step.threat_map.keys():
						gs.write('\n\t\t\trisks:\t{}'.format(str(step.threat_map[pre.ID])))

			if step.height > 0:
				gs.write('\n\tsub_steps:')
				for sub in step.sub_steps:
					gs.write('\n\t\t{}'.format(str(sub)))
				gs.write('\n\tsub_orderings:')
				for ord in step.sub_orderings.edges:
					gs.write('\n\t\t{}'.format(str(ord.source) + ' < ' + str(ord.sink)))
				for link in step.sub_links.edges:
					gs.write('\n\t\t{}'.format(str(link)))
			gs.write('\n\n')

	for i, gstep in enumerate(ground_step_list):
		with open(pickle_names + str(i), 'wb') as ugly:
			pickle.dump(gstep, ugly)
	return ground_step_list

if __name__ == '__main__':
	num_args = len(sys.argv)
	if num_args >1:
		domain_file = sys.argv[1]
		if num_args > 2:
			problem_file = sys.argv[2]
	else:
		# domain_file = 'Ground_Compiler_Library//domains/travel_domain_primitive_only.pddl'
		domain_file = 'Ground_Compiler_Library//domains/travel_domain.pddl'
		problem_file = 'Ground_Compiler_Library//domains/travel-to-la.pddl'
		# problem_file = 'Ground_Compiler_Library//domains/travel-to-la.pddl'
	d_name = domain_file.split('/')[-1].split('.')[0]
	p_name = problem_file.split('/')[-1].split('.')[0]
	uploadable_ground_step_library_name = 'Ground_Compiler_Library//' + d_name + '.' + p_name


	RELOAD = 0
	if RELOAD:
		ground_steps = just_compile(domain_file, problem_file, uploadable_ground_step_library_name)

	PLAN = 1
	if PLAN:
		ground_steps = []
		i = 0
		while True:
			try:
				print(i)
				with open(uploadable_ground_step_library_name + str(i), 'rb') as ugly:
					ground_steps.append(pickle.load(ugly))
				i += 1
			except:
				break
		print('finished uploading')


		planner = GPlanner(ground_steps)
		planner.solve(k=1)


		# planner2 = GPlanner()
		# planner2.solve(k=1)