Source code for concepts.dm.crow.planners.regression_planning_impl.crow_regression_planner_v1

#! /usr/bin/env python3
# -*- coding: utf-8 -*-
# File   : crow_regression_planner_v1.py
# Author : Jiayuan Mao
# Email  : maojiayuan@gmail.com
# Date   : 03/21/2024
#
# This file is part of Project Concepts.
# Distributed under terms of the MIT license.

import queue
import jacinle

from typing import Optional, Union, Iterator, Sequence, Tuple, List, Dict, NamedTuple
from concepts.dsl.constraint import ConstraintSatisfactionProblem
from concepts.dsl.dsl_types import Variable
from concepts.dsl.tensor_state import StateObjectReference

from concepts.dm.crow.controller import CrowControllerApplier, CrowControllerApplicationExpression
from concepts.dm.crow.behavior import CrowBehavior, CrowAchieveExpression, CrowBindExpression, CrowRuntimeAssignmentExpression, CrowAssertExpression
from concepts.dm.crow.behavior import CrowBehaviorStatementOrdering, CrowBehaviorOrderingSuite, CrowBehaviorApplicationExpression
from concepts.dm.crow.behavior_utils import match_applicable_behaviors
from concepts.dm.crow.executors.crow_executor import CrowExecutor
from concepts.dm.crow.planners.regression_planning import ScopedCrowExpression, CrowPlanningResult, CrowRegressionPlanner
from concepts.dm.crow.planners.regression_planning_impl.crow_regression_utils import canonize_bounded_variables, split_simple_sequential, execute_object_bind, execute_behavior_effect_batch, unique_results, execute_behavior_effect


__all__ = ['CrowPlanningState', 'CrowRegressionPlannerBFSv1', 'CrowRegressionPlannerDFSv1']


[docs] class CrowPlanningState(NamedTuple): program: Optional[CrowBehaviorOrderingSuite] scopes: Dict[int, dict] latest_scope: int right_statements: List[ScopedCrowExpression] depth: int = 0 def __lt__(self, other): return len(self.right_statements) < len(other.right_statements)
LOG_BFS_GRAPH = False
[docs] class CrowRegressionPlannerBFSv1(CrowRegressionPlanner):
[docs] def main_entry(self, program: CrowBehaviorOrderingSuite) -> List[Tuple[CrowControllerApplier, ...]]: state = CrowPlanningState(program, scopes={0: dict()}, right_statements=[], latest_scope=0) candidate_plans = self.bfs(state) candidate_plans = [result.controller_actions for result in candidate_plans] return candidate_plans
[docs] def bfs(self, state: CrowPlanningState) -> Sequence[CrowPlanningResult]: q = queue.PriorityQueue() q.put(state) graph = None if LOG_BFS_GRAPH: graph = dict(nodes=dict(), edges=list()) graph['nodes'][id(state)] = state while not q.empty(): self._search_stat['nr_expanded_nodes'] += 1 if self._search_stat['nr_expanded_nodes'] > 1000000: import ipdb; ipdb.set_trace() raise RuntimeError('Too many nodes expanded.') if self._search_stat['nr_expanded_nodes'] % 1000 == 0: jacinle.log_function.print('Expanded nodes:', self._search_stat['nr_expanded_nodes']) current_state = q.get() # print('Current state:', current_state.right_statements) for left, stmt, scope_id in current_state.program.pop_right_statement(): for i, new_state in enumerate(self._bfs_expand(current_state, left, stmt, scope_id)): if LOG_BFS_GRAPH: graph['nodes'][id(new_state)] = new_state graph['edges'].append((id(current_state), id(new_state), f'{stmt}@{i}')) if new_state.program is None: if (result := self._bfs_verify(new_state)) is not None: return [result] else: # jacinle.log_function.print(' New state:', new_state.right_statements) q.put(new_state) return list()
def _bfs_expand(self, state: CrowPlanningState, left: CrowBehaviorOrderingSuite, stmt: Union[CrowAchieveExpression, CrowControllerApplicationExpression], scope_id: int) -> Iterator[CrowPlanningState]: if isinstance(stmt, CrowAchieveExpression): if left is None: yield CrowPlanningState(None, state.scopes, state.latest_scope, [ScopedCrowExpression(CrowAssertExpression(stmt.goal), scope_id)] + state.right_statements, state.depth + 1) else: yield CrowPlanningState(left, state.scopes, state.latest_scope, [ScopedCrowExpression(CrowAssertExpression(stmt.goal), scope_id)] + state.right_statements, state.depth + 1) all_matching = match_applicable_behaviors(self.executor.domain, self.state, stmt.goal, state.scopes[scope_id]) all_matching = list(all_matching) for behavior_matching in all_matching: # print('Behavior matching:', behavior_matching.behavior.name, behavior_matching.bounded_variables) # if 'hand' in behavior_matching.behavior.name: # import ipdb; ipdb.set_trace() # pass bounded_variables = behavior_matching.bounded_variables for var, value in bounded_variables.items(): if isinstance(value, Variable): bounded_variables[var] = value.clone_with_scope(scope_id) new_scope_id = state.latest_scope + 1 new_scopes = state.scopes.copy() new_scopes[new_scope_id] = bounded_variables.copy() program = behavior_matching.behavior.assign_body_program_scope(new_scope_id) complex_part, simple_part = split_simple_sequential(program.get_flatten_body(), new_scope_id) if left is None: if len(complex_part) == 0: new_program = None else: new_program = CrowBehaviorOrderingSuite(CrowBehaviorStatementOrdering.SEQUENTIAL, complex_part, variable_scope_identifier=new_scope_id) else: new_program = CrowBehaviorOrderingSuite(CrowBehaviorStatementOrdering.SEQUENTIAL, (left,) + program.get_flatten_body(), variable_scope_identifier=new_scope_id) yield CrowPlanningState(new_program, new_scopes, new_scope_id, simple_part + [ScopedCrowExpression(behavior_matching.behavior, new_scope_id)] + state.right_statements, state.depth + 1) if self.enable_reordering: promotable, sequential_body = program.split_promotable() complex_seq, simple_seq = split_simple_sequential(sequential_body, new_scope_id) if left is not None and promotable is not None: new_program = CrowBehaviorOrderingSuite(CrowBehaviorStatementOrdering.SEQUENTIAL, ( CrowBehaviorOrderingSuite(CrowBehaviorStatementOrdering.UNORDERED, ( left, CrowBehaviorOrderingSuite(CrowBehaviorStatementOrdering.SEQUENTIAL, promotable, variable_scope_identifier=new_scope_id) ), variable_scope_identifier=new_scope_id), *complex_seq ), variable_scope_identifier=new_scope_id) yield CrowPlanningState(new_program, new_scopes, new_scope_id, simple_seq + [ScopedCrowExpression(behavior_matching.behavior, new_scope_id)] + state.right_statements, state.depth + 1) elif isinstance(stmt, (CrowBindExpression, CrowRuntimeAssignmentExpression, CrowAssertExpression, CrowControllerApplicationExpression)): if left is None: yield CrowPlanningState(None, state.scopes, state.latest_scope, [ScopedCrowExpression(stmt, scope_id)] + state.right_statements, state.depth + 1) else: yield CrowPlanningState(left, state.scopes, state.latest_scope, [ScopedCrowExpression(stmt, scope_id)] + state.right_statements, state.depth + 1) else: raise ValueError(f'Unknown statement type: {stmt}') def _bfs_verify(self, state: CrowPlanningState) -> Optional[CrowPlanningResult]: init_results = [CrowPlanningResult(self.state, ConstraintSatisfactionProblem() if self.enable_csp else None, tuple(), state.scopes)] results = execute_statements(self.executor, init_results, state.right_statements) if len(results) > 0: return results[0] else: return None
[docs] class CrowRegressionPlannerDFSv1(CrowRegressionPlanner):
[docs] def main_entry(self, program: CrowBehaviorOrderingSuite) -> List[Tuple[CrowControllerApplier, ...]]: state = CrowPlanningState(program, scopes={0: dict()}, right_statements=[], latest_scope=0) candidate_plans = self.bfs(state) candidate_plans = [result.controller_actions for result in candidate_plans] return candidate_plans
[docs] @jacinle.log_function(verbose=False) def dfs(self, state: CrowPlanningState) -> Sequence[CrowPlanningResult]: jacinle.log_function.print('Program:', state.program, 'Depth:', state.depth) if state.depth >= self.max_search_depth: raise RuntimeError('Maximum search depth reached.') right_statements_str = ' '.join([f'{str(x)}@{i}' for x, i in state.right_statements]) jacinle.log_function.print(jacinle.colored(right_statements_str, 'yellow'), state.scopes) new_results = list() for left, stmt, scope_id in state.program.pop_right_statement(): new_results.extend(self._dfs_expand(state, left, stmt, scope_id)) # jacinle.log_function.print('New results:', [x.controller_appliers for x in new_results]) return unique_results(new_results)
def _dfs_expand(self, state: CrowPlanningState, left: CrowBehaviorOrderingSuite, stmt: Union[CrowAchieveExpression, CrowControllerApplicationExpression], scope_id: int) -> Sequence[CrowPlanningResult]: """Expand a statement. Args: state: the current search state. left: the left part of the program. stmt: the statement to be expanded. scope_id: the current scope id. """ # jacinle.log_function.print('Expanding:', stmt, 'with left:', left, 'and scope', state.scopes[scope_id]) new_results = list() if isinstance(stmt, CrowAchieveExpression): jacinle.log_function.print('Expanding:', stmt, 'with left:', left, 'and scope_id:', scope_id) jacinle.log_function.print('Null goal expansion', stmt.goal) # Branch 1: the goal is directly satisfied at the after expanding the left part (null production). if left is None: last_results = [CrowPlanningResult(self.state, ConstraintSatisfactionProblem() if self.enable_csp else None, tuple(), state.scopes)] else: last_results = self.dfs(CrowPlanningState(left, state.scopes, state.latest_scope, [ScopedCrowExpression(CrowAssertExpression(stmt.goal), scope_id)] + state.right_statements, state.depth + 1)) for last_result in last_results: rv = self.executor.execute(stmt.goal, state=last_result.state, bounded_variables=canonize_bounded_variables(last_result.scopes, scope_id)) jacinle.log_function.print('Last result:', last_result.controller_actions, 'Null Eval=', bool(rv.item())) if bool(rv.item()): new_results.append(last_result) if len(new_results) > 0: return new_results # Branch 2: the goal is not directly satisfied. We need to refine the goal. all_matching = match_applicable_behaviors(self.executor.domain, self.state, stmt.goal, state.scopes[scope_id]) all_matching = list(all_matching) matchings_str = [(x.behavior.name, x.bounded_variables) for x in all_matching] jacinle.log_function.print(jacinle.tabulate(matchings_str, headers=['Behavior', 'Bounded Variables'])) for behavior_matching in all_matching: bounded_variables = behavior_matching.bounded_variables for var, value in bounded_variables.items(): if isinstance(value, Variable): bounded_variables[var] = value.clone_with_scope(scope_id) # Create a new scope for this subgoal refinement. new_scope_id = state.latest_scope + 1 new_scopes = state.scopes.copy() new_scopes[new_scope_id] = bounded_variables.copy() program = behavior_matching.behavior.assign_body_program_scope(new_scope_id) # Branch 2.1: the goal will be refined by ignoring the promotable part. # Create a new program by sequencing the left part and the refinement of this behavior. if left is None: new_program = CrowBehaviorOrderingSuite(CrowBehaviorStatementOrdering.SEQUENTIAL, program.get_flatten_body(), variable_scope_identifier=new_scope_id) else: new_program = CrowBehaviorOrderingSuite(CrowBehaviorStatementOrdering.SEQUENTIAL, (left,) + program.get_flatten_body(), variable_scope_identifier=new_scope_id) # Now recursively calls the DFS to expand the new program. # import ipdb; ipdb.set_trace() this_new_results = self.dfs(CrowPlanningState(new_program, new_scopes, new_scope_id, [ScopedCrowExpression(behavior_matching.behavior, new_scope_id)] + state.right_statements, state.depth + 1)) if len(this_new_results) > 0: new_results.extend(execute_behavior_effect_batch(self.executor, this_new_results, behavior_matching.behavior, new_scope_id)) continue # Branch 2.2: If the sequential expansion fails, we try to expand the unordered part. if self.enable_reordering: promotable, sequential_body = program.split_promotable() if left is not None and promotable is not None: new_program = CrowBehaviorOrderingSuite( CrowBehaviorStatementOrdering.SEQUENTIAL, (CrowBehaviorOrderingSuite(CrowBehaviorStatementOrdering.UNORDERED, (left,) + promotable, variable_scope_identifier=new_scope_id), sequential_body), variable_scope_identifier=new_scope_id ) this_new_results = self.dfs(CrowPlanningState(new_program, new_scopes, new_scope_id, [ScopedCrowExpression(behavior_matching.behavior, new_scope_id)] + state.right_statements, state.depth + 1)) if len(this_new_results) > 0: new_results.extend(execute_behavior_effect_batch(self.executor, this_new_results, behavior_matching.behavior, new_scope_id)) return new_results elif isinstance(stmt, CrowBehaviorApplicationExpression): pass elif isinstance(stmt, (CrowBindExpression, CrowRuntimeAssignmentExpression, CrowAssertExpression, CrowControllerApplicationExpression)): # These statements are "primitive" or "atomic". Therefore, all we need to do is to expand the left branch and then apply the primitive. if left is None: last_results = [CrowPlanningResult(self.state, ConstraintSatisfactionProblem() if self.enable_csp else None, tuple(), state.scopes)] else: last_results = self.dfs(CrowPlanningState(left, state.scopes, state.latest_scope, [ScopedCrowExpression(stmt, scope_id)] + state.right_statements, state.depth + 1)) for last_result in last_results: new_results.extend(self._dfs_expand_primitive(last_result, stmt, scope_id)) return new_results else: raise ValueError(f'Unknown statement type: {stmt}') def _dfs_expand_primitive(self, last_result: CrowPlanningResult, stmt: Union[CrowBindExpression, CrowRuntimeAssignmentExpression, CrowAssertExpression, CrowControllerApplicationExpression], scope_id: int) -> Sequence[CrowPlanningResult]: """Apply a primitive statement on top of a particular planning result of the left branch.""" if isinstance(stmt, CrowControllerApplicationExpression): argument_values = [self.executor.execute(x, state=last_result.state, bounded_variables=canonize_bounded_variables(last_result.scopes, scope_id)) for x in stmt.arguments] for i, argv in enumerate(argument_values): if isinstance(argv, StateObjectReference): argument_values[i] = argv.name return [CrowPlanningResult(last_result.state, last_result.csp, last_result.controller_actions + (CrowControllerApplier(stmt.controller, argument_values),), last_result.scopes)] elif isinstance(stmt, CrowBindExpression): if stmt.is_object_bind: new_results = list() for new_scope in execute_object_bind(self.executor, stmt, last_result.state, canonize_bounded_variables(last_result.scopes, scope_id)): new_scopes = last_result.scopes.copy() new_scopes[scope_id] = new_scope new_results.append(CrowPlanningResult(last_result.state, last_result.csp, last_result.controller_actions, new_scopes)) jacinle.log_function.print(f'Object binding results for {stmt} under scope {canonize_bounded_variables(last_result.scopes, scope_id)}:', len(new_results), 'states.') return new_results else: raise NotImplementedError() elif isinstance(stmt, CrowRuntimeAssignmentExpression): raise NotImplementedError() elif isinstance(stmt, CrowAssertExpression): # TODO(Jiayuan Mao @ 2024/03/19): implement the CSP tracking. rv = self.executor.execute(stmt.bool_expr, state=last_result.state, bounded_variables=canonize_bounded_variables(last_result.scopes, scope_id)) jacinle.log_function.print(f'Assert {stmt.bool_expr} under scope {canonize_bounded_variables(last_result.scopes, scope_id)}:', bool(rv.item())) if bool(rv.item()): return [last_result] else: return [] else: raise ValueError(f'Unknown statement type: {stmt}')
[docs] def execute_statements(executor: CrowExecutor, init_results: Sequence[CrowPlanningResult], statements: Sequence[ScopedCrowExpression]) -> List[CrowPlanningResult]: # statement_str = ' '.join([f'{str(x)}@{i}' for x, i in state.right_statements]) # print(jacinle.colored(statement_str, 'yellow'), state.scopes) results = init_results for statement in statements: stmt, scope_id = statement.statement, statement.scope_id new_results = list() try: # Invalid ordering of find statement. bounded_variables = canonize_bounded_variables(results[0].scopes, scope_id) except KeyError: return list() if isinstance(stmt, CrowAssertExpression): for result in results: rv = executor.execute(stmt.bool_expr, state=result.state, bounded_variables=canonize_bounded_variables(result.scopes, scope_id)) if bool(rv.item()): new_results.append(result) elif isinstance(stmt, CrowControllerApplicationExpression): for result in results: argument_values = [executor.execute(x, state=result.state, bounded_variables=canonize_bounded_variables(result.scopes, scope_id)) for x in stmt.arguments] for i, argv in enumerate(argument_values): if isinstance(argv, StateObjectReference): argument_values[i] = argv.name new_results.append(CrowPlanningResult(result.state, result.csp, result.controller_actions + (CrowControllerApplier(stmt.controller, argument_values),), result.scopes)) elif isinstance(stmt, CrowBindExpression): for result in results: for new_scope in execute_object_bind(executor, stmt, result.state, canonize_bounded_variables(result.scopes, scope_id)): # print('!!!Object binding result:', new_scope) new_scopes = result.scopes.copy() new_scopes[scope_id] = new_scope new_results.append(CrowPlanningResult(result.state, result.csp, result.controller_actions, new_scopes)) elif isinstance(stmt, CrowBehavior): new_results = [execute_behavior_effect(executor, stmt, result.state, canonize_bounded_variables(result.scopes, scope_id)) for result in results] else: raise ValueError(f'Unknown statement type: {stmt}') results = new_results if len(results) == 0: break return results