Spaces:
Runtime error
Runtime error
add reacher env and all mujoco envs now support COT, SPP, SELF-REFLEXION, EXE methods under L1&L3 setting.
8f842da
import numpy as np | |
import random | |
def pseudo_random_policy(state, pre_action): | |
def get_description(): | |
return "Select action randomly" | |
pseudo_random_policy.description = get_description() | |
return [2 * random.random() - 1 for i in range(2)] | |
def real_random_policy(state, pre_action=1): | |
def get_description(): | |
return "Select action with a random policy" | |
real_random_policy.description = get_description() | |
return [2 * random.random() - 1 for i in range(2)] |