Fix: handle _action_masks buffer in single-task scenarios (#67)
This commit is contained in:
@@ -212,6 +212,7 @@ def api_model_conversion(target_state_dict, source_state_dict):
|
||||
# copy log_std_min and log_std_max from target_state_dict to new_state_dict
|
||||
new_state_dict['log_std_min'] = target_state_dict['log_std_min']
|
||||
new_state_dict['log_std_dif'] = target_state_dict['log_std_dif']
|
||||
if '_action_masks' in target_state_dict:
|
||||
new_state_dict['_action_masks'] = target_state_dict['_action_masks']
|
||||
|
||||
# copy new_state_dict to source_state_dict
|
||||
|
||||
Reference in New Issue
Block a user