[文档]defreturn_range(dataset,max_episode_steps):returns,lengths=[],[]ep_ret,ep_len=0.,0forr,dinzip(dataset['rewards'],dataset['terminals']):ep_ret+=float(r)ep_len+=1ifdorep_len==max_episode_steps:returns.append(ep_ret)lengths.append(ep_len)ep_ret,ep_len=0.,0# returns.append(ep_ret) # incomplete trajectorylengths.append(ep_len)# but still keep track of number of stepsassertsum(lengths)==len(dataset['rewards'])returnmin(returns),max(returns)