Spaces:

ar08
/

zzz

Running

zzz / evaluation /benchmarks /miniwob /get_avg_reward.py

Upload 1040 files

246d201 verified 6 months ago

1.08 kB

	import argparse
	import json

	import browsergym.miniwob # noqa F401 register miniwob tasks as gym environments
	import gymnasium as gym

	parser = argparse.ArgumentParser(description='Calculate average reward.')
	parser.add_argument('output_path', type=str, help='path to output.jsonl')

	args = parser.parse_args()

	if __name__ == '__main__':
	env_ids = [
	id for id in gym.envs.registry.keys() if id.startswith('browsergym/miniwob')
	]
	total_num = len(env_ids)
	print('Total number of tasks: ', total_num)
	total_reward = 0
	total_cost = 0
	actual_num = 0
	with open(args.output_path, 'r') as f:
	for line in f:
	data = json.loads(line)
	actual_num += 1
	total_cost += data['metrics']['accumulated_cost']
	total_reward += data['test_result']['reward']

	avg_reward = total_reward / total_num
	print('Avg Reward: ', avg_reward)

	avg_cost = total_cost / actual_num
	print('Avg Cost: ', avg_cost)
	print('Actual number of tasks finished: ', actual_num)