       £K"	ÒöK±ØAbrain.Event:2»íÄ
ö      Œf‰	(L±ØA*ê	
ç	
Hyperparameters/text_summaryB¼	B±		trainer_type:	ppo
	hyperparameters:	
	  batch_size:	128
	  buffer_size:	2048
	  learning_rate:	0.0003
	  beta:	0.01
	  epsilon:	0.2
	  lambd:	0.95
	  num_epoch:	3
	  learning_rate_schedule:	linear
	  beta_schedule:	linear
	  epsilon_schedule:	linear
	network_settings:	
	  normalize:	False
	  hidden_units:	512
	  num_layers:	2
	  vis_encode_type:	simple
	  memory:	None
	  goal_conditioning_type:	hyper
	  deterministic:	False
	reward_signals:	
	  extrinsic:	
	    gamma:	0.99
	    strength:	1.0
	    network_settings:	
	      normalize:	False
	      hidden_units:	128
	      num_layers:	2
	      vis_encode_type:	simple
	      memory:	None
	      goal_conditioning_type:	hyper
	      deterministic:	False
	  rnd:	
	    gamma:	0.99
	    strength:	0.01
	    network_settings:	
	      normalize:	False
	      hidden_units:	64
	      num_layers:	3
	      vis_encode_type:	simple
	      memory:	None
	      goal_conditioning_type:	hyper
	      deterministic:	False
	    learning_rate:	0.0001
	    encoding_size:	None
	init_path:	None
	keep_checkpoints:	5
	checkpoint_interval:	500000
	max_steps:	3000000
	time_horizon:	128
	summary_freq:	30000
	threaded:	False
	self_play:	None
	behavioral_cloning:	NoneJ

text¹ÒÄb