Event JSON
{
"id": "6a8f08b36693c621a793338bdec8ceda0133408488ac53de6eb79322c855c96e",
"pubkey": "95ea081a627cee44e532825986ecc662139d068c4bdacbe820a8f445b9c6c06b",
"created_at": 1720260432,
"kind": 1,
"tags": [
[
"e",
"40bfb7693311ed52907a54e8d67ee374b7fcc01b8506eabf0743e2587e1fc2a6",
"",
"reply"
],
[
"p",
"95ea081a627cee44e532825986ecc662139d068c4bdacbe820a8f445b9c6c06b"
],
[
"proxy",
"https://recsys.social/@brohrer/112738987710960351",
"web"
],
[
"e",
"800ba7c73cf73dcf9bf7ebdf59e84f0664cbb253f261e0e0108fd128be4e3937",
"",
"root"
],
[
"proxy",
"https://recsys.social/users/brohrer/statuses/112738987710960351",
"activitypub"
],
[
"L",
"pink.momostr"
],
[
"l",
"pink.momostr.activitypub:https://recsys.social/users/brohrer/statuses/112738987710960351",
"pink.momostr"
],
[
"expiration",
"1722852435"
]
],
"content": "Each time step it gets a reward based on the height of the pendulum is— ranging from zero if it’s at the bottom to two if it’s at the top. \n\nBy the time it reaches a thousand episodes, it’s performing near optimally, with an average reward of 1.96, which includes spinning up from the bottom.\n\nThat represents 1 million times steps of learning at four times steps per second-about three days at 1X speed.",
"sig": "2747cd10ee55ac7905b9a390ee140e16bdc7018ada81206f0ecfa02e8fbe79e4ad588f3cae3e95babc63698117f4461254f4b328ed239d5d252d58876376cb1c"
}