{"id":440,"date":"2022-05-03T21:31:00","date_gmt":"2022-05-03T12:31:00","guid":{"rendered":"https:\/\/singularity2045.jp\/?p=440"},"modified":"2022-05-03T21:34:07","modified_gmt":"2022-05-03T12:34:07","slug":"%e3%83%a1%e3%83%a2%ef%bc%9astable-baseline3-ppo-%e5%87%ba%e5%8a%9b","status":"publish","type":"post","link":"https:\/\/singularity2045.jp\/wordpress\/?p=440","title":{"rendered":"\u30e1\u30e2\uff1aStable Baseline3 PPO \u51fa\u529b\u5185\u5bb9"},"content":{"rendered":"\n<figure class=\"wp-block-table is-style-stripes\"><table><tbody><tr><td>\u51fa\u529b\u9805\u76ee<\/td><td>\u6570\u5024\u4f8b<\/td><td>\u5185\u5bb9<\/td><\/tr><tr><td>approxkl <\/td><td>0.00013371343<\/td><td>\u65b0\u3057\u3044\u65b9\u7b56\u304b\u3089\u53e4\u3044\u65b9\u7b56\u3078\u306eKullback-Leibler divergence<\/td><\/tr><tr><td>clipfrac<\/td><td>0.0<\/td><td>\u30af\u30ea\u30c3\u30d7\u7bc4\u56f2\u30cf\u30a4\u30d1\u30fc\u30d1\u30e9\u30e1\u30fc\u30bf\u304c\u4f7f\u7528\u3055\u308c\u308b\u56de\u6570\u306e\u5272\u5408<\/td><\/tr><tr><td>explained_variance<\/td><td>-0.0241<\/td><td>\u8aa4\u5dee\u306e\u5206\u6563<\/td><\/tr><tr><td>fps<\/td><td>405<\/td><td>\uff11\u79d2\u3042\u305f\u308a\u306e\u30d5\u30ec\u30fc\u30e0\u6570<\/td><\/tr><tr><td>n_updates<\/td><td>1<\/td><td>\u66f4\u65b0\u56de\u6570<\/td><\/tr><tr><td>policy_entropy<\/td><td>1.3861077<\/td><td>\u65b9\u7b56\u306e\u30a8\u30f3\u30c8\u30ed\u30d4\u30fc<\/td><\/tr><tr><td>policy_loss<\/td><td>-0.00052567874<\/td><td>\u65b9\u7b56\u306e\u640d\u5931<\/td><\/tr><tr><td>serial_timesteps<\/td><td>128 <\/td><td>\uff11\u3064\u306e\u74b0\u5883\u3067\u306e\u30bf\u30a4\u30d7\u30b9\u30c6\u30c3\u30d7\u6570<\/td><\/tr><tr><td>time_elapsed<\/td><td>0<\/td><td>\u7d4c\u904e\u6642\u9593<\/td><\/tr><tr><td>total_timesteps<\/td><td>128<\/td><td>\u5168\u74b0\u5883\u3067\u306e\u30bf\u30a4\u30e0\u30b9\u30c6\u30c3\u30d7\u6570<\/td><\/tr><tr><td>value_loss<\/td><td>111.95057<\/td><td>\u4fa1\u5024\u95a2\u6570\u66f4\u65b0\u6642\u306e\u5e73\u5747\u640d\u5931<\/td><\/tr><\/tbody><\/table><\/figure>\n","protected":false},"excerpt":{"rendered":"<p>\u51fa\u529b\u9805\u76ee \u6570\u5024\u4f8b \u5185\u5bb9 approxkl 0.00013371343 \u65b0\u3057\u3044\u65b9\u7b56\u304b\u3089\u53e4\u3044\u65b9\u7b56\u3078\u306eKullback-Leibler divergence clipfrac 0.0 \u30af\u30ea\u30c3\u30d7\u7bc4\u56f2\u30cf\u30a4\u30d1\u30fc\u30d1\u30e9\u30e1\u30fc\u30bf\u304c\u4f7f\u7528\u3055\u308c\u308b &hellip; <a href=\"https:\/\/singularity2045.jp\/wordpress\/?p=440\" class=\"more-link\"><span class=\"screen-reader-text\">&#8220;\u30e1\u30e2\uff1aStable Baseline3 PPO \u51fa\u529b\u5185\u5bb9&#8221; \u306e<\/span>\u7d9a\u304d\u3092\u8aad\u3080<\/a><\/p>\n","protected":false},"author":1,"featured_media":0,"comment_status":"open","ping_status":"closed","sticky":false,"template":"","format":"standard","meta":{"advanced_seo_description":"","jetpack_seo_html_title":"","jetpack_seo_noindex":false,"jetpack_post_was_ever_published":false,"_jetpack_newsletter_access":"","_jetpack_dont_email_post_to_subs":false,"_jetpack_newsletter_tier_id":0,"_jetpack_memberships_contains_paywalled_content":false,"_jetpack_memberships_contains_paid_content":false,"footnotes":"","jetpack_publicize_message":"","jetpack_publicize_feature_enabled":true,"jetpack_social_post_already_shared":false,"jetpack_social_options":{"image_generator_settings":{"template":"highway","enabled":false},"version":2}},"categories":[1],"tags":[],"class_list":["post-440","post","type-post","status-publish","format-standard","hentry","category-1"],"jetpack_publicize_connections":[],"jetpack_featured_media_url":"","jetpack_sharing_enabled":true,"jetpack_shortlink":"https:\/\/wp.me\/pf3Jhj-76","jetpack-related-posts":[],"jetpack_likes_enabled":true,"_links":{"self":[{"href":"https:\/\/singularity2045.jp\/wordpress\/index.php?rest_route=\/wp\/v2\/posts\/440"}],"collection":[{"href":"https:\/\/singularity2045.jp\/wordpress\/index.php?rest_route=\/wp\/v2\/posts"}],"about":[{"href":"https:\/\/singularity2045.jp\/wordpress\/index.php?rest_route=\/wp\/v2\/types\/post"}],"author":[{"embeddable":true,"href":"https:\/\/singularity2045.jp\/wordpress\/index.php?rest_route=\/wp\/v2\/users\/1"}],"replies":[{"embeddable":true,"href":"https:\/\/singularity2045.jp\/wordpress\/index.php?rest_route=%2Fwp%2Fv2%2Fcomments&post=440"}],"version-history":[{"count":3,"href":"https:\/\/singularity2045.jp\/wordpress\/index.php?rest_route=\/wp\/v2\/posts\/440\/revisions"}],"predecessor-version":[{"id":445,"href":"https:\/\/singularity2045.jp\/wordpress\/index.php?rest_route=\/wp\/v2\/posts\/440\/revisions\/445"}],"wp:attachment":[{"href":"https:\/\/singularity2045.jp\/wordpress\/index.php?rest_route=%2Fwp%2Fv2%2Fmedia&parent=440"}],"wp:term":[{"taxonomy":"category","embeddable":true,"href":"https:\/\/singularity2045.jp\/wordpress\/index.php?rest_route=%2Fwp%2Fv2%2Fcategories&post=440"},{"taxonomy":"post_tag","embeddable":true,"href":"https:\/\/singularity2045.jp\/wordpress\/index.php?rest_route=%2Fwp%2Fv2%2Ftags&post=440"}],"curies":[{"name":"wp","href":"https:\/\/api.w.org\/{rel}","templated":true}]}}