12:["$","div",null,{"className":"Post-module__aBOVGG__post","style":{"display":"flex","flexDirection":"column","alignItems":"center","gap":"8px","flex":"1","width":"100%","padding":"12px"},"children":[["$","div",null,{"className":"$undefined","style":{"display":"flex","gap":"0.4rem","flexWrap":"wrap","width":"100%"},"children":[false,[["$","a","2CC4",{"href":"/2CC4","className":"Post-module__aBOVGG__fg","style":{},"children":"強化学習"}],["$","a","A52F-1D88",{"href":"/A52F-1D88","className":"Post-module__aBOVGG__fg","style":{},"children":"Policy Gradient"}]]]}],["$","article",null,{"className":"article","children":[["$","div",null,{"className":"$undefined","style":{"display":"flex","justifyContent":"space-between","flexWrap":"wrap","width":"100%"},"children":[["$","h2",null,{"style":{"margin":"0.2rem"},"children":["$","a",null,{"href":"/A52F-9A21","children":"『強化学習アルゴリズム整理 - joeの日記』"}]}],["$","div",null,{"className":"$undefined","style":{"display":"flex","justifyContent":"end","alignItems":"center","flex":"1","textAlign":"right","whiteSpace":"nowrap"},"children":["$","div",null,{"children":"2024/11/1 3:56:00"}]}]]}],["$","div",null,{"className":"article_body","dangerouslySetInnerHTML":{"__html":"

https://xuzijian629.hatenablog.com/entry/2020/01/03/212451\n

"}}]]}],["$","div",null,{"className":"$undefined","style":{"display":"flex","gap":"0.4rem","flexWrap":"wrap","width":"100%"},"children":[["$","a","",{"href":"/","className":"Post-module__aBOVGG__bg","style":{"opacity":0},"children":"あれ"}],[]]}]]}]