Matches in SemOpenAlex for { <https://semopenalex.org/work/W2890391327> ?p ?o ?g. }
- W2890391327 abstract "Reinforcement learning is a way for an artificial intelligence system to learn by trial and error. This paper presents a deterministic limit of such a learning method, in an environment that changes in time. The method is applied to three well-known learning algorithms." @default.
- W2890391327 created "2018-09-27" @default.
- W2890391327 creator A5047941384 @default.
- W2890391327 creator A5079184903 @default.
- W2890391327 creator A5085207296 @default.
- W2890391327 date "2019-04-10" @default.
- W2890391327 modified "2023-10-18" @default.
- W2890391327 title "Deterministic limit of temporal difference reinforcement learning for stochastic games" @default.
- W2890391327 cites W1192553058 @default.
- W2890391327 cites W1540547620 @default.
- W2890391327 cites W192920577 @default.
- W2890391327 cites W1995622844 @default.
- W2890391327 cites W2026069625 @default.
- W2890391327 cites W2031098375 @default.
- W2890391327 cites W2036651296 @default.
- W2890391327 cites W2039656410 @default.
- W2890391327 cites W2045817941 @default.
- W2890391327 cites W2046579047 @default.
- W2890391327 cites W2051432898 @default.
- W2890391327 cites W2057171149 @default.
- W2890391327 cites W2063129619 @default.
- W2890391327 cites W2076337359 @default.
- W2890391327 cites W2083535091 @default.
- W2890391327 cites W2096348520 @default.
- W2890391327 cites W2099618002 @default.
- W2890391327 cites W2101786389 @default.
- W2890391327 cites W2114499604 @default.
- W2890391327 cites W2128797809 @default.
- W2890391327 cites W2132979098 @default.
- W2890391327 cites W2140643197 @default.
- W2890391327 cites W2145339207 @default.
- W2890391327 cites W2158274534 @default.
- W2890391327 cites W2163569945 @default.
- W2890391327 cites W2238069175 @default.
- W2890391327 cites W2254971679 @default.
- W2890391327 cites W2263834964 @default.
- W2890391327 cites W2277784065 @default.
- W2890391327 cites W2399928304 @default.
- W2890391327 cites W2738724892 @default.
- W2890391327 cites W2741809339 @default.
- W2890391327 cites W2746179850 @default.
- W2890391327 cites W2808252900 @default.
- W2890391327 cites W2811498230 @default.
- W2890391327 cites W3101913361 @default.
- W2890391327 cites W3102551942 @default.
- W2890391327 cites W3102839078 @default.
- W2890391327 cites W3103304776 @default.
- W2890391327 cites W4232215708 @default.
- W2890391327 cites W4239900517 @default.
- W2890391327 cites W4252488326 @default.
- W2890391327 cites W4254547512 @default.
- W2890391327 doi "https://doi.org/10.1103/physreve.99.043305" @default.
- W2890391327 hasPubMedId "https://pubmed.ncbi.nlm.nih.gov/31108579" @default.
- W2890391327 hasPublicationYear "2019" @default.
- W2890391327 type Work @default.
- W2890391327 sameAs 2890391327 @default.
- W2890391327 citedByCount "29" @default.
- W2890391327 countsByYear W28903913272018 @default.
- W2890391327 countsByYear W28903913272019 @default.
- W2890391327 countsByYear W28903913272020 @default.
- W2890391327 countsByYear W28903913272021 @default.
- W2890391327 countsByYear W28903913272022 @default.
- W2890391327 countsByYear W28903913272023 @default.
- W2890391327 crossrefType "journal-article" @default.
- W2890391327 hasAuthorship W2890391327A5047941384 @default.
- W2890391327 hasAuthorship W2890391327A5079184903 @default.
- W2890391327 hasAuthorship W2890391327A5085207296 @default.
- W2890391327 hasBestOaLocation W28903913272 @default.
- W2890391327 hasConcept C126255220 @default.
- W2890391327 hasConcept C134306372 @default.
- W2890391327 hasConcept C151201525 @default.
- W2890391327 hasConcept C154945302 @default.
- W2890391327 hasConcept C15744967 @default.
- W2890391327 hasConcept C196340769 @default.
- W2890391327 hasConcept C199190896 @default.
- W2890391327 hasConcept C33923547 @default.
- W2890391327 hasConcept C41008148 @default.
- W2890391327 hasConcept C67203356 @default.
- W2890391327 hasConcept C77805123 @default.
- W2890391327 hasConcept C97541855 @default.
- W2890391327 hasConceptScore W2890391327C126255220 @default.
- W2890391327 hasConceptScore W2890391327C134306372 @default.
- W2890391327 hasConceptScore W2890391327C151201525 @default.
- W2890391327 hasConceptScore W2890391327C154945302 @default.
- W2890391327 hasConceptScore W2890391327C15744967 @default.
- W2890391327 hasConceptScore W2890391327C196340769 @default.
- W2890391327 hasConceptScore W2890391327C199190896 @default.
- W2890391327 hasConceptScore W2890391327C33923547 @default.
- W2890391327 hasConceptScore W2890391327C41008148 @default.
- W2890391327 hasConceptScore W2890391327C67203356 @default.
- W2890391327 hasConceptScore W2890391327C77805123 @default.
- W2890391327 hasConceptScore W2890391327C97541855 @default.
- W2890391327 hasFunder F4320311215 @default.
- W2890391327 hasFunder F4320327430 @default.
- W2890391327 hasFunder F4320334763 @default.
- W2890391327 hasIssue "4" @default.
- W2890391327 hasLocation W28903913271 @default.
- W2890391327 hasLocation W28903913272 @default.
- W2890391327 hasLocation W28903913273 @default.
- W2890391327 hasLocation W28903913274 @default.