Matches in SemOpenAlex for { <https://semopenalex.org/work/W3112804989> ?p ?o ?g. }
- W3112804989 endingPage "229100" @default.
- W3112804989 startingPage "229086" @default.
- W3112804989 abstract "We investigate the important problem of certifying stability of reinforcement learning policies when interconnected with nonlinear dynamical systems. We show that by regulating the partial gradients of policies, strong guarantees of robust stability can be obtained based on a proposed semidefinite programming feasibility problem. The method is able to certify a large set of stabilizing controllers by exploiting problem-specific structures; furthermore, we analyze and establish its (non)conservatism. Empirical evaluations on two decentralized control tasks, namely multi-flight formation and power system frequency regulation, demonstrate that the reinforcement learning agents can have high performance within the stability-certified parameter space and also exhibit stable learning behaviors in the long run." @default.
- W3112804989 created "2020-12-21" @default.
- W3112804989 creator A5012672471 @default.
- W3112804989 creator A5042580848 @default.
- W3112804989 date "2020-01-01" @default.
- W3112804989 modified "2023-10-16" @default.
- W3112804989 title "Stability-Certified Reinforcement Learning: A Control-Theoretic Perspective" @default.
- W3112804989 cites W1551360398 @default.
- W3112804989 cites W1568689741 @default.
- W3112804989 cites W2003658506 @default.
- W3112804989 cites W2052970196 @default.
- W3112804989 cites W2053572490 @default.
- W3112804989 cites W2063493327 @default.
- W3112804989 cites W2076199517 @default.
- W3112804989 cites W2079121704 @default.
- W3112804989 cites W2082847490 @default.
- W3112804989 cites W2097944741 @default.
- W3112804989 cites W2112594540 @default.
- W3112804989 cites W2119717200 @default.
- W3112804989 cites W2145339207 @default.
- W3112804989 cites W2160545578 @default.
- W3112804989 cites W2570533838 @default.
- W3112804989 cites W2572949971 @default.
- W3112804989 cites W2573774505 @default.
- W3112804989 cites W2809808592 @default.
- W3112804989 cites W2914316834 @default.
- W3112804989 cites W2963525569 @default.
- W3112804989 cites W2964102336 @default.
- W3112804989 cites W3210839039 @default.
- W3112804989 cites W32403112 @default.
- W3112804989 cites W4211232706 @default.
- W3112804989 cites W4253985045 @default.
- W3112804989 doi "https://doi.org/10.1109/access.2020.3045114" @default.
- W3112804989 hasPublicationYear "2020" @default.
- W3112804989 type Work @default.
- W3112804989 sameAs 3112804989 @default.
- W3112804989 citedByCount "28" @default.
- W3112804989 countsByYear W31128049892021 @default.
- W3112804989 countsByYear W31128049892022 @default.
- W3112804989 countsByYear W31128049892023 @default.
- W3112804989 crossrefType "journal-article" @default.
- W3112804989 hasAuthorship W3112804989A5012672471 @default.
- W3112804989 hasAuthorship W3112804989A5042580848 @default.
- W3112804989 hasBestOaLocation W31128049891 @default.
- W3112804989 hasConcept C101901036 @default.
- W3112804989 hasConcept C112972136 @default.
- W3112804989 hasConcept C119857082 @default.
- W3112804989 hasConcept C121332964 @default.
- W3112804989 hasConcept C126255220 @default.
- W3112804989 hasConcept C12713177 @default.
- W3112804989 hasConcept C154945302 @default.
- W3112804989 hasConcept C158622935 @default.
- W3112804989 hasConcept C177264268 @default.
- W3112804989 hasConcept C199360897 @default.
- W3112804989 hasConcept C2775924081 @default.
- W3112804989 hasConcept C33923547 @default.
- W3112804989 hasConcept C41008148 @default.
- W3112804989 hasConcept C47446073 @default.
- W3112804989 hasConcept C62520636 @default.
- W3112804989 hasConcept C97541855 @default.
- W3112804989 hasConceptScore W3112804989C101901036 @default.
- W3112804989 hasConceptScore W3112804989C112972136 @default.
- W3112804989 hasConceptScore W3112804989C119857082 @default.
- W3112804989 hasConceptScore W3112804989C121332964 @default.
- W3112804989 hasConceptScore W3112804989C126255220 @default.
- W3112804989 hasConceptScore W3112804989C12713177 @default.
- W3112804989 hasConceptScore W3112804989C154945302 @default.
- W3112804989 hasConceptScore W3112804989C158622935 @default.
- W3112804989 hasConceptScore W3112804989C177264268 @default.
- W3112804989 hasConceptScore W3112804989C199360897 @default.
- W3112804989 hasConceptScore W3112804989C2775924081 @default.
- W3112804989 hasConceptScore W3112804989C33923547 @default.
- W3112804989 hasConceptScore W3112804989C41008148 @default.
- W3112804989 hasConceptScore W3112804989C47446073 @default.
- W3112804989 hasConceptScore W3112804989C62520636 @default.
- W3112804989 hasConceptScore W3112804989C97541855 @default.
- W3112804989 hasFunder F4320306076 @default.
- W3112804989 hasFunder F4320337345 @default.
- W3112804989 hasFunder F4320338279 @default.
- W3112804989 hasFunder F4320338281 @default.
- W3112804989 hasLocation W31128049891 @default.
- W3112804989 hasLocation W31128049892 @default.
- W3112804989 hasOpenAccess W3112804989 @default.
- W3112804989 hasPrimaryLocation W31128049891 @default.
- W3112804989 hasRelatedWork W2115030441 @default.
- W3112804989 hasRelatedWork W260766989 @default.
- W3112804989 hasRelatedWork W2898291697 @default.
- W3112804989 hasRelatedWork W2959276766 @default.
- W3112804989 hasRelatedWork W3111983280 @default.
- W3112804989 hasRelatedWork W3112804989 @default.
- W3112804989 hasRelatedWork W3139193008 @default.
- W3112804989 hasRelatedWork W3164468573 @default.
- W3112804989 hasRelatedWork W4206669594 @default.
- W3112804989 hasRelatedWork W4295941380 @default.
- W3112804989 hasVolume "8" @default.
- W3112804989 isParatext "false" @default.
- W3112804989 isRetracted "false" @default.
- W3112804989 magId "3112804989" @default.