SimuRLacra/rcspysim/RcsSimEnv_8h_source.html

 /*******************************************************************************
  Copyright (c) 2020, Fabio Muratore, Honda Research Institute Europe GmbH, and
  Technical University of Darmstadt.
  All rights reserved.

  Redistribution and use in source and binary forms, with or without
  modification, are permitted provided that the following conditions are met:
  1. Redistributions of source code must retain the above copyright
     notice, this list of conditions and the following disclaimer.
  2. Redistributions in binary form must reproduce the above copyright
     notice, this list of conditions and the following disclaimer in the
     documentation and/or other materials provided with the distribution.
  3. Neither the name of Fabio Muratore, Honda Research Institute Europe GmbH,
     or Technical University of Darmstadt, nor the names of its contributors may
     be used to endorse or promote products derived from this software without
     specific prior written permission.

  THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS "AS IS" AND
  ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED
  WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE
  DISCLAIMED. IN NO EVENT SHALL FABIO MURATORE, HONDA RESEARCH INSTITUTE EUROPE GMBH,
  OR TECHNICAL UNIVERSITY OF DARMSTADT BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL,
  SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO,
  PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS;
  OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER
  IN CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE)
  ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE
  POSSIBILITY OF SUCH DAMAGE.
 *******************************************************************************/

 #ifndef _RCSSIMENV_H_
 #define _RCSSIMENV_H_

 #include "ExperimentConfig.h"
 #include "physics/PhysicsParameterManager.h"

 #include "util/BoxSpace.h"
 #include "util/nocopy.h"

 #include <mutex>

 namespace Rcs
 {

 class Viewer;

 class HUD;

 /**
  * Thrown if the joint limits are violated after applying the action.
  */
 class JointLimitException : public std::runtime_error
 {
     using runtime_error::runtime_error;
 };

 /**
  * Rcs-backed machine learning simulation environment.
  * This class provides a user-driven update loop. It is started by reset(), and then updated by step().
  */
 class RcsSimEnv
 {
 public:
     /**
      * Create the environment from the given property source.
      *
      * @param propertySource configuration
      */
     explicit RcsSimEnv(PropertySource* propertySource);

     virtual ~RcsSimEnv();

     // not copy- or movable
     RCSPYSIM_NOCOPY_NOMOVE(RcsSimEnv)

     /**
      * Reset the internal state in order to start a new rollout.
      *
      * @param domainParam physics params to use for this rollout
      * @param initState initial state for this rollout
      * @return observation of the initial state
      */
     virtual MatNd* reset(PropertySource* domainParam = PropertySource::empty(), const MatNd* initState = NULL);

     /**
      * Perform one environment step.
      *
      * @param action action vector
      * @param disturbance disturbance vector, e.g. a 3-dim force
      * @return observation after the step was processed
      * @throws JointLimitException if the joint limits were violated
      */
     virtual MatNd* step(const MatNd* action, const MatNd* disturbance = NULL);

     /**
      * Render the current state of the simulation.
      *
      * Should be called after each step call.
      * The RcsGraphics renderer runs mostly on it's own thread, so that isn't absolutely
      * necessairy, but it is required to update the HUD.
      *
      * @param mode only 'human' is supported at the moment, is also the default
      * @param close true to close the render window
      */
     virtual void render(std::string mode = "human", bool close = false);

     /** Start/stop video recording. */
     void toggleVideoRecording();

     /**
      * Observation space of this environment.
      * All valid observation values fit inside this.
      */
     const BoxSpace* observationSpace();

     /**
      * Action space of this environment.
      * All valid action values fit inside this.
      * The actions provided from Python are not projected to this space, i.e. this must be done on the Python side.
      */
     const BoxSpace* actionSpace();

     /**
      * Initial state space of this environment.
      * All valid initial state values fit inside this.
      */
     const BoxSpace* initStateSpace();

     /**
      * Set the transition noise buffer.
      * In order to avoid heavy stochastic computation in every step, the transition noise values are pregenerated.
      * The buffer should have a row count equal to getInternalStateDim(). Every column is a set of noise values
      * applied in one step. In the next step, the next column is used. If the last column is reached, the next step
      * will use the first column again.
      *
      * @param tnb transition noise buffer
      */
     void setTransitionNoiseBuffer(const MatNd* tnb);

     /** Internal state dimension, required for the transition noise buffer. */
     unsigned int getInternalStateDim();

     /** Configuration settings for the experiment */
     ExperimentConfig* getConfig()
     {
         return config;
     }

     /** Physics parameter management */
     PhysicsParameterManager* getPhysicsManager()
     {
         return physicsManager;
     }

     /** Observation from last step */
     MatNd* getCurrentObservation() const
     {
         return currentObservation;
     }

     /** Action from last step */
     MatNd* getCurrentAction() const
     {
         return currentAction;
     }

 private:
     //! Guards for parallel access to graph (can happen from gui)
     std::mutex graphLock;

     //! Experiment configuration
     ExperimentConfig* config;
     bool allJointsPosCtrl;

     //! Physics simulator factory
     PhysicsParameterManager* physicsManager;
     //! Physics simulator
     PhysicsBase* physicsSim;
     //! Disturbance force simulator
     ForceDisturber* disturber;

     //! Initial state setter
     InitStateSetter* initStateSetter;

     //! Temporary matrices
     MatNd* q_ctrl;
     MatNd* qd_ctrl;
     MatNd* T_ctrl;

     //! Counters
     unsigned int currentStep;
     double currentTime;

     //! Transition noise values (every column is one set of noise values for every state variable)
     MatNd* transitionNoiseBuffer;
     unsigned int tnbIndex;
     bool transitionNoiseIncludeVelocity; // false if transition noise is only applied to state

     //! Observation and action at last step
     MatNd* currentObservation;
     MatNd* currentAction;

     //! Visualization
     Viewer* viewer;
     bool usePhysicsNode; // use PhysicsNode (can not be reset) or GraphicsNode for the viewer
     HUD* hud;
 //    int adWidgetHandle;
 };

 } /* namespace Rcs */

 #endif /* _RCSSIMENV_H_ */
Rcs::PhysicsParameterManager
Definition: PhysicsParameterManager.h:52

Rcs::PropertySource
Definition: PropertySource.h:46

nocopy.h

BoxSpace.h

Rcs::RcsSimEnv::usePhysicsNode
bool usePhysicsNode
Definition: RcsSimEnv.h:205

RCSPYSIM_NOCOPY_NOMOVE
#define RCSPYSIM_NOCOPY_NOMOVE(cls)
Definition: nocopy.h:40

Rcs::RcsSimEnv::currentStep
unsigned int currentStep
Counters.
Definition: RcsSimEnv.h:191

Rcs::RcsSimEnv::viewer
Viewer * viewer
Visualization.
Definition: RcsSimEnv.h:204

Rcs::RcsSimEnv::getCurrentAction
MatNd * getCurrentAction() const
Definition: RcsSimEnv.h:162

Rcs::RcsSimEnv::allJointsPosCtrl
bool allJointsPosCtrl
Definition: RcsSimEnv.h:173

Rcs::RcsSimEnv::currentObservation
MatNd * currentObservation
Observation and action at last step.
Definition: RcsSimEnv.h:200

Rcs::RcsSimEnv::hud
HUD * hud
Definition: RcsSimEnv.h:206

Rcs::RcsSimEnv
Definition: RcsSimEnv.h:61

Rcs::InitStateSetter
Definition: InitStateSetter.h:45

Rcs::RcsSimEnv::T_ctrl
MatNd * T_ctrl
Definition: RcsSimEnv.h:188

Rcs::RcsSimEnv::physicsManager
PhysicsParameterManager * physicsManager
Physics simulator factory.
Definition: RcsSimEnv.h:176

Rcs::RcsSimEnv::qd_ctrl
MatNd * qd_ctrl
Definition: RcsSimEnv.h:187

Rcs::JointLimitException
Definition: RcsSimEnv.h:52

Rcs::RcsSimEnv::getPhysicsManager
PhysicsParameterManager * getPhysicsManager()
Definition: RcsSimEnv.h:150

ExperimentConfig.h

Rcs::PropertySource::empty
static PropertySource * empty()
Definition: PropertySource.cpp:114

Rcs::RcsSimEnv::currentAction
MatNd * currentAction
Definition: RcsSimEnv.h:201

PhysicsParameterManager.h

Rcs::RcsSimEnv::getConfig
ExperimentConfig * getConfig()
Definition: RcsSimEnv.h:144

Rcs::RcsSimEnv::tnbIndex
unsigned int tnbIndex
Definition: RcsSimEnv.h:196

Rcs::RcsSimEnv::disturber
ForceDisturber * disturber
Disturbance force simulator.
Definition: RcsSimEnv.h:180

Rcs::RcsSimEnv::physicsSim
PhysicsBase * physicsSim
Physics simulator.
Definition: RcsSimEnv.h:178

Rcs::RcsSimEnv::q_ctrl
MatNd * q_ctrl
Temporary matrices.
Definition: RcsSimEnv.h:186

Rcs::RcsSimEnv::getCurrentObservation
MatNd * getCurrentObservation() const
Definition: RcsSimEnv.h:156

Rcs::RcsSimEnv::currentTime
double currentTime
Definition: RcsSimEnv.h:192

Rcs::RcsSimEnv::transitionNoiseBuffer
MatNd * transitionNoiseBuffer
Transition noise values (every column is one set of noise values for every state variable) ...
Definition: RcsSimEnv.h:195

Rcs::ExperimentConfig
Definition: ExperimentConfig.h:72

Rcs::BoxSpace
Definition: BoxSpace.h:49

Rcs::ForceDisturber
Definition: ForceDisturber.h:45

Rcs::RcsSimEnv::transitionNoiseIncludeVelocity
bool transitionNoiseIncludeVelocity
Definition: RcsSimEnv.h:197

Rcs::RcsSimEnv::initStateSetter
InitStateSetter * initStateSetter
Initial state setter.
Definition: RcsSimEnv.h:183

Rcs::RcsSimEnv::config
ExperimentConfig * config
Experiment configuration.
Definition: RcsSimEnv.h:172

Rcs::RcsSimEnv::graphLock
std::mutex graphLock
Guards for parallel access to graph (can happen from gui)
Definition: RcsSimEnv.h:169

Rcs
Definition: ActionModel.cpp:36