gazebo/RoverPlugin.h

/*
 * http://github.com/dusty-nv/jetson-reinforcement
 */

#ifndef __GAZEBO_ROVER_PLUGIN_H__
#define __GAZEBO_ROVER_PLUGIN_H__

#include "deepRL.h"

#include <boost/bind.hpp>
#include <gazebo/gazebo.hh>
#include <gazebo/transport/transport.hh>
#include <gazebo/msgs/msgs.hh>
#include <gazebo/physics/physics.hh>
#include <gazebo/common/common.hh>
#include <stdio.h>
#include <iostream>
#include <gazebo/transport/TransportTypes.hh>
#include <gazebo/msgs/MessageTypes.hh>
#include <gazebo/common/Time.hh>

#include <errno.h>
#include <fcntl.h>
#include <assert.h>
#include <unistd.h>
#include <pthread.h>
#include <ctype.h>
#include <stdbool.h>
#include <math.h>
#include <inttypes.h>
#include <string.h>
#include <syslog.h>
#include <time.h>

#include "devInput.h"


namespace gazebo
{

/**
 * RoverPlugin
 */
class RoverPlugin : public ModelPlugin
{
public: 
	RoverPlugin(); 

	virtual void Load(physics::ModelPtr _parent, sdf::ElementPtr /*_sdf*/); 
	virtual void OnUpdate(const common::UpdateInfo & /*_info*/);

	float resetPosition( uint32_t dof );  // center servo positions

	bool createAgent();
	bool updateAgent();
	bool configJoint( const char* name );
	bool updateJoints();
	
	void onCameraMsg(ConstImageStampedPtr &_msg);
	void onCollisionMsg(ConstContactsPtr &contacts);

	static const uint32_t DOF = 2;	// FWD/BACK, LEFT/RIGHT

private:
	float vel[DOF];			// joint velocity control
	float dT[3];				// IK delta theta

	enum OperatingMode
	{
		USER_MANUAL,
		/*USER_TRAIN,*/
		AGENT_LEARN,
		AGENT_RESET
		/*,AGENT_AUTO*/
	} opMode;

	rlAgent* agent;			// AI learning agent instance
	//OpMode   opMode;			// robot operating mode	
	bool     newState;			// true if a new frame needs processed
	bool     newReward;			// true if a new reward's been issued
	bool     endEpisode;		// true if this episode is over
	float    rewardHistory;		// value of the last reward issued
	Tensor*  inputState;		// pyTorch input object to the agent
	void*    inputBuffer[2];		// [0] for CPU and [1] for GPU
	size_t   inputBufferSize;
	size_t   inputRawWidth;
	size_t   inputRawHeight;	
	float    actionVelDelta;		// amount of velocity offset caused to a joint by an action
	int	    maxEpisodeLength;	// maximum number of frames to win episode (or <= 0 for unlimited)
	int      episodeFrames;		// frame counter for the current episode	
	int      episodesCompleted;
	int 	    episodesWon;
	int	    lastAction;
	float    lastGoalDistance;
	float    avgGoalDelta;
	int      runHistoryIdx;
	int	    runHistoryMax;
	bool     runHistory[20];

	physics::ModelPtr model;
	math::Pose originalPose;

	InputDevices* HID;
	event::ConnectionPtr updateConnection;
	std::vector<physics::JointPtr> joints;
	physics::JointController* j2_controller;

	gazebo::transport::NodePtr cameraNode;
	gazebo::transport::SubscriberPtr cameraSub;

	gazebo::transport::NodePtr collisionNode;
	gazebo::transport::SubscriberPtr collisionSub;
};

}


#endif