deepQlearning: add libdeepqlearn.so, debug some issue with -Werror -fpic
This commit is contained in:
@@ -45,7 +45,7 @@ struct networks_qlearning * create_nework_qlearning(
|
||||
struct networks_qlearning *qnets = malloc(sizeof(struct networks_qlearning));
|
||||
qnets->config = config;
|
||||
|
||||
setup_networks_alloutputs_config_TYPE_FLOAT(&(qnets->main_net), config, random, minR, maxR, randomRange);
|
||||
setup_networks_alloutputs_config_TYPE_FLOAT(&(qnets->main_net), config, randomize, minR, maxR, randomRange);
|
||||
setup_networks_alloutputs_config_TYPE_FLOAT(&(qnets->target_net), config, false, minR, maxR, randomRange);
|
||||
copy_weight_in_networks_from_main_to_target(qnets);
|
||||
|
||||
@@ -283,7 +283,7 @@ int select_action(struct RL_agent * rlAgent){
|
||||
//init =false;
|
||||
//}
|
||||
//int random = xrand() % randRange;
|
||||
float proba_explor = (float) (xrand() % (1<<17 -1))/ (1<<17 -1); //frand(); //(float)(random ) / randRange;
|
||||
float proba_explor = (float) (xrand() % ((1<<17) -1))/ ((1<<17) -1); //frand(); //(float)(random ) / randRange;
|
||||
if(proba_explor > rlAgent->qlearnParams->exploration_factor ){
|
||||
action = ARG_MAX_ARRAY_TYPE_FLOAT( action_value->x, action_value->dim->rank );
|
||||
//if(action == ARG_MIN_ARRAY_TYPE_FLOAT( action_value->x, action_value->dim->rank ))
|
||||
@@ -385,7 +385,7 @@ void learn_to_drive(struct RL_agent * rlAgent){
|
||||
struct game_status * car_status = car->status;
|
||||
struct qlearning_params * qlParams = rlAgent->qlearnParams;
|
||||
struct status_qlearning * qlStatus = rlAgent->status;
|
||||
struct print_params * pprint = rlAgent->pprint;
|
||||
//struct print_params * pprint = rlAgent->pprint;
|
||||
char msg[100];
|
||||
|
||||
pthread_t threadPrint;
|
||||
|
||||
@@ -20,6 +20,7 @@ struct game_status * create_game_status(){
|
||||
status->reward = 0;
|
||||
status->cumulative_reward = 0;
|
||||
status->done = false;
|
||||
return status;
|
||||
}
|
||||
|
||||
coordinate * create_coordinate(size_t dim_size){
|
||||
@@ -423,13 +424,12 @@ float distance2_coordinate(coordinate *c0, coordinate *c1){
|
||||
v->sensor->x[position] = (float)(MIN((SUBDIVISION-1),dist))/SUBDIVISION ;\
|
||||
|
||||
|
||||
|
||||
//v->sensor->x[position] = (float)(MIN((SUBDIVISION-1),(int)dist))/SUBDIVISION ;\
|
||||
|
||||
|
||||
//v->sensor->x[position] = (MIN(49,(distance2_coordinate(diStep_sensor, v->coord)/5))) ;\
|
||||
//v->sensor->x[position] = (MIN(49,(distance2_coordinate(diStep_sensor, v->coord)))) / 50;\
|
||||
//v->sensor->x[position] = (MIN(49,(int)(distance2_coordinate(diStep_sensor, v->coord)/10))) / 50;\
|
||||
#if 0
|
||||
//v->sensor->x[position] = (float)(MIN((SUBDIVISION-1),(int)dist))/SUBDIVISION ;
|
||||
//v->sensor->x[position] = (MIN(49,(distance2_coordinate(diStep_sensor, v->coord)/5))) ;
|
||||
//v->sensor->x[position] = (MIN(49,(distance2_coordinate(diStep_sensor, v->coord)))) / 50;
|
||||
//v->sensor->x[position] = (MIN(49,(int)(distance2_coordinate(diStep_sensor, v->coord)/10))) / 50;
|
||||
#endif
|
||||
|
||||
void read_sensor(struct vehicle *v){
|
||||
copy_tensor_TYPE_FLOAT(v->old_sensor, v->sensor);
|
||||
|
||||
Reference in New Issue
Block a user