learn_to_drive: action repeated too much, increase exploration factor
This commit is contained in:
@@ -366,7 +366,7 @@ int select_action(struct RL_agent * rlAgent){
|
||||
}
|
||||
struct qlearning_params * qlParams = rlAgent->qlearnParams;
|
||||
write(1,"#",1);
|
||||
qlParams->exploration_factor = (qlParams->exploration_factor < 1 ) ? qlParams->exploration_factor / qlParams->factor_update_exploration_factor : qlParams->exploration_factor ;
|
||||
qlParams->exploration_factor = (qlParams->exploration_factor < 1 ) ? (qlParams->exploration_factor / qlParams->factor_update_exploration_factor)*5 : qlParams->exploration_factor ;
|
||||
}
|
||||
#endif
|
||||
////else write(1,".",1);
|
||||
|
||||
Reference in New Issue
Block a user