trust-ai
xrl
gpxrl

Repository

.
|── GPRL
|   |── containers           # Fix a bug in qdpy grid 0.1.2.1 (current last stable version)
|   |── genetic_programming  # Individual definition of linear GP and Team for deap
|   |── MCTS                 # Nested Monte-Carlo code
|   |── utils                # Various utils and callback functions to run easily experiments
|   |── algorithms.py        # deap like algorithm using toolbox
|   |── factory.py           # Abstract class to make better used of toolbox between script
|   |── UCB.py               # Subclass of deap base Fitness to use UCB
└── ...
python evolve.py --conf /path/to/conf.yml
algorithm:
  name: # algorithm name in deap (algorithms.<name>) or algoritm name from GPRL (algo.name)
  args:
    # args of the algorithm chosen (lambda_, mu, ngen ...)

population:
  init_size: #size of the population (int)

selection:
  name: # selection method for the evolutionnay algorithm. ex: selTournament (from deap.tools.sel*)
  args:
    # argument for the selection method. ex: tournsize: 5

individual: # Individual representation ("Tree" or "Linear")

params:
  env: # env-id from the gym/bullet env. ex:"MountainCarContinuous-v0"
  function_set: #Function set size ("small" or "extended")
  c: # Exploration constante for UCB (float)
  n_episodes: # Number of episode per evaluation (int)
  n_steps: # Number of step per evaluation (int)
  gamma: # Discount factor γ (float in [0,1])
  n_thread: # Number of thread to use (int)
  ... (many others depending of the individual representation (Tree or Linear). see conf/ for examples)
seed: #set seed for random