ml-agents/ml-agents/mlagents/trainers/curriculum.py


								import os

								import json

								import math


								from .exception import CurriculumError


								import logging


								logger = logging.getLogger('mlagents.trainers')


								class Curriculum(object):

								    def __init__(self, location, default_reset_parameters):

								        """

								        Initializes a Curriculum object.

								        :param location: Path to JSON defining curriculum.

								        :param default_reset_parameters: Set of reset parameters for

								               environment.

								        """

								        self.max_lesson_num = 0

								        self.measure = None

								        self._lesson_num = 0

								        # The name of the brain should be the basename of the file without the

								        # extension.

								        self._brain_name = os.path.basename(location).split('.')[0]


								        try:

								            with open(location) as data_file:

								                self.data = json.load(data_file)

								        except IOError:

								            raise CurriculumError(

								                'The file {0} could not be found.'.format(location))

								        except UnicodeDecodeError:

								            raise CurriculumError('There was an error decoding {}'

								                                  .format(location))

								        self.smoothing_value = 0

								        for key in ['parameters', 'measure', 'thresholds',

								                    'min_lesson_length', 'signal_smoothing']:

								            if key not in self.data:

								                raise CurriculumError("{0} does not contain a "

								                                      "{1} field."

								                                      .format(location, key))

								        self.smoothing_value = 0

								        self.measure = self.data['measure']

								        self.min_lesson_length = self.data['min_lesson_length']

								        self.max_lesson_num = len(self.data['thresholds'])


								        parameters = self.data['parameters']

								        for key in parameters:

								            if key not in default_reset_parameters:

								                raise CurriculumError(

								                    'The parameter {0} in Curriculum {1} is not present in '

								                    'the Environment'.format(key, location))

								            if len(parameters[key]) != self.max_lesson_num + 1:

								                raise CurriculumError(

								                    'The parameter {0} in Curriculum {1} must have {2} values '

								                    'but {3} were found'.format(key, location,

								                                                self.max_lesson_num + 1,

								                                                len(parameters[key])))


								    @property

								    def lesson_num(self):

								        return self._lesson_num


								    @lesson_num.setter

								    def lesson_num(self, lesson_num):

								        self._lesson_num = max(0, min(lesson_num, self.max_lesson_num))


								    def increment_lesson(self, measure_val):

								        """

								        Increments the lesson number depending on the progress given.

								        :param measure_val: Measure of progress (either reward or percentage

								               steps completed).

								        :return Whether the lesson was incremented.

								        """

								        if not self.data or not measure_val or math.isnan(measure_val):

								            return False

								        if self.data['signal_smoothing']:

								            measure_val = self.smoothing_value * 0.25 + 0.75 * measure_val

								            self.smoothing_value = measure_val

								        if self.lesson_num < self.max_lesson_num:

								            if measure_val > self.data['thresholds'][self.lesson_num]:

								                self.lesson_num += 1

								                config = {}

								                parameters = self.data['parameters']

								                for key in parameters:

								                    config[key] = parameters[key][self.lesson_num]

								                logger.info('{0} lesson changed. Now in lesson {1}: {2}'

								                            .format(self._brain_name,

								                                    self.lesson_num,

								                                    ', '.join([str(x) + ' -> ' + str(config[x])

								                                        for x in config])))

								                return True

								        return False


								    def get_config(self, lesson=None):

								        """

								        Returns reset parameters which correspond to the lesson.

								        :param lesson: The lesson you want to get the config of. If None, the

								               current lesson is returned.

								        :return: The configuration of the reset parameters.

								        """

								        if not self.data:

								            return {}

								        if lesson is None:

								            lesson = self.lesson_num

								        lesson = max(0, min(lesson, self.max_lesson_num))

								        config = {}

								        parameters = self.data['parameters']

								        for key in parameters:

								            config[key] = parameters[key][lesson]

								        return config