Classes/_learner_8py_source.html

#!/usr/bin/env python3

""" @brief  Simple trial-and-error learning mechanism.

"""


#============================================================================#

# EVOLIFE  http://evolife.telecom-paris.fr             Jean-Louis Dessalles  #

# Telecom Paris  2022-04-11                                www.dessalles.fr  #

# -------------------------------------------------------------------------- #

# License:  Creative Commons BY-NC-SA                                        #

#============================================================================#

# Documentation: https://evolife.telecom-paris.fr/Classes                    #

#============================================================================#


if __name__ == '__main__':  # for tests

    import sys

    sys.path.append('../..')

    # from Evolife.Scenarii.MyScenario import InstantiateScenario

    # InstantiateScenario('SexRatio')


from random import random, randint

from Evolife.Tools.Tools import boost, LimitedMemory, error


# Global elements

class Global:

    """ General functions: Closer, Perturbate, Limitate, Decrease

    """

    def __init__(self):

        """ Definitions of Closer, Perturbate, Limitate, Decrease

        """

        # Closer pushes x towards Target

        self.Closer = lambda x, Target, Attractiveness: ((100.0 - Attractiveness) * x + Attractiveness * Target) / 100

        # Perturbate is a mutation function

        self.Perturbate = lambda x, Amplitude: x + (2 * random() - 1) * Amplitude

        # Limitate keeps x within limits

        self.Limitate = lambda x, Min, Max: min(max(x,Min), Max)

        # Decrease is a linear decreasing function between 100 and MinY

        self.Decrease = lambda x, MaxX, MinY: max(MinY, (100 - x * ((100.0 - MinY)/ MaxX)))


Gbl = Global()


class LimitedMemory_(LimitedMemory):

    """ memory buffer with limited length

    """

    def __str__(self):

        if self.past:   features = list(self.past[0][0].keys())

        Res = ''

        for b in self.past:

            Res += ','.join([f"{f[0]}:{b[0][f]:0.1f}" for f in features if f == 'Signal'])

            Res += f": {b[1]:0.1f} -- "

        return Res


class Learner:

    """ defines learning capabilities

    """

    def __init__(self, Features, MemorySpan=5, AgeMax=100, Infancy=0, Imitation=0, Speed=3,

            JumpProbability=0, Conservatism=0, LearningSimilarity=10, toric=False, Start=-1):

        """ Features :  Dictionary or list of features that will be learned

            MemorySpan: size of memory

            Scores :    memory of past benefits

            AgeMax:     Max age before resetting

            Performance :    stores current performances

            Infancy :    percentage of lifetime when the learner is considered a child

            Imitation :  forced similarity wiht neighbouring values when learning continuous function

            Speed :  learning speed

            JumpProbability:    Probability of jumping far from last value

            Conservatism:   Importance in % of immediate past solutions

            LearningSimilarity = LearningSimilarity

                Influence of neighbouring feature values when retrieving best past feature value.

                Between 0.1 (or so) and 100.

                Influence of NeighbVal on Val is   LearningSimilarity / abs(Val - NeighbVal)

                10 means that a feature that differs by 30 contributes up to 1/3 of its value.

                0.1 or so would cancel the effect of neighbouring feature values.

            Toric = toric

                If True, learning space is circular (toric): maximal feature values are next to smallest values.

            Start:  Features are created random (-1) or all-zero (0) or all-100 (1)

        """

        self.Features = Features    # Dictionary or list of features that will be learned

        self.MemorySpan = MemorySpan

        self.Scores = LimitedMemory_(self.MemorySpan)  # memory of past benefits

        self.AgeMax = AgeMax    # Max age before resetting

        self.Performance = []   # stores current performances

        self.Infancy = Infancy  # percentage of lifetime when the learner is considered a child

        self.Imitation = Imitation  # forced similarity wiht neighbouring values when learning continuous function

        self.Speed = Speed  # learning speed

        self.JumpProbability = JumpProbability  # Probability of jumping far from last value

        self.Conservatism = Conservatism    #   Importance in % of immediate past solutions

        self.LearningSimilarity = LearningSimilarity

        self.Toric = toric

        self.Start = Start

        self.Reset(Newborn=False)   # individuals are created at various ages


    def Reset(self, Newborn=True):

        """ Initializes Feature values to random values (if Start == -1)

            Age set to random value if Newborn is False (useful at start)

        """

        self.Age = 0 if Newborn else randint(0, self.AgeMax)    # age is random at initialization

        Features = dict()   # so that self.Features may be created as a list

        for F in self.Features:

            if self.Start == -1 or Newborn: Features[F] = randint(0,100)

            else: Features[F] = 100 * self.Start

        self.Features = Features

        self.Scores.reset()


    def adult(self):

        """ adult if age larger than AgeMax*Infancy/100

        """

        return self.Age > self.AgeMax * self.Infancy / 100.0


    def feature(self, F, Value=None):

        """ reads or sets feature value

        """

        if F is None:   F = list(self.Features.keys())[0]

        if Value is not None:   self.Features[F] = Value

        return self.Features[F]


    def Limitate(self, x, Min, Max):

        if self.Toric: return (x % Max)

        else:   return Gbl.Limitate(x, Min, Max)


    def imitate(self, models, Feature):

        """ The individual moves its own feature closer to its models' features

        """

        if models:

            TrueModels = [m for m in models if m.adult()]

            if TrueModels:

                ModelValues = list(map(lambda x: x.feature(Feature), TrueModels))

                Avg = float(sum(ModelValues)) / len(ModelValues)

                return Gbl.Closer(self.feature(Feature), Avg, self.Imitation)

        return self.feature(Feature)


    def bestRecord(self, second=False):

        """ Retrieves the best (or the second best) solution so far

        """

        if len(self.Scores) == 0:   Best = None

        elif len(self.Scores) == 1: Best = self.Scores.last()

        else:

            # ------ retrieve the best solution so far

            past = self.Scores.retrieve()

            Best = max(past, key = lambda x: x[1])

            if second:

                # ------ retrieve the SECOND best solution so far

                past = past[:]

                past.remove(Best)

                Best = max(past, key = lambda x: x[1])

        return Best


    def bestFeatureRecord(self, Feature):

        """ Alternative to bestRecord that aggregates similar feature values

        """

        if len(self.Scores) == 0:   return None

        Best = dict()

        for i, (B1, Perf1) in enumerate(self.Scores.retrieve()):

            for j, (B2, Perf2) in enumerate(self.Scores.retrieve()):

                # if j >= i:    break   # symmetry

                dist= abs(B1[Feature] - B2[Feature]) / (0.001 +self.LearningSimilarity)

                # ------ updating Perf1 through weighted sum depending on distance

                Perf1 = (Perf1 + Perf2 / (1 + dist)) * (1 + dist)/(2 + dist)

            Best[B1[Feature]] = Perf1

        return max(Best, key=Best.get)  # return key with max value


    def avgRecord(self):

        """ Averaging past scores

        """

        if len(self.Scores) > 0:

            return sum([p[1] for p in self.Scores.retrieve()]) / len(self.Scores)

        else:   return 0


    def loser(self):

        """ A looser has full experience and bad results

        """

        return self.Scores.complete() and self.bestRecord()[1] <= 0


    def explore(self, Feature, Speed, Bottom=0, Top=100):

        """ the individual changes its feature values

        """

        # try:  Best = self.bestRecord(second=False)[0][Feature]

        try:    Best = self.bestFeatureRecord(Feature)

        except (TypeError, IndexError): Best = self.Features[Feature]

        Target = self.Limitate(Gbl.Perturbate(Best, Speed), Bottom, Top)

        return round(Gbl.Closer(Target, self.feature(Feature), self.Conservatism), 2)   # Target closer to old value if conservative


    def Learns(self, neighbours=None, Speed=None, hot=False, BottomValue=0, TopValue=100):

        """ Learns by randomly changing current value.

            Starting point depends on previous success and on neighbours.

            If 'hot' is true, perturbation is larger for children

        """

        if self.Age > self.AgeMax:  self.Reset(Newborn=True)

        self.Age += 1

        # Averaging performances obtained for current feature values

        Performance = 0

        if len(self.Performance): Performance = float(sum(self.Performance)) / len(self.Performance)

        self.Performance = []   # resetting performance

        self.Scores.push((self.Features.copy(), Performance))   # storing current performance

        if self.Age == 1:   return False    # Newborn, no learning


        # (1) imitation

        FeatureNames = list(self.Features.keys()) # safer to put 'list'

        # get features closer to neighbours' values

        if self.Imitation:

            for F in FeatureNames:  self.feature(F, self.imitate(neighbours, F))


        # (2) exploration

        if Speed is None:   Speed = self.Speed

        if hot and not self.adult():    # still a kid

            LearningSpeed = Gbl.Decrease(self.Age, self.Infancy, Speed)

        else:   LearningSpeed = Speed

        if randint(0,100) < self.JumpProbability:   LearningSpeed = TopValue    # max exploration from time to time

        # compromise between current value and a perturbation of past best value

        for F in FeatureNames:

            # Pr = (F == 'Signal' and self.feature(F) == 0) ################################

            self.feature(F, self.explore(F, LearningSpeed, Bottom=BottomValue, Top=TopValue))

            # if Pr:    #################################

                # print(self.outrages, self.Scores, '\t//\t', self.feature(F))

                # print(self.bestFeatureRecord('Signal'))

        return True


    def wins(self, Points):

        """ stores a benefit

        """

        self.Performance.append(Points)


    def __str__(self):  return str(self.Features)


if __name__ == "__main__":

    print(__doc__)

    print(Learner.__doc__ + '\n\n')

    John_Doe = Learner({'F':0})

    print("John_Doe:\n")

    print(John_Doe)

    raw_input('[Return]')


__author__ = 'Dessalles'

Evolife.Ecology.Learner.Global
General functions: Closer, Perturbate, Limitate, Decrease.
Definition: Learner.py:32

Evolife.Ecology.Learner.Global.Limitate
Limitate
Definition: Learner.py:43

Evolife.Ecology.Learner.Global.Decrease
Decrease
Definition: Learner.py:45

Evolife.Ecology.Learner.Global.__init__
def __init__(self)
Definitions of Closer, Perturbate, Limitate, Decrease.
Definition: Learner.py:35

Evolife.Ecology.Learner.Global.Perturbate
Perturbate
Definition: Learner.py:41

Evolife.Ecology.Learner.Global.Closer
Closer
Definition: Learner.py:39

Evolife.Ecology.Learner.Learner
defines learning capabilities
Definition: Learner.py:61

Evolife.Ecology.Learner.Learner.loser
def loser(self)
A looser has full experience and bad results.
Definition: Learner.py:179

Evolife.Ecology.Learner.Learner.Start
Start
Definition: Learner.py:98

Evolife.Ecology.Learner.Learner.LearningSimilarity
LearningSimilarity
Definition: Learner.py:96

Evolife.Ecology.Learner.Learner.feature
def feature(self, F, Value=None)
reads or sets feature value
Definition: Learner.py:118

Evolife.Ecology.Learner.Learner.Speed
Speed
Definition: Learner.py:93

Evolife.Ecology.Learner.Learner.Toric
Toric
Definition: Learner.py:97

Evolife.Ecology.Learner.Learner.Infancy
Infancy
Definition: Learner.py:91

Evolife.Ecology.Learner.Learner.Age
Age
Definition: Learner.py:105

Evolife.Ecology.Learner.Learner.bestFeatureRecord
def bestFeatureRecord(self, Feature)
Alternative to bestRecord that aggregates similar feature values.
Definition: Learner.py:158

Evolife.Ecology.Learner.Learner.wins
def wins(self, Points)
stores a benefit
Definition: Learner.py:229

Evolife.Ecology.Learner.Learner.Features
Features
Definition: Learner.py:86

Evolife.Ecology.Learner.Learner.imitate
def imitate(self, models, Feature)
The individual moves its own feature closer to its models' features.
Definition: Learner.py:130

Evolife.Ecology.Learner.Learner.avgRecord
def avgRecord(self)
Averaging past scores.
Definition: Learner.py:172

Evolife.Ecology.Learner.Learner.MemorySpan
MemorySpan
Definition: Learner.py:87

Evolife.Ecology.Learner.Learner.JumpProbability
JumpProbability
Definition: Learner.py:94

Evolife.Ecology.Learner.Learner.Reset
def Reset(self, Newborn=True)
Initializes Feature values to random values (if Start == -1) Age set to random value if Newborn is Fa...
Definition: Learner.py:101

Evolife.Ecology.Learner.Learner.Learns
def Learns(self, neighbours=None, Speed=None, hot=False, BottomValue=0, TopValue=100)
Learns by randomly changing current value.
Definition: Learner.py:194

Evolife.Ecology.Learner.Learner.Conservatism
Conservatism
Definition: Learner.py:95

Evolife.Ecology.Learner.Learner.Limitate
def Limitate(self, x, Min, Max)
Definition: Learner.py:125

Evolife.Ecology.Learner.Learner.bestRecord
def bestRecord(self, second=False)
Retrieves the best (or the second best) solution so far.
Definition: Learner.py:142

Evolife.Ecology.Learner.Learner.__init__
def __init__(self, Features, MemorySpan=5, AgeMax=100, Infancy=0, Imitation=0, Speed=3, JumpProbability=0, Conservatism=0, LearningSimilarity=10, toric=False, Start=-1)
Features : Dictionary or list of features that will be learned MemorySpan: size of memory Scores : me...
Definition: Learner.py:65

Evolife.Ecology.Learner.Learner.explore
def explore(self, Feature, Speed, Bottom=0, Top=100)
the individual changes its feature values
Definition: Learner.py:184

Evolife.Ecology.Learner.Learner.Performance
Performance
Definition: Learner.py:90

Evolife.Ecology.Learner.Learner.Imitation
Imitation
Definition: Learner.py:92

Evolife.Ecology.Learner.Learner.AgeMax
AgeMax
Definition: Learner.py:89

Evolife.Ecology.Learner.Learner.adult
def adult(self)
adult if age larger than AgeMax*Infancy/100
Definition: Learner.py:113

Evolife.Ecology.Learner.Learner.Scores
Scores
Definition: Learner.py:88

Evolife.Ecology.Learner.LimitedMemory_
memory buffer with limited length
Definition: Learner.py:50

Evolife.Tools.Tools.LimitedMemory
memory buffer with limited length
Definition: Tools.py:201

Evolife.Tools.Tools.LimitedMemory.past
past
Definition: Tools.py:211

Evolife.Tools.Tools
Various functions.
Definition: Tools.py:1