Safe Haskell	None
Language	Haskell2010

AI.MEP

Contents

Genetic algorithm
Expression interpretation
Random

Description

Multiple Expression Programming

Example application: trigonometry cheating

Suppose, you forgot certain trigonometric identities. For instance, you want to express cos^2(x) using sin(x). No problem, set the target function cos^2(x) in the dataset and add sin to the arithmetic set of operators {+,-,*,/}. See app/Main.hs.

After running

 $ stack build && stack exec hmep-demo

We obtain

 Average loss in the initial population 15.268705681244962
 Population 10: average loss 14.709728527360586
 Population 20: average loss 13.497114190675477
 Population 30: average loss 8.953185872653737
 Population 40: average loss 8.953185872653737
 Population 50: average loss 3.3219954564955856e-15

The average value of 3.3e-15 is close to zero, indicating that the exact expression was found!

The produced output was:

 Interpreted expression:
 v1 = sin x0
 v2 = v1 * v1
 result = 1 - v2

From here we can infer that cos^2(x) = 1 - v2 = 1 - v1 * v1 = 1 - sin^2(x).

Sweet!

Synopsis

type Chromosome a = Vector (Gene a Int)
data Gene a i
type Population a = [Chromosome a]
type Phenotype a = (Double, Chromosome a, Vector Int)
data Config a = Config {
- p'const :: Double
- p'var :: Double
- p'mutation :: Double
- p'crossover :: Double
- c'length :: Int
- c'popSize :: Int
- c'popN :: Int
- c'ops :: Vector (F a)
- c'vars :: Int
}
defaultConfig :: Config Double
type LossFunction a = (Vector a -> Vector a) -> (Vector Int, Double)
initialize :: PrimMonad m => Config Double -> RandT m (Population Double)
evaluatePopulation :: Num a => LossFunction a -> Population a -> Generation a
regressionLoss1 :: (Num result, Ord result) => (b -> b -> result) -> [(a, b)] -> (Vector a -> Vector b) -> (Vector Int, result)
avgLoss :: Generation Double -> Double
best :: Generation a -> Phenotype a
worst :: Generation a -> Phenotype a
evolve :: PrimMonad m => Config Double -> LossFunction Double -> (Chromosome Double -> RandT m (Chromosome Double)) -> (Chromosome Double -> Chromosome Double -> RandT m (Chromosome Double, Chromosome Double)) -> (Generation Double -> RandT m (Chromosome Double)) -> Generation Double -> RandT m (Generation Double)
binaryTournament :: (PrimMonad m, Ord a) => Generation a -> RandT m (Chromosome a)
crossover :: PrimMonad m => Chromosome a -> Chromosome a -> RandT m (Chromosome a, Chromosome a)
mutation3 :: PrimMonad m => Config Double -> Chromosome Double -> RandT m (Chromosome Double)
smoothMutation :: PrimMonad m => Double -> Config Double -> Chromosome Double -> RandT m (Chromosome Double)
newChromosome :: PrimMonad m => Config Double -> RandT m (Chromosome Double)
generateCode :: Phenotype Double -> String
data RandT m a :: (* -> *) -> * -> *
runRandIO :: RandT IO a -> IO a

Documentation

type Chromosome a = Vector (Gene a Int) Source

A chromosome is a vector of genes

data Gene a i Source

Either a terminal symbol or a three-address code (a function and two pointers)

Instances

(Eq a, Eq i) => Eq (Gene a i) Source

Eq instance for Gene

(Show a, Show i) => Show (Gene a i) Source

Show instance for Gene

type Population a = [Chromosome a] Source

List of chromosomes

type Phenotype a = (Double, Chromosome a, Vector Int) Source

Loss value, chromosome, and the best expression indices vector

data Config a Source

MEP configuration

Constructors

Config

Fields

p'const :: Double: Probability of constant generation
p'var :: Double: Probability of variable generation. The probability of operator generation is inferred automatically as 1 - p'const - p'var.
p'mutation :: Double: Mutation probability
p'crossover :: Double: Crossover probability
c'length :: Int: The chromosome length
c'popSize :: Int: A (sub)population size
c'popN :: Int: Number of subpopulations (1 or more) [not implemented]
c'ops :: Vector (F a): Functions pool with their symbolic representations
c'vars :: Int: The input dimensionality

defaultConfig :: Config Double Source

defaultConfig = Config
 {
 p'const = 0.1
 , p'var = 0.4
 , p'mutation = 0.1
 , p'crossover = 0.9
 , c'length = 50
 , c'popSize = 100
 , c'popN = 1
 , c'ops = V.empty -- <-- To be overridden
 , c'vars = 1
 }

type LossFunction a = (Vector a -> Vector a) -> (Vector Int, Double) Source

A function to minimize.

The argument is a vector evaluation function whose input is a vector (length c'vars) and ouput is a vector with a different length c'length.

The result is a vector of the best indices and a scalar loss value.