hip/chl.go

// Copyright (c) 2019, The Emergent Authors. All rights reserved.
// Use of this source code is governed by a BSD-style
// license that can be found in the LICENSE file.

package hip

import (
	"fmt"
	"github.com/chewxy/math32"
	"github.com/dhairyyas/leabra-sleep/leabra"
)

// Contrastive Hebbian Learning (CHL) parameters
type CHLParams struct {
	On      bool    `desc:"if true, use CHL learning instead of standard XCAL learning -- allows easy exploration of CHL vs. XCAL"`
	Hebb    float32 `def:"0.001" min:"0" max:"1" desc:"amount of hebbian learning (should be relatively small, can be effective at .0001)"`
	Err     float32 `def:"0.999" min:"0" max:"1" inactive:"+" desc:"amount of error driven learning, automatically computed to be 1-Hebb"`
	MinusQ1 bool    `desc:"if true, use ActQ1 as the minus phase -- otherwise ActM"`
	SAvgCor float32 `def:"0.4:0.8" min:"0" max:"1" desc:"proportion of correction to apply to sending average activation for hebbian learning component (0=none, 1=all, .5=half, etc)"`
	SAvgThr float32 `def:"0.001" min:"0" desc:"threshold of sending average activation below which learning does not occur (prevents learning when there is no input)"`
}

func (ch *CHLParams) Defaults() {
	ch.On = true
	ch.Hebb = 0.001
	ch.SAvgCor = 0.4
	ch.SAvgThr = 0.001
	ch.Update()
}

func (ch *CHLParams) Update() {
	ch.Err = 1 - ch.Hebb
}

// MinusAct returns the minus-phase activation to use based on settings (ActM vs. ActQ1)
func (ch *CHLParams) MinusAct(actM, actQ1 float32) float32 {
	if ch.MinusQ1 {
		return actQ1
	}
	return actM
}

// HebbDWt computes the hebbian DWt value from sending, recv acts, savgCor, and linear Wt
func (ch *CHLParams) HebbDWt(sact, ract, savgCor, linWt float32) float32 {
	return ract * (sact*(savgCor-linWt) - (1-sact)*linWt)
}

// ErrDWt computes the error-driven DWt value from sending,
// recv acts in both phases, and linear Wt, which is used
// for soft weight bounding (always applied here, separate from hebbian
// which has its own soft weight bounding dynamic).
func (ch *CHLParams) ErrDWt(sactP, sactM, ractP, ractM, linWt float32) float32 {
	err := (ractP * sactP) - (ractM * sactM)
	if err > 0 {
		err *= (1 - linWt)
	} else {
		err *= linWt
	}
	return err
}

// DWt computes the overall dwt from hebbian and error terms
func (ch *CHLParams) DWt(hebb, err float32) float32 {
	return ch.Hebb*hebb + ch.Err*err
}

////////////////////////////////////////////////////////////////////
//  CHLPrjn

// hip.CHLPrjn is a Contrastive Hebbian Learning (CHL) projection,
// based on basic rate-coded leabra.Prjn, that implements a
// pure CHL learning rule, which works better in the hippocampus.
type CHLPrjn struct {
	leabra.Prjn           // access as .Prjn
	CHL         CHLParams `view:"inline" desc:"parameters for CHL learning -- if CHL is On then WtSig.SoftBound is automatically turned off -- incompatible"`
}

func (pj *CHLPrjn) Defaults() {
	pj.Prjn.Defaults()
	pj.CHL.Defaults()
	pj.Prjn.Learn.Norm.On = false     // off by default
	pj.Prjn.Learn.Momentum.On = false // off by default
	pj.Prjn.Learn.WtBal.On = false    // todo: experiment
}

func (pj *CHLPrjn) UpdateParams() {
	pj.CHL.Update()
	if pj.CHL.On {
		pj.Prjn.Learn.WtSig.SoftBound = false
	}
	pj.Prjn.UpdateParams()
}

//////////////////////////////////////////////////////////////////////////////////////
//  Learn methods

// DWt computes the weight change (learning) -- on sending projections
// CHL version supported if On
func (pj *CHLPrjn) DWt() {
	if !pj.Learn.Learn {
		return
	}
	if pj.CHL.On {
		pj.DWtCHL()
	} else {
		pj.Prjn.DWt()
	}
}

// DS Added
func (pj *CHLPrjn) SlpDWt() {
	if !pj.Learn.Learn {
		return
	}
	if pj.CHL.On {
		pj.SlpDWtCHL()
	} else {
		fmt.Println("error - projection is not CHL learning on and sleep dwt won't work")
	}
}

// SAvgCor computes the sending average activation, corrected according to the SAvgCor
// correction factor (typically makes layer appear more sparse than it is)
func (pj *CHLPrjn) SAvgCor(slay *leabra.Layer) float32 {
	savg := .5 + pj.CHL.SAvgCor*(slay.Pools[0].ActAvg.ActPAvgEff-0.5)
	savg = math32.Max(pj.CHL.SAvgThr, savg) // keep this computed value within bounds
	return 0.5 / savg
}

// DS Added
// SlpDWtCHL computes sleep error driven learning using avg plus phase and minus phase activations
func (pj *CHLPrjn) SlpDWtCHL() {
	slay := pj.Send.(leabra.LeabraLayer).AsLeabra()
	//rlay := pj.Recv.(leabra.LeabraLayer).AsLeabra()
	//if slay.Pools[0].ActP.Avg < pj.CHL.SAvgThr { // inactive, no learn
	//	return
	//}
	for si := range slay.Neurons {
		//sn := &slay.Neurons[si]
		nc := int(pj.SConN[si])
		st := int(pj.SConIdxSt[si])
		syns := pj.Syns[st : st+nc]
		//scons := pj.SConIdx[st : st+nc]
		//snActM := pj.CHL.MinusAct(sn.ActM, sn.ActQ1)
		//savgCor := pj.SAvgCor(slay)
		for ci := range syns {
			sy := &syns[ci]
			//ri := scons[ci]
			//rn := &rlay.Neurons[ri]

			err := sy.ActPAvg - sy.ActMAvg
			sy.ActMAvg = 0
			sy.ActPAvg = 0
			if err > 0 {
				err *= (1 -  sy.LWt)
			} else {
				err *=  sy.LWt
			}
			dwt := err
			norm := float32(1)
			if pj.Learn.Norm.On {
				norm = pj.Learn.Norm.NormFmAbsDWt(&sy.Norm, math32.Abs(dwt))
			}
			if pj.Learn.Momentum.On {
				dwt = norm * pj.Learn.Momentum.MomentFmDWt(&sy.Moment, dwt)
			} else {
				dwt *= norm
			}
			sy.DWt += pj.Learn.Lrate * dwt
		}
		// aggregate max DWtNorm over sending synapses
		if pj.Learn.Norm.On {
			maxNorm := float32(0)
			for ci := range syns {
				sy := &syns[ci]
				if sy.Norm > maxNorm {
					maxNorm = sy.Norm
				}
			}
			for ci := range syns {
				sy := &syns[ci]
				sy.Norm = maxNorm
			}
		}
	}
}

// DWtCHL computes the weight change (learning) for CHL
func (pj *CHLPrjn) DWtCHL() {
	slay := pj.Send.(leabra.LeabraLayer).AsLeabra()
	rlay := pj.Recv.(leabra.LeabraLayer).AsLeabra()
	if slay.Pools[0].ActP.Avg < pj.CHL.SAvgThr { // inactive, no learn
		return
	}
	for si := range slay.Neurons {
		sn := &slay.Neurons[si]
		nc := int(pj.SConN[si])
		st := int(pj.SConIdxSt[si])
		syns := pj.Syns[st : st+nc]
		scons := pj.SConIdx[st : st+nc]
		snActM := pj.CHL.MinusAct(sn.ActM, sn.ActQ1)

		savgCor := pj.SAvgCor(slay)

		for ci := range syns {
			sy := &syns[ci]
			ri := scons[ci]
			rn := &rlay.Neurons[ri]
			rnActM := pj.CHL.MinusAct(rn.ActM, rn.ActQ1)

			hebb := pj.CHL.HebbDWt(sn.ActP, rn.ActP, savgCor, sy.LWt)
			err := pj.CHL.ErrDWt(sn.ActP, snActM, rn.ActP, rnActM, sy.LWt)

			dwt := pj.CHL.DWt(hebb, err)
			norm := float32(1)
			if pj.Learn.Norm.On {
				norm = pj.Learn.Norm.NormFmAbsDWt(&sy.Norm, math32.Abs(dwt))
			}
			if pj.Learn.Momentum.On {
				dwt = norm * pj.Learn.Momentum.MomentFmDWt(&sy.Moment, dwt)
			} else {
				dwt *= norm
			}
			sy.DWt += pj.Learn.Lrate * dwt
		}
		// aggregate max DWtNorm over sending synapses
		if pj.Learn.Norm.On {
			maxNorm := float32(0)
			for ci := range syns {
				sy := &syns[ci]
				if sy.Norm > maxNorm {
					maxNorm = sy.Norm
				}
			}
			for ci := range syns {
				sy := &syns[ci]
				sy.Norm = maxNorm
			}
		}
	}
}