Bayesian-Net-Toolbox/bayesianNet.py at master · davidhaohanli/Bayesian-Net-Toolbox · GitHub

1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
210
211
212
213
214
215
216
217
218
219
220
221
222
223
224
225
226
227
228
229
230
231
232
233
234
235
236
237
238
239
240
241
242
243
244
245
246
247
248
249
250
251
252
253
254
255
256
257
258
259
260
261
262
263
264
265
266
267
268
269
270
271
272
273
274
275
276
277
278
279
280
281
282
283
284
285
286
287
288
289
290
291
292
293
294
295
296
297
298
299
300
301
302
303
304
305
306
307
308
309
310
311
312
313
314
315
316
317
318
319
320
321
322
323
324
325
326
327
328
329
330
331
332
333
334
335
336
337
338
339
340
341
342
343
344
345
346
347
348
349
350
351
352
353
354
355
356
357
358
359
360
361
362
363
364
365
366
367
368
369
370
371
372
373
374
375
376
377
378
379
380
381
382
383
384
385
386
387
388
389
390
391
392
393
394
395
396
397
398
399
400
401
402
403
404
405
406
407
408
409
410
411
412
413
414
415
416
417
418
419
420
421
422
423
424
425
426
427
428
429
430
431
432
433
434
435
436
437
438
439
440
441
442
443
444
445
446
447
448
449
450
451
452
453
454
455
456
457
458
459
460
461
462
463
464
465
466
467
468
469
470
471
472
473
474
475
476
477
478
479
480
481
482
483
484
485
486
487
488
489
490
491
492
493
494
495
496
497
498
499
500
501
502
503
504
505
506
507
508
509
510
511
512
513
514
515
516
517
518
519
520
521
522
523
524
525
526
527
528
529
530
531
532
533
534
535
536
537
538
539
540
541
542
543
544
545
546
547
548
549
550
551
552
553
554
555
556
557
558
559
560
561
562
563
564
565
566
567
568
569
570
571
572
573
574
575
576
577
578
579
580
581
582
583
584
585
586
587
588
589
590
591
592
593
594
595
596
597
#TODO COMMENT ABOUT THE TOOLBOX

import itertools
import functools
import copy
import numpy as np
from abc import abstractmethod
from matplotlib import pyplot as plt

np.random.seed(1784)

#TODO COMMENT IN DETAILS

def plot(pointsA:list,exactFactorForStepShow):
    plt.figure(figsize=(20, 5))
    plt.plot(pointsA)
    plt.plot([exactFactorForStepShow.get_val((True,))]*len(pointsA), 'r--')
    plt.xlabel('Sample Size')
    plt.ylabel('Probability for True')
    plt.legend(['Gibbs Sampling', 'Variable Elimination'])
    plt.show()

def printVal(cpd):
    print('Variables: {}\n Probability Distribution:\n{}\n'.format(cpd.scope, \
                                                                   cpd.get_all_val()))

def cleanser(theClass=tuple,posOfParam=2):
	def wrapper(func):
		def decFunc(*args,**kw):
			args=list(args)
			thisType = type(args[posOfParam-1])
			if thisType is not theClass:
				if thisType is str:
					args[posOfParam-1] = theClass([args[posOfParam-1],])
					return func(*args,**kw)
				try:
					thisType.__iter__
					args[posOfParam-1] = theClass(args[posOfParam-1])
				except:
					args[posOfParam-1] = theClass([args[posOfParam-1],])
			return func(*args,**kw)
		return decFunc
	return wrapper

class Factor(object):
    '''

    self.valDistribution is the factor value distribution on the random variable assignemnt grid
    in form as:
    {(True,True,True):0.1,(True,True,False):0.9,(True,False,True):None,...,(False,False,False):1.6}
    * None for value pending to be determined

    '''

    def __init__(self,scope:tuple,varValsDict=None,defaultVal=None):
        '''
        :param scope:  tuple of chars
        :param valsDistribution:  dict of distribution of factor values on the random variable grid
        '''
        self.scope = scope
        self.var_assignment(defaultVal); # assign values to each random variables to generate a grid
        if varValsDict:
            self.add_all_vals(varValsDict)

    def var_assignment(self,defaultVal=None):
        '''
        repeat scope size times to get the binary grid
        '''
        self.valDistribution = dict()
        for thisVarVals in itertools.product((True,False),repeat=len(self.scope)):
            self.valDistribution[thisVarVals] = defaultVal

    def add_all_vals(self,varValsDict):
        '''
        :param varValsDict: dict of [tuples,float]    e.g. {(True,True):0.9}
        '''
        for thisVarVals,val in varValsDict.items():
            self.add_val(thisVarVals,val)

    @cleanser()
    def add_val(self,varVals,val):
        '''
        :param varVals: tuples,assignment to random variables
        :param val: value of the grid point
        '''
        self.valDistribution[varVals] = val

    def get_val(self,varVals):
        '''
        :param vars: tuples,assignment to query random variables
        :return: value of the grid point, None for unassigned yet
        '''
        return self.valDistribution[varVals]

    def get_all_val(self):
        '''
        :return: self.valDistribution
        '''
        return self.valDistribution

    def val_check(self):
        '''
        :return: points on the grid with value unassigned. if all assigned, return True
        '''
        res=[]
        for thisVarVals,val in self.valDistribution.items():
            if val is None:
                res.append(thisVarVals)
        if res:
            return res
        return True

    def normalize(self):
        if self.val_check() is True:
            normalizer = sum(self.valDistribution.values())
            for thisVarVals in self.valDistribution.keys():
                self.valDistribution[thisVarVals]/=normalizer
        else:
            print ('some values unassigned\n')

class BayesianModel(object):
    '''
    self.nodes is the nodes over the graphical network, a dict of {str : list of str}   e.g. {'a':['b','c'],'b':[],'c':[],'d':['c']}
    self.factors is the factors of variables, a list of factors
    '''

    def __init__(self,edges=None):
        '''
        :param edges: in for [('a','b'),('c')] where 'a' is predecessor of 'b'
        '''
        self.nodes = dict()
        self.factors = list()
        if edges:
            self.add_edges(edges)

    @cleanser(list)
    def add_edges(self,edges):
        for edge in edges:
            self.add_edge(edge)

    @cleanser(tuple)
    def add_edge(self,edge):
        self.add_nodes(edge)
        if len(edge) > 1:
            self.nodes[edge[0]].append(edge[1])

    @cleanser(list)
    def add_nodes(self,nodes):
        for node in nodes:
            if node not in self.nodes.keys():
                self.nodes[node] = []

    @cleanser(list)
    def add_factors(self,factors):
        self.factors.extend(factors)

    def add_cpd(self,node:str, mat:'2d list', evidences:list=None)->'convert to factor':

        scope=[node]
        if evidences:
            scope+=evidences
        else:
            self.factors.append(Factor(scope,{(True,):mat[0][0],(False,):mat[1][0]}))
            return
        newFactor = Factor(tuple(scope))

        for i,nodeVal in enumerate((True,False)):
            for j,evidenceVals in enumerate(itertools.product((True,False),repeat=len(evidences))):
                thisVarValDict = dict()
                thisVarValDict[node] = nodeVal
                for ind,var in enumerate(evidences):
                    thisVarValDict[var] = evidenceVals[ind]
                newFactor.add_val(tuple([thisVarValDict[var] for var in newFactor.scope]),mat[i][j])

        self.factors.append(newFactor)

class Inference(object):
    #TODO abstract the class
    #TODO collect the common methods

    def __init__(self,model):
        '''
        :param model: A Bayesian Model
        '''
        self.model = model

    @abstractmethod
    def query(self,queries,evidences):
        raise NotImplementedError()

    def topoSort(self,vars=None):
        '''
        :param vars: variables to be ordered according to topological orders
        :return:  ordered variables (reversed)
        '''
        if vars is None:
            vars = list(self.model.nodes.keys())

        color=dict()
        for node in self.model.nodes.keys():
            color[node]='white'
        time = 0
        res = []

        def dfs(node,time):
            color[node]='grey'
            time += 1
            for adj in self.model.nodes[node]:
                if color[adj] == 'white':
                    time = dfs(adj,time)
            color[node] = 'black'
            time+=1
            if node in vars:
                res.append(node)
            return time

        for node in self.model.nodes.keys():
            if color[node] == 'white':
                time = dfs(node,time)

        return res

class VE(Inference):

    @cleanser(list)
    def query(self,queries:list,evidences:dict=dict(),printTrigger:bool=True)->Factor:
        '''
        :param queries: list of joint conditional probabilities pending to query      e.g. ['a','b']
        :param evidences: dict of evidences       e.g. {'c':True,'d':False}
        :return: a factor with value distribution on query variables only (normalized)
        '''

        factors = copy.deepcopy(self.model.factors)

        blanket_factors = self.is_markov_blanket(queries, evidences,factors)

        if not blanket_factors:
            varsToBeEliminated = set(self.model.nodes.keys())-set(queries)-set(evidences.keys())

        else:
            varsToBeEliminated = []
            factors = blanket_factors

        for i in range(len(factors)):
            factors[i] = self.giveEvidence(factors[i], evidences)

        cpd_factor = self.sum_product(factors,varsToBeEliminated)
        cpd_factor.normalize()

        if printTrigger:
            printVal(cpd_factor)

        return cpd_factor

    def is_markov_blanket(self,queries,evidences,factors):

        blanket = []

        for factor in factors:
            if set(factor.scope).intersection(queries):
                if set(factor.scope) - set(queries) - set(evidences.keys()):
                    return False
                blanket.append(factor)
        return blanket

    def sum_product(self,factors,vars)->Factor:
        '''
        :param factors: all factors
        :param vars: variables to be eliminated
        :return:
        '''
        vars = self.topoSort(vars)
        while vars:
            var = vars.pop()
            factors = self.sum_product_var(factors,var)
        return self.facs_multi(factors)

    def sum_product_var(self,factors,var)->'list of Factors':
        '''
        :param factors: all factors
        :param var:  variable to be eliminated
        :return: set of all factors after VE of this variable
        '''
        involvedFactors = []
        otherFactors = []
        for factor in factors:
            if var in factor.scope:
                involvedFactors.append(factor)
            else:
                otherFactors.append(factor)
        newFactor = self.sum_ve(self.facs_multi(involvedFactors),var)
        return otherFactors+[newFactor]

    def facs_multi(self,factors,pre=None,isReduceVersion=False)->Factor:
        '''
        :param factors: list of Factors
        :param pre: a Factor
        :param isReduceVersion: use functools.reduce or my own implementation
        :return: new Factor
        '''
        if isReduceVersion:
            return functools.reduce(self.two_facs_multi,factors)

        # my own implementation: recursively compute 2 factor multiplication
        if not pre:
            pre = factors[0]
            factors = factors[1:]
        if factors:
            pre = self.two_facs_multi(factors[0],pre)
            res = self.facs_multi(factors[1:],pre)
            return res
        return pre

    def two_facs_multi(self,a,b)->Factor:
        '''
        :param a: a Factor
        :param b: a Factor
        :return: a new Factor
        '''
        newFactor = Factor(tuple(set(a.scope+b.scope))) #newFactor scope: scope of a + scope of b - common scope

        for thisVarVals in newFactor.val_check():

            # dict form : {'a':True,'b':False,'c':True}
            thisVarValsDict = dict()
            for i,var in enumerate(newFactor.scope):
                thisVarValsDict[var] = thisVarVals[i]

            a_val = a.get_val(tuple([thisVarValsDict[var] for var in a.scope]))
            #find the random variable assignment of a scope e.g. (b,a) from the dict, and then get value
            b_val = b.get_val(tuple([thisVarValsDict[var] for var in b.scope]))
            # find the random variable assignment of b scope e.g. (c,a) from the dict, and then get value
            newFactor.add_val(thisVarVals,a_val*b_val)

        return newFactor

    @cleanser(list,3)
    def sum_ve(self,factor,vars)->Factor:
        '''
        :param factor: factor containing variables
        :param vars: variables to be eliminated
        :return: new factor
        '''

        newFactor = Factor(tuple(set(factor.scope) - set(vars)))
        for thisVarVals in newFactor.val_check():

            # dict form : {'a':True}
            thisVarValsDict = dict()
            for i, var in enumerate(newFactor.scope):
                thisVarValsDict[var] = thisVarVals[i]

            val=0
            for eliminateVarVals in itertools.product((True, False), repeat=len(vars)):
                factorVarValsDict = dict()
                for i, var in enumerate(vars):
                    factorVarValsDict[var] = eliminateVarVals[i]
                factorVarValsDict.update(thisVarValsDict)

                val += factor.get_val(tuple([factorVarValsDict[var] for var in factor.scope]))

            newFactor.add_val(thisVarVals,val)

        return newFactor

    def giveEvidence(self,factor,evidences)->Factor:
        '''
        :param factor: factor containing evidence variables
        :param evidences: dict of evidences       e.g. {'c':True,'d':False}
        :return: new factor
        '''
        newFactor = Factor(tuple(set(factor.scope)-set(evidences.keys())))
        for thisVarVals in newFactor.val_check():

            # dict form : {'a':True}
            thisVarValsDict = dict()
            for i, var in enumerate(newFactor.scope):
                thisVarValsDict[var] = thisVarVals[i]
            # merge thisVarValsDict (in newFactor) and evidences
            thisVarValsDict.update(evidences)

            newFactor.add_val(thisVarVals,factor.get_val(tuple([thisVarValsDict[var] for var in factor.scope])))

        return newFactor

class GibbsSampler(Inference):

    def __init__(self,model,step = 1000, burnInCoefficient = 0.3, thinningGap = 5):
        super().__init__(model)
        self.hyperParamSet({'step':step,'burnInCoefficient':burnInCoefficient,'thinningGap':thinningGap})
        self.initStepCollector()

    def initStepCollector(self):
        self.stepVals=[]
        self.allSamples=[]

    def hyperParamSet(self,hyperParams = {'step':1000,'burnInCoefficient':0.3,'thinningGap':5}):
        '''
        :param step: sample size
        :param burnInCoefficient: proportion of starting samples to be dropped
        :param thinningGap: selection gap for i.i.d
        '''
        if hyperParams.get('step') is not None:
            self.step = hyperParams['step']

        if hyperParams.get('step') is not None:
            self.burnInNum = self.step * hyperParams['burnInCoefficient']

        if hyperParams.get('step') is not None:
            self.thinningGap = hyperParams['thinningGap']

    @cleanser(list)
    def query(self,queries:list,evidences:dict=dict(),\
              printTrigger:bool=True,collectTrigger:bool=False,exactFactorForStepShow:Factor=None)->Factor:
        '''
        :param queries: list of joint conditional probabilities pending to query      e.g. ['a','b']
        :param evidences: dict of evidences       e.g. {'c':True,'d':False}
        :return: a probability distribution, Factor
        '''
        varsToBeSampled = self.topoSort(set(self.model.nodes.keys()) - set(evidences.keys()))[::-1]

        cpd = self.gibbs(varsToBeSampled,queries,evidences,collectTrigger)

        if exactFactorForStepShow is not None:
            plot(self.stepVals,exactFactorForStepShow)

        if printTrigger:
            print(cpd)

        return cpd

    def gibbs(self,vars:list,queries:list,evidences:dict,collectTrigger:bool=False)->Factor:
        '''
        :param factors: all factors
        :param vars: sorted vars to be sampled
        :param steps: number of sample sets needed
        :return: desired cpd factor
        '''
        samplePool = self.initSamplePool(vars)

        newFactor = Factor(tuple(queries),defaultVal=0)

        if collectTrigger is not None:
            self.initStepCollector()
            tempFactor = Factor(tuple(queries),defaultVal=0)

        for t in range(self.step):

            thisVarValDict=dict()

            for var in vars:
                samplePool = self.sample(var,samplePool,evidences)
                if var in queries:
                    thisVarValDict[var] = samplePool[var]

            thisVarVals = tuple([thisVarValDict[var] for var in newFactor.scope])

            if collectTrigger is not None:
                tempFactor.add_val(thisVarVals,tempFactor.get_val(thisVarVals) + 1)
                self.stepCollect(tempFactor,thisVarVals)

            if t >= self.burnInNum and not t % self.thinningGap:
                newFactor.add_val(thisVarVals,newFactor.get_val(thisVarVals)+1)

        newFactor.normalize()

        return newFactor

    def initSamplePool(self,vars):
        samplePool=dict()
        for var in vars:
            particle = np.random.rand()
            if particle <= 0.5:
                newSampleVal = True
            else:
                newSampleVal = False
            samplePool[var] = newSampleVal
        return samplePool

    def sample(self,var:str,samplePool:dict,evidences:dict)->dict:
        '''
        :param samplePool: dict of samples
        :param factors: all factors from model
        :param var: variable to be sampled
        :return: the updated dictionary of samples
        '''
        samplePool.pop(var,None)

        fullEvidence = {**samplePool,**evidences}

        cpd = VE(self.model).query([var],fullEvidence,False)

        particle = np.random.rand()

        if particle <= cpd.get_val((True,)):
            newSampleVal = True
        else:
            newSampleVal = False

        samplePool[var] = newSampleVal

        return samplePool

    def stepCollect(self,theFactor:Factor,thisVarVals):

        theFactor = copy.deepcopy(theFactor)

        theFactor.normalize()

        self.stepVals.append(theFactor.get_val((True,)))

        self.allSamples.append(thisVarVals)

    def get_steps(self):
        '''
        :return: all steps values
        '''
        return self.stepVals,self.allSamples

class GridSearchTuner(object):

    def __init__(self,model:GibbsSampler,**hyperParamCandidates):
        '''
        :param model: of which hyper-parameters pending to be tuned
        :param hyperParams: the candidates of hyper-parameters, concatenated in a dictionary   e.g.{}
        '''
        self.bestModel = model
        self.hyperParamCandidates = hyperParamCandidates

    def tune(self,queries:list,targets:Factor,evidences:dict=dict(),printTrigger=True,plotTrigger=False,asymptoteError=1e-5):
        '''
        :param queries: same as model.query
        :param evidences: same as model.query
        :param targets: real values for query variable probability distribution, Factor
        :return: best model
        '''

        _ = self.bestModel.query(queries,evidences,printTrigger=False,collectTrigger=True)
        stepVals,stepSamples = self.bestModel.get_steps()

        # exhaustive search for every possible combination of hyper-parameter values, recursive
        def search(hyperParamKeys:list,hyperParamVals:dict,bestHyperParamValsAndError:list)->list:

            if not hyperParamKeys:
                cpdFactor = self.tuneCPD(queries,stepSamples,hyperParamVals)
                error = abs(cpdFactor.get_val((True,))-targets.get_val((True,)))
                if error <= bestHyperParamValsAndError[1]:
                    bestHyperParamValsAndError = [hyperParamVals,error]
                    if plotTrigger:
                        self.bestCPD = cpdFactor
                return bestHyperParamValsAndError

            hyperParamKey = hyperParamKeys[0]

            for thisKeyVal in self.hyperParamCandidates[hyperParamKey]:
                bestHyperParamValsAndError = search(hyperParamKeys[1:],{**hyperParamVals,hyperParamKey:thisKeyVal},\
                                                    bestHyperParamValsAndError)
            return bestHyperParamValsAndError

        self.bestHyperParam, self.bestScore = search(list(self.hyperParamCandidates.keys()), dict(), [dict(),float('inf')])

        if printTrigger:
            print('''
The optimal hyper-parameters are:
{}, which indicates the first {} samples to be dropped, and count only every {} samples.
The corresponding error is:
{}
            '''.format(self.bestHyperParam,int(self.bestHyperParam['burnInCoefficient']*self.bestModel.step),\
                       self.bestHyperParam['thinningGap'],self.bestScore))

        if plotTrigger:
            plot(stepVals, targets)
            printVal(self.bestCPD)

        self.bestModel.hyperParamSet(self.bestHyperParam)

        return self.bestModel

    def tuneCPD(self,queries:list,stepSamples:list,hyperParamVals:dict):

        tunedCPD = Factor(tuple(queries),defaultVal=0)

        burnInNum = hyperParamVals['burnInCoefficient']*len(stepSamples)

        for sample in stepSamples[int(burnInNum)::hyperParamVals['thinningGap']]:
            tunedCPD.add_val(sample,tunedCPD.get_val(sample)+1)

        tunedCPD.normalize()

        return tunedCPD

def main_test():
    #TODO IMPLEMENT A GENERAL TEST FUNC
    pass

if __name__ == '__main__':
    main_test()