isabelle: comparison src/HOL/Tools/Sledgehammer/MaSh/src/sparseNaiveBayes.py

equal deleted inserted replaced

-:9df2f825422b
+:b958a94cf811
 #     Title:      HOL/Tools/Sledgehammer/MaSh/src/sparseNaiveBayes.py
 #     Author:     Daniel Kuehlwein, ICIS, Radboud University Nijmegen
 #     Copyright   2012
 #
-# An updatable naive Bayes classifier.
+# An updatable sparse naive Bayes classifier.
 '''
 Created on Jul 11, 2012
 @author: Daniel Kuehlwein
 self.counts[d] = [dPosCount,dFeatureCounts]
 for key in dicts.dependenciesDict.keys():
 # Add p proves p
 keyDeps = [key]+dicts.dependenciesDict[key]
 for dep in keyDeps:
 self.counts[dep][0] += 1
 depFeatures = dicts.featureDict[key]
 for f,_w in depFeatures:
 if self.counts[dep][1].has_key(f):
 def predict(self,features,accessibles):
 """
 For each accessible, predicts the probability of it being useful given the features.
 Returns a ranking of the accessibles.
 """
+posWeight = 20.0
+defVal = 15
 predictions = []
 for a in accessibles:
 posA = self.counts[a][0]
 fA = set(self.counts[a][1].keys())
 fWeightsA = self.counts[a][1]
 resultA = log(posA)
 for f,w in features:
+# DEBUG
+#w = 1
 if f in fA:
 if fWeightsA[f] == 0:
-resultA -= w*15
+resultA -= w*defVal
 else:
 assert fWeightsA[f] <= posA
-resultA += w*log(float(fWeightsA[f])/posA)
+resultA += w*log(float(posWeight*fWeightsA[f])/posA)
 else:
-resultA -= w*15
+resultA -= w*defVal
 predictions.append(resultA)
 #expPredictions = array([exp(x) for x in predictions])
 predictions = array(predictions)
 perm = (-predictions).argsort()
 #return array(accessibles)[perm],expPredictions[perm]

changeset 50619	b958a94cf811
parent 50482	d7be7ccf428b
child 50827	aba769dc82e9