Files
rdkit/Python/ML/Data/UnitTestQuantize.py
Greg Landrum 75a79b6327 initial import
2006-05-06 22:20:08 +00:00

255 lines
7.0 KiB
Python
Executable File

#
# Copyright (C) 2001 greg Landrum
#
""" unit testing code for variable quantization
"""
import unittest
import RDConfig
from ML.Data import Quantize
class TestCase(unittest.TestCase):
def setUp(self):
#print '\n%s: '%self.shortDescription(),
pass
def testOneSplit1(self):
""" simple case (clear division)
"""
d = [(1.,0),
(1.1,0),
(1.2,0),
(1.4,0),
(1.4,0),
(1.6,0),
(2.,1),
(2.1,1),
(2.2,1),
(2.3,1)]
varValues = map(lambda x:x[0],d)
resCodes = map(lambda x:x[1],d)
nPossibleRes = 2
res = Quantize.FindVarQuantBound(varValues,resCodes,nPossibleRes)
target = (1.8,0.97095)
assert map(lambda x,y:Quantize.feq(x,y,1e-4),res,target)==[1,1],\
'result comparison failed: %s != %s'%(res,target)
def testOneSplit2(self):
""" some noise
"""
d = [(1.,0),
(1.1,0),
(1.2,0),
(1.4,0),
(1.4,1),
(1.6,0),
(2.,1),
(2.1,1),
(2.2,1),
(2.3,1)]
varValues = map(lambda x:x[0],d)
resCodes = map(lambda x:x[1],d)
nPossibleRes = 2
res = Quantize.FindVarQuantBound(varValues,resCodes,nPossibleRes)
target = (1.8,0.60999)
assert map(lambda x,y:Quantize.feq(x,y,1e-4),res,target)==[1,1],\
'result comparison failed: %s != %s'%(res,target)
def testOneSplit3(self):
""" optimal division not possibe
"""
d = [(1.,0),
(1.1,0),
(1.2,0),
(1.4,2),
(1.4,2),
(1.6,2),
(2.,2),
(2.1,1),
(2.2,1),
(2.3,1)]
varValues = map(lambda x:x[0],d)
resCodes = map(lambda x:x[1],d)
nPossibleRes = 3
res = Quantize.FindVarQuantBound(varValues,resCodes,nPossibleRes)
target = (1.3,0.88129)
assert map(lambda x,y:Quantize.feq(x,y,1e-4),res,target)==[1,1],\
'result comparison failed: %s != %s'%(res,target)
def testOneSplit4(self):
""" lots of duplicates
"""
d = [(1.,0),
(1.1,0),
(1.2,0),
(1.2,1),
(1.4,0),
(1.4,0),
(1.6,0),
(2.,1),
(2.1,1),
(2.1,1),
(2.1,1),
(2.1,1),
(2.2,1),
(2.3,1)]
varValues = map(lambda x:x[0],d)
resCodes = map(lambda x:x[1],d)
nPossibleRes = 2
res = Quantize.FindVarQuantBound(varValues,resCodes,nPossibleRes)
target = (1.8,0.68939)
assert map(lambda x,y:Quantize.feq(x,y,1e-4),res,target)==[1,1],\
'result comparison failed: %s != %s'%(res,target)
def testOneSplit5(self):
""" same as testOneSplit1 data, but out of order
"""
d = [(1.,0),
(1.1,0),
(2.2,1),
(1.2,0),
(1.6,0),
(1.4,0),
(2.,1),
(2.1,1),
(1.4,0),
(2.3,1)]
varValues = map(lambda x:x[0],d)
resCodes = map(lambda x:x[1],d)
nPossibleRes = 2
res = Quantize.FindVarQuantBound(varValues,resCodes,nPossibleRes)
target = (1.8,0.97095)
assert map(lambda x,y:Quantize.feq(x,y,1e-4),res,target)==[1,1],\
'result comparison failed: %s != %s'%(res,target)
def testMultSplit1(self):
""" simple dual split
"""
d = [(1.,0),
(1.1,0),
(1.2,0),
(1.4,2),
(1.4,2),
(1.6,2),
(2.,2),
(2.1,1),
(2.1,1),
(2.1,1),
(2.2,1),
(2.3,1)]
varValues = map(lambda x:x[0],d)
resCodes = map(lambda x:x[1],d)
nPossibleRes =3
res = Quantize.FindVarMultQuantBounds(varValues,2,resCodes,nPossibleRes)
target = ([1.3, 2.05],1.55458)
assert min(map(lambda x,y:Quantize.feq(x,y,1e-4),res[0],target[0]))==1,\
'split bound comparison failed: %s != %s'%(res[0],target[0])
assert Quantize.feq(res[1],target[1],1e-4),\
'InfoGain comparison failed: %s != %s'%(res[1],target[1])
def testMultSplit2(self):
""" same test as testMultSplit1, but out of order
"""
d = [(1.,0),
(2.1,1),
(1.1,0),
(1.2,0),
(1.4,2),
(1.6,2),
(2.,2),
(1.4,2),
(2.1,1),
(2.2,1),
(2.1,1),
(2.3,1)]
varValues = map(lambda x:x[0],d)
resCodes = map(lambda x:x[1],d)
nPossibleRes =3
res = Quantize.FindVarMultQuantBounds(varValues,2,resCodes,nPossibleRes)
target = ([1.3, 2.05],1.55458)
assert Quantize.feq(res[1],target[1],1e-4),\
'InfoGain comparison failed: %s != %s'%(res[1],target[1])
assert min(map(lambda x,y:Quantize.feq(x,y,1e-4),res[0],target[0]))==1,\
'split bound comparison failed: %s != %s'%(res[0],target[0])
def testMultSplit3(self):
""" 4 possible results
"""
d = [(1.,0),
(1.1,0),
(1.2,0),
(1.4,2),
(1.4,2),
(1.6,2),
(2.,2),
(2.1,1),
(2.1,1),
(2.1,1),
(2.2,1),
(2.3,1),
(3.0,3),
(3.1,3),
(3.2,3),
(3.3,3)]
varValues = map(lambda x:x[0],d)
resCodes = map(lambda x:x[1],d)
nPossibleRes =4
res = Quantize.FindVarMultQuantBounds(varValues,3,resCodes,nPossibleRes)
target = ([1.30, 2.05, 2.65],1.97722)
assert Quantize.feq(res[1],target[1],1e-4),\
'InfoGain comparison failed: %s != %s'%(res[1],target[1])
assert min(map(lambda x,y:Quantize.feq(x,y,1e-4),res[0],target[0]))==1,\
'split bound comparison failed: %s != %s'%(res[0],target[0])
def testMultSplit4(self):
""" dual valued, with an island
"""
d = [(1.,0),
(1.1,0),
(1.2,0),
(1.4,1),
(1.4,1),
(1.6,1),
(2.,1),
(2.1,0),
(2.1,0),
(2.1,0),
(2.2,0),
(2.3,0)]
varValues = map(lambda x:x[0],d)
resCodes = map(lambda x:x[1],d)
nPossibleRes = 2
res = Quantize.FindVarMultQuantBounds(varValues,2,resCodes,nPossibleRes)
target = ( [1.3, 2.05], .91830)
assert Quantize.feq(res[1],target[1],1e-4),\
'InfoGain comparison failed: %s != %s'%(res[1],target[1])
assert min(map(lambda x,y:Quantize.feq(x,y,1e-4),res[0],target[0]))==1,\
'split bound comparison failed: %s != %s'%(res[0],target[0])
def testMultSplit5(self):
""" dual valued, with an island, a bit noisy
"""
d = [(1.,0),
(1.1,0),
(1.2,0),
(1.4,1),
(1.4,0),
(1.6,1),
(2.,1),
(2.1,0),
(2.1,0),
(2.1,0),
(2.2,1),
(2.3,0)]
varValues = map(lambda x:x[0],d)
resCodes = map(lambda x:x[1],d)
nPossibleRes = 2
res = Quantize.FindVarMultQuantBounds(varValues,2,resCodes,nPossibleRes)
target = ([1.3, 2.05],.34707 )
assert Quantize.feq(res[1],target[1],1e-4),\
'InfoGain comparison failed: %s != %s'%(res[1],target[1])
assert min(map(lambda x,y:Quantize.feq(x,y,1e-4),res[0],target[0]))==1,\
'split bound comparison failed: %s != %s'%(res[0],target[0])
if __name__ == '__main__':
unittest.main()