mirror of
https://github.com/rdkit/rdkit.git
synced 2026-06-05 22:04:27 +08:00
* extend the allowed valences of the alkali earths make it possible to have preferred and arbitrary valence states (I thought this already worked) * backup * maybe needed * copy in some swig3 files; at this point the tests all work * remove SWIG version lock * changes in response to review
287 lines
10 KiB
Java
287 lines
10 KiB
Java
/*
|
|
* $Id: AtomPairsTests.java 4395 2011-01-28 16:54:48Z landrgr1 $
|
|
*
|
|
* Copyright (c) 2010, Novartis Institutes for BioMedical Research Inc.
|
|
* All rights reserved.
|
|
*
|
|
* Redistribution and use in source and binary forms, with or without
|
|
* modification, are permitted provided that the following conditions are
|
|
* met:
|
|
*
|
|
* * Redistributions of source code must retain the above copyright
|
|
* notice, this list of conditions and the following disclaimer.
|
|
* * Redistributions in binary form must reproduce the above
|
|
* copyright notice, this list of conditions and the following
|
|
* disclaimer in the documentation and/or other materials provided
|
|
* with the distribution.
|
|
* * Neither the name of Novartis Institutes for BioMedical Research Inc.
|
|
* nor the names of its contributors may be used to endorse or promote
|
|
* products derived from this software without specific prior written permission.
|
|
*
|
|
* THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS
|
|
* "AS IS" AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT
|
|
* LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR
|
|
* A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT
|
|
* OWNER OR CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL,
|
|
* SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT
|
|
* LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE,
|
|
* DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY
|
|
* THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT
|
|
* (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE
|
|
* OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
|
|
*/
|
|
package org.RDKit;
|
|
|
|
import static org.junit.Assert.*;
|
|
|
|
import java.io.File;
|
|
|
|
import org.junit.*;
|
|
|
|
public class AtomPairsTests extends GraphMolTest {
|
|
|
|
@Test
|
|
public void testAtomCodes_1() {
|
|
ROMol mol = RWMol.MolFromSmiles("C=C");
|
|
Atom atom0 = mol.getAtomWithIdx(0);
|
|
Atom atom1 = mol.getAtomWithIdx(1);
|
|
assertNotNull(atom0);
|
|
assertNotNull(atom1);
|
|
assertEquals(RDKFuncs.getAtomCode(atom0), RDKFuncs.getAtomCode(atom1));
|
|
|
|
long tgt = 1 | (1 | 1 << RDKFuncs.getNumPiBits()) << RDKFuncs.getNumBranchBits();
|
|
assertEquals(tgt, RDKFuncs.getAtomCode(atom0));
|
|
tgt = 1 << RDKFuncs.getNumBranchBits() | 1 << (RDKFuncs.getNumBranchBits() + RDKFuncs.getNumPiBits());
|
|
assertEquals(tgt, RDKFuncs.getAtomCode(atom0, 1));
|
|
}
|
|
|
|
@Test
|
|
public void testAtomCodes_2() {
|
|
ROMol mol = RWMol.MolFromSmiles("C#CO");
|
|
long tgt = 1 | 2 << RDKFuncs.getNumBranchBits() | 1 << (RDKFuncs.getNumBranchBits() + RDKFuncs.getNumPiBits());
|
|
assertEquals(tgt, RDKFuncs.getAtomCode(mol.getAtomWithIdx(0)));
|
|
tgt = 2 | 2 << RDKFuncs.getNumBranchBits() | 1 << (RDKFuncs.getNumBranchBits() + RDKFuncs.getNumPiBits());
|
|
assertEquals(tgt, RDKFuncs.getAtomCode(mol.getAtomWithIdx(1)));
|
|
tgt = 1 | 0 << RDKFuncs.getNumBranchBits() | 3 << (RDKFuncs.getNumBranchBits() + RDKFuncs.getNumPiBits());
|
|
assertEquals(tgt, RDKFuncs.getAtomCode(mol.getAtomWithIdx(2)));
|
|
}
|
|
|
|
@Test
|
|
public void testAtomCodes_3() {
|
|
ROMol mol = RWMol.MolFromSmiles("CC(O)C(O)(O)C");
|
|
long tgt = 1 | 0 << RDKFuncs.getNumBranchBits() | 1 << (RDKFuncs.getNumBranchBits() + RDKFuncs.getNumPiBits());
|
|
assertEquals(tgt, RDKFuncs.getAtomCode(mol.getAtomWithIdx(1), 2));
|
|
tgt = 2 | 0 << RDKFuncs.getNumBranchBits() | 1 << (RDKFuncs.getNumBranchBits() + RDKFuncs.getNumPiBits());
|
|
assertEquals(tgt, RDKFuncs.getAtomCode(mol.getAtomWithIdx(3), 2));
|
|
|
|
}
|
|
|
|
@Test
|
|
public void testAtomCodes_4() {
|
|
ROMol mol = RWMol.MolFromSmiles("C=CC(=O)O");
|
|
long tgt = 0 | 0 << RDKFuncs.getNumBranchBits() | 3 << (RDKFuncs.getNumBranchBits() + RDKFuncs.getNumPiBits());
|
|
assertEquals(tgt, RDKFuncs.getAtomCode(mol.getAtomWithIdx(4), 1));
|
|
tgt = 3 | 1 << RDKFuncs.getNumBranchBits() | 1 << (RDKFuncs.getNumBranchBits() + RDKFuncs.getNumPiBits());
|
|
assertEquals(tgt, RDKFuncs.getAtomCode(mol.getAtomWithIdx(2)));
|
|
}
|
|
|
|
@Test
|
|
public void testAtomPairs() {
|
|
ROMol mol = RWMol.MolFromSmiles("CCCCC");
|
|
SparseIntVect32 fp;
|
|
long tgt, c1, c2, c3;
|
|
|
|
c1 = RDKFuncs.getAtomCode(mol.getAtomWithIdx(0));
|
|
c2 = RDKFuncs.getAtomCode(mol.getAtomWithIdx(1));
|
|
c3 = RDKFuncs.getAtomCode(mol.getAtomWithIdx(2));
|
|
tgt = 1 | (Math.min(c1, c2) | Math.max(c1, c2) << RDKFuncs.getCodeSize()) << RDKFuncs.getNumPathBits();
|
|
assertEquals(tgt, RDKFuncs.getAtomPairCode(c1, c2, 1));
|
|
assertEquals(tgt, RDKFuncs.getAtomPairCode(c2, c1, 1));
|
|
tgt = 2 | (Math.min(c1, c3) | Math.max(c1, c3) << RDKFuncs.getCodeSize()) << RDKFuncs.getNumPathBits();
|
|
assertEquals(tgt, RDKFuncs.getAtomPairCode(c1, c3, 2));
|
|
assertEquals(tgt, RDKFuncs.getAtomPairCode(c3, c1, 2));
|
|
|
|
mol = RWMol.MolFromSmiles("CCC");
|
|
fp = RDKFuncs.getAtomPairFingerprint(mol);
|
|
assertEquals(3, fp.getTotalVal());
|
|
assertEquals(2, fp.getNonzero().size());
|
|
|
|
c1 = RDKFuncs.getAtomCode(mol.getAtomWithIdx(0));
|
|
c2 = RDKFuncs.getAtomCode(mol.getAtomWithIdx(1));
|
|
c3 = RDKFuncs.getAtomCode(mol.getAtomWithIdx(2));
|
|
assertEquals(2, fp.getVal((int) RDKFuncs.getAtomPairCode(c1, c2, 1)));
|
|
assertEquals(1, fp.getVal((int) RDKFuncs.getAtomPairCode(c1, c3, 2)));
|
|
|
|
mol = RWMol.MolFromSmiles("CC=O.Cl");
|
|
fp = RDKFuncs.getAtomPairFingerprint(mol);
|
|
assertEquals(3, fp.getTotalVal());
|
|
assertEquals(3, fp.getNonzero().size());
|
|
|
|
c1 = RDKFuncs.getAtomCode(mol.getAtomWithIdx(0));
|
|
c2 = RDKFuncs.getAtomCode(mol.getAtomWithIdx(1));
|
|
c3 = RDKFuncs.getAtomCode(mol.getAtomWithIdx(2));
|
|
assertEquals(1, fp.getVal((int) RDKFuncs.getAtomPairCode(c1, c2, 1)));
|
|
assertEquals(1, fp.getVal((int) RDKFuncs.getAtomPairCode(c1, c2, 1)));
|
|
assertEquals(1, fp.getVal((int) RDKFuncs.getAtomPairCode(c2, c3, 1)));
|
|
}
|
|
|
|
@Test
|
|
public void testAtomPairs2() {
|
|
ROMol mol;
|
|
SparseIntVect32 fp;
|
|
|
|
mol = RWMol.MolFromSmiles("CCC");
|
|
fp = RDKFuncs.getAtomPairFingerprint(mol, 1, 2);
|
|
assertEquals(3, fp.getTotalVal());
|
|
assertEquals(2, fp.getNonzero().size());
|
|
|
|
fp = RDKFuncs.getAtomPairFingerprint(mol, 2, 2);
|
|
assertEquals(1, fp.getTotalVal());
|
|
assertEquals(1, fp.getNonzero().size());
|
|
}
|
|
|
|
@Test
|
|
public void testHashedAtomPairs() {
|
|
ROMol mol = RWMol.MolFromSmiles("c1ccccc1");
|
|
SparseIntVect32 fp1, fp2;
|
|
fp1 = RDKFuncs.getHashedAtomPairFingerprint(mol);
|
|
fp2 = RDKFuncs.getHashedAtomPairFingerprint(mol);
|
|
assertEquals(1.0, RDKFuncs.DiceSimilarity(fp1, fp2), 0.0);
|
|
assertTrue( fp1.eq(fp2) );
|
|
|
|
mol = RWMol.MolFromSmiles("c1ccccn1");
|
|
fp2 = RDKFuncs.getHashedAtomPairFingerprint(mol);
|
|
assertEquals(0.0, RDKFuncs.DiceSimilarity(fp1, fp2), 1.0);
|
|
|
|
mol = RWMol.MolFromSmiles("c1ccccc1");
|
|
fp1 = RDKFuncs.getHashedAtomPairFingerprint(mol, 2048);
|
|
fp2 = RDKFuncs.getHashedAtomPairFingerprint(mol, 2048, 1, 3);
|
|
assertEquals(1.0, RDKFuncs.DiceSimilarity(fp1, fp2), 0.0);
|
|
assertTrue( fp1.eq(fp2) );
|
|
|
|
fp2 = RDKFuncs.getHashedAtomPairFingerprint(mol, 2048, 1, 2);
|
|
assertEquals(0.0, RDKFuncs.DiceSimilarity(fp1, fp2), 1.0);
|
|
}
|
|
|
|
@Test
|
|
public void testTorsions() {
|
|
ROMol mol = RWMol.MolFromSmiles("CCCC");
|
|
SparseIntVect64 fp;
|
|
double tgt;
|
|
long c1, c2, c3, c4;
|
|
UInt_Vect codes = new UInt_Vect();
|
|
|
|
mol = RWMol.MolFromSmiles("CCCC");
|
|
c1 = RDKFuncs.getAtomCode(mol.getAtomWithIdx(0)) - 1;
|
|
c2 = RDKFuncs.getAtomCode(mol.getAtomWithIdx(1)) - 2;
|
|
c3 = RDKFuncs.getAtomCode(mol.getAtomWithIdx(2)) - 2;
|
|
c4 = RDKFuncs.getAtomCode(mol.getAtomWithIdx(3)) - 1;
|
|
tgt = c1 | (c2 | (c3 | c4 << RDKFuncs.getCodeSize()) << RDKFuncs.getCodeSize()) << RDKFuncs.getCodeSize();
|
|
|
|
codes.clear();
|
|
codes.add(c1);
|
|
codes.add(c2);
|
|
codes.add(c3);
|
|
codes.add(c4);
|
|
assertEquals(tgt, RDKFuncs.getTopologicalTorsionCode(codes).doubleValue(), 0.0);
|
|
|
|
fp = RDKFuncs.getTopologicalTorsionFingerprint(mol);
|
|
assertEquals(1, fp.getTotalVal());
|
|
assertEquals(1, fp.getNonzero().size());
|
|
|
|
mol = RWMol.MolFromSmiles("CCCCO.Cl");
|
|
fp = RDKFuncs.getTopologicalTorsionFingerprint(mol);
|
|
assertEquals(2, fp.getTotalVal());
|
|
assertEquals(2, fp.getNonzero().size());
|
|
|
|
fp = RDKFuncs.getTopologicalTorsionFingerprint(mol, 3);
|
|
assertEquals(3, fp.getTotalVal());
|
|
assertEquals(3, fp.getNonzero().size());
|
|
}
|
|
|
|
@Test
|
|
public void testHashedTorsions() {
|
|
ROMol mol = RWMol.MolFromSmiles("c1ccccc1");
|
|
SparseIntVect64 fp1, fp2;
|
|
fp1 = RDKFuncs.getHashedTopologicalTorsionFingerprint(mol);
|
|
fp2 = RDKFuncs.getHashedTopologicalTorsionFingerprint(mol);
|
|
assertEquals(1.0, RDKFuncs.DiceSimilarity(fp1, fp2), 0.0);
|
|
assertTrue( fp1.eq(fp2) );
|
|
|
|
mol = RWMol.MolFromSmiles("c1ccccn1");
|
|
fp2 = RDKFuncs.getHashedTopologicalTorsionFingerprint(mol);
|
|
assertEquals(0.0, RDKFuncs.DiceSimilarity(fp1, fp2), 1.0);
|
|
|
|
mol = RWMol.MolFromSmiles("c1ccccc1");
|
|
fp1 = RDKFuncs.getHashedTopologicalTorsionFingerprint(mol, 2048, 6);
|
|
fp2 = RDKFuncs.getHashedTopologicalTorsionFingerprint(mol, 2048, 6);
|
|
assertEquals(1.0, RDKFuncs.DiceSimilarity(fp1, fp2), 0.0);
|
|
assertTrue( fp1.eq(fp2) );
|
|
|
|
mol = RWMol.MolFromSmiles("c1ccccn1");
|
|
fp2 = RDKFuncs.getHashedTopologicalTorsionFingerprint(mol, 2048, 6);
|
|
assertEquals(0.0, RDKFuncs.DiceSimilarity(fp1, fp2), 1.0);
|
|
}
|
|
|
|
@Test
|
|
public void testBulkTorsions() {
|
|
String fName = new File(getRdBase(), "/Projects/DbCLI/testData/pubchem.200.sdf").getPath();
|
|
SDMolSupplier suppl = new SDMolSupplier(fName);
|
|
while (!suppl.atEnd()) {
|
|
ROMol mol = suppl.next();
|
|
SparseIntVect64 fp;
|
|
fp = RDKFuncs.getTopologicalTorsionFingerprint(mol);
|
|
assertTrue(fp.getTotalVal() > 1);
|
|
}
|
|
}
|
|
|
|
@Test
|
|
public void testRootedAtomPairs() {
|
|
ROMol mol = RWMol.MolFromSmiles("OCCCCC");
|
|
SparseIntVect32 fp1, fp2;
|
|
UInt_Vect roots = new UInt_Vect();
|
|
|
|
fp1 = RDKFuncs.getAtomPairFingerprint(mol);
|
|
Match_Vect nz1 = fp1.getNonzero();
|
|
assertTrue(nz1.size() > 0);
|
|
|
|
roots.add(0L);
|
|
fp2 = RDKFuncs.getAtomPairFingerprint(mol, roots);
|
|
Match_Vect nz2 = fp2.getNonzero();
|
|
assertTrue(nz2.size() > 0);
|
|
assertTrue(nz2.size() < nz1.size());
|
|
|
|
for (int i = 0; i < nz2.size(); i++) {
|
|
Int_Pair pair = nz2.get(i);
|
|
assertEquals(pair.getSecond() , fp2.getVal(pair.getFirst()));
|
|
}
|
|
}
|
|
|
|
@Test
|
|
public void testRootedTorsions() {
|
|
SparseIntVect64 fp1, fp2;
|
|
|
|
ROMol mol = RWMol.MolFromSmiles("OCCCC");
|
|
UInt_Vect roots = new UInt_Vect();
|
|
roots.add(0L);
|
|
|
|
fp1 = RDKFuncs.getTopologicalTorsionFingerprint(mol);
|
|
Long_Pair_Vect nz1 = fp1.getNonzero();
|
|
assertTrue(nz1.size() > 0);
|
|
|
|
fp2 = RDKFuncs.getTopologicalTorsionFingerprint(mol, 4, roots);
|
|
Long_Pair_Vect nz2 = fp2.getNonzero();
|
|
assertTrue(nz2.size() > 0);
|
|
assertTrue(nz2.size() < nz1.size());
|
|
|
|
for (int i = 0; i < nz2.size(); ++i) {
|
|
Long_Pair pair = nz2.get(i);
|
|
assertTrue(pair.getSecond() <= fp2.getVal(pair.getFirst()));
|
|
}
|
|
}
|
|
|
|
public static void main(String args[]) {
|
|
org.junit.runner.JUnitCore.main(AtomPairsTests.class.getName());
|
|
}
|
|
}
|