Mercurial > repos > yufei-luo > s_mart
diff commons/core/coord/test/Test_MapUtils.py @ 6:769e306b7933
Change the repository level.
author | yufei-luo |
---|---|
date | Fri, 18 Jan 2013 04:54:14 -0500 |
parents | |
children |
line wrap: on
line diff
--- /dev/null Thu Jan 01 00:00:00 1970 +0000 +++ b/commons/core/coord/test/Test_MapUtils.py Fri Jan 18 04:54:14 2013 -0500 @@ -0,0 +1,384 @@ +# Copyright INRA (Institut National de la Recherche Agronomique) +# http://www.inra.fr +# http://urgi.versailles.inra.fr +# +# This software is governed by the CeCILL license under French law and +# abiding by the rules of distribution of free software. You can use, +# modify and/ or redistribute the software under the terms of the CeCILL +# license as circulated by CEA, CNRS and INRIA at the following URL +# "http://www.cecill.info". +# +# As a counterpart to the access to the source code and rights to copy, +# modify and redistribute granted by the license, users are provided only +# with a limited warranty and the software's author, the holder of the +# economic rights, and the successive licensors have only limited +# liability. +# +# In this respect, the user's attention is drawn to the risks associated +# with loading, using, modifying and/or developing or reproducing the +# software by the user in light of its specific status of free software, +# that may mean that it is complicated to manipulate, and that also +# therefore means that it is reserved for developers and experienced +# professionals having in-depth computer knowledge. Users are therefore +# encouraged to load and test the software's suitability as regards their +# requirements in conditions enabling the security of their systems and/or +# data to be ensured and, more generally, to use and operate it in the +# same conditions as regards security. +# +# The fact that you are presently reading this means that you have had +# knowledge of the CeCILL license and that you accept its terms. + + +import unittest +import os +import sys +from commons.core.coord.MapUtils import MapUtils +from commons.core.coord.Map import Map +from commons.core.coord.Set import Set +from commons.core.utils.FileUtils import FileUtils + + +class Test_MapUtils( unittest.TestCase ): + + def test_getMapListSortedByIncreasingMinThenMax( self ): + iMap1 = Map("name1", "chr1", 1, 350) + iMap2 = Map("name2", "chr1", 1, 100) + iMap3 = Map("name3", "chr1", 50, 350) + iMap4 = Map("name4", "chr1", 5, 450) + lMaps = [ iMap1, iMap2, iMap3, iMap4 ] + + expLMaps = [ iMap2, iMap1, iMap4, iMap3 ] + + obsLMaps = MapUtils.getMapListSortedByIncreasingMinThenMax( lMaps ) + + self.assertEquals( expLMaps, obsLMaps ) + + + def test_getMapListSortedByIncreasingMinThenMax_ordered( self ): + iMap1 = Map("name1", "chr1", 1, 100) + iMap2 = Map("name2", "chr1", 1, 350) + + lMaps = [ iMap1, iMap2 ] + expLMaps = [ iMap1, iMap2 ] + + obsLMaps = MapUtils.getMapListSortedByIncreasingMinThenMax( lMaps ) + + self.assertEquals( expLMaps, obsLMaps ) + + + def test_getMapListSortedByIncreasingMinThenMax_unordered( self ): + iMap1 = Map("name1", "chr1", 1, 350) + iMap2 = Map("name2", "chr1", 1, 100) + + lMaps = [ iMap1, iMap2 ] + expLMaps = [ iMap2, iMap1 ] + + obsLMaps = MapUtils.getMapListSortedByIncreasingMinThenMax( lMaps ) + + self.assertEquals( expLMaps, obsLMaps ) + + + def test_getMapListSortedByIncreasingMinThenMax_nonOverlapping( self ): + iMap1 = Map("name1", "chr1", 1, 350) + iMap2 = Map("name2", "chr1", 400, 600) + + lMaps = [ iMap2, iMap1 ] + expLMaps = [ iMap1, iMap2 ] + + obsLMaps = MapUtils.getMapListSortedByIncreasingMinThenMax( lMaps ) + + self.assertEquals( expLMaps, obsLMaps ) + + + def test_getMapListSortedByIncreasingMinThenMax_sameMinThreeMaps( self ): + iMap1 = Map("name1", "chr1", 350, 1) + iMap2 = Map("name2", "chr1", 400, 1) + iMap3 = Map("name3", "chr1", 500, 1) + + lMaps = [ iMap2, iMap1, iMap3 ] + expLMaps = [ iMap1, iMap2, iMap3 ] + + obsLMaps = MapUtils.getMapListSortedByIncreasingMinThenMax( lMaps ) + + self.assertEquals( expLMaps, obsLMaps ) + + + def test_getMapListSortedByIncreasingMinThenMax_included( self ): + iMap1 = Map("name1", "chr1", 350, 1) + iMap2 = Map("name2", "chr1", 300, 10) + + lMaps = [ iMap2, iMap1 ] + expLMaps = [ iMap1, iMap2] + + obsLMaps = MapUtils.getMapListSortedByIncreasingMinThenMax( lMaps ) + + self.assertEquals( expLMaps, obsLMaps ) + + + def test_getMapListSortedByIncreasingMinThenMax_equal( self ): + iMap1 = Map("name1", "chr1", 350, 1) + iMap2 = Map("name2", "chr1", 350, 1) + + lMaps = [ iMap2, iMap1 ] + expLMaps = [ iMap2, iMap1 ] + notExpLMaps = [ iMap1, iMap2 ] + + obsLMaps = MapUtils.getMapListSortedByIncreasingMinThenMax( lMaps ) + + self.assertEquals( expLMaps, obsLMaps ) + self.assertNotEquals( notExpLMaps, obsLMaps ) + + + def test_getMapListSortedByIncreasingNameThenSeqnameThenMinThenMax( self ): + iMap1 = Map("name1", "chr1", 1, 350) + iMap2 = Map("name4", "chr2", 5, 450) + iMap3 = Map("name4", "chr1", 10, 450) + iMap4 = Map("name4", "chr1", 10, 500) + iMap5 = Map("name4", "chr1", 5, 450) + iMap6 = Map("name3", "chr1", 50, 350) + iMap7 = Map("name2", "chr1", 1, 100) + + lMaps = [ iMap1, iMap2, iMap3, iMap4, iMap5, iMap6, iMap7 ] + + expLMaps = [ iMap1, iMap7, iMap6, iMap5, iMap3, iMap4, iMap2 ] + + obsLMaps = MapUtils.getMapListSortedByIncreasingNameThenSeqnameThenMinThenMax( lMaps ) + + self.assertEquals( expLMaps, obsLMaps ) + + + def test_getMapListSortedByIncreasingNameThenSeqnameThenMinThenMax_ordered( self ): + iMap1 = Map("name1", "chr1", 1, 100) + iMap2 = Map("name1", "chr2", 1, 350) + + lMaps = [ iMap1, iMap2 ] + expLMaps = [ iMap1, iMap2 ] + + obsLMaps = MapUtils.getMapListSortedByIncreasingNameThenSeqnameThenMinThenMax( lMaps ) + + self.assertEquals( expLMaps, obsLMaps ) + + + def test_getMapListSortedByIncreasingNameThenSeqnameThenMinThenMax_unordered( self ): + iMap1 = Map("name1", "chr2", 1, 350) + iMap2 = Map("name1", "chr1", 1, 100) + + lMaps = [ iMap1, iMap2 ] + expLMaps = [ iMap2, iMap1 ] + + obsLMaps = MapUtils.getMapListSortedByIncreasingNameThenSeqnameThenMinThenMax( lMaps ) + + self.assertEquals( expLMaps, obsLMaps ) + + + def test_getMapListSortedByIncreasingNameThenSeqnameThenMinThenMax_nonOverlapping( self ): + iMap1 = Map("name1", "chr1", 1, 350) + iMap2 = Map("name2", "chr1", 400, 600) + + lMaps = [ iMap2, iMap1 ] + expLMaps = [ iMap1, iMap2 ] + + obsLMaps = MapUtils.getMapListSortedByIncreasingNameThenSeqnameThenMinThenMax( lMaps ) + + self.assertEquals( expLMaps, obsLMaps ) + + + def test_getMapListSortedByIncreasingNameThenSeqnameThenMinThenMax_sameMinThreeMaps( self ): + iMap1 = Map("name2", "chr1", 150, 10) + iMap2 = Map("name2", "chr1", 1, 100) + iMap3 = Map("name2", "chr1", 100, 1) + + lMaps = [ iMap1, iMap2, iMap3 ] + expLMaps = [ iMap2, iMap3, iMap1 ] + + obsLMaps = MapUtils.getMapListSortedByIncreasingNameThenSeqnameThenMinThenMax( lMaps ) + + self.assertEquals( expLMaps, obsLMaps ) + + + def test_getDictPerNameFromMapFile( self ): + iMap1 = Map( "chunk1", "chromosome1", 1, 100 ) + iMap2 = Map( "chunk2", "chromosome1", 91, 190 ) + iMap3 = Map( "chunk3", "chromosome2", 1, 100 ) + iMap4 = Map( "chunk1", "chromosome1", 1, 100 ) # redundant with iMap1 + + mapFile = "dummyFile.map" + mapFileHandler = open( mapFile, "w" ) + for iMap in [ iMap1, iMap2, iMap3, iMap4 ]: + iMap.write( mapFileHandler ) + mapFileHandler.close() + + dExp = { "chunk1": iMap1, "chunk2": iMap2, "chunk3": iMap3 } + + dObs = MapUtils.getDictPerNameFromMapFile( mapFile ) + + self.assertEquals( dExp, dObs ) + + os.remove( mapFile ) + + + def test_mapList2SetList(self): + map1 = Map( "name1", "desc1", 1, 120 ) + map2 = Map( "name2", "desc2", 1, 20 ) + lMap = [ map1, map2 ] + set1 = Set( 1, "name1", "desc1", 1, 120 ) + set2 = Set( 2, "name2", "desc2", 1, 20 ) + explMapSet = [ set1, set2 ] + obslMapSet = MapUtils.mapList2SetList( lMap ) + + self.assertEquals( explMapSet, obslMapSet ) + + + def test_mergeCoordsInFile( self ): + if sys.modules.has_key( "commons.core.checker.CheckerUtils" ): + inFile = "dummyInFile" + inFileHandler = open( inFile, "w" ) + inFileHandler.write( "TE1\tchr1\t1501\t2500\n" ) + inFileHandler.write( "TE3\tchr1\t4000\t3401\n" ) + inFileHandler.write( "TE3\tchr1\t3800\t3601\n" ) + inFileHandler.close() + expFile = "dummyExpFile" + expFileHandler = open( expFile, "w" ) + expFileHandler.write( "TE1\tchr1\t1501\t2500\n" ) + expFileHandler.write( "TE3\tchr1\t4000\t3401\n" ) + expFileHandler.close() + obsFile = "dummyObsFile" + MapUtils.mergeCoordsInFile( inFile, obsFile ) + self.assertTrue( FileUtils.are2FilesIdentical( expFile, obsFile ) ) + for f in [ inFile, expFile, obsFile ]: + os.remove( f ) + + + def test_getDictPerSeqNameFromMapFile( self ): + inFile = "dummyInFile" + inFileHandler = open( inFile, "w" ) + inFileHandler.write( "TE1\tchr1\t1\t10\n" ) + inFileHandler.write( "TE2\tchr1\t60\t41\n" ) + inFileHandler.write( "TE3\tchr2\t5\t36\n" ) + inFileHandler.close() + dExp = { "chr1": [ Map( "TE1", "chr1", 1, 10 ), Map( "TE2", "chr1", 60, 41 ) ], + "chr2": [ Map( "TE3", "chr2", 5, 36 ) ] } + dObs = MapUtils.getDictPerSeqNameFromMapFile( inFile ) + self.assertEqual( dExp, dObs ) + os.remove( inFile ) + + def test_convertMapFileIntoSetFile(self): + mapInputFile = "dummyExpFile" + mapFileHandler = open( mapInputFile, "w" ) + mapFileHandler.write( "seq31\tchr1\t151\t250\n" ) + mapFileHandler.write( "seq27\tchr2\t301\t500\n" ) + mapFileHandler.write( "seq40\tchr2\t600\t700\n" ) + mapFileHandler.write( "seq2\tchr3\t301\t500\n" ) + mapFileHandler.close() + + expSetFile = "dummyexpSetFile" + expSetFileHandler = open( expSetFile, "w" ) + expSetFileHandler.write( "1\tseq31\tchr1\t151\t250\n" ) + expSetFileHandler.write( "2\tseq27\tchr2\t301\t500\n" ) + expSetFileHandler.write( "3\tseq40\tchr2\t600\t700\n" ) + expSetFileHandler.write( "4\tseq2\tchr3\t301\t500\n" ) + expSetFileHandler.close() + + obsFile = "dummyObsFile" + + MapUtils.convertMapFileIntoSetFile( mapInputFile, obsFile ) + + self.assertTrue( FileUtils.are2FilesIdentical( expSetFile, obsFile ) ) + + for f in [ expSetFile, mapInputFile, obsFile ]: + os.remove( f ) + + def test_convertMapFileIntoSetFile_one_line(self): + mapInputFile = "dummyExpFile" + mapFileHandler = open( mapInputFile, "w" ) + mapFileHandler.write( "seq31\tchr1\t151\t250\n" ) + mapFileHandler.close() + + expSetFile = "dummyexpSetFile" + expSetFileHandler = open( expSetFile, "w" ) + expSetFileHandler.write( "1\tseq31\tchr1\t151\t250\n" ) + expSetFileHandler.close() + + obsFile = "dummyObsFile" + + MapUtils.convertMapFileIntoSetFile( mapInputFile, obsFile ) + + self.assertTrue( FileUtils.are2FilesIdentical( expSetFile, obsFile ) ) + + for f in [ expSetFile, mapInputFile, obsFile ]: + os.remove( f ) + + def test_convertMapFileIntoSetFile_empty_file(self): + mapInputFile = "dummyFile.map" + mapFileHandler = open( mapInputFile, "w" ) + mapFileHandler.close() + + expFile = "dummyExpFile.map.set" + expFileHandler = open( expFile, "w" ) + expFileHandler.close() + + obsFile = "dummyFile.map.set" + + MapUtils.convertMapFileIntoSetFile( mapInputFile ) + + self.assertTrue( FileUtils.are2FilesIdentical( expFile, obsFile ) ) + + for f in [ expFile, mapInputFile, obsFile ]: + os.remove( f ) + + def test_writeListInFile_empty_list(self): + lMaps = [ ] + expFileName = "expFileName" + fileHandle = open(expFileName, "w") + fileHandle.close() + + obsFileName = "obsFileName" + fileHandle = open(obsFileName, "w") + MapUtils.writeListInFile(lMaps, obsFileName, "w") + fileHandle.close() + + self.assertTrue( FileUtils.are2FilesIdentical( expFileName, obsFileName ) ) + + os.remove(obsFileName) + os.remove(expFileName) + + def test_writeListInFile_list_one_set(self): + lMaps = [ Map( "map1", "map1seq", 1, 10 ) ] + line = "map1\tmap1seq\t1\t10\n" + + expFileName = "expFileName" + + fileHandle = open(expFileName, "w") + fileHandle.write(line) + fileHandle.close() + + obsFileName = "obsFileName" + fileHandle = open(obsFileName, "w") + MapUtils.writeListInFile(lMaps, obsFileName, "w") + fileHandle.close() + + self.assertTrue( FileUtils.are2FilesIdentical( expFileName, obsFileName ) ) + + os.remove(obsFileName) + os.remove(expFileName) + + def test_getMinLengthOfMapFile(self): + mapFileName = "%s/Gnome_tools/Vein_v4_scaffold_00001.fa.Nstretch.map" % os.environ["REPET_DATA"] + expMinLengthofMapFile = 20 + iMap = MapUtils() + obsMinLengthofMapFile = iMap.getMinLengthOfMapFile(mapFileName) + self.assertEquals(expMinLengthofMapFile, obsMinLengthofMapFile) + + def test_getMaxLengthOfMapFile(self): + mapFileName = "%s/Gnome_tools/Vein_v4_scaffold_00001.fa.Nstretch.map" % os.environ["REPET_DATA"] + expMinLengthofMapFile = 6344 + iMap = MapUtils() + obsMinLengthofMapFile = iMap.getMaxLengthOfMapFile(mapFileName) + self.assertEquals(expMinLengthofMapFile, obsMinLengthofMapFile) + + + +test_suite = unittest.TestSuite() +test_suite.addTest( unittest.makeSuite( Test_MapUtils ) ) +if __name__ == "__main__": + unittest.TextTestRunner(verbosity=2).run( test_suite )