diff options
Diffstat (limited to 'chromium/net/tools/tld_cleanup/make_dafsa_unittest.py')
-rwxr-xr-x | chromium/net/tools/tld_cleanup/make_dafsa_unittest.py | 757 |
1 files changed, 757 insertions, 0 deletions
diff --git a/chromium/net/tools/tld_cleanup/make_dafsa_unittest.py b/chromium/net/tools/tld_cleanup/make_dafsa_unittest.py new file mode 100755 index 00000000000..5ff92e62292 --- /dev/null +++ b/chromium/net/tools/tld_cleanup/make_dafsa_unittest.py @@ -0,0 +1,757 @@ +#!/usr/bin/env python +# Copyright 2014 The Chromium Authors. All rights reserved. +# Use of this source code is governed by a BSD-style license that can be +# found in the LICENSE file. + + +import sys +import unittest +import make_dafsa + + +class ParseGperfTest(unittest.TestCase): + def testMalformedKey(self): + """Tests exception is thrown at bad format.""" + infile1 = [ '%%', '', '%%' ] + self.assertRaises(make_dafsa.InputError, make_dafsa.parse_gperf, infile1) + + infile2 = [ '%%', 'apa,1', '%%' ] + self.assertRaises(make_dafsa.InputError, make_dafsa.parse_gperf, infile2) + + infile3 = [ '%%', 'apa, 1', '%%' ] + self.assertRaises(make_dafsa.InputError, make_dafsa.parse_gperf, infile3) + + def testBadValues(self): + """Tests exception is thrown when value is out of range.""" + infile1 = [ '%%', 'a, -1', '%%' ] + self.assertRaises(make_dafsa.InputError, make_dafsa.parse_gperf, infile1) + + infile2 = [ '%%', 'a, x', '%%' ] + self.assertRaises(make_dafsa.InputError, make_dafsa.parse_gperf, infile2) + + infile3 = [ '%%', 'a, 3', '%%' ] + self.assertRaises(make_dafsa.InputError, make_dafsa.parse_gperf, infile3) + + infile4 = [ '%%', 'a, 6', '%%' ] + self.assertRaises(make_dafsa.InputError, make_dafsa.parse_gperf, infile4) + + infile5 = [ '%%', 'a, 12', '%%' ] + self.assertRaises(make_dafsa.InputError, make_dafsa.parse_gperf, infile5) + + def testValues(self): + """Tests legal values are accepted.""" + infile1 = [ '%%', 'a, 0', '%%' ] + words1 = [ 'a0' ] + self.assertEqual(make_dafsa.parse_gperf(infile1), words1) + + infile2 = [ '%%', 'a, 1', '%%' ] + words2 = [ 'a1' ] + self.assertEqual(make_dafsa.parse_gperf(infile2), words2) + + infile3 = [ '%%', 'a, 2', '%%' ] + words3 = [ 'a2' ] + self.assertEqual(make_dafsa.parse_gperf(infile3), words3) + + infile4 = [ '%%', 'a, 4', '%%' ] + words4 = [ 'a4' ] + self.assertEqual(make_dafsa.parse_gperf(infile4), words4) + + def testOneWord(self): + """Tests a single key can be parsed.""" + infile = [ '%%', 'apa, 1', '%%' ] + words = [ 'apa1' ] + self.assertEqual(make_dafsa.parse_gperf(infile), words) + + def testTwoWords(self): + """Tests a sequence of keys can be parsed.""" + infile = [ '%%', 'apa, 1', 'bepa.com, 2', '%%' ] + words = [ 'apa1', 'bepa.com2' ] + self.assertEqual(make_dafsa.parse_gperf(infile), words) + + +class ToDafsaTest(unittest.TestCase): + def testEmptyInput(self): + """Tests exception is thrown at empty input.""" + words = () + self.assertRaises(make_dafsa.InputError, make_dafsa.to_dafsa, words) + + def testNonASCII(self): + """Tests exception is thrown if illegal characters are used.""" + words1 = ( chr(0x1F) + 'a1', ) + self.assertRaises(make_dafsa.InputError, make_dafsa.to_dafsa, words1) + + words2 = ( 'a' + chr(0x1F) + '1', ) + self.assertRaises(make_dafsa.InputError, make_dafsa.to_dafsa, words2) + + words3 = ( chr(0x80) + 'a1', ) + self.assertRaises(make_dafsa.InputError, make_dafsa.to_dafsa, words3) + + words4 = ( 'a' + chr(0x80) + '1', ) + self.assertRaises(make_dafsa.InputError, make_dafsa.to_dafsa, words4) + + def testChar(self): + """Tests a DAFSA can be created from a single character domain name.""" + words = [ 'a0' ] + node2 = ( chr(0), [ None ] ) + node1 = ( 'a', [ node2 ] ) + source = [ node1 ] + self.assertEqual(make_dafsa.to_dafsa(words), source) + + def testChars(self): + """Tests a DAFSA can be created from a multi character domain name.""" + words = [ 'ab0' ] + node3 = ( chr(0), [ None ] ) + node2 = ( 'b', [ node3 ] ) + node1 = ( 'a', [ node2 ] ) + source = [ node1 ] + self.assertEqual(make_dafsa.to_dafsa(words), source) + + def testWords(self): + """Tests a DAFSA can be created from a sequence of domain names.""" + words = [ 'a0', 'b1' ] + node4 = ( chr(1), [ None ] ) + node3 = ( 'b', [ node4 ] ) + node2 = ( chr(0), [ None ] ) + node1 = ( 'a', [ node2 ] ) + source = [ node1, node3 ] + self.assertEqual(make_dafsa.to_dafsa(words), source) + + +class ToWordsTest(unittest.TestCase): + def testSink(self): + """Tests the sink is exapnded to a list with an empty string.""" + node1 = None + words = [ '' ] + self.assertEqual(make_dafsa.to_words(node1), words) + + def testSingleNode(self): + """Tests a single node is expanded to a list with the label string.""" + + # 'ab' -> [ 'ab' ] + + node1 = ( 'ab', [ None ] ) + words = [ 'ab' ] + self.assertEqual(make_dafsa.to_words(node1), words) + + def testChain(self): + """Tests a sequence of nodes are preoperly expanded.""" + + # 'ab' -> 'cd' => [ 'abcd' ] + + node2 = ( 'cd', [ None ] ) + node1 = ( 'ab', [ node2 ] ) + words = [ 'abcd' ] + self.assertEqual(make_dafsa.to_words(node1), words) + + def testInnerTerminator(self): + """Tests a sequence with an inner terminator is expanded to two strings.""" + + # 'a' -> 'b' + # \ => [ 'ab', 'a' ] + # {sink} + + node2 = ( 'b', [ None ] ) + node1 = ( 'a', [ node2, None ] ) + words = [ 'ab', 'a' ] + self.assertEqual(make_dafsa.to_words(node1), words) + + def testDiamond(self): + """Tests a diamond can be expanded to a word list.""" + + # 'cd' + # / \ + # 'ab' 'gh' + # \ / + # 'ef' + + node4 = ( 'gh', [ None ] ) + node3 = ( 'ef', [ node4 ] ) + node2 = ( 'cd', [ node4 ] ) + node1 = ( 'ab', [ node2, node3 ] ) + words = [ 'abcdgh', 'abefgh' ] + self.assertEqual(make_dafsa.to_words(node1), words) + + +class JoinLabelsTest(unittest.TestCase): + def testLabel(self): + """Tests a single label passes unchanged.""" + + # 'a' => 'a' + + node1 = ( 'a', [ None ] ) + source = [ node1 ] + self.assertEqual(make_dafsa.join_labels(source), source) + + def testInnerTerminator(self): + """Tests a sequence with an inner terminator passes unchanged.""" + + # 'a' -> 'b' 'a' -> 'b' + # \ => \ + # {sink} {sink} + + node2 = ( 'b', [ None ] ) + node1 = ( 'a', [ node2, None ] ) + source = [ node1 ] + self.assertEqual(make_dafsa.join_labels(source), source) + + def testLabels(self): + """Tests a sequence of labels can be joined.""" + + # 'a' -> 'b' => 'ab' + + node2 = ( 'b', [ None ] ) + node1 = ( 'a', [ node2 ] ) + source1 = [ node1 ] + node3 = ( 'ab', [ None ] ) + source2 = [ node3 ] + self.assertEqual(make_dafsa.join_labels(source1), source2) + + def testCompositeLabels(self): + """Tests a sequence of multi character labels can be joined.""" + + # 'ab' -> 'cd' => 'abcd' + + node2 = ( 'cd', [ None ] ) + node1 = ( 'ab', [ node2 ] ) + source1 = [ node1 ] + node3 = ( 'abcd', [ None ] ) + source2 = [ node3 ] + self.assertEqual(make_dafsa.join_labels(source1), source2) + + def testAtomicTrie(self): + """Tests a trie formed DAFSA with atomic labels passes unchanged.""" + + # 'b' 'b' + # / / + # 'a' => 'a' + # \ \ + # 'c' 'c' + + node3 = ( 'c', [ None ] ) + node2 = ( 'b', [ None ] ) + node1 = ( 'a', [ node2, node3 ] ) + source = [ node1 ] + self.assertEqual(make_dafsa.join_labels(source), source) + + def testReverseAtomicTrie(self): + """Tests a reverse trie formed DAFSA with atomic labels passes unchanged.""" + + # 'a' 'a' + # \ \ + # 'c' => 'c' + # / / + # 'b' 'b' + + node3 = ( 'c', [ None ] ) + node2 = ( 'b', [ node3 ] ) + node1 = ( 'a', [ node3 ] ) + source = [ node1, node2 ] + self.assertEqual(make_dafsa.join_labels(source), source) + + def testChainedTrie(self): + """Tests a trie formed DAFSA with chained labels can be joined.""" + + # 'c' -> 'd' 'cd' + # / / + # 'a' -> 'b' => 'ab' + # \ \ + # 'e' -> 'f' 'ef' + + node6 = ( 'f', [ None ] ) + node5 = ( 'e', [ node6 ] ) + node4 = ( 'd', [ None ] ) + node3 = ( 'c', [ node4 ] ) + node2 = ( 'b', [ node3, node5 ] ) + node1 = ( 'a', [ node2 ] ) + source1 = [ node1 ] + node9 = ( 'ef', [ None ] ) + node8 = ( 'cd', [ None ] ) + node7 = ( 'ab', [ node8, node9 ] ) + source2 = [ node7 ] + self.assertEqual(make_dafsa.join_labels(source1), source2) + + def testReverseChainedTrie(self): + """Tests a reverse trie formed DAFSA with chained labels can be joined.""" + + # 'a' -> 'b' 'ab' + # \ \ + # 'e' -> 'f' => 'ef' + # / / + # 'c' -> 'd' 'cd' + + node6 = ( 'f', [ None ] ) + node5 = ( 'e', [ node6 ] ) + node4 = ( 'd', [ node5 ] ) + node3 = ( 'c', [ node4 ] ) + node2 = ( 'b', [ node5 ] ) + node1 = ( 'a', [ node2 ] ) + source1 = [ node1, node3 ] + node9 = ( 'ef', [ None ] ) + node8 = ( 'cd', [ node9 ] ) + node7 = ( 'ab', [ node9 ] ) + source2 = [ node7, node8 ] + self.assertEqual(make_dafsa.join_labels(source1), source2) + + +class JoinSuffixesTest(unittest.TestCase): + def testSingleLabel(self): + """Tests a single label passes unchanged.""" + + # 'a' => 'a' + + node1 = ( 'a', [ None ] ) + source = [ node1 ] + self.assertEqual(make_dafsa.join_suffixes(source), source) + + def testInnerTerminator(self): + """Tests a sequence with an inner terminator passes unchanged.""" + + # 'a' -> 'b' 'a' -> 'b' + # \ => \ + # {sink} {sink} + + node2 = ( 'b', [ None ] ) + node1 = ( 'a', [ node2, None ] ) + source = [ node1 ] + self.assertEqual(make_dafsa.join_suffixes(source), source) + + def testDistinctTrie(self): + """Tests a trie formed DAFSA with distinct labels passes unchanged.""" + + # 'b' 'b' + # / / + # 'a' => 'a' + # \ \ + # 'c' 'c' + + node3 = ( 'c', [ None ] ) + node2 = ( 'b', [ None ] ) + node1 = ( 'a', [ node2, node3 ] ) + source = [ node1 ] + self.assertEqual(make_dafsa.join_suffixes(source), source) + + def testReverseDistinctTrie(self): + """Tests a reverse trie formed DAFSA with distinct labels passes unchanged. + """ + + # 'a' 'a' + # \ \ + # 'c' => 'c' + # / / + # 'b' 'b' + + node3 = ( 'c', [ None ] ) + node2 = ( 'b', [ node3 ] ) + node1 = ( 'a', [ node3 ] ) + source = [ node1, node2 ] + self.assertEqual(make_dafsa.join_suffixes(source), source) + + def testJoinTwoHeads(self): + """Tests two heads can be joined even if there is something else between.""" + + # 'a' ------'a' + # / + # 'b' => 'b' / + # / + # 'a' --- + # + # The picture above should shows that the new version should have just one + # instance of the node with label 'a'. + + node3 = ( 'a', [ None ] ) + node2 = ( 'b', [ None ] ) + node1 = ( 'a', [ None ] ) + source1 = [ node1, node2, node3 ] + source2 = make_dafsa.join_suffixes(source1) + + # Both versions should expand to the same content. + self.assertEqual(source1, source2) + # But the new version should have just one instance of 'a'. + self.assertIs(source2[0], source2[2]) + + def testJoinTails(self): + """Tests tails can be joined.""" + + # 'a' -> 'c' 'a' + # \ + # => 'c' + # / + # 'b' -> 'c' 'b' + + node4 = ( 'c', [ None ] ) + node3 = ( 'b', [ node4 ] ) + node2 = ( 'c', [ None ] ) + node1 = ( 'a', [ node2 ] ) + source1 = [ node1, node3 ] + source2 = make_dafsa.join_suffixes(source1) + + # Both versions should expand to the same content. + self.assertEqual(source1, source2) + # But the new version should have just one tail. + self.assertIs(source2[0][1][0], source2[1][1][0]) + + def testMakeRecursiveTrie(self): + """Tests recursive suffix join.""" + + # 'a' -> 'e' -> 'g' 'a' + # \ + # 'e' + # / \ + # 'b' -> 'e' -> 'g' 'b' \ + # \ + # => 'g' + # / + # 'c' -> 'f' -> 'g' 'c' / + # \ / + # 'f' + # / + # 'd' -> 'f' -> 'g' 'd' + + node7 = ( 'g', [ None ] ) + node6 = ( 'f', [ node7 ] ) + node5 = ( 'e', [ node7 ] ) + node4 = ( 'd', [ node6 ] ) + node3 = ( 'c', [ node6 ] ) + node2 = ( 'b', [ node5 ] ) + node1 = ( 'a', [ node5 ] ) + source1 = [ node1, node2, node3, node4 ] + source2 = make_dafsa.join_suffixes(source1) + + # Both versions should expand to the same content. + self.assertEqual(source1, source2) + # But the new version should have just one 'e'. + self.assertIs(source2[0][1][0], source2[1][1][0]) + # And one 'f'. + self.assertIs(source2[2][1][0], source2[3][1][0]) + # And one 'g'. + self.assertIs(source2[0][1][0][1][0], source2[2][1][0][1][0]) + + def testMakeDiamond(self): + """Test we can join suffixes of a trie.""" + + # 'b' -> 'd' 'b' + # / / \ + # 'a' => 'a' 'd' + # \ \ / + # 'c' -> 'd' 'c' + + node5 = ( 'd', [ None ] ) + node4 = ( 'c', [ node5 ] ) + node3 = ( 'd', [ None ] ) + node2 = ( 'b', [ node3 ] ) + node1 = ( 'a', [ node2, node4 ] ) + source1 = [ node1 ] + source2 = make_dafsa.join_suffixes(source1) + + # Both versions should expand to the same content. + self.assertEqual(source1, source2) + # But the new version should have just one 'd'. + self.assertIs(source2[0][1][0][1][0], source2[0][1][1][1][0]) + + def testJoinOneChild(self): + """Tests that we can join some children but not all.""" + + # 'c' ----'c' + # / / / + # 'a' 'a' / + # \ \ / + # 'd' 'd'/ + # => / + # 'c' / + # / / + # 'b' 'b' + # \ \ + # 'e' 'e' + + node6 = ( 'e', [ None ] ) + node5 = ( 'c', [ None ] ) + node4 = ( 'b', [ node5, node6 ] ) + node3 = ( 'd', [ None ] ) + node2 = ( 'c', [ None ] ) + node1 = ( 'a', [ node2, node3 ] ) + source1 = [ node1, node4 ] + source2 = make_dafsa.join_suffixes(source1) + + # Both versions should expand to the same content. + self.assertEqual(source1, source2) + # But the new version should have just one 'c'. + self.assertIs(source2[0][1][0], source2[1][1][0]) + + +class ReverseTest(unittest.TestCase): + def testAtomicLabel(self): + """Tests an atomic label passes unchanged.""" + + # 'a' => 'a' + + node1 = ( 'a', [ None ] ) + source = [ node1 ] + self.assertEqual(make_dafsa.reverse(source), source) + + def testLabel(self): + """Tests that labels are reversed.""" + + # 'ab' => 'ba' + + node1 = ( 'ab', [ None ] ) + source1 = [ node1 ] + node2 = ( 'ba', [ None ] ) + source2 = [ node2 ] + self.assertEqual(make_dafsa.reverse(source1), source2) + + def testChain(self): + """Tests that edges are reversed.""" + + # 'a' -> 'b' => 'b' -> 'a' + + node2 = ( 'b', [ None ] ) + node1 = ( 'a', [ node2 ] ) + source1 = [ node1 ] + node4 = ( 'a', [ None ] ) + node3 = ( 'b', [ node4 ] ) + source2 = [ node3 ] + self.assertEqual(make_dafsa.reverse(source1), source2) + + def testInnerTerminator(self): + """Tests a sequence with an inner terminator can be reversed.""" + + # 'a' -> 'b' 'b' -> 'a' + # \ => / + # {sink} ------ + + node2 = ( 'b', [ None ] ) + node1 = ( 'a', [ node2, None ] ) + source1 = [ node1 ] + node4 = ( 'a', [ None ] ) + node3 = ( 'b', [ node4 ] ) + source2 = [ node3, node4 ] + self.assertEqual(make_dafsa.reverse(source1), source2) + + def testAtomicTrie(self): + """Tests a trie formed DAFSA can be reversed.""" + + # 'b' 'b' + # / \ + # 'a' => 'a' + # \ / + # 'c' 'c' + + node3 = ( 'c', [ None ] ) + node2 = ( 'b', [ None ] ) + node1 = ( 'a', [ node2, node3 ] ) + source1 = [ node1 ] + node6 = ( 'a', [ None ] ) + node5 = ( 'c', [ node6 ] ) + node4 = ( 'b', [ node6 ] ) + source2 = [ node4, node5 ] + self.assertEqual(make_dafsa.reverse(source1), source2) + + def testReverseAtomicTrie(self): + """Tests a reverse trie formed DAFSA can be reversed.""" + + # 'a' 'a' + # \ / + # 'c' => 'c' + # / \ + # 'b' 'b' + + node3 = ( 'c', [ None ] ) + node2 = ( 'b', [ node3 ] ) + node1 = ( 'a', [ node3 ] ) + source1 = [ node1, node2 ] + node6 = ( 'b', [ None ] ) + node5 = ( 'a', [ None ] ) + node4 = ( 'c', [ node5, node6 ] ) + source2 = [ node4 ] + self.assertEqual(make_dafsa.reverse(source1), source2) + + def testDiamond(self): + """Tests we can reverse both edges and nodes in a diamond.""" + + # 'cd' 'dc' + # / \ / \ + # 'ab' 'gh' => 'hg' 'ba' + # \ / \ / + # 'ef' 'fe' + + node4 = ( 'gh', [ None ] ) + node3 = ( 'ef', [ node4 ] ) + node2 = ( 'cd', [ node4 ] ) + node1 = ( 'ab', [ node2, node3 ] ) + source1 = [ node1 ] + node8 = ( 'ba', [ None ] ) + node7 = ( 'fe', [ node8 ] ) + node6 = ( 'dc', [ node8 ] ) + node5 = ( 'hg', [ node6, node7 ] ) + source2 = [ node5 ] + self.assertEqual(make_dafsa.reverse(source1), source2) + + +class TopSortTest(unittest.TestCase): + def testNode(self): + """Tests a DAFSA with one node can be sorted.""" + + # 'a' => [ 'a' ] + + node1 = ( 'a', [ None ] ) + source = [ node1 ] + nodes = [ node1 ] + self.assertEqual(make_dafsa.top_sort(source), nodes) + + def testDiamond(self): + """Tests nodes in a diamond can be sorted.""" + + # 'b' + # / \ + # 'a' 'd' + # \ / + # 'c' + + node4 = ( 'd', [ None ] ) + node3 = ( 'c', [ node4 ] ) + node2 = ( 'b', [ node4 ] ) + node1 = ( 'a', [ node2, node3 ] ) + source = [ node1 ] + nodes = make_dafsa.top_sort(source) + self.assertLess(nodes.index(node1), nodes.index(node2)) + self.assertLess(nodes.index(node2), nodes.index(node4)) + self.assertLess(nodes.index(node3), nodes.index(node4)) + + +class EncodePrefixTest(unittest.TestCase): + def testChar(self): + """Tests to encode a single character prefix.""" + label = 'a' + bytes = [ ord('a') ] + self.assertEqual(make_dafsa.encode_prefix(label), bytes) + + def testChars(self): + """Tests to encode a multi character prefix.""" + label = 'ab' + bytes = [ ord('b'), ord('a') ] + self.assertEqual(make_dafsa.encode_prefix(label), bytes) + + +class EncodeLabelTest(unittest.TestCase): + def testChar(self): + """Tests to encode a single character label.""" + label = 'a' + bytes = [ ord('a') + 0x80 ] + self.assertEqual(make_dafsa.encode_label(label), bytes) + + def testChars(self): + """Tests to encode a multi character label.""" + label = 'ab' + bytes = [ ord('b') + 0x80, ord('a') ] + self.assertEqual(make_dafsa.encode_label(label), bytes) + + +class EncodeLinksTest(unittest.TestCase): + def testEndLabel(self): + """Tests to encode link to the sink.""" + children = [ None ] + offsets = {} + bytes = 0 + output = [] + self.assertEqual(make_dafsa.encode_links(children, offsets, bytes), + output) + + def testOneByteOffset(self): + """Tests to encode a single one byte offset.""" + node = ( '', [ None ] ) + children = [ node ] + offsets = { id(node) : 2 } + bytes = 5 + output = [ 132 ] + self.assertEqual(make_dafsa.encode_links(children, offsets, bytes), + output) + + def testOneByteOffsets(self): + """Tests to encode a sequence of one byte offsets.""" + node1 = ( '', [ None ] ) + node2 = ( '', [ None ] ) + children = [ node1, node2 ] + offsets = { id(node1) : 2, id(node2) : 1 } + bytes = 5 + output = [ 129, 5 ] + self.assertEqual(make_dafsa.encode_links(children, offsets, bytes), + output) + + def testTwoBytesOffset(self): + """Tests to encode a single two byte offset.""" + node = ( '', [ None ] ) + children = [ node ] + offsets = { id(node) : 2 } + bytes = 1005 + output = [ 237, 195] + self.assertEqual(make_dafsa.encode_links(children, offsets, bytes), + output) + + def testTwoBytesOffsets(self): + """Tests to encode a sequence of two byte offsets.""" + node1 = ( '', [ None ] ) + node2 = ( '', [ None ] ) + node3 = ( '', [ None ] ) + children = [ node1, node2, node3 ] + offsets = { id(node1) : 1002, id(node2) : 2, id(node3) : 2002 } + bytes = 3005 + output = [ 232, 195, 232, 67, 241, 67 ] + self.assertEqual(make_dafsa.encode_links(children, offsets, bytes), + output) + + def testThreeBytesOffset(self): + """Tests to encode a single three byte offset.""" + node = ( '', [ None ] ) + children = [ node ] + offsets = { id(node) : 2 } + bytes = 100005 + output = [ 166, 134, 225 ] + self.assertEqual(make_dafsa.encode_links(children, offsets, bytes), + output) + + def testThreeBytesOffsets(self): + """Tests to encode a sequence of three byte offsets.""" + node1 = ( '', [ None ] ) + node2 = ( '', [ None ] ) + node3 = ( '', [ None ] ) + children = [ node1, node2, node3 ] + offsets = { id(node1) : 100002, id(node2) : 2, id(node3) : 200002 } + bytes = 300005 + output = [ 160, 134, 225, 160, 134, 97, 172, 134, 97 ] + self.assertEqual(make_dafsa.encode_links(children, offsets, bytes), + output) + + def testOneTwoThreeBytesOffsets(self): + """Tests to encode offsets of different sizes.""" + node1 = ( '', [ None ] ) + node2 = ( '', [ None ] ) + node3 = ( '', [ None ] ) + children = [ node1, node2, node3 ] + offsets = { id(node1) : 10003, id(node2) : 10002, id(node3) : 100002 } + bytes = 300005 + output = [ 129, 143, 95, 97, 74, 13, 99 ] + self.assertEqual(make_dafsa.encode_links(children, offsets, bytes), + output) + + +class ExamplesTest(unittest.TestCase): + def testExample1(self): + """Tests Example 1 from make_dafsa.py.""" + infile = [ '%%', 'aa, 1', 'a, 2', '%%' ] + bytes = [ 0x81, 0xE1, 0x02, 0x81, 0x82, 0x61, 0x81 ] + outfile = make_dafsa.to_cxx(bytes) + self.assertEqual(make_dafsa.words_to_cxx(make_dafsa.parse_gperf(infile)), + outfile) + + def testExample2(self): + """Tests Example 2 from make_dafsa.py.""" + infile = [ '%%', 'aa, 1', 'bbb, 2', 'baa, 1', '%%' ] + bytes = [ 0x02, 0x83, 0xE2, 0x02, 0x83, 0x61, 0x61, 0x81, 0x62, 0x62, + 0x82 ] + outfile = make_dafsa.to_cxx(bytes) + self.assertEqual(make_dafsa.words_to_cxx(make_dafsa.parse_gperf(infile)), + outfile) + + +if __name__ == '__main__': + unittest.main() |