summaryrefslogtreecommitdiffstats
path: root/chromium/net/tools/tld_cleanup/make_dafsa_unittest.py
diff options
context:
space:
mode:
Diffstat (limited to 'chromium/net/tools/tld_cleanup/make_dafsa_unittest.py')
-rwxr-xr-xchromium/net/tools/tld_cleanup/make_dafsa_unittest.py757
1 files changed, 757 insertions, 0 deletions
diff --git a/chromium/net/tools/tld_cleanup/make_dafsa_unittest.py b/chromium/net/tools/tld_cleanup/make_dafsa_unittest.py
new file mode 100755
index 00000000000..5ff92e62292
--- /dev/null
+++ b/chromium/net/tools/tld_cleanup/make_dafsa_unittest.py
@@ -0,0 +1,757 @@
+#!/usr/bin/env python
+# Copyright 2014 The Chromium Authors. All rights reserved.
+# Use of this source code is governed by a BSD-style license that can be
+# found in the LICENSE file.
+
+
+import sys
+import unittest
+import make_dafsa
+
+
+class ParseGperfTest(unittest.TestCase):
+ def testMalformedKey(self):
+ """Tests exception is thrown at bad format."""
+ infile1 = [ '%%', '', '%%' ]
+ self.assertRaises(make_dafsa.InputError, make_dafsa.parse_gperf, infile1)
+
+ infile2 = [ '%%', 'apa,1', '%%' ]
+ self.assertRaises(make_dafsa.InputError, make_dafsa.parse_gperf, infile2)
+
+ infile3 = [ '%%', 'apa, 1', '%%' ]
+ self.assertRaises(make_dafsa.InputError, make_dafsa.parse_gperf, infile3)
+
+ def testBadValues(self):
+ """Tests exception is thrown when value is out of range."""
+ infile1 = [ '%%', 'a, -1', '%%' ]
+ self.assertRaises(make_dafsa.InputError, make_dafsa.parse_gperf, infile1)
+
+ infile2 = [ '%%', 'a, x', '%%' ]
+ self.assertRaises(make_dafsa.InputError, make_dafsa.parse_gperf, infile2)
+
+ infile3 = [ '%%', 'a, 3', '%%' ]
+ self.assertRaises(make_dafsa.InputError, make_dafsa.parse_gperf, infile3)
+
+ infile4 = [ '%%', 'a, 6', '%%' ]
+ self.assertRaises(make_dafsa.InputError, make_dafsa.parse_gperf, infile4)
+
+ infile5 = [ '%%', 'a, 12', '%%' ]
+ self.assertRaises(make_dafsa.InputError, make_dafsa.parse_gperf, infile5)
+
+ def testValues(self):
+ """Tests legal values are accepted."""
+ infile1 = [ '%%', 'a, 0', '%%' ]
+ words1 = [ 'a0' ]
+ self.assertEqual(make_dafsa.parse_gperf(infile1), words1)
+
+ infile2 = [ '%%', 'a, 1', '%%' ]
+ words2 = [ 'a1' ]
+ self.assertEqual(make_dafsa.parse_gperf(infile2), words2)
+
+ infile3 = [ '%%', 'a, 2', '%%' ]
+ words3 = [ 'a2' ]
+ self.assertEqual(make_dafsa.parse_gperf(infile3), words3)
+
+ infile4 = [ '%%', 'a, 4', '%%' ]
+ words4 = [ 'a4' ]
+ self.assertEqual(make_dafsa.parse_gperf(infile4), words4)
+
+ def testOneWord(self):
+ """Tests a single key can be parsed."""
+ infile = [ '%%', 'apa, 1', '%%' ]
+ words = [ 'apa1' ]
+ self.assertEqual(make_dafsa.parse_gperf(infile), words)
+
+ def testTwoWords(self):
+ """Tests a sequence of keys can be parsed."""
+ infile = [ '%%', 'apa, 1', 'bepa.com, 2', '%%' ]
+ words = [ 'apa1', 'bepa.com2' ]
+ self.assertEqual(make_dafsa.parse_gperf(infile), words)
+
+
+class ToDafsaTest(unittest.TestCase):
+ def testEmptyInput(self):
+ """Tests exception is thrown at empty input."""
+ words = ()
+ self.assertRaises(make_dafsa.InputError, make_dafsa.to_dafsa, words)
+
+ def testNonASCII(self):
+ """Tests exception is thrown if illegal characters are used."""
+ words1 = ( chr(0x1F) + 'a1', )
+ self.assertRaises(make_dafsa.InputError, make_dafsa.to_dafsa, words1)
+
+ words2 = ( 'a' + chr(0x1F) + '1', )
+ self.assertRaises(make_dafsa.InputError, make_dafsa.to_dafsa, words2)
+
+ words3 = ( chr(0x80) + 'a1', )
+ self.assertRaises(make_dafsa.InputError, make_dafsa.to_dafsa, words3)
+
+ words4 = ( 'a' + chr(0x80) + '1', )
+ self.assertRaises(make_dafsa.InputError, make_dafsa.to_dafsa, words4)
+
+ def testChar(self):
+ """Tests a DAFSA can be created from a single character domain name."""
+ words = [ 'a0' ]
+ node2 = ( chr(0), [ None ] )
+ node1 = ( 'a', [ node2 ] )
+ source = [ node1 ]
+ self.assertEqual(make_dafsa.to_dafsa(words), source)
+
+ def testChars(self):
+ """Tests a DAFSA can be created from a multi character domain name."""
+ words = [ 'ab0' ]
+ node3 = ( chr(0), [ None ] )
+ node2 = ( 'b', [ node3 ] )
+ node1 = ( 'a', [ node2 ] )
+ source = [ node1 ]
+ self.assertEqual(make_dafsa.to_dafsa(words), source)
+
+ def testWords(self):
+ """Tests a DAFSA can be created from a sequence of domain names."""
+ words = [ 'a0', 'b1' ]
+ node4 = ( chr(1), [ None ] )
+ node3 = ( 'b', [ node4 ] )
+ node2 = ( chr(0), [ None ] )
+ node1 = ( 'a', [ node2 ] )
+ source = [ node1, node3 ]
+ self.assertEqual(make_dafsa.to_dafsa(words), source)
+
+
+class ToWordsTest(unittest.TestCase):
+ def testSink(self):
+ """Tests the sink is exapnded to a list with an empty string."""
+ node1 = None
+ words = [ '' ]
+ self.assertEqual(make_dafsa.to_words(node1), words)
+
+ def testSingleNode(self):
+ """Tests a single node is expanded to a list with the label string."""
+
+ # 'ab' -> [ 'ab' ]
+
+ node1 = ( 'ab', [ None ] )
+ words = [ 'ab' ]
+ self.assertEqual(make_dafsa.to_words(node1), words)
+
+ def testChain(self):
+ """Tests a sequence of nodes are preoperly expanded."""
+
+ # 'ab' -> 'cd' => [ 'abcd' ]
+
+ node2 = ( 'cd', [ None ] )
+ node1 = ( 'ab', [ node2 ] )
+ words = [ 'abcd' ]
+ self.assertEqual(make_dafsa.to_words(node1), words)
+
+ def testInnerTerminator(self):
+ """Tests a sequence with an inner terminator is expanded to two strings."""
+
+ # 'a' -> 'b'
+ # \ => [ 'ab', 'a' ]
+ # {sink}
+
+ node2 = ( 'b', [ None ] )
+ node1 = ( 'a', [ node2, None ] )
+ words = [ 'ab', 'a' ]
+ self.assertEqual(make_dafsa.to_words(node1), words)
+
+ def testDiamond(self):
+ """Tests a diamond can be expanded to a word list."""
+
+ # 'cd'
+ # / \
+ # 'ab' 'gh'
+ # \ /
+ # 'ef'
+
+ node4 = ( 'gh', [ None ] )
+ node3 = ( 'ef', [ node4 ] )
+ node2 = ( 'cd', [ node4 ] )
+ node1 = ( 'ab', [ node2, node3 ] )
+ words = [ 'abcdgh', 'abefgh' ]
+ self.assertEqual(make_dafsa.to_words(node1), words)
+
+
+class JoinLabelsTest(unittest.TestCase):
+ def testLabel(self):
+ """Tests a single label passes unchanged."""
+
+ # 'a' => 'a'
+
+ node1 = ( 'a', [ None ] )
+ source = [ node1 ]
+ self.assertEqual(make_dafsa.join_labels(source), source)
+
+ def testInnerTerminator(self):
+ """Tests a sequence with an inner terminator passes unchanged."""
+
+ # 'a' -> 'b' 'a' -> 'b'
+ # \ => \
+ # {sink} {sink}
+
+ node2 = ( 'b', [ None ] )
+ node1 = ( 'a', [ node2, None ] )
+ source = [ node1 ]
+ self.assertEqual(make_dafsa.join_labels(source), source)
+
+ def testLabels(self):
+ """Tests a sequence of labels can be joined."""
+
+ # 'a' -> 'b' => 'ab'
+
+ node2 = ( 'b', [ None ] )
+ node1 = ( 'a', [ node2 ] )
+ source1 = [ node1 ]
+ node3 = ( 'ab', [ None ] )
+ source2 = [ node3 ]
+ self.assertEqual(make_dafsa.join_labels(source1), source2)
+
+ def testCompositeLabels(self):
+ """Tests a sequence of multi character labels can be joined."""
+
+ # 'ab' -> 'cd' => 'abcd'
+
+ node2 = ( 'cd', [ None ] )
+ node1 = ( 'ab', [ node2 ] )
+ source1 = [ node1 ]
+ node3 = ( 'abcd', [ None ] )
+ source2 = [ node3 ]
+ self.assertEqual(make_dafsa.join_labels(source1), source2)
+
+ def testAtomicTrie(self):
+ """Tests a trie formed DAFSA with atomic labels passes unchanged."""
+
+ # 'b' 'b'
+ # / /
+ # 'a' => 'a'
+ # \ \
+ # 'c' 'c'
+
+ node3 = ( 'c', [ None ] )
+ node2 = ( 'b', [ None ] )
+ node1 = ( 'a', [ node2, node3 ] )
+ source = [ node1 ]
+ self.assertEqual(make_dafsa.join_labels(source), source)
+
+ def testReverseAtomicTrie(self):
+ """Tests a reverse trie formed DAFSA with atomic labels passes unchanged."""
+
+ # 'a' 'a'
+ # \ \
+ # 'c' => 'c'
+ # / /
+ # 'b' 'b'
+
+ node3 = ( 'c', [ None ] )
+ node2 = ( 'b', [ node3 ] )
+ node1 = ( 'a', [ node3 ] )
+ source = [ node1, node2 ]
+ self.assertEqual(make_dafsa.join_labels(source), source)
+
+ def testChainedTrie(self):
+ """Tests a trie formed DAFSA with chained labels can be joined."""
+
+ # 'c' -> 'd' 'cd'
+ # / /
+ # 'a' -> 'b' => 'ab'
+ # \ \
+ # 'e' -> 'f' 'ef'
+
+ node6 = ( 'f', [ None ] )
+ node5 = ( 'e', [ node6 ] )
+ node4 = ( 'd', [ None ] )
+ node3 = ( 'c', [ node4 ] )
+ node2 = ( 'b', [ node3, node5 ] )
+ node1 = ( 'a', [ node2 ] )
+ source1 = [ node1 ]
+ node9 = ( 'ef', [ None ] )
+ node8 = ( 'cd', [ None ] )
+ node7 = ( 'ab', [ node8, node9 ] )
+ source2 = [ node7 ]
+ self.assertEqual(make_dafsa.join_labels(source1), source2)
+
+ def testReverseChainedTrie(self):
+ """Tests a reverse trie formed DAFSA with chained labels can be joined."""
+
+ # 'a' -> 'b' 'ab'
+ # \ \
+ # 'e' -> 'f' => 'ef'
+ # / /
+ # 'c' -> 'd' 'cd'
+
+ node6 = ( 'f', [ None ] )
+ node5 = ( 'e', [ node6 ] )
+ node4 = ( 'd', [ node5 ] )
+ node3 = ( 'c', [ node4 ] )
+ node2 = ( 'b', [ node5 ] )
+ node1 = ( 'a', [ node2 ] )
+ source1 = [ node1, node3 ]
+ node9 = ( 'ef', [ None ] )
+ node8 = ( 'cd', [ node9 ] )
+ node7 = ( 'ab', [ node9 ] )
+ source2 = [ node7, node8 ]
+ self.assertEqual(make_dafsa.join_labels(source1), source2)
+
+
+class JoinSuffixesTest(unittest.TestCase):
+ def testSingleLabel(self):
+ """Tests a single label passes unchanged."""
+
+ # 'a' => 'a'
+
+ node1 = ( 'a', [ None ] )
+ source = [ node1 ]
+ self.assertEqual(make_dafsa.join_suffixes(source), source)
+
+ def testInnerTerminator(self):
+ """Tests a sequence with an inner terminator passes unchanged."""
+
+ # 'a' -> 'b' 'a' -> 'b'
+ # \ => \
+ # {sink} {sink}
+
+ node2 = ( 'b', [ None ] )
+ node1 = ( 'a', [ node2, None ] )
+ source = [ node1 ]
+ self.assertEqual(make_dafsa.join_suffixes(source), source)
+
+ def testDistinctTrie(self):
+ """Tests a trie formed DAFSA with distinct labels passes unchanged."""
+
+ # 'b' 'b'
+ # / /
+ # 'a' => 'a'
+ # \ \
+ # 'c' 'c'
+
+ node3 = ( 'c', [ None ] )
+ node2 = ( 'b', [ None ] )
+ node1 = ( 'a', [ node2, node3 ] )
+ source = [ node1 ]
+ self.assertEqual(make_dafsa.join_suffixes(source), source)
+
+ def testReverseDistinctTrie(self):
+ """Tests a reverse trie formed DAFSA with distinct labels passes unchanged.
+ """
+
+ # 'a' 'a'
+ # \ \
+ # 'c' => 'c'
+ # / /
+ # 'b' 'b'
+
+ node3 = ( 'c', [ None ] )
+ node2 = ( 'b', [ node3 ] )
+ node1 = ( 'a', [ node3 ] )
+ source = [ node1, node2 ]
+ self.assertEqual(make_dafsa.join_suffixes(source), source)
+
+ def testJoinTwoHeads(self):
+ """Tests two heads can be joined even if there is something else between."""
+
+ # 'a' ------'a'
+ # /
+ # 'b' => 'b' /
+ # /
+ # 'a' ---
+ #
+ # The picture above should shows that the new version should have just one
+ # instance of the node with label 'a'.
+
+ node3 = ( 'a', [ None ] )
+ node2 = ( 'b', [ None ] )
+ node1 = ( 'a', [ None ] )
+ source1 = [ node1, node2, node3 ]
+ source2 = make_dafsa.join_suffixes(source1)
+
+ # Both versions should expand to the same content.
+ self.assertEqual(source1, source2)
+ # But the new version should have just one instance of 'a'.
+ self.assertIs(source2[0], source2[2])
+
+ def testJoinTails(self):
+ """Tests tails can be joined."""
+
+ # 'a' -> 'c' 'a'
+ # \
+ # => 'c'
+ # /
+ # 'b' -> 'c' 'b'
+
+ node4 = ( 'c', [ None ] )
+ node3 = ( 'b', [ node4 ] )
+ node2 = ( 'c', [ None ] )
+ node1 = ( 'a', [ node2 ] )
+ source1 = [ node1, node3 ]
+ source2 = make_dafsa.join_suffixes(source1)
+
+ # Both versions should expand to the same content.
+ self.assertEqual(source1, source2)
+ # But the new version should have just one tail.
+ self.assertIs(source2[0][1][0], source2[1][1][0])
+
+ def testMakeRecursiveTrie(self):
+ """Tests recursive suffix join."""
+
+ # 'a' -> 'e' -> 'g' 'a'
+ # \
+ # 'e'
+ # / \
+ # 'b' -> 'e' -> 'g' 'b' \
+ # \
+ # => 'g'
+ # /
+ # 'c' -> 'f' -> 'g' 'c' /
+ # \ /
+ # 'f'
+ # /
+ # 'd' -> 'f' -> 'g' 'd'
+
+ node7 = ( 'g', [ None ] )
+ node6 = ( 'f', [ node7 ] )
+ node5 = ( 'e', [ node7 ] )
+ node4 = ( 'd', [ node6 ] )
+ node3 = ( 'c', [ node6 ] )
+ node2 = ( 'b', [ node5 ] )
+ node1 = ( 'a', [ node5 ] )
+ source1 = [ node1, node2, node3, node4 ]
+ source2 = make_dafsa.join_suffixes(source1)
+
+ # Both versions should expand to the same content.
+ self.assertEqual(source1, source2)
+ # But the new version should have just one 'e'.
+ self.assertIs(source2[0][1][0], source2[1][1][0])
+ # And one 'f'.
+ self.assertIs(source2[2][1][0], source2[3][1][0])
+ # And one 'g'.
+ self.assertIs(source2[0][1][0][1][0], source2[2][1][0][1][0])
+
+ def testMakeDiamond(self):
+ """Test we can join suffixes of a trie."""
+
+ # 'b' -> 'd' 'b'
+ # / / \
+ # 'a' => 'a' 'd'
+ # \ \ /
+ # 'c' -> 'd' 'c'
+
+ node5 = ( 'd', [ None ] )
+ node4 = ( 'c', [ node5 ] )
+ node3 = ( 'd', [ None ] )
+ node2 = ( 'b', [ node3 ] )
+ node1 = ( 'a', [ node2, node4 ] )
+ source1 = [ node1 ]
+ source2 = make_dafsa.join_suffixes(source1)
+
+ # Both versions should expand to the same content.
+ self.assertEqual(source1, source2)
+ # But the new version should have just one 'd'.
+ self.assertIs(source2[0][1][0][1][0], source2[0][1][1][1][0])
+
+ def testJoinOneChild(self):
+ """Tests that we can join some children but not all."""
+
+ # 'c' ----'c'
+ # / / /
+ # 'a' 'a' /
+ # \ \ /
+ # 'd' 'd'/
+ # => /
+ # 'c' /
+ # / /
+ # 'b' 'b'
+ # \ \
+ # 'e' 'e'
+
+ node6 = ( 'e', [ None ] )
+ node5 = ( 'c', [ None ] )
+ node4 = ( 'b', [ node5, node6 ] )
+ node3 = ( 'd', [ None ] )
+ node2 = ( 'c', [ None ] )
+ node1 = ( 'a', [ node2, node3 ] )
+ source1 = [ node1, node4 ]
+ source2 = make_dafsa.join_suffixes(source1)
+
+ # Both versions should expand to the same content.
+ self.assertEqual(source1, source2)
+ # But the new version should have just one 'c'.
+ self.assertIs(source2[0][1][0], source2[1][1][0])
+
+
+class ReverseTest(unittest.TestCase):
+ def testAtomicLabel(self):
+ """Tests an atomic label passes unchanged."""
+
+ # 'a' => 'a'
+
+ node1 = ( 'a', [ None ] )
+ source = [ node1 ]
+ self.assertEqual(make_dafsa.reverse(source), source)
+
+ def testLabel(self):
+ """Tests that labels are reversed."""
+
+ # 'ab' => 'ba'
+
+ node1 = ( 'ab', [ None ] )
+ source1 = [ node1 ]
+ node2 = ( 'ba', [ None ] )
+ source2 = [ node2 ]
+ self.assertEqual(make_dafsa.reverse(source1), source2)
+
+ def testChain(self):
+ """Tests that edges are reversed."""
+
+ # 'a' -> 'b' => 'b' -> 'a'
+
+ node2 = ( 'b', [ None ] )
+ node1 = ( 'a', [ node2 ] )
+ source1 = [ node1 ]
+ node4 = ( 'a', [ None ] )
+ node3 = ( 'b', [ node4 ] )
+ source2 = [ node3 ]
+ self.assertEqual(make_dafsa.reverse(source1), source2)
+
+ def testInnerTerminator(self):
+ """Tests a sequence with an inner terminator can be reversed."""
+
+ # 'a' -> 'b' 'b' -> 'a'
+ # \ => /
+ # {sink} ------
+
+ node2 = ( 'b', [ None ] )
+ node1 = ( 'a', [ node2, None ] )
+ source1 = [ node1 ]
+ node4 = ( 'a', [ None ] )
+ node3 = ( 'b', [ node4 ] )
+ source2 = [ node3, node4 ]
+ self.assertEqual(make_dafsa.reverse(source1), source2)
+
+ def testAtomicTrie(self):
+ """Tests a trie formed DAFSA can be reversed."""
+
+ # 'b' 'b'
+ # / \
+ # 'a' => 'a'
+ # \ /
+ # 'c' 'c'
+
+ node3 = ( 'c', [ None ] )
+ node2 = ( 'b', [ None ] )
+ node1 = ( 'a', [ node2, node3 ] )
+ source1 = [ node1 ]
+ node6 = ( 'a', [ None ] )
+ node5 = ( 'c', [ node6 ] )
+ node4 = ( 'b', [ node6 ] )
+ source2 = [ node4, node5 ]
+ self.assertEqual(make_dafsa.reverse(source1), source2)
+
+ def testReverseAtomicTrie(self):
+ """Tests a reverse trie formed DAFSA can be reversed."""
+
+ # 'a' 'a'
+ # \ /
+ # 'c' => 'c'
+ # / \
+ # 'b' 'b'
+
+ node3 = ( 'c', [ None ] )
+ node2 = ( 'b', [ node3 ] )
+ node1 = ( 'a', [ node3 ] )
+ source1 = [ node1, node2 ]
+ node6 = ( 'b', [ None ] )
+ node5 = ( 'a', [ None ] )
+ node4 = ( 'c', [ node5, node6 ] )
+ source2 = [ node4 ]
+ self.assertEqual(make_dafsa.reverse(source1), source2)
+
+ def testDiamond(self):
+ """Tests we can reverse both edges and nodes in a diamond."""
+
+ # 'cd' 'dc'
+ # / \ / \
+ # 'ab' 'gh' => 'hg' 'ba'
+ # \ / \ /
+ # 'ef' 'fe'
+
+ node4 = ( 'gh', [ None ] )
+ node3 = ( 'ef', [ node4 ] )
+ node2 = ( 'cd', [ node4 ] )
+ node1 = ( 'ab', [ node2, node3 ] )
+ source1 = [ node1 ]
+ node8 = ( 'ba', [ None ] )
+ node7 = ( 'fe', [ node8 ] )
+ node6 = ( 'dc', [ node8 ] )
+ node5 = ( 'hg', [ node6, node7 ] )
+ source2 = [ node5 ]
+ self.assertEqual(make_dafsa.reverse(source1), source2)
+
+
+class TopSortTest(unittest.TestCase):
+ def testNode(self):
+ """Tests a DAFSA with one node can be sorted."""
+
+ # 'a' => [ 'a' ]
+
+ node1 = ( 'a', [ None ] )
+ source = [ node1 ]
+ nodes = [ node1 ]
+ self.assertEqual(make_dafsa.top_sort(source), nodes)
+
+ def testDiamond(self):
+ """Tests nodes in a diamond can be sorted."""
+
+ # 'b'
+ # / \
+ # 'a' 'd'
+ # \ /
+ # 'c'
+
+ node4 = ( 'd', [ None ] )
+ node3 = ( 'c', [ node4 ] )
+ node2 = ( 'b', [ node4 ] )
+ node1 = ( 'a', [ node2, node3 ] )
+ source = [ node1 ]
+ nodes = make_dafsa.top_sort(source)
+ self.assertLess(nodes.index(node1), nodes.index(node2))
+ self.assertLess(nodes.index(node2), nodes.index(node4))
+ self.assertLess(nodes.index(node3), nodes.index(node4))
+
+
+class EncodePrefixTest(unittest.TestCase):
+ def testChar(self):
+ """Tests to encode a single character prefix."""
+ label = 'a'
+ bytes = [ ord('a') ]
+ self.assertEqual(make_dafsa.encode_prefix(label), bytes)
+
+ def testChars(self):
+ """Tests to encode a multi character prefix."""
+ label = 'ab'
+ bytes = [ ord('b'), ord('a') ]
+ self.assertEqual(make_dafsa.encode_prefix(label), bytes)
+
+
+class EncodeLabelTest(unittest.TestCase):
+ def testChar(self):
+ """Tests to encode a single character label."""
+ label = 'a'
+ bytes = [ ord('a') + 0x80 ]
+ self.assertEqual(make_dafsa.encode_label(label), bytes)
+
+ def testChars(self):
+ """Tests to encode a multi character label."""
+ label = 'ab'
+ bytes = [ ord('b') + 0x80, ord('a') ]
+ self.assertEqual(make_dafsa.encode_label(label), bytes)
+
+
+class EncodeLinksTest(unittest.TestCase):
+ def testEndLabel(self):
+ """Tests to encode link to the sink."""
+ children = [ None ]
+ offsets = {}
+ bytes = 0
+ output = []
+ self.assertEqual(make_dafsa.encode_links(children, offsets, bytes),
+ output)
+
+ def testOneByteOffset(self):
+ """Tests to encode a single one byte offset."""
+ node = ( '', [ None ] )
+ children = [ node ]
+ offsets = { id(node) : 2 }
+ bytes = 5
+ output = [ 132 ]
+ self.assertEqual(make_dafsa.encode_links(children, offsets, bytes),
+ output)
+
+ def testOneByteOffsets(self):
+ """Tests to encode a sequence of one byte offsets."""
+ node1 = ( '', [ None ] )
+ node2 = ( '', [ None ] )
+ children = [ node1, node2 ]
+ offsets = { id(node1) : 2, id(node2) : 1 }
+ bytes = 5
+ output = [ 129, 5 ]
+ self.assertEqual(make_dafsa.encode_links(children, offsets, bytes),
+ output)
+
+ def testTwoBytesOffset(self):
+ """Tests to encode a single two byte offset."""
+ node = ( '', [ None ] )
+ children = [ node ]
+ offsets = { id(node) : 2 }
+ bytes = 1005
+ output = [ 237, 195]
+ self.assertEqual(make_dafsa.encode_links(children, offsets, bytes),
+ output)
+
+ def testTwoBytesOffsets(self):
+ """Tests to encode a sequence of two byte offsets."""
+ node1 = ( '', [ None ] )
+ node2 = ( '', [ None ] )
+ node3 = ( '', [ None ] )
+ children = [ node1, node2, node3 ]
+ offsets = { id(node1) : 1002, id(node2) : 2, id(node3) : 2002 }
+ bytes = 3005
+ output = [ 232, 195, 232, 67, 241, 67 ]
+ self.assertEqual(make_dafsa.encode_links(children, offsets, bytes),
+ output)
+
+ def testThreeBytesOffset(self):
+ """Tests to encode a single three byte offset."""
+ node = ( '', [ None ] )
+ children = [ node ]
+ offsets = { id(node) : 2 }
+ bytes = 100005
+ output = [ 166, 134, 225 ]
+ self.assertEqual(make_dafsa.encode_links(children, offsets, bytes),
+ output)
+
+ def testThreeBytesOffsets(self):
+ """Tests to encode a sequence of three byte offsets."""
+ node1 = ( '', [ None ] )
+ node2 = ( '', [ None ] )
+ node3 = ( '', [ None ] )
+ children = [ node1, node2, node3 ]
+ offsets = { id(node1) : 100002, id(node2) : 2, id(node3) : 200002 }
+ bytes = 300005
+ output = [ 160, 134, 225, 160, 134, 97, 172, 134, 97 ]
+ self.assertEqual(make_dafsa.encode_links(children, offsets, bytes),
+ output)
+
+ def testOneTwoThreeBytesOffsets(self):
+ """Tests to encode offsets of different sizes."""
+ node1 = ( '', [ None ] )
+ node2 = ( '', [ None ] )
+ node3 = ( '', [ None ] )
+ children = [ node1, node2, node3 ]
+ offsets = { id(node1) : 10003, id(node2) : 10002, id(node3) : 100002 }
+ bytes = 300005
+ output = [ 129, 143, 95, 97, 74, 13, 99 ]
+ self.assertEqual(make_dafsa.encode_links(children, offsets, bytes),
+ output)
+
+
+class ExamplesTest(unittest.TestCase):
+ def testExample1(self):
+ """Tests Example 1 from make_dafsa.py."""
+ infile = [ '%%', 'aa, 1', 'a, 2', '%%' ]
+ bytes = [ 0x81, 0xE1, 0x02, 0x81, 0x82, 0x61, 0x81 ]
+ outfile = make_dafsa.to_cxx(bytes)
+ self.assertEqual(make_dafsa.words_to_cxx(make_dafsa.parse_gperf(infile)),
+ outfile)
+
+ def testExample2(self):
+ """Tests Example 2 from make_dafsa.py."""
+ infile = [ '%%', 'aa, 1', 'bbb, 2', 'baa, 1', '%%' ]
+ bytes = [ 0x02, 0x83, 0xE2, 0x02, 0x83, 0x61, 0x61, 0x81, 0x62, 0x62,
+ 0x82 ]
+ outfile = make_dafsa.to_cxx(bytes)
+ self.assertEqual(make_dafsa.words_to_cxx(make_dafsa.parse_gperf(infile)),
+ outfile)
+
+
+if __name__ == '__main__':
+ unittest.main()