File size: 1,949 Bytes
d916065
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
import unittest

from nltk.metrics import (
    BigramAssocMeasures,
    QuadgramAssocMeasures,
    TrigramAssocMeasures,
)

## Test the likelihood ratio metric

_DELTA = 1e-8


class TestLikelihoodRatio(unittest.TestCase):
    def test_lr_bigram(self):
        self.assertAlmostEqual(
            BigramAssocMeasures.likelihood_ratio(2, (4, 4), 20),
            2.4142743368419755,
            delta=_DELTA,
        )
        self.assertAlmostEqual(
            BigramAssocMeasures.likelihood_ratio(1, (1, 1), 1), 0.0, delta=_DELTA
        )
        self.assertRaises(
            ValueError,
            BigramAssocMeasures.likelihood_ratio,
            *(0, (2, 2), 2),
        )

    def test_lr_trigram(self):
        self.assertAlmostEqual(
            TrigramAssocMeasures.likelihood_ratio(1, (1, 1, 1), (1, 1, 1), 2),
            5.545177444479562,
            delta=_DELTA,
        )
        self.assertAlmostEqual(
            TrigramAssocMeasures.likelihood_ratio(1, (1, 1, 1), (1, 1, 1), 1),
            0.0,
            delta=_DELTA,
        )
        self.assertRaises(
            ValueError,
            TrigramAssocMeasures.likelihood_ratio,
            *(1, (1, 1, 2), (1, 1, 2), 2),
        )

    def test_lr_quadgram(self):
        self.assertAlmostEqual(
            QuadgramAssocMeasures.likelihood_ratio(
                1, (1, 1, 1, 1), (1, 1, 1, 1, 1, 1), (1, 1, 1, 1), 2
            ),
            8.317766166719343,
            delta=_DELTA,
        )
        self.assertAlmostEqual(
            QuadgramAssocMeasures.likelihood_ratio(
                1, (1, 1, 1, 1), (1, 1, 1, 1, 1, 1), (1, 1, 1, 1), 1
            ),
            0.0,
            delta=_DELTA,
        )
        self.assertRaises(
            ValueError,
            QuadgramAssocMeasures.likelihood_ratio,
            *(1, (1, 1, 1, 1), (1, 1, 1, 1, 1, 2), (1, 1, 1, 1), 1),
        )