texar-pytorch/tests/modules/pretrained/xlnet_utils_test.py at 1e4416fc0ba8838e7bc3352dd9f5b157d2fc2ff7 · asyml/texar-pytorch · GitHub

1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
# Copyright 2019 The Texar Authors. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#      http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.
"""
Unit tests for XLNet model utils.
"""

import unittest

import torch

from texar.torch.modules.pretrained.xlnet_utils import *


class XLNetModelUtilsTest(unittest.TestCase):
    r"""Tests XLNet model utils.
    """

    def test_PositionWiseFF(self):

        # Case 1
        model = PositionWiseFF()
        inputs = torch.rand(32, model._hparams.hidden_dim)
        outputs = model(inputs)
        self.assertEqual(outputs.shape, torch.Size([32,
                                                    model._hparams.hidden_dim]))

        # Case 2
        hparams = {
            "hidden_dim": 16,
            "ffn_inner_dim": 32,
            "dropout": 0.1,
            "activation": 'relu',
        }
        model = PositionWiseFF(hparams=hparams)
        inputs = torch.rand(32, 16)
        outputs = model(inputs)
        self.assertEqual(outputs.shape, torch.Size([32, 16]))

        # Case 3
        hparams = {
            "hidden_dim": 16,
            "ffn_inner_dim": 32,
            "dropout": 0.1,
            "activation": 'gelu',
        }
        model = PositionWiseFF(hparams=hparams)
        inputs = torch.rand(32, 16)
        outputs = model(inputs)
        self.assertEqual(outputs.shape, torch.Size([32, 16]))

    def test_RelativeMultiheadAttention(self):

        model = RelativeMultiheadAttention()

        states_h = torch.rand(16, 32, model._hparams.hidden_dim)
        pos_embed = torch.rand(24, 32, model._hparams.hidden_dim)

        output_h, output_g = model(states_h=states_h, pos_embed=pos_embed)

        self.assertEqual(output_h.shape,
                         torch.Size([16, 32, model._hparams.hidden_dim]))
        self.assertEqual(output_g, None)

    def test_RelativePositionalEncoding(self):

        batch_size = 16
        seq_len = 8
        total_len = 32

        # Case 1
        model = RelativePositionalEncoding()
        pos_embed = model(batch_size=batch_size,
                          seq_len=seq_len,
                          total_len=total_len)
        self.assertEqual(pos_embed.shape,
                         torch.Size([40, 16, model._hparams.dim]))

        # Case 2
        model = RelativePositionalEncoding()
        pos_embed = model(batch_size=batch_size,
                          seq_len=seq_len,
                          total_len=total_len,
                          attn_type='uni')
        self.assertEqual(pos_embed.shape,
                         torch.Size([33, 16, model._hparams.dim]))


if __name__ == "__main__":
    unittest.main()