This repository has been archived by the owner on Oct 21, 2024. It is now read-only.
-
Notifications
You must be signed in to change notification settings - Fork 4
/
Copy pathinstructions_util_test.py
123 lines (103 loc) · 4.12 KB
/
instructions_util_test.py
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
# coding=utf-8
# Copyright 2023 The Google Research Authors.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
# http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.
"""Test for utility library of instructions."""
from absl.testing import absltest
from absl.testing import parameterized
import instructions_util
class InstructionsUtilTest(parameterized.TestCase):
TEST_WORD_COUNT_CASE_1 = ("word1, word2, word3, word4.", 4)
TEST_WORD_COUNT_CASE_2 = (
"""
Bard can you tell me which is the best optimization method for the
transition from an hydro-thermal system to an hydro-renewables system""",
24)
TEST_WORD_COUNT_CASE_3 = (
"""
Hyphenated-word has two word counts.
""", 6)
def test_word_count(self):
"""Tests word counter."""
with self.subTest(f"{self.TEST_WORD_COUNT_CASE_1[0]}"):
text, expected_num_words = self.TEST_WORD_COUNT_CASE_1
actual_num_words = instructions_util.count_words(text)
self.assertEqual(expected_num_words, actual_num_words)
with self.subTest(f"{self.TEST_WORD_COUNT_CASE_2[0]}"):
text, expected_num_words = self.TEST_WORD_COUNT_CASE_2
actual_num_words = instructions_util.count_words(text)
self.assertEqual(expected_num_words, actual_num_words)
with self.subTest(f"{self.TEST_WORD_COUNT_CASE_3[0]}"):
text, expected_num_words = self.TEST_WORD_COUNT_CASE_3
actual_num_words = instructions_util.count_words(text)
self.assertEqual(expected_num_words, actual_num_words)
@parameterized.named_parameters(
[
{ # pylint: disable=g-complex-comprehension
"testcase_name": (
f"_response={response}_num_sentences={num_sentences}"
),
"response": response,
"num_sentences": num_sentences,
}
for response, num_sentences in [
("xx,x. xx,x! xx/x. x{x}x? x.", 5),
("xx,x! xxxx. x(x)x?", 3),
("xxxx. xx,x! xx|x. x&x x?", 4),
("xx-x]xx,x! x{x}xx,x.", 2),
]
]
)
def test_count_sentences(self, response, num_sentences):
"""Tests sentence counter."""
actual_num_sentences = instructions_util.count_sentences(response)
self.assertEqual(num_sentences, actual_num_sentences)
TEST_SENTENCE_SPLIT_1 = """
Google is a technology company. It was founded in 1998 by Larry Page
and Sergey Brin. Google's mission is to organize the world's information
and make it universally accessible and useful.
"""
TEST_SENTENCE_SPLIT_2 = """
The U.S.A has many Ph.D. students. They will often haven a .com website
sharing the research that they have done.
"""
EXPECTED_SENTENCE_SPLIT_1 = [
"Google is a technology company.",
"It was founded in 1998 by Larry Page and Sergey Brin.",
(
"Google's mission is to organize the world's information and make it"
" universally accessible and useful."
),
]
EXPECTED_SENTENCE_SPLIT_2 = [
"The U.S.A has many Ph.D. students.",
(
"They will often haven a .com website sharing the research that they"
" have done."
),
]
def test_sentence_splitter(self):
"""Tests sentence splitter."""
sentence_split_1 = instructions_util.split_into_sentences(
self.TEST_SENTENCE_SPLIT_1
)
sentence_split_2 = instructions_util.split_into_sentences(
self.TEST_SENTENCE_SPLIT_2
)
self.assertEqual(self.EXPECTED_SENTENCE_SPLIT_1, sentence_split_1)
self.assertEqual(self.EXPECTED_SENTENCE_SPLIT_2, sentence_split_2)
def test_generate_keywords(self):
"""Tests generate keywords."""
self.assertLen(instructions_util.generate_keywords(10), 10)
if __name__ == "__main__":
absltest.main()