[79668b]: / tests / unit / str / test_str.py

Download this file

83 lines (65 with data), 2.8 kB

 1
 2
 3
 4
 5
 6
 7
 8
 9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
import docdeid as dd
from deduce.str import (
Acronimify,
FilterBasedOnLookupSet,
RemoveValues,
TakeLastToken,
TitleCase,
UpperCase,
UpperCaseFirstChar,
)
class TestStr:
def test_uppercase(self):
processor = UpperCase()
assert processor.process("test") == "TEST"
assert processor.process("Test") == "TEST"
assert processor.process("TEST") == "TEST"
assert processor.process("123") == "123"
assert processor.process("test_123") == "TEST_123"
def test_uppercase_first_char(self):
processor = UpperCaseFirstChar()
assert processor.process("test") == "Test"
assert processor.process("Test") == "Test"
assert processor.process("t") == "T"
assert processor.process("T") == "T"
assert processor.process("A3") == "A3"
assert processor.process("a3") == "A3"
def test_titlecase(self):
processor = TitleCase()
assert processor.process("test") == "Test"
assert processor.process("Test") == "Test"
assert processor.process("Test test") == "Test Test"
assert processor.process("t") == "T"
assert processor.process("T") == "T"
assert processor.process("T t") == "T T"
assert processor.process("A3") == "A3"
assert processor.process("a3") == "A3"
assert processor.process("a3 a4") == "A3 A4"
def test_take_last_token(self):
processor = TakeLastToken()
assert processor.process("test") == "test"
assert processor.process("dit is een test") == "test"
assert processor.process("") == ""
def test_remove_values(self):
processor = RemoveValues(filter_values=["de", "het", "een"])
assert processor.process("de boot") == "boot"
assert processor.process("debiet") == "debiet"
assert (
processor.process("van het Schip") == "vanSchip"
) # TODO Is this intended?
assert processor.process("nummer een") == "nummer"
def test_acronimify(self):
processor = Acronimify()
assert processor.process("Elizabeth Tweesteden Ziekenhuis") == "ETZ"
assert processor.process("Umcu") == "U"
assert processor.process("Universitair Medisch Centrum Utrecht") == "UMCU"
assert processor.process("universitair medisch centrum utrecht") == "umcu"
def test_filter_based_on_lookupset(self):
lookup_set = dd.ds.LookupSet()
lookup_set.add_items_from_iterable(["arts", "bakker", "slager"])
processor = FilterBasedOnLookupSet(filter_set=lookup_set)
assert processor.filter("")
assert processor.filter("visser")
assert not processor.filter("arts")
assert not processor.filter("bakker")
assert not processor.filter("slager")