-
Notifications
You must be signed in to change notification settings - Fork 0
/
VocabularyFactory.py
53 lines (39 loc) · 1.22 KB
/
VocabularyFactory.py
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
from abc import ABC, abstractmethod
class VocabularyFactory:
@staticmethod
def get_vocabulary(vocabulary_type):
if vocabulary_type == '0':
return CaseInsensitiveAlphabetChars()
if vocabulary_type == '1':
return CaseSensitiveAlphabetChars()
if vocabulary_type == '2':
return IsAlphaChars()
class Vocabulary(ABC):
@abstractmethod
def is_in_vocabulary(self, char):
pass
@abstractmethod
def get_size(self):
pass
class CaseInsensitiveAlphabetChars(Vocabulary):
def is_in_vocabulary(self, char):
codepoint = ord(char)
return 97 <= codepoint <= 122
def get_size(self):
return 26
class CaseSensitiveAlphabetChars(Vocabulary):
def is_in_vocabulary(self, char):
codepoint = ord(char)
return 65 <= codepoint <= 90 or 97 <= codepoint <= 122
def get_size(self):
return 52 # 26*2
class IsAlphaChars(Vocabulary):
def is_in_vocabulary(self, char):
return char.isalpha()
def get_size(self):
count = 0
for codepoint in range(17 * 2 ** 16):
ch = chr(codepoint)
if ch.isalpha():
count = count + 1
return count