forked from TorahBibleCodes/TorahBibleCodes
-
Notifications
You must be signed in to change notification settings - Fork 0
/
mod_3BTextFileParse.py
82 lines (53 loc) · 2.51 KB
/
mod_3BTextFileParse.py
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
## IMPORT MODULES
import re
## FUNCTION () #3B - TEXT FILE PARSE
def fn_TextFileParse(JSONString):
"""
## MODULE.FUNCTION() #3B - TEXT FILE PARSE ## RETURNS TextParsedWithSpaces, TextParsedNoSpaces
"""
## TEST PRINT OUTPUT
print("\n") ## PRINT SPACE
print("WITHIN FUNCTION: BEGIN FUNCTION #3B TEXT FILE PARSE")
## TEST PRINT OUTPUT
## print("\n") ## PRINT SPACE
##print(JSONString)
## TEST PRINT OUTPUT
## print("\n") ## PRINT SPACE
## print("Length of JSONString =", len(JSONString), type(JSONString))
## BEGIN TEXT FILE PARSE
## REMOVE HYPHENS FROM STRING
TextNoHyphensWithSpaces = JSONString.replace("־", " ")
## TEST PRINT OUTPUT
##print("\n") ## PRINT SPACE
##print("Length of TextNoHyphensWithSpaces =", len(TextNoHyphensWithSpaces), type(TextNoHyphensWithSpaces))
## REMOVE BRACKETS AND CONTENTS WIHIN BRACKETS FROM STRING
TextNoBracketsWithSpaces = re.sub("[\[].*?[\]]", "", TextNoHyphensWithSpaces)
## TEST - 1ST GOOD ISSUE ON GITHUB
TextNoBracketsWithSpaces = TextNoBracketsWithSpaces.replace(u"\u200D", "")
## TEST PRINT OUTPUT
##print("\n") ## PRINT SPACE
##print("Length of TextNoBracketsWithSpaces =", len(TextNoBracketsWithSpaces), type(TextNoBracketsWithSpaces))
## REMOVE WHITE SPACES FROM STRING
TextNoSpaces = TextNoBracketsWithSpaces.replace(" ", "")
## TEST PRINT OUTPUT
##print("\n") ## PRINT SPACE
##print("Length of TextNoSpaces =", len(TextNoSpaces), type(TextNoSpaces))
## CHANGE VARIABLE NAME
TextParsedWithSpaces = TextNoBracketsWithSpaces
TextParsedNoSpaces = TextNoSpaces
## TEST PRINT OUTPUT
##print("\n") ## PRINT SPACE
##print("Length of TextParsedWithSpaces =", len(TextParsedWithSpaces), type(TextParsedWithSpaces))
## TEST PRINT OUTPUT
##print("\n") ## PRINT SPACE
##print("Length of TextParsedNoSpaces =", len(TextParsedNoSpaces), type(TextParsedNoSpaces))
## END TEXT FILE PARSE
## CHANGE VARIABLE NAMES
TextParsedWithSpaces = TextNoBracketsWithSpaces
TextParsedNoSpaces = TextNoSpaces
## TEST PRINT OUTPUT
print("\n") ## PRINT SPACE
print("WITHIN FUNCTION: END FUNCTION #3B - TEXT FILE PARSE")
## RETURN VARIABLES TO PROGRAM - RETURNS TUPLE OF TWO TEXTS (LISTS): 1.) WITH SPACES; 2.) WITH NO SPACES
return(TextParsedWithSpaces, TextParsedNoSpaces)
## END FUNCTION () #3B - TEXT FILE PARSE