36 lines
1.1 KiB
Python
36 lines
1.1 KiB
Python
import re
|
||
|
||
inputFile = 'berean_accented.csv'
|
||
outputFile = 'berean_unaccented.csv'
|
||
|
||
f = open(inputFile,'r')
|
||
newData = f.read()
|
||
f.close()
|
||
|
||
# Greek unicode characters
|
||
|
||
searchReplace = (
|
||
('[ἀἄᾄἂἆἁἅᾅἃάᾴὰᾶᾷᾳ]', 'α'),
|
||
('[ἈἌἎἉἍἋ]', 'Α'),
|
||
('[ἐἔἑἕἓέὲ]', 'ε'),
|
||
('[ἘἜἙἝἛ]', 'Ε'),
|
||
('[ἠἤᾔἢἦᾖᾐἡἥἣἧᾗᾑήῄὴῆῇῃ]', 'η'),
|
||
('[ἨἬἪἮἩἭἫ]', 'Η'),
|
||
('[ἰἴἶἱἵἳἷίὶῖϊΐῒ]', 'ι'),
|
||
('[ἸἼἹἽ]', 'Ι'),
|
||
('[ὀὄὂὁὅὃόὸ]', 'ο'),
|
||
('[ὈὌὉὍὋ]', 'Ο'),
|
||
('[ῥ]', 'ρ'),
|
||
('[Ῥ]', 'Ρ'),
|
||
('[ὐὔὒὖὑὕὓὗύὺῦϋΰῢ]', 'υ'),
|
||
('[ὙὝὟ]', 'Υ'),
|
||
('[ὠὤὢὦᾠὡὥὧᾧώῴὼῶῷῳ]', 'ω'),
|
||
('[ὨὬὪὮὩὭὯ]', 'Ω'),
|
||
("[\-\—\,\;\:\\\?\.\·\·\'\‘\’\‹\›\“\”\«\»\(\)\[\]\{\}\⧼\⧽\〈\〉\*\‿\᾽\⇔\¦]", ""),
|
||
)
|
||
for search, replace in searchReplace:
|
||
newData = re.sub(search, replace, newData)
|
||
|
||
f = open(outputFile,'w')
|
||
f.write(newData)
|
||
f.close() |