Browse Source

Utils: latex-preprocessing twice faster, half the code

remotes/origin/split-songs
Guillaume Bouchard 15 years ago
committed by crep
parent
commit
7f155f16c4
  1. 34
      utils/latex-preprocessing.py

34
utils/latex-preprocessing.py

@ -1,21 +1,8 @@
#!/usr/bin/python #!/usr/bin/python
# -*- coding: utf-8 -*- # -*- coding: utf-8 -*-
import re
import glob import glob
import codecs
def replace_words(text, word_dic):
"""
take a text and <strong class="highlight">replace</strong> words
that match a key in a dictionary with the associated value,
return the changed text
"""
rc = re.compile('|'.join(map(re.escape, word_dic)))
def translate(match):
return word_dic[match.group(0)]
return rc.sub(translate, text)
# the dictionary has target_word:replacement_word pairs # the dictionary has target_word:replacement_word pairs
word_dic = { word_dic = {
#oe inclusion #oe inclusion
@ -51,13 +38,12 @@ word_dic = {
# Process song files # Process song files
songfiles = glob.glob('songs/*/*.sg') songfiles = glob.glob('songs/*/*.sg')
for file in songfiles: for filename in songfiles:
songfile = codecs.open(file, "r", "utf-8") with open(filename, 'r+') as songfile:
data = songfile.read().encode("utf-8") data = songfile.read()
data = replace_words(data, word_dic) for search, replace in word_dic.items():
songfile.close() data = data.replace(search, replace)
songfile = open(file, "w") songfile.seek(0)
songfile.write(data) songfile.write(data)
songfile.close() songfile.truncate()

Loading…
Cancel
Save