mirror of https://github.com/patacrep/patacrep.git
Engine for LaTeX songbooks
http://www.patacrep.com
You can not select more than 25 topics
Topics must start with a letter or number, can include dashes ('-') and can be up to 35 characters long.
181 lines
6.1 KiB
181 lines
6.1 KiB
12 years ago
|
#!/usr/bin/python
|
||
|
# -*- coding: utf-8 -*-
|
||
11 years ago
|
|
||
|
"""Manage indexes.
|
||
|
|
||
|
Generate indexes files for the songbook compilation. This is a replacement for
|
||
|
the original makeindex program written in C that produces an index file (.sbx)
|
||
|
from a file generated by the latex compilation of the songbook (.sxd).
|
||
|
"""
|
||
12 years ago
|
|
||
12 years ago
|
from unidecode import unidecode
|
||
12 years ago
|
import locale
|
||
11 years ago
|
import re
|
||
|
import sys
|
||
12 years ago
|
|
||
11 years ago
|
from songbook_core.authors import processauthors
|
||
|
from songbook_core.plastex import simpleparse
|
||
12 years ago
|
|
||
11 years ago
|
EOL = "\n"
|
||
|
|
||
12 years ago
|
# Pattern set to ignore latex command in title prefix
|
||
11 years ago
|
KEYWORD_PATTERN = re.compile(r"^%(\w+)\s?(.*)$")
|
||
|
FIRST_LETTER_PATTERN = re.compile(r"^(?:\{?\\\w+\}?)*[^\w]*(\w)")
|
||
12 years ago
|
|
||
11 years ago
|
|
||
12 years ago
|
def sortkey(value):
|
||
|
'''
|
||
|
From a title, return something usable for sorting. It handles locale (but
|
||
12 years ago
|
don't forget to call locale.setlocale(locale.LC_ALL, '')). It also handles
|
||
|
the sort with latex escape sequences.
|
||
12 years ago
|
'''
|
||
12 years ago
|
return locale.strxfrm(unidecode(simpleparse(value).replace(' ', 'A')))
|
||
12 years ago
|
|
||
11 years ago
|
|
||
11 years ago
|
def process_sxd(filename):
|
||
11 years ago
|
"""Parse sxd file.
|
||
|
|
||
11 years ago
|
Return an Index object.
|
||
11 years ago
|
"""
|
||
11 years ago
|
index_file = open(filename)
|
||
12 years ago
|
data = []
|
||
11 years ago
|
for line in index_file:
|
||
12 years ago
|
data.append(line.strip())
|
||
11 years ago
|
index_file.close()
|
||
12 years ago
|
|
||
|
i = 1
|
||
11 years ago
|
idx = Index(data[0])
|
||
12 years ago
|
|
||
11 years ago
|
while len(data) > i and data[i].startswith('%'):
|
||
11 years ago
|
keywords = KEYWORD_PATTERN.match(data[i]).groups()
|
||
11 years ago
|
idx.keyword(keywords[0], keywords[1])
|
||
11 years ago
|
i += 1
|
||
12 years ago
|
|
||
11 years ago
|
idx.compile_keywords()
|
||
11 years ago
|
for i in range(i, len(data), 3):
|
||
11 years ago
|
entry = data[i:i + 3]
|
||
11 years ago
|
idx.add(entry[0], entry[1], entry[2])
|
||
12 years ago
|
|
||
12 years ago
|
return idx
|
||
|
|
||
11 years ago
|
|
||
11 years ago
|
class Index(object):
|
||
11 years ago
|
"""Title, author or scripture Index representation."""
|
||
11 years ago
|
|
||
12 years ago
|
def __init__(self, indextype):
|
||
12 years ago
|
self.data = dict()
|
||
|
self.keywords = dict()
|
||
11 years ago
|
self.prefix_patterns = []
|
||
|
self.authwords = {"after": [], "ignore": [], "sep": []}
|
||
12 years ago
|
if indextype == "TITLE INDEX DATA FILE":
|
||
|
self.indextype = "TITLE"
|
||
|
elif indextype == "SCRIPTURE INDEX DATA FILE":
|
||
|
self.indextype = "SCRIPTURE"
|
||
|
elif indextype == "AUTHOR INDEX DATA FILE":
|
||
|
self.indextype = "AUTHOR"
|
||
|
else:
|
||
|
self.indextype = ""
|
||
12 years ago
|
|
||
11 years ago
|
@staticmethod
|
||
|
def filter(key):
|
||
|
letter = FIRST_LETTER_PATTERN.match(key).group(1)
|
||
|
if re.match(r'\d', letter):
|
||
12 years ago
|
letter = '0-9'
|
||
|
return (letter.upper(), key)
|
||
|
|
||
|
def keyword(self, key, word):
|
||
11 years ago
|
if not key in self.keywords.keys():
|
||
12 years ago
|
self.keywords[key] = []
|
||
|
self.keywords[key].append(word)
|
||
|
|
||
11 years ago
|
def compile_keywords(self):
|
||
12 years ago
|
if self.indextype == "TITLE":
|
||
|
if 'prefix' in self.keywords:
|
||
|
for prefix in self.keywords['prefix']:
|
||
11 years ago
|
self.prefix_patterns.append(re.compile(
|
||
|
r"^({prefix})(\b|\\)(\s*.*)$".format(prefix=prefix)
|
||
|
))
|
||
12 years ago
|
|
||
|
if self.indextype == "AUTHOR":
|
||
|
for key in self.keywords:
|
||
|
if key in self.authwords:
|
||
|
self.authwords[key] = self.keywords[key]
|
||
|
for word in self.authwords.keys():
|
||
|
if word in self.keywords:
|
||
|
if word == "after":
|
||
11 years ago
|
self.authwords[word] = [
|
||
|
re.compile(r"^.*{after}\b(.*)".format(after=after))
|
||
|
for after in self.keywords[word]
|
||
|
]
|
||
12 years ago
|
elif word == "sep":
|
||
11 years ago
|
self.authwords[word] = [" {sep}".format(sep=sep)
|
||
|
for sep in self.authwords[word]
|
||
|
] + [","]
|
||
|
self.authwords[word] = [
|
||
|
re.compile(r"^(.*){sep} (.*)$".format(sep=sep))
|
||
|
for sep in self.authwords[word]
|
||
|
]
|
||
12 years ago
|
else:
|
||
|
self.authwords[word] = self.keywords[word]
|
||
|
|
||
|
def _raw_add(self, key, number, link):
|
||
12 years ago
|
(first, key) = self.filter(key)
|
||
11 years ago
|
if not first in self.data.keys():
|
||
12 years ago
|
self.data[first] = dict()
|
||
11 years ago
|
if not key in self.data[first].keys():
|
||
12 years ago
|
self.data[first][key] = []
|
||
11 years ago
|
self.data[first][key].append({'num': number, 'link': link})
|
||
12 years ago
|
|
||
12 years ago
|
def add(self, key, number, link):
|
||
|
if self.indextype == "TITLE":
|
||
|
# Removing prefixes before titles
|
||
|
for pattern in self.prefix_patterns:
|
||
|
match = pattern.match(key)
|
||
|
if match:
|
||
|
self._raw_add(
|
||
11 years ago
|
"{} ({})".format(
|
||
|
match.group(2) + match.group(3),
|
||
|
match.group(1)),
|
||
|
number, link)
|
||
12 years ago
|
return
|
||
|
self._raw_add(key, number, link)
|
||
|
|
||
|
if self.indextype == "AUTHOR":
|
||
|
# Processing authors
|
||
|
for author in processauthors(
|
||
|
key,
|
||
|
**self.authwords):
|
||
|
self._raw_add(author, number, link)
|
||
|
|
||
11 years ago
|
@staticmethod
|
||
|
def ref_to_str(ref):
|
||
11 years ago
|
if sys.version_info >= (2, 6):
|
||
11 years ago
|
return r'\hyperlink{{{0[link]}}}{{{0[num]}}}'.format(ref)
|
||
12 years ago
|
else:
|
||
11 years ago
|
return r'\hyperlink{%(link)s}{%(num)s}' % ref
|
||
12 years ago
|
|
||
11 years ago
|
def entry_to_str(self, key, entry):
|
||
11 years ago
|
if sys.version_info >= (2, 6):
|
||
11 years ago
|
return unicode(r'\idxentry{{{0}}}{{{1}}}' + EOL).format(
|
||
|
key,
|
||
|
r'\\'.join([self.ref_to_str(ref) for ref in entry]),
|
||
|
)
|
||
12 years ago
|
else:
|
||
11 years ago
|
return unicode(r'\idxentry{%s}{%s}' + EOL) % (
|
||
|
key,
|
||
|
r'\\'.join([self.ref_to_str(ref) for ref in entry]),
|
||
|
)
|
||
12 years ago
|
|
||
11 years ago
|
def idxblock_to_str(self, letter, entries):
|
||
11 years ago
|
string = r'\begin{idxblock}{' + letter + '}' + EOL
|
||
12 years ago
|
for key in sorted(entries.keys(), key=sortkey):
|
||
11 years ago
|
string += self.entry_to_str(key, entries[key])
|
||
11 years ago
|
string += r'\end{idxblock}' + EOL
|
||
11 years ago
|
return string
|
||
12 years ago
|
|
||
11 years ago
|
def entries_to_str(self):
|
||
11 years ago
|
string = ""
|
||
12 years ago
|
for letter in sorted(self.data.keys()):
|
||
11 years ago
|
string += self.idxblock_to_str(letter, self.data[letter])
|
||
11 years ago
|
return string
|