Source code for ly.docinfo

# This file is part of python-ly, https://pypi.python.org/pypi/python-ly
#
# Copyright (c) 2013 - 2015 by Wilbert Berendsen
#
# This program is free software; you can redistribute it and/or
# modify it under the terms of the GNU General Public License
# as published by the Free Software Foundation; either version 2
# of the License, or (at your option) any later version.
#
# This program is distributed in the hope that it will be useful,
# but WITHOUT ANY WARRANTY; without even the implied warranty of
# MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
# GNU General Public License for more details.
#
# You should have received a copy of the GNU General Public License
# along with this program; if not, write to the Free Software
# Foundation, Inc., 51 Franklin St, Fifth Floor, Boston, MA  02110-1301  USA
# See http://www.gnu.org/licenses/ for more information.

"""
Harvest information from a ly.document.DocumentBase instance.

"""

from __future__ import unicode_literals
from __future__ import absolute_import

import re
import collections
import functools
import itertools

import ly.lex.lilypond
import ly.pitch


def _cache(func):
    """Simple decorator caching the return value of a function."""
    @functools.wraps(func)
    def wrapper(self):
        try:
            return self._cache_[func]
        except AttributeError:
            self._cache_ = {}
        except KeyError:
            pass
        result = self._cache_[func] = func(self)
        return result
    return wrapper


[docs]class DocInfo(object): """Harvest information from a ly.document.DocumentBase instance. All tokens are saved in the tokens attribute as a tuple. Newline tokens are added between all lines. All corresponding classes are in the classes attribute as a tuple. This makes quick search and access possible. The tokens are requested from the document using the tokens_with_position() method, so you can always locate them back in the original document using their pos attribute. DocInfo does not update when the document changes, you should just instantiate a new one. """ def __init__(self, doc): """Initialize with ly.document.DocumentBase instance.""" self._d = doc blocks = iter(doc) for b in blocks: tokens = doc.tokens_with_position(b) self.tokens = sum(map( lambda b: ((ly.lex.Newline('\n', doc.position(b) - 1),) + doc.tokens_with_position(b)), blocks), tokens) self.classes = tuple(map(type, self.tokens)) @property def document(self): return self._d
[docs] def range(self, start=0, end=None): """Return a new instance of the DocInfo class for the selected range. Only the tokens completely contained within the range start..end are added to the new instance. This can be used to perform fast searches on a subset of a document. """ if start == 0 and end is None: return self lo = 0 hi = len(self.tokens) while lo < hi: mid = (lo + hi) // 2 if start > self.tokens[mid].pos: lo = mid + 1 else: hi = mid start = lo if end is not None: lo = 0 hi = len(self.tokens) while lo < hi: mid = (lo + hi) // 2 if end < self.tokens[mid].pos: hi = mid else: lo = mid + 1 end = lo - 1 s = slice(start, end) n = type(self).__new__(type(self)) n._d = self._d n.tokens = self.tokens[s] n.classes = self.classes[s] return n
[docs] @_cache def mode(self): """Return the mode, e.g. "lilypond".""" return self._d.initial_state().mode()
[docs] def find(self, token=None, cls=None, pos=0, endpos=-1): """Return the index of the first specified token and/or class after pos. If token is None, the cls should be specified. If cls is given, the token should be an instance of the specified class. If endpos is given, never searches beyond endpos. Returns -1 if the token is not found. """ if token is None: try: return self.classes.index(cls, pos, endpos) except ValueError: return -1 elif cls is None: try: return self.tokens.index(token, pos, endpos) except ValueError: return -1 else: while True: try: i = self.tokens.index(token, pos, endpos) except ValueError: return -1 if cls == self.classes[i]: return i pos = i + 1
[docs] def find_all(self, token=None, cls=None, pos=0, endpos=-1): """Yield all indices of the first specified token and/or class after pos. If token is None, the cls should be specified. If cls is given, the token should be an instance of the specified class. If endpos is given, never searches beyond endpos. Returns -1 if the token is not found. """ while True: i = self.find(token, cls, pos, endpos) if i == -1: break yield i pos = i + 1
[docs] @_cache def version_string(self): r"""Return the version as a string, e.g. "2.19.8". Looks for the \version LilyPond command. The string is returned without quotes. Returns None if there was no \version command found. """ i = self.find("\\version", ly.lex.lilypond.Keyword) if i != -1: tokens = iter(self.tokens[i+1:i+10]) for t in tokens: if not isinstance(t, (ly.lex.Space, ly.lex.Comment)): if t == '"': pred = lambda t: t != '"' else: pred = lambda t: not isinstance(t, (ly.lex.Space, ly.lex.Comment)) return ''.join(itertools.takewhile(pred, tokens))
[docs] @_cache def version(self): """Return the version_string() as a tuple of ints, e.g. (2, 16, 2).""" version = self.version_string() if version: return tuple(map(int, re.findall(r"\d+", version))) return ()
[docs] @_cache def include_args(self): r"""The list of \include command arguments.""" result = [] for i in self.find_all("\\include", ly.lex.lilypond.Keyword): tokens = iter(self.tokens[i+1:i+10]) for token in tokens: if not isinstance(token, (ly.lex.Space, ly.lex.Comment)): if token == '"': result.append(''.join(itertools.takewhile(lambda t: t != '"', tokens))) break return result
[docs] @_cache def scheme_load_args(self): """The list of scheme (load) command arguments.""" result = [] for i in self.find_all("load", ly.lex.scheme.Keyword): tokens = iter(self.tokens[i+1:i+10]) for token in tokens: if not isinstance(token, (ly.lex.Space, ly.lex.Comment)): if token == '"': result.append(''.join(itertools.takewhile(lambda t: t != '"', tokens))) break return result
[docs] @_cache def output_args(self): r"""The list of arguments of constructs defining the name of output documents. This looks at the \bookOutputName, \bookOutputSuffix and define output-suffix commands. Every argument is a two tuple(type, argument) where type is either "suffix" or "name". """ result = [] for arg_type, cmd, cls in ( ("suffix", "output-suffix", ly.lex.scheme.Word), ("suffix", "\\bookOutputSuffix", ly.lex.lilypond.Command), ("name", "\\bookOutputName", ly.lex.lilypond.Command), ): for i in self.find_all(cmd, cls): tokens = iter(self.tokens[i+1:i+6]) for t in tokens: if t == '"': arg = ''.join(itertools.takewhile(lambda t: t != '"', tokens)) result.append((arg_type, arg)) break elif isinstance(t, ly.lex.lilypond.Name): result.append((arg_type, format(t))) elif isinstance(t, (ly.lex.lilypond.SchemeStart, ly.lex.Space, ly.lex.Comment)): continue break return result
[docs] @_cache def definitions(self): """The list of LilyPond identifiers the document defines.""" result = [] for i in self.find_all(None, ly.lex.lilypond.Name): if i == 0 or self.tokens[i-1] == '\n': result.append(self.tokens[i]) return result
[docs] @_cache def markup_definitions(self): """The list of markup command definitions in the document.""" result = [] # find bla = \markup { .. } for i in self.find_all(None, ly.lex.lilypond.Name): if i == 0 or self.tokens[i-1] == '\n': for t in self.tokens[i+1:i+6]: if t == "\\markup": result.append(self.tokens[i]) elif t == "=" or t.isspace(): continue break # find #(define-markup-command construction for i in self.find_all('define-markup-command', ly.lex.scheme.Function): for t in self.tokens[i+1:i+6]: if isinstance(t, ly.lex.scheme.Word): result.append(t) break result.sort(key=lambda t: t.pos) return result
[docs] @_cache def language(self): """The pitch language, None if not set in the document.""" languages = ly.pitch.pitchInfo.keys() for i in self.find_all("\\language", ly.lex.lilypond.Keyword): for t in self.tokens[i+1:i+10]: if isinstance(t, ly.lex.Space): continue elif t == '"': continue if t in languages: return t for n in self.include_args(): lang = n.rsplit('.', 1)[0] if lang in languages: return lang
[docs] @_cache def global_staff_size(self): """The global-staff-size, if set, else None.""" i = self.find('set-global-staff-size', ly.lex.scheme.Function) if i != -1: try: return int(self.tokens[i+2]) except (IndexError, ValueError): pass
[docs] @_cache def token_hash(self): """Return an integer hash for all non-whitespace and non-comment tokens. This hash does not change when only comments or whitespace are changed. """ return hash(tuple(t for t in self.tokens if not isinstance(t, (ly.lex.Space, ly.lex.Comment))))
[docs] @_cache def complete(self): """Return whether the document is probably complete and could be compilable.""" return self._d.state_end(self._d[len(self._d)-1]).depth() == 1
[docs] @_cache def has_output(self): """Return True when the document probably generates output. I.e. has notes, rests, markup or other output-generating commands. """ for t, c in ( (None, ly.lex.lilypond.MarkupStart), (None, ly.lex.lilypond.Note), (None, ly.lex.lilypond.Rest), ('\\include', ly.lex.lilypond.Keyword), (None, ly.lex.lilypond.LyricMode), ): for i in self.find_all(t, c): return True return False
[docs] def count_tokens(self, cls): """Return the number of tokens that are (a subclass) of the specified class. If you only want the number of instances of the exact class (not a subclass of) you can use info.classes.count(cls), where info is a DocInfo instance. """ return sum([issubclass(c, cls) for c in self.classes], False)
[docs] def counted_tokens(self): """Return a dictionary mapping classes to the number of instances of that class.""" return collections.Counter(self.classes)