tempgen.parsers.ods

View Source

from odf import opendocument, text, teletype, element, table
from tempgen.parsers.parser import AbstractParser

class Parser(AbstractParser):
    def parse(self, path, container, parse_entry, find_matches):
        doc = opendocument.load(path)
        paragraphs = doc.getElementsByType(text.P)
        for s in map(teletype.extractText, paragraphs):
            matches = find_matches(s)
            for match in matches:
                payload = parse_entry(match, path)
                container[payload['id']] = payload ## add check here for duplicates

    def replace(self, source_path, target_path, compute_match, replacements, update_external = False):
        doc = opendocument.load(source_path)
        for cell in doc.getElementsByType(table.TableCell):
            for paragraph in cell.getElementsByType(text.P):
                s = teletype.extractText(paragraph)
                local_to_replace = compute_match(s, {}, replacements, source_path, update_external)
                for match, value in local_to_replace.items():
                    if s.find(match) != -1:
                        s = s.replace(match, value)
                        paragraph._get_firstChild().data = s
                        while len(paragraph.childNodes) > 1:
                            try:
                                paragraph.removeChild(paragraph.lastChild)
                            except:
                                pass
        doc.save(target_path)

# class Parser(tempgen.parsers.parser.AbstractParser):

View Source

class Parser(AbstractParser):
    def parse(self, path, container, parse_entry, find_matches):
        doc = opendocument.load(path)
        paragraphs = doc.getElementsByType(text.P)
        for s in map(teletype.extractText, paragraphs):
            matches = find_matches(s)
            for match in matches:
                payload = parse_entry(match, path)
                container[payload['id']] = payload ## add check here for duplicates

    def replace(self, source_path, target_path, compute_match, replacements, update_external = False):
        doc = opendocument.load(source_path)
        for cell in doc.getElementsByType(table.TableCell):
            for paragraph in cell.getElementsByType(text.P):
                s = teletype.extractText(paragraph)
                local_to_replace = compute_match(s, {}, replacements, source_path, update_external)
                for match, value in local_to_replace.items():
                    if s.find(match) != -1:
                        s = s.replace(match, value)
                        paragraph._get_firstChild().data = s
                        while len(paragraph.childNodes) > 1:
                            try:
                                paragraph.removeChild(paragraph.lastChild)
                            except:
                                pass
        doc.save(target_path)

Helper class that provides a standard way to create an ABC using inheritance.

# Parser()

# def parse(self, path, container, parse_entry, find_matches):

View Source

    def parse(self, path, container, parse_entry, find_matches):
        doc = opendocument.load(path)
        paragraphs = doc.getElementsByType(text.P)
        for s in map(teletype.extractText, paragraphs):
            matches = find_matches(s)
            for match in matches:
                payload = parse_entry(match, path)
                container[payload['id']] = payload ## add check here for duplicates

Parse file accessible via path property

A general implementation of parse method should include following steps:

Open file
Read file data and transform it's meaningful content into string or an iterable of strings
Call of find_matches function on such strings, resulting in an array of matches
For each match found one should call parse_entry, resulting in an entry dictionary
For each entry use entry "id" property as key and payload as value to populate the container provided

Parameters

path (str): Absolute path to file to be parsed
container (Dict[str, [Dict[str, Any]]]): Dictionary to be populated with parsed entries, contains key-value pairs with entry id property as key and entry payload dictionary as value
parse_entry (callable): Function that extracts entry (current implementation uses json parse) from matching string, returns entry payload dictionary
find_matches (callable): Function that searches the entry string for matches (that is, {{VALID_JSON_OBJECT}} patterns), returns array of matching substrings

# def replace( self, source_path, target_path, compute_match, replacements, update_external=False ):

View Source

    def replace(self, source_path, target_path, compute_match, replacements, update_external = False):
        doc = opendocument.load(source_path)
        for cell in doc.getElementsByType(table.TableCell):
            for paragraph in cell.getElementsByType(text.P):
                s = teletype.extractText(paragraph)
                local_to_replace = compute_match(s, {}, replacements, source_path, update_external)
                for match, value in local_to_replace.items():
                    if s.find(match) != -1:
                        s = s.replace(match, value)
                        paragraph._get_firstChild().data = s
                        while len(paragraph.childNodes) > 1:
                            try:
                                paragraph.removeChild(paragraph.lastChild)
                            except:
                                pass
        doc.save(target_path)

Replace file contents

A general implementation of replace method should include following steps:

Open file accessible via source_path in read mode
Read file data and transform it so its text content becomes available for editing
For each string in obtained text call compute_match, it results in an dictionary with {{VALID_JSON_OBJECT}} patterns as keys and computed substitutions as values
For each match, value in the dictionary, replace match with value in text
Create file at target_path and write modified text

Parameters

source_path (str): Absolute path to file to be parsed
target_path (str): Absolute path to file to be generated
compute_match (callable): Function that
1. searches the entry string for matches (that is, {{VALID_JSON_OBJECT}} patterns)
2. finds entry id in replacements dictionary
3. populates to_replace dictionary parameter with "{{VALID_JSON_OBJECT}}" as key and replacement string as value
4. if update_external is True, it updates external resources with replacement string
5. returns to_replace dictionary
replacements (Dict[str, str]): Dictionary containing pairs of "{{VALID_JSON_OBJECT}}" keys and their replacements as values
update_external (bool, optional): Boolean, indicating whether external resources should be updated