Index: Friedrich-Nietzsche-late-work-ontology.ttl
===================================================================
--- Friedrich-Nietzsche-late-work-ontology.ttl	(revision 113)
+++ Friedrich-Nietzsche-late-work-ontology.ttl	(revision 114)
@@ -1,167 +1,188 @@
 @prefix dct: <http://purl.org/dc/terms/>.
 @prefix document: <https://www.e-editiones.ch/ontology/document#>.
 @prefix homotypic: <http://www.nie.org/ontology/homotypic#>.
 @prefix stoff: <http://www.nie.org/ontology/standoff#>.
 @prefix text: <http://www.e-editiones.ch/ontology/text#>.
 @prefix owl: <http://www.w3.org/2002/07/owl#>.
 @prefix rdfs: <http://www.w3.org/2000/01/rdf-schema#>.
 @prefix rdf: <http://www.w3.org/1999/02/22-rdf-syntax-ns#> .
 @prefix skos: <http://www.w3.org/2004/02/skos/core#> .
 @prefix xsd: <http://www.w3.org/2001/XMLSchema#>.
+@prefix information-carrier: <http://e-editiones.ch/ontology/information-carrier#>.
 
 @prefix tln: <http://www.nie.org/ontology/nietzsche#>.
 
 <http://www.nie.org/ontology/nietzsche>
 	a owl:Ontology;
 	dct:license <http://creativecommons.org/licenses/by/3.0/>;
 	dct:title "An ontology about the collected late works of Friedrich Nietzsche"@en;
 	dct:description """Formal description of specific concepts in the scientific study of Friedrich Nietzsches late work."""@en;
 	dct:creator "Dominique Steinbach, tool coordinator/software developer, NIE-INE/digital edition of der späte Nietzsche, Basel University, Switzerland"@en;
 	dct:contributor "Christian Steiner, software developer, digital edition of der späte Nietzsche, University of Basel, Switzerland"@en;
    dct:publisher "Basel University, Switzerland"@en.
 
+tln:Leaf a owl:Class ;
+    rdfs:label "leaf"@en, "Blatt"@de;
+    rdfs:comment """Sheet of a writable substance, e.g. paper, parchment, treated plant leaf."""@en ;
+    rdfs:isDefinedBy <http://www.nie.org/ontology/nietzsche> .
+
 tln:TextGenesis a owl:Class ;
-    rdfs:label "identifies a genetic order of text versions"@en ;
+    rdfs:subClassOf information-carrier:Leaf ;
+    rdfs:label "identifies a genetic order of text version"@en ;
     rdfs:comment "Identifies a genetic order of text versions, i.e. groups text units as earlier and later versions of each other."@en ;
     rdfs:isDefinedBy <http://www.nie.org/ontology/nietzsche> .
    
 tln:IdentifiedTextVersion a owl:Class ;
     rdfs:label "identifies a list of text unities as a text version"@en ;
     rdfs:comment "Identification of a list of text unities (e.g. pages or parts of pages) as a text version for which there is an earlier or later version."@en ;
     rdfs:isDefinedBy <http://www.nie.org/ontology/nietzsche> .
 
 tln:PartOfPageTextUnit a owl:Class ;
     rdfs:label "identifies a part of a page as a text unity"@en ;
     rdfs:comment "Identification of a part of page as a text unity."@en ;
     rdfs:isDefinedBy <http://www.nie.org/ontology/nietzsche> ;
     rdfs:subClassOf [ a owl:Restriction ;
             owl:cardinality "1"^^xsd:nonNegativeInteger ;
             owl:onProperty tln:belongsToPage ],
         [ a owl:Restriction ;
             owl:cardinality "1"^^xsd:nonNegativeInteger ;
             owl:onProperty tln:startLine ], 
          [ a owl:Restriction ;
             owl:cardinality "1"^^xsd:nonNegativeInteger ;
             owl:onProperty tln:endLine ] .
 
 tln:ExternalTextUnit a owl:Class ;
     rdfs:label "a list text unit that has been published external to the digital edition"@en ;
     rdfs:comment "A text unit that has been published external to the digital edition."@en ;
     rdfs:isDefinedBy <http://www.nie.org/ontology/nietzsche> ;
     rdfs:subClassOf tln:IdentifiedTextVersion .
 
 tln:Page a owl:Class ;
     rdfs:subClassOf document:Page .
 
+tln:leafHasDescription a owl:ObjectProperty ;
+    rdfs:label "relates a leaf to a manuscript description"@en ;
+    rdfs:comment "Relates a leaf to its manuscript description."@en ;
+    rdfs:isDefinedBy <http://www.nie.org/ontology/nietzsche> ;
+    rdfs:domain tln:Leaf ;
+    rdfs:range tln:ManuscriptDescription.
+
+tln:isDepictedBy a owl:ObjectProperty ;
+    rdfs:label "relates a leaf to a faksimile image"@en ;
+    rdfs:comment "Relates a leaf to the faksimile image that depicts it."@en ;
+    rdfs:isDefinedBy <http://www.nie.org/ontology/nietzsche> ;
+    rdfs:domain tln:Leaf ;
+    rdfs:range tln:FaksimileImage.
+
 tln:belongsToPage a owl:ObjectProperty ;
     rdfs:label "relates a part of a page with the page it is a part of"@en ;
     rdfs:comment "Relates a part of a page with the page it is a part of."@en ;
     rdfs:isDefinedBy <http://www.nie.org/ontology/nietzsche> ;
     rdfs:domain tln:PartOfPageTextUnit ;
     rdfs:range tln:Page.
 
 tln:startLine a owl:ObjectProperty ;
     rdfs:label "relates a part of a page with the line it starts with"@en ;
     rdfs:comment "Relates a part of a page with the line it starts with."@en ;
     rdfs:isDefinedBy <http://www.nie.org/ontology/nietzsche> ;
     rdfs:domain tln:PartOfPageTextUnit ;
     rdfs:range tln:Line.
 
 tln:endLine a owl:ObjectProperty ;
     rdfs:label "relates a part of a page with the line it ends with"@en ;
     rdfs:comment "Relates a part of a page with the line it ends with."@en ;
     rdfs:isDefinedBy <http://www.nie.org/ontology/nietzsche> ;
     rdfs:domain tln:PartOfPageTextUnit ;
     rdfs:range tln:Line.
 
 tln:identifiesAsVersion a owl:ObjectProperty ;
     rdfs:label "groups a list of text unities together as a identified text version"@en ;
     rdfs:comment "Groups a list of text unities together as a identified text version for which there is an ealier or later version."@en ;
     rdfs:isDefinedBy <http://www.nie.org/ontology/nietzsche> ;
     rdfs:domain tln:IdentifiedTextVersion ;
     rdfs:range rdf:List.
 
 tln:hasGeneticOrder a owl:ObjectProperty ;
     rdfs:label "relates a list of text versions to an identified genetic order"@en ;
     rdfs:comment "Relates a list of text versions to an identified genetic order. The position in the list determines the version of a text unit."@en ;
     rdfs:isDefinedBy <http://www.nie.org/ontology/nietzsche> ;
     rdfs:domain tln:TextGenesis ;
     rdfs:range rdf:List.
 
 tln:textUnitHasTitle a owl:ObjectProperty ;
     rdfs:label "relates a external published text unit with a title"@en ;
     rdfs:comment "Relates a external published text unit with a title by which it can be identified."@en ;
     rdfs:isDefinedBy <http://www.nie.org/ontology/nietzsche> ;
     rdfs:domain tln:ExternalTextUnit ;
     rdfs:range xsd:string .
 
 tln:textUnitHasUrl a owl:ObjectProperty ;
     rdfs:label "relates a external published text unit with a URL"@en ;
     rdfs:comment "Relates a external published text unit with a URL by which it can be visited."@en ;
     rdfs:isDefinedBy <http://www.nie.org/ontology/nietzsche> ;
     rdfs:domain tln:ExternalTextUnit ;
     rdfs:range xsd:anyURI .
 
 tln:hasImage a owl:ObjectProperty ;
     rdfs:label "relates a page to a image"@en ;
     rdfs:comment "relates a page to an image that has a textfield that specifies the area where the writing that constitutes the page can be found."@en ;
     rdfs:isDefinedBy <http://www.nie.org/ontology/nietzsche> ;
     rdfs:domain tln:Page ;
     rdfs:range tln:Image .
 
 tln:hasUrl a owl:DatatypeProperty ;
     rdfs:label "has Url"@en ;
     rdfs:domain tln:Image ;
     rdfs:isDefinedBy <http://www.nie.org/ontology/nietzsche> ;
     rdfs:range xsd:anyURI .
 
 #tln:inheritOverwritesWord a owl:ObjectProperty ;
 #   rdfs:subPropertyOf tln:overwritesWord;
 #   rdfs:label "word overwrites word (inherited from tln:wordHasCorrection)"@en ;
 #   rdfs:comment "The author has used this word in order to overwrite that word."@en ;
 #   rdfs:isDefinedBy <http://www.nie.org/ontology/nietzsche> ;
 #   owl:propertyChainAxiom  ( tln:wordHasCorrection tln:overwritesWord ).
 
 tln:hasStandoffMarkup4PartThatOverwritesWord a owl:ObjectProperty ;
     rdfs:label "word has standoff markup for the part that overwrites a word"@en ;
     rdfs:comment "word has standoff markup that highlights the part of its text that overwrites a word"@en ;
     rdfs:isDefinedBy <http://www.nie.org/ontology/nietzsche> ;
     rdfs:domain tln:Word ;
     rdfs:range stoff:StandoffMarkup .
 
 tln:lineContinuesOn a owl:ObjectProperty ;
     rdfs:label "writing from subject line continues on object line"@en ;
     rdfs:comment "the writing that ends on subject line continues on object line"@en ;
     rdfs:isDefinedBy <http://www.nie.org/ontology/nietzsche> ;
     rdfs:domain tln:Line ;
     rdfs:range tln:Line .
 
 tln:pageIsOnTextField a owl:ObjectProperty ;
     rdfs:label "page is on text field"@en ;
     rdfs:comment "the writing that is referred to as subject can be found on object"@en ;
     rdfs:isDefinedBy <http://www.nie.org/ontology/nietzsche> ;
     rdfs:domain tln:Page ;
     rdfs:range tln:TextField .
 
 tln:writingContinuesWithWord a owl:ObjectProperty ;
     rdfs:label "writing continues with next word"@en ;
     rdfs:isDefinedBy <http://www.nie.org/ontology/nietzsche> ;
     rdfs:domain tln:Word ;
     rdfs:range tln:Word .
 
 tln:selectableWordProperty a owl:ObjectProperty ;
     rdfs:label "a property of a word for which it can be selected"@en ;
     rdfs:isDefinedBy <http://www.nie.org/ontology/nietzsche> ;
     rdfs:domain tln:Word .
 
 tln:cardinalityGreaterOne a rdf:Property ;
     rdfs:label "whether a tln:selectableWordProperty can have a greater cardinality then one"@en ;
     rdfs:isDefinedBy <http://www.nie.org/ontology/nietzsche> ;
     rdfs:domain tln:selectableWordProperty ;
     rdfs:range xsd:boolean .
 
 tln:suggestedMaxCardinality a rdf:Property ;
     rdfs:label "the suggested max cardinaltiy of a tln:selectableWordProperty on a word"@en ;
     rdfs:isDefinedBy <http://www.nie.org/ontology/nietzsche> ;
     rdfs:domain tln:selectableWordProperty ;
     rdfs:range xsd:nonNegativeInteger .
Index: svgscripts/datatypes/faksimile.py
===================================================================
--- svgscripts/datatypes/faksimile.py	(revision 113)
+++ svgscripts/datatypes/faksimile.py	(revision 114)
@@ -1,209 +1,226 @@
 #!/usr/bin/env python3
 # -*- coding: utf-8 -*-
 
 """   This class can be used to represent a faksimile page.
 """
-#    Copyright (C) University of Basel 2019  {{{1
+#    Copyright (C) University of Basel 2022  {{{1
 #
 #    This program is free software: you can redistribute it and/or modify
 #    it under the terms of the GNU General Public License as published by
 #    the Free Software Foundation, either version 3 of the License, or
 #    (at your option) any later version.
 #
 #    This program is distributed in the hope that it will be useful,
 #    but WITHOUT ANY WARRANTY; without even the implied warranty of
 #    MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
 #    GNU General Public License for more details.
 #
 #    You should have received a copy of the GNU General Public License
 #    along with this program.  If not, see <https://www.gnu.org/licenses/> 1}}}
 
 __author__ = "Christian Steiner"
 __maintainer__ = __author__
 __copyright__ = 'University of Basel'
 __email__ = "christian.steiner@unibas.ch"
 __status__ = "Development"
 __license__ = "GPL v3"
-__version__ = "0.0.1"
+__version__ = "0.0.2"
 
 import re
 from lxml import etree as ET
 from os import path
 from os.path import isdir, isfile, sep, basename
 from svgpathtools.parser import parse_path
 
 
 from .faksimile_image import FaksimileImage
 from .matrix import Matrix
 from .text_field import TextField
 from .word_position import WordPosition
 
 class FaksimilePage:
     """
     This class represents a faksimile page.
 
     Args:
         xml_target_file (str): name of the xml file to which page info will be written.
         xml_source_file (str): name of the xml file that will be instantiated.
     """
     XML_TAG = 'faksimile-page'
 
     def __init__(self, xml_source_file=None, xml_target_file=None, title=None, page_number=None, svg_source_file=None, faksimile_image=None, text_field=None):
         xml_file = xml_source_file if xml_source_file is not None else xml_target_file
         self.title = title
         self.page_number = page_number
         self.xml_file = xml_file
         if xml_file is not None and isfile(xml_file):
             parser = ET.XMLParser(remove_blank_text=True)
             self.page_tree = ET.parse(xml_file, parser)
             self.title = self.page_tree.getroot().get('title')
             self.page_number = self.page_tree.getroot().get('page-number')
             self.width = float(self.page_tree.getroot().get('width')) if bool(self.page_tree.getroot().get('width')) else 0.0
             self.height = float(self.page_tree.getroot().get('height')) if bool(self.page_tree.getroot().get('height')) else 0.0
         else:
             self.page_tree = ET.ElementTree(ET.Element(self.XML_TAG))
             if title is not None:
                 self.page_tree.getroot().set('title', title)
             if page_number is not None:
                 self.page_tree.getroot().set('page-number', str(page_number))
         if xml_target_file is not None:
             self.remove_tags_from_page_tree([WordPosition.FAKSIMILE])
         if svg_source_file is not None:
             self.page_tree.getroot().set('svg-source-file', svg_source_file)
         if faksimile_image is not None:
             faksimile_image.attach_object_to_tree(self.page_tree)
         if text_field is not None:
             text_field.attach_object_to_tree(self.page_tree)
         self.svg_source_file = self.page_tree.getroot().get('svg-source-file')
         self.faksimile_image = FaksimileImage(node=self.page_tree.getroot().find('.//' + FaksimileImage.XML_TAG))\
                 if len(self.page_tree.getroot().findall('.//' + FaksimileImage.XML_TAG)) > 0 else None
         self.text_field = TextField(node=self.page_tree.getroot().find('.//' + TextField.XML_TAG))\
                 if len(self.page_tree.getroot().findall('.//' + TextField.XML_TAG)) > 0 else None
         self.word_positions = [ WordPosition(node=node) for node in self.page_tree.getroot().findall('.//' + WordPosition.FAKSIMILE) ]\
                 if len(self.page_tree.getroot().findall('.//' + WordPosition.FAKSIMILE)) > 0 else []
 
     def append_word_position(self, word_position):
         """Appends word_position to word_positions and attaches it to page_tree.
         """
         self.word_positions.append(word_position)
         word_position.attach_object_to_tree(self.page_tree)
 
+    def attach_to_tei_facsimile(self, tei_facsimile: ET.Element, xml_id: str, page_number: str):
+        """Attach faksimile_page as a surface to facsimile element (of a tei xml file)
+        """
+        for item in tei_facsimile.iterchildren(): tei_facsimile.remove(item)
+        surface = ET.SubElement(tei_facsimile, 'surface')
+        surface.set('xml-id', xml_id)
+        surface.set('ulx', str(self.text_field.left))
+        surface.set('uly', str(self.text_field.top))
+        surface.set('lrx', str(round(self.text_field.left + self.text_field.width, 3)))
+        surface.set('lry', str(round(self.text_field.top + self.text_field.height, 3)))
+        surface.set('n', page_number)
+        graphic = ET.SubElement(surface, 'graphic')
+        graphic.set('url', self.faksimile_image.nietzsche_source_download)
+        graphic.set('width', str(self.faksimile_image.width) + 'pt')
+        graphic.set('height', str(self.faksimile_image.height) + 'pt')
+
+
     @classmethod
     def get_faksimile_pages(cls, svg_file, page_number='', isBlank=False) -> list:
         """Creates and returns text fields contained in a svg_file as a list.
         """
         svg_tree = ET.parse(svg_file)
         namespaces = { k if k is not None else 'ns': v for k, v in svg_tree.getroot().nsmap.items() }
         return cls.GET_FAKSIMILEPAGES(svg_tree, namespaces=namespaces, page_number=page_number, isBlank=isBlank)
 
     @staticmethod
     def GET_FAKSIMILEPAGES(svg_tree, namespaces=None, page_number='', isBlank=False) -> list:
        """Creates and returns text fields contained in a svg_tree as a list.
 
        """
        THRESHOLD_X = 10
        if namespaces is None:
             namespaces = { k if k is not None else 'ns': v for k, v in svg_tree.getroot().nsmap.items() }
        source_file_name = svg_tree.docinfo.URL
        image = FaksimileImage.CREATE_IMAGE(svg_tree.getroot().find('.//image', svg_tree.getroot().nsmap), source_file_name)
        xml_dir = '.{}xml'.format(sep)
        faksimile_pages = list()
        title_string = re.sub(r'[,_][0-9]+.*\.svg', '', basename(source_file_name))
        title = title_string.replace('-', ' ')
        if re.match(r'.*-\d+[a-z]*$', title_string):
             title_string = re.sub(r'-\d+[a-z]*$', '', title_string)
        rect_list = [ rect for rect in svg_tree.getroot().findall('.//rect', svg_tree.getroot().nsmap)\
                if rect.get('id', svg_tree.getroot().nsmap).startswith(title_string)\
                and rect.get('id', svg_tree.getroot().nsmap).endswith(str(page_number)) ]
        if isBlank:
            rect_list = [ rect for rect in svg_tree.getroot().findall('.//rect', svg_tree.getroot().nsmap) ]
        if len(rect_list) == 0 and page_number != '':
            return FaksimilePage.GET_FAKSIMILEPAGES(svg_tree, namespaces=namespaces)
        for text_field_rect in rect_list:
            tf_x = float(text_field_rect.get('x', svg_tree.getroot().nsmap)) - image.x
            tf_y = float(text_field_rect.get('y', svg_tree.getroot().nsmap)) - image.y
            tf_width = float(text_field_rect.get('width', svg_tree.getroot().nsmap))
            tf_height = float(text_field_rect.get('height', svg_tree.getroot().nsmap))
            tf_matrix = Matrix(transform_matrix_string=text_field_rect.get('transform'))\
                if bool(text_field_rect.get('transform'))\
                else None
            id = text_field_rect.get('id', svg_tree.getroot().nsmap)
            target_file_name = xml_dir + sep + id + '.xml' if isdir(xml_dir) else id + '.xml'
            page_number = re.sub(r'.*[,_-]', '', id)
            if page_number.startswith('0'):
                page_number = page_number.lstrip('0')
            text_field = TextField(id=id, width=tf_width, height=tf_height, x=tf_x, y=tf_y, matrix=tf_matrix)
            faksimile_page = FaksimilePage(xml_target_file=target_file_name, svg_source_file=source_file_name,\
                    title=title, page_number=page_number, faksimile_image=image, text_field=text_field)
            x_min = text_field.xmin + image.x
            y_min = text_field.ymin + image.y
            #rect_titles = svg_tree.getroot().xpath('//ns:rect[@x>"{0}" and @x<"{1}" and @y>"{2}" and @y<"{3}" and @id!="{4}"]/ns:title'.format(\
            #        x_min, text_field.xmax + image.x - THRESHOLD_X, y_min, text_field.ymax + image.y, text_field.id), namespaces=namespaces)
            rect_titles = get_paths_inside_rect(svg_tree, '//ns:rect/ns:title', x_min, text_field.xmax + image.x - THRESHOLD_X,\
                    y_min, text_field.ymax + image.y, text_field.id, namespaces=namespaces)
            rect_titles += get_paths_inside_rect(svg_tree, '//ns:path/ns:title', x_min, text_field.xmax + image.x - THRESHOLD_X,\
                    y_min, text_field.ymax + image.y, text_field.id, namespaces=namespaces)
            for rect_title in rect_titles:
                rect = rect_title.getparent()
                x, y, height, width = 0.0, 0.0, 0.0, 0.0
                if rect.tag.endswith('path'):
                     path = parse_path(rect.get('d'))
                     x, xmax, y, ymax = path.bbox()
                     width = xmax - x
                     height = ymax - y 
                else:
                    x = float(rect.get('x', svg_tree.getroot().nsmap))
                    y = float(rect.get('y', svg_tree.getroot().nsmap))
                    height = float(rect.get('height', svg_tree.getroot().nsmap))
                    width = width=float(rect.get('width', svg_tree.getroot().nsmap))
                matrix = None
                if bool(rect.get('transform')):
                    matrix = Matrix(transform_matrix_string=rect.get('transform'))
                text = re.sub(r'(\s(?=[-;:.,…?!’–])|(?<=[-;:.,…?!’–])\s)', '', rect_title.text)
                faksimile_page.append_word_position(\
                        WordPosition(id=rect.get('id', svg_tree.getroot().nsmap), text=text, height=height,\
                        width=width, x=x, y=y, matrix=matrix, tag=WordPosition.FAKSIMILE))
            faksimile_pages.append(faksimile_page)
        return faksimile_pages 
           
     def remove_tags_from_page_tree(self, list_of_tags_to_remove):
         """Removes the tags specified in the list from the target tree.
         """
         for xpath2remove in list_of_tags_to_remove:
             for node in self.page_tree.xpath('//' + xpath2remove):
                 node.getparent().remove(node)
 
 def get_paths_inside_rect(svg_tree, xpath, x_min, x_max, y_min, y_max, not_id, namespaces={}):
     """Returns a list of all paths selected by xpath that are inside x_min, x_max, y_min, y_max and do not have id == not_id.
     """
     paths = []
     if len(namespaces) == 0:
         namespaces = { k if k is not None else 'ns': v for k, v in svg_tree.getroot().nsmap.items() }
     for path_node in svg_tree.xpath(xpath, namespaces=namespaces):
         append_node = path_node
         if not path_node.tag.endswith('path') and not path_node.tag.endswith('rect'):
             path_node = path_node.getparent()
         x, xmax, y, ymax = -1, -1, -1, -1
         init_xy = False
         if path_node.tag.endswith('rect'):
             x = float(path_node.get('x')) if bool(path_node.get('x')) else -1
             y = float(path_node.get('y')) if bool(path_node.get('y')) else -1
             xmax = x + float(path_node.get('width')) if bool(path_node.get('width')) else -1
             ymax = y + float(path_node.get('height')) if bool(path_node.get('height')) else -1
             init_xy = True
         elif path_node.tag.endswith('path') and bool(path_node.get('d')) and path_node.get('d') != 0:
             path = parse_path(path_node.get('d'))
             x, xmax, y, ymax = path.bbox()
             init_xy = True
         if init_xy:
             if bool(path_node.get('transform')):
                 matrix = Matrix(transform_matrix_string=path_node.get('transform'))
                 x, xmax = matrix.get_new_x(x=x, y=y), matrix.get_new_x(x=xmax, y=ymax) 
                 y, ymax = matrix.get_new_y(x=x, y=y), matrix.get_new_y(x=xmax, y=ymax) 
             width = xmax - x
             height = ymax - y 
             if x > x_min and x < x_max\
                 and y > y_min and y < y_max\
                 and path_node.get('id') != not_id:
                 paths.append(append_node) 
     return paths
Index: svgscripts/datatypes/faksimile_image.py
===================================================================
--- svgscripts/datatypes/faksimile_image.py	(revision 113)
+++ svgscripts/datatypes/faksimile_image.py	(revision 114)
@@ -1,127 +1,137 @@
 #!/usr/bin/env python3
 # -*- coding: utf-8 -*-
 
 """   This class can be used to represent faksimile images.
 """
 #    Copyright (C) University of Basel 2019  {{{1
 #
 #    This program is free software: you can redistribute it and/or modify
 #    it under the terms of the GNU General Public License as published by
 #    the Free Software Foundation, either version 3 of the License, or
 #    (at your option) any later version.
 #
 #    This program is distributed in the hope that it will be useful,
 #    but WITHOUT ANY WARRANTY; without even the implied warranty of
 #    MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
 #    GNU General Public License for more details.
 #
 #    You should have received a copy of the GNU General Public License
 #    along with this program.  If not, see <https://www.gnu.org/licenses/> 1}}}
 
 __author__ = "Christian Steiner"
 __maintainer__ = __author__
 __copyright__ = 'University of Basel'
 __email__ = "christian.steiner@unibas.ch"
 __status__ = "Development"
 __license__ = "GPL v3"
 __version__ = "0.0.1"
 
 import fnmatch
 from lxml import etree as ET
 import os
 from os.path import basename, dirname, isfile, realpath, sep
 import sys
 
 from .image import Image 
 from .matrix import Matrix
 from .text_field import TextField
 
 sys.path.append('svgscripts')
 from local_config import FAKSIMILE_LOCATION
 
 class FaksimileImage(Image):
     """
     This class represents a faksimile image.
 
     Args:
         file_name (str):            name of the image file.
         node (lxml.etree.Element)   node, containing information
         URL (str):                  URL of image file.
         height (float):             height of image
         width (float):              width of image
         x (float):                  x
         y (float):                  y
     """
     XML_TAG = 'faksimile-image'
     OLD_NIETZSCHE_SOURCES_URL = 'http://www.nietzschesource.org/DFGAapi/api/page/download/'
     NIETZSCHE_SOURCES_URL = 'https://nietzsche.philhist.unibas.ch/faksimiles/'
+    NIETZSCHE_SOURCES_ORIGINAL_URL = 'http://www.nietzschesource.org/DFGA/'
     NIETZSCHE_SOURCES_API_URL = 'http://www.nietzschesource.org/DFGAapi/api/page/'
     NIETZSCHE_SOURCES_IMAGE_API_URL = 'http://www.nietzschesource.org/DFGAapi/images/DFGA/'
+    FAKSIMILE_DIR = 'faksimiles/'
 
     def __init__(self, node=None, file_name=None, local_path=None, URL=None, height=0.0, width=0.0, x=0.0, y=0.0, matrix=None, text_field=None):
         super(FaksimileImage, self).__init__(node=node, file_name=file_name, URL=URL, local_path=local_path,\
                 height=height, width=width, matrix=matrix, text_field=text_field, tag=self.XML_TAG)
         self.x = x
         self.y = y
         self.apiURL = None 
         self.thumbURL = None 
         self.mediumURL = None 
         if self.file_name is not None:
             nsource_page_name = self.file_name.replace('.jpg','')
             nsource_manuscript_name = nsource_page_name.split(',')[0] 
             self.primaryURL = self.NIETZSCHE_SOURCES_URL + self.file_name
             self.thumbURL = self.NIETZSCHE_SOURCES_URL + self.file_name.replace('.jpg', '_thumb.jpg') 
+            self.original_thumbURL = None
+            if node is not None and bool(node.get('thumb')):
+                self.thumbURL = self.NIETZSCHE_SOURCES_URL + node.get('thumb')
+            if node is not None and bool(node.get('originalThumb')):
+                self.original_thumbURL = self.NIETZSCHE_SOURCES_URL + node.get('originalThumb')
             # self.NIETZSCHE_SOURCES_IMAGE_API_URL + nsource_manuscript_name + '/mini/' + self.file_name 
             self.apiURL = self.NIETZSCHE_SOURCES_API_URL + nsource_page_name
             self.mediumURL = self.NIETZSCHE_SOURCES_IMAGE_API_URL + nsource_manuscript_name + '/medium/' + self.file_name 
+            self.nietzsche_source = self.NIETZSCHE_SOURCES_ORIGINAL_URL + self.file_name.replace('.jpg','')
+            self.nietzsche_source_download = self.OLD_NIETZSCHE_SOURCES_URL + self.file_name.replace('.jpg','')
             """
             if self.primaryURL is not None and self.primaryURL.startswith(self.NIETZSCHE_SOURCES_API_URL):
                 self.apiURL = self.primaryURL
                 self.primaryURL = self.NIETZSCHE_SOURCES_URL + basename(self.primaryURL)
             """
 
     def get_image_joined_with_text_field(self, text_field):
         """Returns a new instance of itself that has a text_field (text_field.TextField).
         """
         return FaksimileImage(file_name=self.file_name, local_path=self.local_path, URL=self.URL, height=self.height,\
                 width=self.width, x=self.x, y=self.y, text_field=text_field)
     
     @classmethod
     def get_semantic_dictionary(cls):
         """ Creates and returns a semantic dictionary as specified by SemanticClass.
         """
         dictionary = super(FaksimileImage,cls).get_semantic_dictionary()
         dictionary[cls.PROPERTIES_KEY].update(cls.create_semantic_property_dictionary('apiURL', str, subPropertyOf=cls.HAS_URL))
+        dictionary[cls.PROPERTIES_KEY].update(cls.create_semantic_property_dictionary('original_thumbURL', str, subPropertyOf=cls.HAS_URL))
         dictionary[cls.PROPERTIES_KEY].update(cls.create_semantic_property_dictionary('thumbURL', str, subPropertyOf=cls.HAS_URL))
         dictionary[cls.PROPERTIES_KEY].update(cls.create_semantic_property_dictionary('mediumURL', str, subPropertyOf=cls.HAS_URL))
         return cls.return_dictionary_after_updating_super_classes(dictionary)
 
     @staticmethod
     def CREATE_IMAGE(image_node, source_file=None):
         """Instantiates a FaksimileImage from a (lxml.etree.Element) image_node.
         """
         namespaces = image_node.nsmap
         if len(namespaces) == 0:
             namespaces = { 'xlink': '' }
         local_path = image_node.get('{%s}href' % namespaces['xlink'])
         file_name = basename(local_path)
         if file_name != local_path and source_file is not None:
             local_path = realpath(dirname(source_file)) + sep + local_path
             local_path = realpath(local_path)
         if not isfile(local_path):
             local_path = None
             for path, dirs, files in os.walk(os.path.abspath(FAKSIMILE_LOCATION)):    
                 for filename in fnmatch.filter(files, file_name):
                     local_path = os.path.join(path, filename)
                     break
         URL = FaksimileImage.NIETZSCHE_SOURCES_URL + file_name.replace('.jpg','')
         height = float(image_node.get('height')) if bool(image_node.get('height')) else 0.0
         width = float(image_node.get('width')) if bool(image_node.get('width')) else 0.0
         x = float(image_node.get('x')) if bool(image_node.get('x')) else 0.0
         y = float(image_node.get('y')) if bool(image_node.get('y')) else 0.0
         matrix = Matrix(transform_matrix_string=image_node.get('transform'))\
                if bool(image_node.get('transform'))\
                else None
         return FaksimileImage(file_name=file_name, local_path=local_path, URL=URL, height=height, width=width, x=x, y=y, matrix=matrix)
 
 
Index: svgscripts/datatypes/matrix.py
===================================================================
--- svgscripts/datatypes/matrix.py	(revision 113)
+++ svgscripts/datatypes/matrix.py	(revision 114)
@@ -1,348 +1,370 @@
 #!/usr/bin/env python3
 # -*- coding: utf-8 -*-
 
 """   This class can be used to transform a svg/text[@transform] matrix-string into a matrix representation.
 """
 #    Copyright (C) University of Basel 2019  {{{1
 #
 #    This program is free software: you can redistribute it and/or modify
 #    it under the terms of the GNU General Public License as published by
 #    the Free Software Foundation, either version 3 of the License, or
 #    (at your option) any later version.
 #
 #    This program is distributed in the hope that it will be useful,
 #    but WITHOUT ANY WARRANTY; without even the implied warranty of
 #    MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
 #    GNU General Public License for more details.
 #
 #    You should have received a copy of the GNU General Public License
 #    along with this program.  If not, see <https://www.gnu.org/licenses/> 1}}}
 
 __author__ = "Christian Steiner"
 __maintainer__ = __author__
 __copyright__ = 'University of Basel'
 __email__ = "christian.steiner@unibas.ch"
 __status__ = "Development"
 __license__ = "GPL v3"
 __version__ = "0.0.1"
 
 import re
 import math
 
 
 class Matrix:
     """
     This class transforms a svg @transform matrix-string into a matrix representation.
 
     Args:
         transform_matrix_string (str)     string of the form 'matrix(1.0 0.0 0.0 1.0 0.0 0.0)' or 'rotate(10)'
     """
     A = 0
     B = 1
     C = 2
     D = 3
     E = 4 
     F = 5 
     XINDEX = 4
     YINDEX = 5
     MATRIX_LENGTH = 6
     DOWN = 1
     STRAIGHT = 0
     UP = -1
 
     def __init__(self, transform_matrix_string=None, transkription_field=None, matrix_list=[]):
         self.matrix = [ 0.0 for i in range(Matrix.MATRIX_LENGTH) ] if len(matrix_list) < 6 else matrix_list
         if transform_matrix_string is not None:
             m = re.search('(?<=rotate\()[-]*[0-9]+', transform_matrix_string)
             if m is not None: # transform='rotate(a)' to transform='matrix(cos(a), sin(a), -sin(a), cos(a), 0, 0)'
                 angle = float(m.group(0))
                 self.matrix[Matrix.A] = round(math.cos(math.radians(angle)), 3)
                 self.matrix[Matrix.B] = round(math.sin(math.radians(angle)), 3)
                 self.matrix[Matrix.C] = round(math.sin(math.radians(angle))*-1, 3)
                 self.matrix[Matrix.D] = round(math.cos(math.radians(angle)), 3)
                 self.matrix[Matrix.E] = 0
                 self.matrix[Matrix.F] = 0
             elif re.search(r'matrix\(\s*([-]*\d+([\.]*\d*(e-\d+)*)*[,\s][\s]*){5}[-]*\d+(\.\d+)*.*\s*\)', transform_matrix_string):
             #elif re.search(r'matrix\(\s*([-]*\d+(\.\d+(e-\d+)*)*[,\s][\s]*){5}[-]*\d+(\.\d+)*.*\s*\)', transform_matrix_string):
             #elif re.search(r'matrix\(\s*([-]*[0-9].*\s){5}[-]*[0-9].*\s*\)', transform_matrix_string): 
             # old-> does not include comma separated matrix string
                 self.matrix = [ float(i) for i in transform_matrix_string.replace('matrix(','').\
                         replace(', ', ',').replace(',', ' ').replace(')','').split(' ') ]
             else:
                 raise Exception('Error: string "{}" is not a valid transform matrix string!'.format(transform_matrix_string))
             if transkription_field is not None:
                 self.matrix[Matrix.XINDEX] -= transkription_field.xmin
                 self.matrix[Matrix.YINDEX] -= transkription_field.ymin
             if(len(self.matrix) < Matrix.MATRIX_LENGTH):
                 raise Exception('Error: string "{}" is not a valid matrix string!'.format(transform_matrix_string))
 
     def add2X(self, add_to_x=0):
         """Return x-value of matrix (float) + add_to_x.
         """
         return self.matrix[Matrix.XINDEX] + float(add_to_x)
 
     def add2Y(self, add_to_y=0):
         """Return y-value of matrix (float) + add_to_y.
         """
         return self.matrix[Matrix.YINDEX] + float(add_to_y)
 
     def getX(self):
         """Return x-value of matrix (float).
         """
         return self.matrix[Matrix.XINDEX]
 
     def getY(self):
         """Return y-value of matrix (float).
         """
         return self.matrix[Matrix.YINDEX]
 
+    def get90DegreeIndex(self) ->int:
+        """Return one of three indices for 90, 180 and 270 rotations.
+        """
+        if not self.isRotationMatrix():
+            return -1
+        elif self.matrix[self.B] == 1.0 and self.matrix[self.C] == -1.0: 
+            return 0
+        elif self.matrix[self.B] == 0.0 and self.matrix[self.C] == 0.0:
+            return 1
+        elif self.matrix[self.B] == -1.0 and self.matrix[self.C] == 1.0: 
+            return 2
+        else:
+            return -1
+
+
     def is_matrix_horizontal(self):
         """Returns whether matrix is horizontal.
 
             [:return:] True/False
         """
         return self.matrix[Matrix.A] == 1 and self.matrix[Matrix.B] == 0 and self.matrix[Matrix.C] == 0 and self.matrix[Matrix.D] == 1
 
     def get_new_x(self, x=0.0, y=0.0):
         """Returns new position of x.
 
             :return: (float) x
         """
         top_left_x = x - self.matrix[self.E] if x != 0.0 else 0.0
         top_left_y = y - self.matrix[self.F] if y != 0.0 else 0.0
         return self.matrix[Matrix.A] * top_left_x + self.matrix[Matrix.C] * top_left_y + self.matrix[self.E]
 
     def get_new_y(self, x=0.0, y=0.0):
         """Returns new position of y.
 
             :return: (float) y
         """
         top_left_x = x - self.matrix[self.E] if x != 0.0 else 0.0
         top_left_y = y - self.matrix[self.F] if y != 0.0 else 0.0
         return self.matrix[Matrix.B] * top_left_x + self.matrix[Matrix.D] * top_left_y + self.matrix[self.F]
 
     def get_old_x(self, x=0.0, y=0.0):
         """Returns old position of x.
 
             :return: (float) x
         """
         old_x = (self.matrix[self.D]*x - self.matrix[Matrix.D]*self.matrix[Matrix.E] - self.matrix[Matrix.C]*y + self.matrix[Matrix.C]*self.matrix[Matrix.F])\
                 /(self.matrix[Matrix.A]*self.matrix[Matrix.D] - self.matrix[Matrix.B]*self.matrix[Matrix.C]) 
         return self.add2X(old_x)
 
     def get_transformed_positions(self, x=0.0, y=0.0, width=0.0, height=0.0):
         """Returns transformed x, y, width and height.
         """
         top_left_x = x
         top_left_y = y
         top_right_x = x + width
         top_right_y = y
         bottom_left_x = x
         bottom_left_y = y + height
         bottom_right_x = x + width
         bottom_right_y = y + height
         new_x = self.matrix[Matrix.A] * top_left_x + self.matrix[Matrix.C] * top_left_y + self.matrix[self.E]
         new_y = self.matrix[Matrix.B] * top_left_x + self.matrix[Matrix.D] * top_left_y + self.matrix[self.F]
         new_top_right_x = self.matrix[Matrix.A] * top_right_x + self.matrix[Matrix.C] * top_right_y + self.matrix[self.E]
         new_top_right_y = self.matrix[Matrix.B] * top_right_x + self.matrix[Matrix.D] * top_right_y + self.matrix[self.F]
         new_bottom_left_x = self.matrix[Matrix.A] * bottom_left_x + self.matrix[Matrix.C] * bottom_left_y + self.matrix[self.E]
         new_bottom_left_y = self.matrix[Matrix.B] * bottom_left_x + self.matrix[Matrix.D] * bottom_left_y + self.matrix[self.F]
         new_bottom_right_x = self.matrix[Matrix.A] * bottom_right_x + self.matrix[Matrix.C] * bottom_right_y + self.matrix[self.E]
         new_bottom_right_y = self.matrix[Matrix.B] * bottom_right_x + self.matrix[Matrix.D] * bottom_right_y + self.matrix[self.F]
         new_width = abs(new_top_right_x - new_x)\
                 if abs(new_top_right_x - new_x) >= abs(new_bottom_right_x - new_bottom_left_x)\
                 else abs(new_bottom_right_x - new_bottom_left_x)
         new_height = abs(new_bottom_left_y - new_y)\
                 if abs(new_bottom_left_y - new_y) >= abs(new_top_right_y - new_bottom_right_y)\
                 else abs(new_top_right_y - new_bottom_right_y)
         return new_x, new_y, new_width, new_height
 
     def clone_transformation_matrix(self):
         """Returns a matrix that contains only the transformation part.
 
             [:return:] (Matrix) a clone of this matrix
         """
         return Matrix(matrix_list=self.matrix[0:4]+[0,0])
 
     def isRotationMatrix(self):
         """Return whether matrix is a rotation matrix.
         """
         return self.matrix[Matrix.A] < 1 or self.matrix[Matrix.B] != 0 
 
     def toCSSTransformString(self):
         """Returns the CSS3 transform string: 'rotate(Xdeg)' where X is the angle.
         """
         angle = 0
         if self.isRotationMatrix():
             angle = int(round(math.degrees(math.asin(self.matrix[Matrix.B])), 0))
             if angle == 0:
                 angle = int(round(math.degrees(math.acos(self.matrix[Matrix.A])), 0))
         return 'rotate({}deg)'.format(angle)
 
     def toString(self):
         """Returns a transform_matrix_string representation of the matrix.
 
             [:returns:] (str) 'matrix(X X X X X X)'
         """
         return 'matrix(' + ' '.join([ str(round(x, 5)) for x in self.matrix ]) + ')'
 
     def get_rotation_direction(self):
         """Get rotation direction of rotation matrix.
 
             [:return:] (int) direction code Matrix.UP, Matrix.STRAIGHT, Matrix.DOWN
         """
         if not self.isRotationMatrix():
             return self.STRAIGHT
         else:
             angle = int(round(math.degrees(math.asin(self.matrix[Matrix.B])), 0))
             return self.UP if angle < 0 else self.DOWN
 
+    def updateOffset(self, height: float, width: float):
+        """Update offset of matrix
+        """
+        if self.matrix[self.B] != 0.0 and self.matrix[self.C] != 0.0:
+            self.matrix[self.E] = (height-width)/2
+            self.matrix[self.F] = -1*(height-width)/2
+
     @staticmethod
     def IS_BENEATH_TF(matrix, transkription_field): 
         """Returns true if matrix specifies a position beneath transkription_field.
         """
         if matrix.getY() < transkription_field.ymax or matrix.getY() > transkription_field.documentHeight-10:
             return False
         if transkription_field.second_field is not None\
             and matrix.getY() > transkription_field.second_field.ymin_without_title:
             return False
         return True
 
     @staticmethod
     def IS_IN_FOOTNOTE_AREA(transform_matrix_string, transkription_field, x=0.0, marginals_on_extra_page=False): 
         """Returns true if matrix specifies a position that is part of the footnote area.
 
             text_node (lxml.etree.Element)
             transkription_field (datatypes.transkription_field.TranskriptionField)
         """
         matrix = Matrix(transform_matrix_string=transform_matrix_string)
         if marginals_on_extra_page:
             return matrix.getY() < transkription_field.documentHeight-10\
                 and matrix.getY() > transkription_field.documentHeight/4\
                 and matrix.getX() + x > transkription_field.documentWidth/4\
                 and not Matrix.IS_IN_MARGIN_FIELD(transform_matrix_string, transkription_field, marginals_on_extra_page=True)
         if not Matrix.IS_BENEATH_TF(matrix, transkription_field):
             return False
         is_part = matrix.getX() + x > transkription_field.xmin\
                 if transkription_field.is_page_verso()\
                 else matrix.getX() + x > transkription_field.documentWidth/4
         return is_part
 
     @staticmethod
     def NODE_HAS_CONTENT_IN_FOOTNOTE_AREA(node, transkription_field, marginals_on_extra_page=False): 
         """Returns true if matrix specifies a position that is part of the footnote area.
 
             text_node (lxml.etree.Element)
             transkription_field (datatypes.transkription_field.TranskriptionField)
         """
         matrix = Matrix(transform_matrix_string=node.get('transform'))
         x = sorted([ float(x.get('x')) for x in node.getchildren()])[-1]\
                 if len(node.getchildren()) > 0 else 0.0
         if marginals_on_extra_page:
             return matrix.getY() < transkription_field.documentHeight-10\
                 and matrix.getY() > transkription_field.documentHeight/4\
                 and matrix.getX() + x > transkription_field.documentWidth/4\
                 and not Matrix.IS_IN_MARGIN_FIELD(node.get('transform'), transkription_field, marginals_on_extra_page=True)
         if not Matrix.IS_BENEATH_TF(matrix, transkription_field):
             return False
         is_part = matrix.getX() + x > transkription_field.xmin\
                 if transkription_field.is_page_verso()\
                 else matrix.getX() + x > transkription_field.documentWidth/4
         return is_part
 
     @staticmethod
     def IS_IN_MARGIN_FIELD(transform_matrix_string, transkription_field, marginals_on_extra_page=False):
         """Returns true if matrix specifies a position that is part of the margin field.
 
             text_node (lxml.etree.Element)
             transkription_field (datatypes.transkription_field.TranskriptionField)
         """
         line_number_area_width = 15\
                 if transkription_field.line_number_area_width == 0.0\
                 else transkription_field.line_number_area_width
         matrix = Matrix(transform_matrix_string=transform_matrix_string)
         if matrix.getY() < transkription_field.ymin or matrix.getY() > transkription_field.ymax:
             return False
         if marginals_on_extra_page:
             return matrix.getX() > transkription_field.xmax
         is_part = matrix.getX() < transkription_field.xmin - line_number_area_width\
                 if transkription_field.is_page_verso()\
                 else matrix.getX() > transkription_field.xmax + line_number_area_width
         return is_part
 
     @staticmethod
     def IS_IN_PLACE_OF_PRINTING_AREA(transform_matrix_string, transkription_field): 
         """Returns true if matrix specifies a position that is part of the area where the places of printing ('Druckorte') are printed.
 
             text_node (lxml.etree.Element)
             transkription_field (datatypes.transkription_field.TranskriptionField)
         """
         matrix = Matrix(transform_matrix_string=transform_matrix_string)
         if not Matrix.IS_BENEATH_TF(matrix, transkription_field):
             return False
         is_part = matrix.getX() < transkription_field.xmin\
                 if transkription_field.is_page_verso()\
                 else matrix.getX() < transkription_field.documentWidth/4
         return is_part
 
     @staticmethod
     def IS_PART_OF_TRANSKRIPTION_FIELD(transkription_field, text_node=None, matrix=None):
         """Returns true if matrix specifies a position that is part of transkription field.
 
             text_node (lxml.etree.Element)
             transkription_field (datatypes.transkription_field.TranskriptionField)
         """
         if matrix is None and not bool(text_node.get('transform')):
             return False
         if matrix is None:
             matrix = Matrix(transform_matrix_string=text_node.get('transform'))
         is_part = matrix.getX() > transkription_field.xmin and matrix.getX() < transkription_field.xmax\
                 and matrix.getY() > transkription_field.ymin and matrix.getY() < transkription_field.ymax
         #if not is_part and matrix.isRotationMatrix() and len([child.text for child in text_node.getchildren() if not re.match(r'^\s*$', child.text)]) > 0:
         if not is_part and len([child.text for child in text_node.getchildren() if not re.match(r'^\s*$', child.text)]) > 0:
             first_tspan_node = [ child for child in text_node.getchildren() if not re.match(r'^\s*$', child.text)][0]    
             x = matrix.add2X(float(first_tspan_node.get('x')))
             y = matrix.add2Y(float(first_tspan_node.get('y')))
             new_x = matrix.get_new_x(x=x, y=y)
             new_y = matrix.get_new_y(x=x, y=y)
             return new_x > transkription_field.xmin and new_x < transkription_field.xmax\
                     and new_y > transkription_field.ymin and new_y < transkription_field.ymax
         return is_part
 
     @staticmethod
     def IS_NEARX_TRANSKRIPTION_FIELD(transform_matrix_string, transkription_field, diffx=20.0):
         """Returns true if matrix specifies a position that is on its x axis near the transkription_field.
 
             transform_matrix_string (str): string from which to init Matrix.
             transkription_field (svgscripts.TranskriptionField)
             diffx (float): defines threshold for positions that count as near.
         """
         matrix = Matrix(transform_matrix_string=transform_matrix_string)
         MINLEFT = transkription_field.xmin - diffx
         MAXRIGHT = transkription_field.xmax + diffx
         return matrix.getY() > transkription_field.ymin and matrix.getY() < transkription_field.ymax\
                 and ((matrix.getX() > MINLEFT and matrix.getX() < transkription_field.xmin)\
                 or (matrix.getX() > transkription_field.xmax and matrix.getX() < MAXRIGHT))
 
     @staticmethod
     def DO_CONVERSION_FACTORS_DIFFER(matrix_a, matrix_b, diff_threshold=0.001):
         """Returns whether the conversion factors (a-d) differ more than diff_threshold.
         """
         if matrix_a is None or matrix_b is None:
             return not (matrix_a is None and matrix_b is None)
         return abs(matrix_a.matrix[Matrix.A] - matrix_b.matrix[Matrix.A]) > diff_threshold\
                 or abs(matrix_a.matrix[Matrix.B] - matrix_b.matrix[Matrix.B]) > diff_threshold\
                 or abs(matrix_a.matrix[Matrix.C] - matrix_b.matrix[Matrix.C]) > diff_threshold\
                 or abs(matrix_a.matrix[Matrix.D] - matrix_b.matrix[Matrix.D]) > diff_threshold
 
     def __eq__(self, other):
         """Return self.matrix == other.matrix.
         """
         if other is None:
             return False
         return self.matrix == other.matrix
 
     def __hash__(self):
         """Return hash value.
         """
         return hash((self.matrix[Matrix.E], self.matrix[Matrix.F]))
Index: svgscripts/datatypes/manuscript_description.py
===================================================================
--- svgscripts/datatypes/manuscript_description.py	(revision 0)
+++ svgscripts/datatypes/manuscript_description.py	(revision 114)
@@ -0,0 +1,74 @@
+#!/usr/bin/env python3
+# -*- coding: utf-8 -*-
+
+"""   This class can be used to represent a manuscript description.
+"""
+#    Copyright (C) University of Basel 2020  {{{1
+#
+#    This program is free software: you can redistribute it and/or modify
+#    it under the terms of the GNU General Public License as published by
+#    the Free Software Foundation, either version 3 of the License, or
+#    (at your option) any later version.
+#
+#    This program is distributed in the hope that it will be useful,
+#    but WITHOUT ANY WARRANTY; without even the implied warranty of
+#    MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
+#    GNU General Public License for more details.
+#
+#    You should have received a copy of the GNU General Public License
+#    along with this program.  If not, see <https://www.gnu.org/licenses/> 1}}}
+
+__author__ = "Christian Steiner"
+__maintainer__ = __author__
+__copyright__ = 'University of Basel'
+__email__ = "christian.steiner@unibas.ch"
+__status__ = "Development"
+__license__ = "GPL v3"
+__version__ = "0.0.1"
+
+from lxml import etree as ET
+import re
+import sys
+
+from .text import Text
+from .description import Description
+from .standoff_tag import StandoffTag
+
+class ManuscriptDescription(Description):
+    """
+    This class represents a manuscript description, i.e. the description of the folio.
+    """
+    ROOT_TAG = 'currentDescription'
+    XML_TAG = 'description'
+    ORIGINALLY_PATTERN = re.compile('(.*\.\s*)(Der|Als|Aus|Ursprünglich)(\s.*)')
+
+    def __init__(self, content: str, standoff_markups=None, originally=None, id=0):
+        super(ManuscriptDescription,self).__init__(content, standoff_markups=standoff_markups, id=id) 
+        self.originally = originally
+
+    @classmethod
+    def get_semantic_dictionary(cls):
+        """ Creates and returns a semantic dictionary as specified by SemanticClass.
+        """
+        dictionary = super(ManuscriptDescription,cls).get_semantic_dictionary()
+        dictionary[cls.PROPERTIES_KEY].update(cls.create_semantic_property_dictionary('originally', str,\
+                  name='leafHasDescriptionAboutOriginalConstitution', label='leaf has description about origianl constitution',\
+                  comment='There is a description of the original constitution of the corresponding leaf.'))
+        return cls.return_dictionary_after_updating_super_classes(dictionary)
+
+    @classmethod
+    def create_cls_from_raw_text(cls, text: str):
+        """Initialize a cls from node.
+
+            [:return:] cls
+        """
+        originally = None
+        m = re.match(cls.ORIGINALLY_PATTERN, text)
+        if m is not None:
+            keyword = m.groups()[1]
+            startIndex = text.index(keyword)
+            endIndex = len(text)
+            originally = text[startIndex:endIndex]
+            text = text[:startIndex].replace('  ', ' ').strip()
+        return cls(text.replace('+', 'x'), originally=originally)
+
Index: teiscripts/create_tei_files.py
===================================================================
--- teiscripts/create_tei_files.py	(revision 0)
+++ teiscripts/create_tei_files.py	(revision 114)
@@ -0,0 +1,278 @@
+#!/usr/bin/env python3
+# -*- coding: utf-8 -*-
+
+"""   This program can be used to create tei files
+"""
+#    Copyright (C) University of Basel 2022  {{{1
+#
+#    This program is free software: you can redistribute it and/or modify
+#    it under the terms of the GNU General Public License as published by
+#    the Free Software Foundation, either version 3 of the License, or
+#    (at your option) any later version.
+#
+#    This program is distributed in the hope that it will be useful,
+#    but WITHOUT ANY WARRANTY; without even the implied warranty of
+#    MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
+#    GNU General Public License for more details.
+#
+#    You should have received a copy of the GNU General Public License
+#    along with this program.  If not, see <https://www.gnu.org/licenses/> 1}}}
+
+from colorama import Fore, Style
+import csv
+import getopt
+import json
+import lxml.etree as ET
+import shutil
+import subprocess
+import sys
+import os
+import wget
+import re
+from os import listdir, sep, path, setpgrp, devnull, mkdir, remove
+from os.path import exists, isfile, isdir, dirname, basename
+from progress.bar import Bar
+import warnings
+import xml.etree.ElementTree as XET
+
+sys.path.append('fixes')
+from get_text_field import get_text_field_on_image, get_text_field_on_thumb
+
+sys.path.append('svgscripts')
+from datatypes.faksimile_image import FaksimileImage
+from datatypes.faksimile import FaksimilePage
+from datatypes.archival_manuscript import ArchivalManuscriptUnity
+from datatypes.page import Page, STATUS_MERGED_OK, STATUS_POSTMERGED_OK
+from datatypes.matrix import Matrix 
+from util import back_up, back_up_svg_file, copy_faksimile_update_image_location, copy_faksimile_svg_file
+from process_files import update_svgposfile_status
+from process_words_post_merging import update_faksimile_line_positions, MERGED_DIR
+
+sys.path.append('shared_util')
+from myxmlwriter import copy_to_bak_dir, write_pretty, xml_has_type, FILE_TYPE_SVG_WORD_POSITION, FILE_TYPE_XML_MANUSCRIPT
+from main_util import create_function_dictionary
+
+
+__author__ = "Christian Steiner"
+__maintainer__ = __author__
+__copyright__ = 'University of Basel'
+__email__ = "christian.steiner@unibas.ch"
+__status__ = "Development"
+__license__ = "GPL v3"
+__version__ = "0.0.2"
+
+MAX_SVG_XY_THRESHOLD = 10
+BLANK_STATUS = 'blank'
+
+class CSVFileCreator:
+    """This class can be used in order to create svg files with textfield rects from a csv file.
+    """
+    UNITTESTING = False
+    FOLIO = "Blatt-ID"
+    LABEL = "Label"
+    ALIAS = "Alias"
+    URL = "Nietzschesource-URL"
+    CONTENT = "Inhalt"
+
+    def __init__(self, template, svg_dir='./svg', content_dir='./text', target_dir='./tmp'):
+        self.template = template
+        self.tei_tree = ET.parse(self.template)
+        self.namespaces = { k if k is not None else 'ns': v for k, v in self.tei_tree.getroot().nsmap.items() }
+        self.namespaces.update({'xml': 'http://www.w3.org/XML/1998/namespace'})
+        self.content_dir = content_dir
+        self.svg_dir = svg_dir
+        self.target_dir = target_dir
+
+    def _add_content(self, body: ET.Element, xml_id: str, page_number: str, contentFiles=None):
+        """Add content to body.
+        """
+        for item in body.iterchildren(): body.remove(item)
+        if contentFiles is None:
+            contentFiles = []
+        div = ET.SubElement(body, 'div')
+        pb = ET.SubElement(div, 'pb')
+        pb.set('facs', '#' + xml_id)
+        pb.set('n', page_number)
+        for contentFile in contentFiles:
+            contentTree = ET.parse(contentFile) 
+            self._mark_greek_as_foreign_lang(contentTree.xpath('//hi[@class="greek"]'))
+            div.append(contentTree.getroot())
+
+    def _mark_greek_as_foreign_lang(self, greekWords: list):
+        """Replace <hi class="greek"> to <foreign xml:lang="gr">
+        """
+        for greekWord in greekWords:
+            try:
+                del greekWord.attrib['class']
+            except KeyError:
+                pass
+            greekWord.tag = 'foreign'
+            greekWord.attrib[ET.QName(self.namespaces['xml'],'lang')] = 'grc' # see www.iana.org/assignments/language-subtag-registry/language-subtag-registry
+
+    def _get_faksimile_page(self, svg_file) ->FaksimilePage:
+        """Return the faksimile page of a faksimile image
+        """
+        faksimile_pages = FaksimilePage.get_faksimile_pages(svg_file, isBlank=True)
+        if len(faksimile_pages) == 1:
+            return faksimile_pages[0]
+        elif len(faksimile_pages):
+            return sorted(faksimile_pages, key=lambda f: f.text_field.height)[-1]
+        return None
+
+    def _get_element(self, xpath: str, firstElementOnly=True) ->ET.Element:
+        """Return element(s) and warn if xpath results in empty list. 
+        """
+        elements = self.tei_tree.xpath(xpath, namespaces=self.namespaces)
+        if len(elements) == 0:
+            msg = f'There are no elements for xpath {xpath}!'
+            warnings.warn(msg)
+            return None
+        if firstElementOnly:
+            return elements[0]
+        return elements
+
+    def _set_idnos(self, idnos: list, contentDict: dict):
+        """Set idno of type URI, SpN, Blatt-ID
+        """
+        for idno in idnos:
+            if bool(contentDict.get(idno.get('type'))):
+                idno.text = contentDict[idno.get('type')]
+
+    def _write_file(self, target_file: str, faksimile_page: FaksimilePage, folioId: str, label: str, alias: str, url: str, content: str, contentFiles=None) ->int:
+        """Write data to target_file
+        """
+        title = self._get_element('/ns:TEI/ns:teiHeader/ns:fileDesc/ns:titleStmt/ns:title')
+        idnos = self._get_element('/ns:TEI/ns:teiHeader/ns:fileDesc/ns:sourceDesc/ns:msDesc/ns:msIdentifier/ns:idno', firstElementOnly=False)
+        objectDesc = self._get_element('/ns:TEI/ns:teiHeader/ns:fileDesc/ns:sourceDesc/ns:msDesc/ns:physDesc/ns:objectDesc')
+        faksimile = self._get_element('/ns:TEI/ns:facsimile')
+        body = self._get_element('/ns:TEI/ns:text/ns:body')
+        if title is not None and idnos is not None and objectDesc is not None and faksimile is not None and ',' in alias and body is not None:
+            xml_id = label.replace('.jpg','')
+            page_number = alias[alias.index(',')+1:].lstrip()
+            title.text = alias 
+            objectDesc.text = content
+            self._set_idnos(idnos, { 'URI': faksimile_page.faksimile_image.nietzsche_source, 'SpN': alias, 'Blatt-ID': folioId })
+            faksimile_page.attach_to_tei_facsimile(faksimile, xml_id, page_number)
+            self._add_content(body, xml_id, page_number, contentFiles=contentFiles)
+            return write_tei(self.tei_tree, target_file, namespaces=self.namespaces)
+        return 2
+  
+    def create_tei_file(self, folioId, label, alias, url, content) ->int:
+        """Create a svg file from csv input.
+        """
+        target_file = self.target_dir + sep + alias.replace(', ', '_page').replace(' ', '_') + '.xml'
+        if isfile(target_file):
+            return 1
+        svg_file = self.svg_dir + sep + label.replace('.jpg','.svg')
+        if not isfile(svg_file):
+            return 2
+        faksimile_page = self._get_faksimile_page(svg_file)
+        if faksimile_page is None:
+            msg = f'There is no faksimile_page in {svg_file} for {label}, {alias}!'
+            warnings.warn(msg)
+            return 2
+        contentFiles = []
+        if 'GM' in content:
+            try:
+                contentId = content[content.index('GM'):].replace(' ', '-')\
+                    if ',' not in content\
+                    else content[content.index('GM'):content.index(',')].replace(' ', '-')
+                if isfile(self.content_dir + sep + contentId + '.txt'):
+                    contentFiles.append(self.content_dir + sep + contentId + '.txt')
+                elif len(contentId.split('-')) > 1 and re.match(r'\d', contentId.split('-')[-2]):
+                    split = contentId.split('-')
+                    for i in range(int(split[-2]), int(split[-1])+1):
+                        contentFile = self.content_dir + sep + contentId[:contentId.index('-'+split[-2])] + '-' + str(i) + '.txt'
+                        if isfile(contentFile):
+                            contentFiles.append(contentFile)
+            except ValueError:
+                msg = f'There has been an error with content {content} of {label}, {alias}'
+                warnings.warn(msg)
+        self._write_file(target_file, faksimile_page, folioId, label, alias, url, content, contentFiles=contentFiles)
+        return 0
+
+def process_default(args) ->int:
+    """ Default process 
+    """
+    if len(args) < 2:  
+        usage()
+        return 2
+    exit_status = 0
+    template = args[0]
+    csv_file = args[1]
+    svg_dir = args[2] if len(args) > 2 else './svg'
+    target_dir = args[3] if len(args) > 3 else './tmp'
+    content_dir = args[4] if len(args) > 4 else './text'
+    not isdir(target_dir) and mkdir(target_dir)
+    if isfile(template) and isfile(csv_file) and isdir(svg_dir) and isdir(content_dir):
+        counter = 0
+        file_creater = CSVFileCreator(template, svg_dir=svg_dir, content_dir=content_dir, target_dir=target_dir)
+        with open(csv_file, newline='') as csvfile: 
+            reader = csv.DictReader(csvfile)
+            for row in [ row for row in reader if not '_thumb' in row[CSVFileCreator.LABEL] ]:
+                status = file_creater.create_tei_file(row[CSVFileCreator.FOLIO], row[CSVFileCreator.LABEL],\
+                        row[CSVFileCreator.ALIAS],row[CSVFileCreator.URL],row[CSVFileCreator.CONTENT])
+                if status > 1:
+                    exit_status = 2
+                elif status == 0:
+                    counter += 1
+        if not CSVFileCreator.UNITTESTING: 
+            print(Style.RESET_ALL + f'[{counter} tei files created]')
+    else:
+        if not isdir(svg_dir):
+            raise FileNotFoundError(f'Directory {svg_dir} does not exist!')
+        if not isdir(content_dir):
+            raise FileNotFoundError(f'Directory {content_dir} does not exist!')
+        if not isfile(template):
+            raise FileNotFoundError(f'File {template} does not exist!')
+        raise FileNotFoundError(f'File {csv_file} does not exist!')
+    return 0
+
+def write_tei(tei_tree: ET.ElementTree, target_file: str, namespaces=None) ->int:
+    """Write to tei file
+    """
+    if namespaces is None:
+        namespaces = { k if k is not None else 'ns': v for k, v in tei_tree.getroot().nsmap.items() }
+    for key in namespaces.keys():
+        if key == 'ns':
+            XET.register_namespace('', namespaces[key])
+        else:
+            XET.register_namespace(key, namespaces[key])
+    target_tree = XET.ElementTree(XET.fromstring(ET.tostring(tei_tree,  pretty_print=True)))
+    if not CSVFileCreator.UNITTESTING: 
+        target_tree.write(target_file, encoding="UTF-8", xml_declaration=True)
+    return 0
+
+def usage():
+    """prints information on how to use the script
+    """
+    print(main.__doc__)
+
+def main(argv):
+    """This program can be used to create tei files.
+
+    fixes/create_tei_files.py [OPTIONS]   <template> <csv_file> <svg-dir> <target-dir>
+
+        <template>              a tei file template.
+        <csv_file>              a csv file with faksimile information.
+        <svg-dir>               a directory containing svg files (created with fixes/create_blank_svg_files.py)
+        <target-dir>            the directory where the files should be saved to
+
+        OPTIONS:
+        -h|--help               show help
+    
+        :return: exit code (int)
+    """
+    try:
+        opts, args = getopt.getopt(argv, "h", ["help"])
+    except getopt.GetoptError:
+        usage()
+        return 2
+    for opt, arg in opts:
+        if opt in ('-h', '--help'):
+            usage()
+            return 0
+    return process_default(args)
+
+if __name__ == "__main__":
+    sys.exit(main(sys.argv[1:]))
Index: tests_svgscripts/test_manuscript_description.py
===================================================================
--- tests_svgscripts/test_manuscript_description.py	(revision 0)
+++ tests_svgscripts/test_manuscript_description.py	(revision 114)
@@ -0,0 +1,23 @@
+import unittest
+from os import sep, path
+from os.path import dirname, basename, isfile, isdir
+import lxml.etree as ET
+import sys
+
+sys.path.append('svgscripts')
+from datatypes.page import Page
+from datatypes.standoff_tag import StandoffTag
+from datatypes.text import Text
+from datatypes.manuscript_description import ManuscriptDescription
+
+class TestManuscriptDescription(unittest.TestCase):
+    def test_semantic(self):
+        pass
+        #print(ManuscriptDescription.get_semantic_dictionary())
+
+    def test_create(self):
+        text = "Heftblatt (restauriert), ca. 17,5+21,7, liniiert; Rißkante Rekto links.  Verso vakat.  Ursprünglich Doppelblatt einer Heftlage: Mp XVI, 64rv / Mp XVII, 118rv; ursprünglich gegenüberliegende Seiten: 124v / 118r (?)."
+        desc = ManuscriptDescription.create_cls_from_raw_text(text)
+
+if __name__ == "__main__":
+    unittest.main()
Index: tests_svgscripts/test_faksimile.py
===================================================================
--- tests_svgscripts/test_faksimile.py	(revision 113)
+++ tests_svgscripts/test_faksimile.py	(revision 114)
@@ -1,98 +1,107 @@
 import unittest
 from os import sep, path
 from os.path import isdir, dirname, basename
 import lxml.etree as ET
 import sys
 import sys
 
 sys.path.append('svgscripts')
 
 from datatypes.faksimile import FaksimilePage, get_paths_inside_rect
 from datatypes.faksimile_image import FaksimileImage
 from datatypes.text_field import TextField 
 
 
 class TestFaksimilePage(unittest.TestCase):
     def setUp(self):
         DATADIR = dirname(__file__) + sep + 'test_data'
         if not isdir(DATADIR):
             DATADIR = dirname(dirname(__file__)) + sep + 'test_data'
         self.svg_file = DATADIR + sep + 'W-II-1,49et50.svg'
+        self.svg_file2 = DATADIR + sep + 'D-20b,61cv.svg'
+        self.tei_file = DATADIR + sep + 'D_20b_page001r.xml'
         self.svg_testmatrix = DATADIR + sep + 'TESTMATRIX_1.svg'
         self.faksimile_dir = DATADIR + sep + 'faksimile_svg'
         self.faksimile_file = self.faksimile_dir + sep + 'N-VII-1,5et6.svg'
         self.faksimile_rotate90 = self.faksimile_dir + sep + 'Mp-XV-2c,4.svg'
 
     def test_init(self):
         image = FaksimileImage(file_name='test.jpg', height=10, width=10)
         text_field = TextField(width=10, height=10, x=10, y=10)
         faksimile = FaksimilePage(title='test', page_number=1, faksimile_image=image, text_field=text_field)
         self.assertEqual(faksimile.page_tree.getroot().get('title'), 'test')
         self.assertEqual(faksimile.page_tree.getroot().get('page-number'), '1')
         self.assertEqual(faksimile.faksimile_image.width, 10)
         self.assertEqual(faksimile.text_field.width, 10)
 
     def test_GET_TEXTFIELDS(self):
         """
         svg_tree = ET.parse('/home/knister0/ownCloud/nietzscheDE/Bearbeitung_Faksimile/Myriam/Blank/Mp_XVI/Fertig/Mp_XVI_page52v.svg')
         pages = FaksimilePage.GET_FAKSIMILEPAGES(svg_tree, page_number='52v', isBlank=True)
         print(pages[0].text_field)
         """
         svg_tree = ET.parse('/home/knister0/ownCloud/nietzscheDE/Bearbeitung_Faksimile/Eric/Mp_XVI/Fertig/Mp-XVI-1,1.svg')
         pages = FaksimilePage.GET_FAKSIMILEPAGES(svg_tree, page_number='1r')
         self.assertEqual(len(pages), 1)
         svg_tree = ET.parse(self.svg_file)
         pages = FaksimilePage.GET_FAKSIMILEPAGES(svg_tree)
         self.assertEqual(len(pages), 2)
         text_field = pages[0].text_field
         self.assertEqual(text_field.width, 663.333)
         result_dir = '.{}xml{}'.format(sep, sep) if isdir('xml') else ''
         self.assertEqual(pages[0].xml_file, result_dir + 'W-II-1_49.xml')
         self.assertEqual(pages[0].title, 'W II 1')
         self.assertEqual(pages[0].page_number, '49')
         pages = FaksimilePage.GET_FAKSIMILEPAGES(svg_tree, page_number='49')
         self.assertEqual(len(pages), 1)
         svg_tree = ET.parse(self.svg_testmatrix)
         pages = FaksimilePage.GET_FAKSIMILEPAGES(svg_tree)
         self.assertEqual(len(pages), 1)
         self.assertEqual(len(pages[0].word_positions), 1)
         self.assertEqual(pages[0].word_positions[0].transform.toCSSTransformString(), 'rotate(45deg)')
         svg_tree = ET.parse(self.faksimile_file)
         pages = FaksimilePage.GET_FAKSIMILEPAGES(svg_tree)
         self.assertEqual(len(pages), 2)
         textfield_id = pages[1].title.replace(' ', '-') + '_' + pages[1].page_number
         #print([ position.id for position in pages[0].word_positions])
         self.assertEqual(textfield_id not in [ position.id for position in pages[0].word_positions ], True)
         self.assertEqual('path1237' in [ position.id for position in pages[0].word_positions ], True)
         self.assertEqual('Vorgangs' in [ position.text for position in pages[0].word_positions ], False)
         svg_tree = ET.parse(self.faksimile_file)
         pages = FaksimilePage.GET_FAKSIMILEPAGES(svg_tree)
         self.assertEqual(len(pages), 2)
         self.assertEqual(pages[0].page_number, '5')
         """
         svg_tree = ET.parse('/home/knister0/ownCloud/nietzscheDE/Bearbeitung_Faksimile/Eric/Kontrolle_und_Beschriftung_der_Wortrahmen/Fertig/W-II-1,141et142.svg')
         pages = FaksimilePage.GET_FAKSIMILEPAGES(svg_tree)
         self.assertEqual(len(pages), 1)
         """
         svg_tree = ET.parse(self.faksimile_rotate90)
         namespaces = { k if k is not None else 'ns': v for k, v in svg_tree.getroot().nsmap.items() }
         pages = FaksimilePage.GET_FAKSIMILEPAGES(svg_tree)
         self.assertEqual(len(pages), 1)
         self.assertEqual(len(pages[0].word_positions), len(svg_tree.xpath('//ns:rect/ns:title', namespaces=namespaces)))
 
     def test_get_paths_inside_rect(self):
         svg_tree = ET.parse(self.faksimile_file)
         paths = get_paths_inside_rect(svg_tree, '//ns:path', 360, 786, 92, 765, 'N-VII-1_5')
         self.assertEqual(len(paths), 1)
         svg_tree = ET.parse(self.svg_testmatrix)
         paths = get_paths_inside_rect(svg_tree, '//ns:rect/ns:title', 0, 2038.72, 0, 974.08002, 'TESTMATRIX_1')
         self.assertEqual(len(paths), 1)
         svg_tree = ET.parse('/home/knister0/ownCloud/nietzscheDE/Bearbeitung_Faksimile/Myriam/Mp_XIV/Kontrolle_und_Beschriftung_der_Wortrahmen/Fertig/Mp-XIV-1,419a.svg')
         namespaces = { k if k is not None else 'ns': v for k, v in svg_tree.getroot().nsmap.items() }
         paths = get_paths_inside_rect(svg_tree, '//ns:rect', 52, 800, 58, 900, 'Mp-XIV-1_419a', namespaces=namespaces)
         self.assertEqual(len([ path for path in paths if 'seinen' in path.xpath('./ns:title/text()', namespaces=namespaces)]), 1)
 
+    def test_attach_to_tei_facsimile(self):
+        tei_tree = ET.parse(self.tei_file)
+        namespaces = { k if k is not None else 'ns': v for k, v in tei_tree.getroot().nsmap.items() }
+        faksimile = tei_tree.xpath('//ns:facsimile', namespaces=namespaces)[0]
+        fp = FaksimilePage.get_faksimile_pages(self.svg_file2, isBlank=True)[1]
+        fp.attach_to_tei_facsimile(faksimile, basename(self.svg_file2).replace('.svg',''), '61cv')
+        #print(ET.dump(faksimile))
 
 
 if __name__ == "__main__":
     unittest.main()
Index: tests_svgscripts/test_data/D-20b,61cv.svg
===================================================================
--- tests_svgscripts/test_data/D-20b,61cv.svg	(revision 0)
+++ tests_svgscripts/test_data/D-20b,61cv.svg	(revision 114)
@@ -0,0 +1,72 @@
+<?xml version="1.0" encoding="UTF-8" standalone="no"?>
+<svg
+   xmlns:dc="http://purl.org/dc/elements/1.1/"
+   xmlns:cc="http://creativecommons.org/ns#"
+   xmlns:rdf="http://www.w3.org/1999/02/22-rdf-syntax-ns#"
+   xmlns:svg="http://www.w3.org/2000/svg"
+   xmlns="http://www.w3.org/2000/svg"
+   xmlns:xlink="http://www.w3.org/1999/xlink"
+   xmlns:sodipodi="http://sodipodi.sourceforge.net/DTD/sodipodi-0.dtd"
+   xmlns:inkscape="http://www.inkscape.org/namespaces/inkscape"
+   height="856.96002"
+   id="svg2"
+   version="1.1"
+   viewBox="0 0 863.03998 856.96002"
+   width="863.03998"
+   sodipodi:docname="D-20b,61cv.svg"
+   inkscape:version="0.92.3 (2405546, 2018-03-11)">
+  <sodipodi:namedview
+     pagecolor="#ffffff"
+     bordercolor="#666666"
+     borderopacity="1"
+     objecttolerance="10"
+     gridtolerance="10"
+     guidetolerance="10"
+     inkscape:pageopacity="0"
+     inkscape:pageshadow="2"
+     inkscape:window-width="640"
+     inkscape:window-height="480"
+     id="namedview7"
+     showgrid="false"
+     inkscape:zoom="0.96244811"
+     inkscape:cx="431.51999"
+     inkscape:cy="428.48001"
+     inkscape:current-layer="svg2" />
+  <metadata
+     id="metadata8">
+    <rdf:RDF>
+      <cc:Work
+         rdf:about="">
+        <dc:format>image/svg+xml</dc:format>
+        <dc:type
+           rdf:resource="http://purl.org/dc/dcmitype/StillImage" />
+      </cc:Work>
+    </rdf:RDF>
+  </metadata>
+  <defs
+     id="defs6" />
+  <image
+     height="856.96002"
+     id="image10"
+     preserveAspectRatio="none"
+     width="863.03998"
+     x="0"
+     y="0"
+     xlink:href="file:///home/knister0/ownCloud/myNietzscheDE/Druckmanuscripte/faksimiles/D-20b,61cv.jpg" />
+  <rect
+     fill="green"
+     height="0.0"
+     id="D_20b_65v"
+     opacity="0.3"
+     style=""
+     width="0.0"
+     x="-0.2"
+     y="-0.2" />
+  <rect
+     style="opacity:0.18800001;fill:#ffffff;fill-opacity:1;stroke:#ff0000;stroke-width:0.30000001;stroke-linejoin:round;stroke-miterlimit:4;stroke-dasharray:none;stroke-dashoffset:0;stroke-opacity:1"
+     id="rect9"
+     width="496.65015"
+     height="769.91162"
+     x="59.223972"
+     y="56.916889" />
+</svg>
Index: tests_svgscripts/test_data/D_20b_page001r.xml
===================================================================
--- tests_svgscripts/test_data/D_20b_page001r.xml	(revision 0)
+++ tests_svgscripts/test_data/D_20b_page001r.xml	(revision 114)
@@ -0,0 +1,68 @@
+<?xml-stylesheet type="text/xsl" href="style.xsl"?>
+<TEI version="4.1.0" xmlns="http://www.tei-c.org/ns/1.0">
+   <teiHeader>
+      <fileDesc>
+         <titleStmt>
+          <title>D 20b, 1r</title>
+         </titleStmt>
+         <sourceDesc>
+           <msDesc>
+             <msIdentifier>
+               <settlement>Weimar</settlement>
+                <repository>Goethe- und Schiller-Archiv</repository>
+                <idno type="URI">http://www.nietzschesource.org/DFGA/D-20b,1</idno>
+                <idno type="SpN">D 20b, 1r</idno>
+                <idno type="Blatt-ID">GSA_71/27,2_001</idno>
+              </msIdentifier>
+              <physDesc>
+                <objectDesc>
+                   <p>Druckvorlage GM III 1</p>
+                </objectDesc>
+             </physDesc>
+           </msDesc>
+         </sourceDesc>
+      </fileDesc>
+   </teiHeader>
+   <facsimile>
+      <surface xml-id="D-20b,1" ulx="326.1875" uly="283" lrx="4455.625" lry="5488" n="1r">
+         <graphic url="http://www.nietzschesource.org/DFGAapi/api/page/download/D-20b,1" width="6315px" height="5724px"/>
+      </surface>
+   </facsimile>
+   <text>
+      <body>
+         <p>
+            <pb n="1r" facs="#D-20b,1"/>
+            <lb/><head place="top left">1.</head>
+            <head place="top right">Anfang der <hi rend="underline">dritten</hi> Abhandlung.</head>
+               <p>
+                  <lb/><head>1.</head>
+                  <lb/>Was bedeuten asketische Ideale? — Bei Künstlern
+                  Nichts oder zu Vielerlei; bei Philo=<lb break="no"/>sophen und Gelehrten Etwas
+                  wie Witterung und Instinkt für die günstigsten Vorbedingungen
+                  hoher Geistigkeit; bei Frauen, besten Falls, eine
+                  Liebenswürdigkeit der Verführung <hi rend="underline">mehr</hi>,
+                  ein wenig morbidezza auf
+                  schönem Fleische, die Engelhaftigkeit eines hübschen fetten
+                  Thiers; bei physiologisch Verunglückten und Verstimmten (bei
+                  der <hi rend="underline">Mehrzahl</hi> der Sterblichen) einen
+                  Versuch, sich „zu gut“ für diese Welt vorzukommen, eine
+                  heilige Form der Ausschweifung, ihr Hauptmittel im Kampf mit
+                  dem langsamen Schmerz und der Langenweile; bei Priestern den
+                  eigentlichen Priesterglauben, ihr bestes Werkzeug der Macht,
+                  auch die „allerhöchste“ Erlaubniss zur Macht; bei Heiligen
+                  endlich einen Vorwand zum Winterschlaf, ihre novissima
+                  gloriae cupido, ihre Ruhe im Nichts („Gott“), ihre Form des
+                  Irrsinns. <hi rend="underline">Dass</hi> aber überhaupt das
+                  asketische Ideal dem Menschen so viel bedeutet hat, darin
+                  drückt sich die Grundthatsache des menschlichen Willens aus,
+                  sein horror vacui: <hi rend="underline">er braucht ein Ziel</hi>,
+                  — und eher will er noch <hi rend="underline">das Nichts</hi>
+                  wollen, als <hi rend="underline">nicht</hi> wollen. — Versteht man mich?…
+                  Hat man mich verstanden?…
+                  <hi rend="underline">„Schlechterdings nicht!  mein Herr!“</hi>
+                  — Fangen wir also von vorne an.
+               </p>
+         </p>
+      </body>
+   </text>
+</TEI>
Index: tests_svgscripts/test_matrix.py
===================================================================
--- tests_svgscripts/test_matrix.py	(revision 113)
+++ tests_svgscripts/test_matrix.py	(revision 114)
@@ -1,245 +1,263 @@
 import unittest
 import lxml.etree as ET
 from os import sep, path
 from os.path import isdir, dirname
 import sys
 
 sys.path.append('svgscripts')
 
 from datatypes.matrix import Matrix
 from datatypes.transkriptionField import TranskriptionField
 
 class FakeTF:
     def __init__(self):
         self.xmin = 297.6379999999997
         self.xmax = 765.354
         self.ymin = 157.328
         self.ymax = 752.6040160033832
 
 class TestMatrix(unittest.TestCase):
     def setUp(self):
         self.x = 219.4058
         self.y = 106.4634
         self.matrix_string = 'matrix(1 0 0 1 {} {})'.format(str(self.x), str(self.y))
         self.test_data_dir = dirname(__file__) + sep + 'test_data'  
         if not isdir(self.test_data_dir):
             self.test_data_dir = dirname(dirname(__file__)) + sep + 'test_data'
         self.test_file = self.test_data_dir + sep + 'test_ai.svg' 
         self.rotation_angle = 20
         self.rotation_matrix_string = 'matrix(0.94 0.342 -0.342 0.94 0 0)'
         self.test_margin_field_file = self.test_data_dir + sep + 'W_I_8_neu_125-01.svg'
         self.test_place_printing_verso = self.test_data_dir + sep + 'N_VII_1_xp5_4_page5.svg'
         self.test_place_printing_recto = self.test_data_dir + sep + 'N_VII_1_xp5_4_page6.svg'
         self.multipage = f'{self.test_data_dir}{sep}pdfsvg{sep}csv{sep}15.svg'
         self.marginals_extra = f'{self.test_data_dir}{sep}pdfsvg{sep}csv{sep}45.svg'
         self.marginals_extra_fn = f'{self.test_data_dir}{sep}pdfsvg{sep}csv{sep}44.svg'
 
     def test_Matrix(self):
         matrix = Matrix(self.matrix_string)
         self.assertEqual(matrix.getX(), self.x)
         self.assertEqual(matrix.add2X(1), self.x + 1)
         self.assertEqual(matrix.getY(), self.y)
         matrix = Matrix('matrix(0.98966578,0.1433933,-0.0913015,0.9958233,0,0)')
         self.assertEqual(matrix.getX(), 0)
         matrix = Matrix('matrix(1 2.998719e-04 -2.998719e-04 1 415.3643 476.7988)')
 
     def test_Matrix_rotation(self):
         rotation_string = 'rotate({})'.format(self.rotation_angle)
         rotation_stringC = 'rotate(-{})'.format(self.rotation_angle)
         matrixA = Matrix(rotation_string)
         matrixB = Matrix(self.rotation_matrix_string)
         matrixC = Matrix(rotation_stringC)
         self.assertEqual(matrixA.matrix[Matrix.A], matrixB.matrix[Matrix.A])
         self.assertEqual(matrixA.matrix[Matrix.B], matrixB.matrix[Matrix.B])
         self.assertEqual(matrixA.matrix[Matrix.C], matrixB.matrix[Matrix.C])
         self.assertEqual(matrixA.matrix[Matrix.D], matrixB.matrix[Matrix.D])
         self.assertEqual(matrixA.matrix[Matrix.E], matrixB.matrix[Matrix.E])
         self.assertEqual(matrixA.matrix[Matrix.F], matrixB.matrix[Matrix.F])
         self.assertEqual(matrixA.toString(), self.rotation_matrix_string)
         self.assertEqual(matrixC.toCSSTransformString(), 'rotate(-{}deg)'.format(self.rotation_angle))
 
     def test_get_rotation_direction(self):
         rotation_string = 'rotate(-{})'.format(self.rotation_angle)
         matrixA = Matrix(rotation_string)
         matrixB = Matrix(self.rotation_matrix_string)
         matrixC = Matrix(self.matrix_string)
         self.assertEqual(matrixA.get_rotation_direction(), Matrix.UP)
         self.assertEqual(matrixB.get_rotation_direction(), Matrix.DOWN)
         self.assertEqual(matrixC.get_rotation_direction(), Matrix.STRAIGHT)
 
     def test_isRotationMatrix(self):
         rotation_string = 'rotate({})'.format(self.rotation_angle)
         matrixA = Matrix(rotation_string)
         self.assertEqual(matrixA.isRotationMatrix(), True)
         matrixB = Matrix(self.matrix_string)
         self.assertEqual(matrixB.isRotationMatrix(), False)
-    
+
+    def test_isRotationMatrix(self):
+        rotation_string = 'rotate(90deg)'
+        matrix = Matrix(rotation_string)
+        mindex = matrix.get90DegreeIndex()
+        self.assertEqual(mindex, 0)
+        rotation_string = 'rotate(180deg)'
+        matrix = Matrix(rotation_string)
+        mindex = matrix.get90DegreeIndex()
+        self.assertEqual(mindex, 1)
+        rotation_string = 'rotate(270deg)'
+        matrix = Matrix(rotation_string)
+        mindex = matrix.get90DegreeIndex()
+        self.assertEqual(mindex, 2)
+        rotation_string = 'rotate(70deg)'
+        matrix = Matrix(rotation_string)
+        mindex = matrix.get90DegreeIndex()
+        self.assertEqual(mindex, -1)
+   
     def test_toCSSTransformString(self):
         rotation_string = 'rotate({})'.format(self.rotation_angle)
         matrixA = Matrix(rotation_string)
         self.assertEqual(matrixA.toCSSTransformString(), 'rotate({}deg)'.format(self.rotation_angle))
         matrixB = Matrix(self.rotation_matrix_string)
         self.assertEqual(matrixB.toCSSTransformString(), 'rotate({}deg)'.format(self.rotation_angle))
 
     def test_Matrix_Exception(self):
         with self.assertRaises(Exception):
             Matrix('matrix({})'.format(' '.join([ '0.0' for i in range(5)])))
 
     def test_Matrix_TranskriptionField(self):
         tf = TranskriptionField(self.test_file)
         matrix = Matrix(self.matrix_string, transkription_field=tf)
         self.assertEqual(round(matrix.getX(), 3) , 28.706)
         self.assertEqual(round(matrix.getY(), 3) , 31.563)
 
     def test_get_transformed_positions(self):
         # Test relies on the example from "https://developer.mozilla.org/en-US/docs/Web/SVG/Attribute/transform"
         x = 10
         y = 10
         width = 30
         height = 20
         matrix = Matrix(transform_matrix_string='matrix(3 1 -1 3 30 40)')
         new_x, new_y, new_width, new_height = matrix.get_transformed_positions(x=x, y=y, width=width, height=height)
         self.assertEqual(new_x, 50)
         self.assertEqual(new_y, 80)
         self.assertEqual(new_width, 90)
         self.assertEqual(new_height, 60)
 
     def test_is_matrix_horizontal(self):
         matrix = Matrix(transform_matrix_string='matrix(3 1 -1 3 30 40)')
         self.assertEqual(matrix.is_matrix_horizontal(), False)
         matrix = Matrix(transform_matrix_string='matrix(1 0 0 1 30 40)')
         self.assertEqual(matrix.is_matrix_horizontal(), True)
 
     def test_is_part_of_transkription_field(self):
         tf = TranskriptionField(self.test_file)
         text_node = ET.Element('text', attrib={'transform': 'matrix(1 0 0 1 244.1211 91.7134)'}) 
         self.assertEqual(Matrix.IS_PART_OF_TRANSKRIPTION_FIELD(tf, text_node=text_node), True)
         text_node = ET.Element('text', attrib={'transform': 'matrix(1 0 0 1 244.1211 51.7134)'}) 
         self.assertEqual(Matrix.IS_PART_OF_TRANSKRIPTION_FIELD(tf, text_node=text_node), False)
         text_node = ET.Element('text', attrib={'transform': 'matrix(1 0 0 1 44.1211 91.7134)'}) 
         self.assertEqual(Matrix.IS_PART_OF_TRANSKRIPTION_FIELD(tf, text_node=text_node), False)
         text_node = ET.Element('text', attrib={'transform': 'matrix(1 0 0 1 244.1211 891.7134)'}) 
         self.assertEqual(Matrix.IS_PART_OF_TRANSKRIPTION_FIELD(tf, text_node=text_node), False)
         text_node = ET.Element('text', attrib={'transform': 'matrix(1 0 0 1 844.1211 91.7134)'}) 
         self.assertEqual(Matrix.IS_PART_OF_TRANSKRIPTION_FIELD(tf, text_node=text_node), False)
         text_node = ET.Element('text', attrib={'transform': 'matrix(0.866 -0.5 0.5 0.866 356.4303 753.4836)'}) 
         tspan_node = ET.SubElement(text_node, 'tspan', attrib={'x': '41.82', 'y': '0'})
         tspan_node.text = 'De'
         fake_tf = FakeTF()
         self.assertEqual(Matrix.IS_PART_OF_TRANSKRIPTION_FIELD(fake_tf, text_node=text_node), True)
         """
         local_file = '/home/knister0/ownCloud/myNietzscheDE/KGW-IX_12/Bd_12_XIV-XVI_Druck_als_SVG/18.svg'
         tf = TranskriptionField(local_file)
         svg_tree = ET.parse(local_file)
         namespaces = { k if k is not None else 'ns': v for k, v in svg_tree.getroot().nsmap.items() }
         text_node = svg_tree.xpath('//ns:text[@transform="matrix(1 0 0 1 115.6299 719.3535)"]', namespaces=namespaces)[0]
         self.assertTrue(Matrix.IS_PART_OF_TRANSKRIPTION_FIELD(tf, text_node=text_node))
         """
 
     def test_is_nearx_tf(self):
         tf = TranskriptionField(self.test_file)
         matrix_string = 'matrix(1 0 0 1 180.8755 315.9131)'
         self.assertEqual(Matrix.IS_NEARX_TRANSKRIPTION_FIELD(matrix_string, tf), True)
         matrix_string = 'matrix(1 0 0 1 100.8755 315.9131)'
         self.assertEqual(Matrix.IS_NEARX_TRANSKRIPTION_FIELD(matrix_string, tf), False)
 
     def test_do_conversion_factors_differ(self):
         self.assertEqual(Matrix.DO_CONVERSION_FACTORS_DIFFER(None, None), False)
         matrix_a = Matrix('matrix(1 0 0 1 180.8755 315.9131)')
         self.assertEqual(Matrix.DO_CONVERSION_FACTORS_DIFFER(matrix_a, None), True)
         matrix_b = Matrix('matrix(1 0 0 1 100.8755 315.9131)')
         self.assertEqual(Matrix.DO_CONVERSION_FACTORS_DIFFER(matrix_a, matrix_b), False)
         matrix_b = Matrix('matrix(0 0 0 1 100.8755 315.9131)')
         self.assertEqual(Matrix.DO_CONVERSION_FACTORS_DIFFER(matrix_a, matrix_b), True)
         matrix_b = Matrix('matrix(1 1 0 1 100.8755 315.9131)')
         self.assertEqual(Matrix.DO_CONVERSION_FACTORS_DIFFER(matrix_a, matrix_b), True)
         matrix_b = Matrix('matrix(1 0 1 1 100.8755 315.9131)')
         self.assertEqual(Matrix.DO_CONVERSION_FACTORS_DIFFER(matrix_a, matrix_b), True)
         matrix_b = Matrix('matrix(1 0 0 0 100.8755 315.9131)')
         self.assertEqual(Matrix.DO_CONVERSION_FACTORS_DIFFER(matrix_a, matrix_b), True)
 
     def test_clone_transformation_matrix(self):
         matrix_a = Matrix(matrix_list=[ 1, 0, 0, 1, 180.8755, 315.9131 ])
         matrix_b = matrix_a.clone_transformation_matrix()
         self.assertEqual(Matrix.DO_CONVERSION_FACTORS_DIFFER(matrix_a, matrix_b), False)
         self.assertEqual(matrix_b.matrix[Matrix.E], 0)
         self.assertEqual(matrix_b.matrix[Matrix.F], 0)
 
     def test_toString(self):
         matrix_string = 'matrix(1.0 0.0 0.0 1.0 180.8755 315.9131)'
         matrix = Matrix(matrix_string)
         self.assertEqual(matrix.toString(), matrix_string)
 
     def test_get_semanticAndDataDict(self):
         matrix = Matrix('rotate(20)')
         #self.assertEqual(matrix.get_data_dictionary()['body'].get('matrix'), matrix.matrix)
 
     def test_is_in_margin_field(self):
         tf = TranskriptionField(self.test_margin_field_file)
         text_node = ET.Element('text', attrib={'transform': 'matrix(1 0 0 1 178.8916 182.0127)'}) 
         self.assertEqual(Matrix.IS_IN_MARGIN_FIELD(text_node.get('transform'), tf), True)
         text_node = ET.Element('text', attrib={'transform': 'matrix(1 0 0 1 357.7339 818.3276)'}) 
         self.assertEqual(Matrix.IS_IN_MARGIN_FIELD(text_node.get('transform'), tf), False)
         tf = TranskriptionField(self.marginals_extra)
         text_node = ET.Element('text', attrib={'transform': 'matrix(1 0 0 1 778.519 407.1094)'}) 
         self.assertEqual(Matrix.IS_IN_MARGIN_FIELD(text_node.get('transform'), tf, marginals_on_extra_page=True), True)
         text_node = ET.Element('text', attrib={'transform': 'matrix(1 0 0 1 51.8503 1056.1182)'}) 
         self.assertEqual(Matrix.IS_IN_MARGIN_FIELD(text_node.get('transform'), tf, marginals_on_extra_page=True), False)
         text_node = ET.Element('text', attrib={'transform': 'matrix(1 0 0 1 552.9165 1072.1025)'}) 
         self.assertEqual(Matrix.IS_IN_MARGIN_FIELD(text_node.get('transform'), tf, marginals_on_extra_page=True), False)
         
     def test_is_in_place_of_printing_area(self):
         tf = TranskriptionField(self.test_place_printing_verso)
         text_node = ET.Element('text', attrib={'transform': 'matrix(1 0 0 1 42.5195 575.8736)'}) 
         self.assertEqual(Matrix.IS_IN_PLACE_OF_PRINTING_AREA(text_node.get('transform'), tf), True)
         text_node = ET.Element('text', attrib={'transform': 'matrix(1 0 0 1 109.145 575.8736)'}) 
         self.assertEqual(Matrix.IS_IN_PLACE_OF_PRINTING_AREA(text_node.get('transform'), tf), True)
         text_node = ET.Element('text', attrib={'transform': 'matrix(1 0 0 1 191.0571 575.8736)'}) 
         self.assertEqual(Matrix.IS_IN_PLACE_OF_PRINTING_AREA(text_node.get('transform'), tf), False)
         tf = TranskriptionField(self.test_place_printing_recto)
         text_node = ET.Element('text', attrib={'transform': 'matrix(1 0 0 1 28.3462 575.8736)'}) 
         self.assertEqual(Matrix.IS_IN_PLACE_OF_PRINTING_AREA(text_node.get('transform'), tf), True)
         text_node = ET.Element('text', attrib={'transform': 'matrix(1 0 0 1 28.3462 583.8736)'}) 
         self.assertEqual(Matrix.IS_IN_PLACE_OF_PRINTING_AREA(text_node.get('transform'), tf), True)
         text_node = ET.Element('text', attrib={'transform': 'matrix(1 0 0 1 170.0791 575.8736)'}) 
         self.assertEqual(Matrix.IS_IN_PLACE_OF_PRINTING_AREA(text_node.get('transform'), tf), False)
 
     def test_is_in_footnote_area(self):
         tf = TranskriptionField(self.test_place_printing_verso)
         text_node = ET.Element('text', attrib={'transform': 'matrix(1 0 0 1 42.5195 575.8736)'}) 
         self.assertEqual(Matrix.IS_IN_FOOTNOTE_AREA(text_node.get('transform'), tf), False)
         text_node = ET.Element('text', attrib={'transform': 'matrix(1 0 0 1 109.145 575.8736)'}) 
         self.assertEqual(Matrix.IS_IN_FOOTNOTE_AREA(text_node.get('transform'), tf), False)
         text_node = ET.Element('text', attrib={'transform': 'matrix(1 0 0 1 191.0571 575.8736)'}) 
         self.assertEqual(Matrix.IS_IN_FOOTNOTE_AREA(text_node.get('transform'), tf), True)
         tf = TranskriptionField(self.test_place_printing_recto)
         text_node = ET.Element('text', attrib={'transform': 'matrix(1 0 0 1 28.3462 575.8736)'}) 
         self.assertEqual(Matrix.IS_IN_FOOTNOTE_AREA(text_node.get('transform'), tf), False)
         text_node = ET.Element('text', attrib={'transform': 'matrix(1 0 0 1 28.3462 583.8736)'}) 
         self.assertEqual(Matrix.IS_IN_FOOTNOTE_AREA(text_node.get('transform'), tf), False)
         text_node = ET.Element('text', attrib={'transform': 'matrix(1 0 0 1 170.0791 575.8736)'}) 
         self.assertEqual(Matrix.IS_IN_FOOTNOTE_AREA(text_node.get('transform'), tf), True)
         tf = TranskriptionField(self.multipage, multipage_index=0)
         text_node = ET.Element('text', attrib={'transform': 'matrix(1 0 0 1 395.7141 463.6953)'}) 
         self.assertEqual(Matrix.IS_IN_FOOTNOTE_AREA(text_node.get('transform'), tf), False)
         text_node = ET.Element('text', attrib={'transform': 'matrix(1 0 0 1 395.7141 453.6953)'}) 
         self.assertEqual(Matrix.IS_IN_FOOTNOTE_AREA(text_node.get('transform'), tf), True)
         tf = TranskriptionField(self.marginals_extra)
         text_node = ET.Element('text', attrib={'transform': 'matrix(1 0 0 1 552.9165 1072.1025)'}) 
         self.assertEqual(Matrix.IS_IN_FOOTNOTE_AREA(text_node.get('transform'), tf, marginals_on_extra_page=True), True)
         text_node = ET.Element('text', attrib={'transform': 'matrix(1 0 0 1 51.8503 1056.1182)'}) 
         self.assertEqual(Matrix.IS_IN_FOOTNOTE_AREA(text_node.get('transform'), tf, x=5.352, marginals_on_extra_page=True), False)
         text_node = ET.Element('text', attrib={'transform': 'matrix(1 0 0 1 215.5483 1056.1182)'}) 
         self.assertTrue(Matrix.IS_IN_FOOTNOTE_AREA(text_node.get('transform'), tf, x=24.732, marginals_on_extra_page=True))
         svg_tree = ET.parse(self.marginals_extra_fn)
         tf = TranskriptionField(self.marginals_extra)
         namespaces = { k if k is not None else 'ns': v for k, v in svg_tree.getroot().nsmap.items() }
         node = svg_tree.xpath('//ns:text[@transform="matrix(1 0 0 1.0101 698.1499 85.3594)"]', namespaces=namespaces)[0]
         self.assertFalse(Matrix.NODE_HAS_CONTENT_IN_FOOTNOTE_AREA(node, tf, marginals_on_extra_page=True))
         self.assertFalse(Matrix.IS_IN_FOOTNOTE_AREA(node.get('transform'), tf, marginals_on_extra_page=True))
         node = svg_tree.xpath('//ns:text[@transform="matrix(1 0 0 1 215.5483 1056.1182)"]', namespaces=namespaces)[0]
         self.assertTrue(Matrix.NODE_HAS_CONTENT_IN_FOOTNOTE_AREA(node, tf, marginals_on_extra_page=True))
         
 
 if __name__ == "__main__":
     unittest.main()
Index: tests_teiscripts/test_create_tei_files.py
===================================================================
--- tests_teiscripts/test_create_tei_files.py	(revision 0)
+++ tests_teiscripts/test_create_tei_files.py	(revision 114)
@@ -0,0 +1,29 @@
+import lxml.etree as ET
+from os import sep, path, remove
+from os.path import isdir, isfile, dirname, basename
+import shutil
+import sys
+import tempfile
+import unittest
+import warnings
+
+sys.path.append('teiscripts')
+from create_tei_files import CSVFileCreator, process_default 
+
+
+sys.path.append('shared_util')
+from myxmlwriter import copy_to_bak_dir
+
+
+class TestCreateTEI(unittest.TestCase):
+    def setUp(self):
+        CSVFileCreator.UNITTESTING = True
+
+    
+    def test_process_default(self):
+        csv_file = 'Druckmanuscripte/D_20.csv'
+        process_default(['Druckmanuscripte/D_20b_page001r.xml', csv_file, '/home/knister0/ownCloud/myNietzscheDE/Druckmanuscripte/svg', '/home/knister0/ownCloud/myNietzscheDE/Druckmanuscripte/tei','/home/knister0/ownCloud/myNietzscheDE/Druckmanuscripte/text'])
+
+
+if __name__ == "__main__":
+    unittest.main()
Index: fixes/test_get_text_field.py
===================================================================
--- fixes/test_get_text_field.py	(revision 113)
+++ fixes/test_get_text_field.py	(revision 114)
@@ -1,25 +1,31 @@
 import lxml.etree as ET
 from os import sep, path, remove
 from os.path import isdir, isfile, dirname, basename
 import shutil
 import sys
 import tempfile
 import unittest
 import warnings
 
 import get_text_field
 
 
 
 
 class TestGETIMAGEINFO(unittest.TestCase):
     def setUp(self):
         DATADIR = path.dirname(__file__) + sep + 'test_data'  
         self.xml_file = DATADIR + sep + 'N_VII_1_page138.xml'
         self.fix_transkription_positions = DATADIR + sep + 'Mp_XIV_page419a.xml'
 
     def test_main(self):
         get_text_field.main(['/home/knister0/ownCloud/nietzscheDE/Bearbeitung_Faksimile/Mp_XVI/Mp-XVI-4,13.jpg','1260.3199','1339.36'])
+        get_text_field.main(['/home/knister0/ownCloud/myNietzscheDE/Druckmanuscripte/faksimiles/D-20a,1.jpg','1221.28','1446.08'])
+
+    def test_get_text_field_on_thumb(self):
+        pass
+        #tf, width, height = get_text_field.get_text_field_on_thumb('/home/knister0/ownCloud/Der_spaete_Nietzsche/DATA/faksimiles/Mp-XVII,243_thumb.jpg')
+        #print(tf, width, height)
 
 if __name__ == "__main__":
     unittest.main()
Index: fixes/get_text_field.py
===================================================================
--- fixes/get_text_field.py	(revision 113)
+++ fixes/get_text_field.py	(revision 114)
@@ -1,144 +1,184 @@
 #!/usr/bin/env python3
 # -*- coding: utf-8 -*-
 
 """   This program can be used to create svg files with a rect for the text_field.
 """
 #    Copyright (C) University of Basel 2019  {{{1
 #
 #    This program is free software: you can redistribute it and/or modify
 #    it under the terms of the GNU General Public License as published by
 #    the Free Software Foundation, either version 3 of the License, or
 #    (at your option) any later version.
 #
 #    This program is distributed in the hope that it will be useful,
 #    but WITHOUT ANY WARRANTY; without even the implied warranty of
 #    MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
 #    GNU General Public License for more details.
 #
 #    You should have received a copy of the GNU General Public License
 #    along with this program.  If not, see <https://www.gnu.org/licenses/> 1}}}
 
 from colorama import Fore, Style
 import getopt
 import json
 import lxml.etree as ET
 import shutil
 import subprocess
 import sys
 import os
 import wget
 import cv2
 import matplotlib.pyplot as plt
 import numpy as np
 from os import listdir, sep, path, setpgrp, devnull, mkdir, remove
 from os.path import exists, isfile, isdir, dirname, basename
 from progress.bar import Bar
 import warnings
 
 if dirname(__file__) not in sys.path:
     sys.path.append(dirname(__file__))
 from fix_old_data import save_page
 
 sys.path.append('svgscripts')
 from datatypes.faksimile_image import FaksimileImage
 from datatypes.faksimile import FaksimilePage
 from datatypes.archival_manuscript import ArchivalManuscriptUnity
 from datatypes.page import Page, STATUS_MERGED_OK, STATUS_POSTMERGED_OK
 from datatypes.text_field import TextField 
 from util import back_up, back_up_svg_file, copy_faksimile_update_image_location, copy_faksimile_svg_file
 from process_files import update_svgposfile_status
 from process_words_post_merging import update_faksimile_line_positions, MERGED_DIR
 
 sys.path.append('shared_util')
 from myxmlwriter import write_pretty, xml_has_type, FILE_TYPE_SVG_WORD_POSITION, FILE_TYPE_XML_MANUSCRIPT
 from main_util import create_function_dictionary
 
 
 __author__ = "Christian Steiner"
 __maintainer__ = __author__
 __copyright__ = 'University of Basel'
 __email__ = "christian.steiner@unibas.ch"
 __status__ = "Development"
 __license__ = "GPL v3"
 __version__ = "0.0.1"
 
 THRESHOLD = 60
+GRAY_THRESHOLD = 200
 BLANK_STATUS = 'blank'
 
-def get_text_field_on_image(image_file: str, image_width: float, image_height: float, id=0) ->TextField:
+def get_text_field_on_thumb(image_file: str, id=0) ->(TextField, float, float):
     """Find the area of of the faksimile image where a manuscript page is displayed
         and return it as a TextField.
     """
     image = cv2.imread(image_file)
     blur = cv2.GaussianBlur(image, (3,3), 0)
     #blur = cv2.bilateralFilter(image,9,75,75)
     gray = cv2.cvtColor(blur, cv2.COLOR_BGR2GRAY)
     thresh = cv2.threshold(gray, 220, 255, cv2.THRESH_BINARY_INV)[1]
     original_height, original_width, channel = image.shape
+    top, bottom = get_start_and_end_index(thresh)
+    height = bottom-top
+    left, right = get_start_and_end_index(thresh.T)
+    width = right-left
+    return (TextField(id=id, x=left, y=top, width=width, height=height), original_width, original_height)
+
+def lessThan(x):
+    return x < GRAY_THRESHOLD
+
+def get_text_field_on_image(image_file: str, image_width: float, image_height: float, id=0) ->TextField:
+    """Find the area of of the faksimile image where a manuscript page is displayed
+        and return it as a TextField.
+    """
+    if not isfile(image_file):
+        raise FileNotFoundError(f'file {image_file} not found!')
+    image = cv2.imread(image_file)
+    blur = cv2.GaussianBlur(image, (3,3), 0)
+    #blur = cv2.bilateralFilter(image,9,75,75)
+    gray = cv2.cvtColor(blur, cv2.COLOR_BGR2GRAY)
+    less = np.frompyfunc(lessThan, 1, 1)
+    thresh = cv2.threshold(gray, 220, 255, cv2.THRESH_BINARY_INV)[1]\
+        if False in less(gray[THRESHOLD])\
+        else cv2.threshold(gray, 200, 255, cv2.THRESH_BINARY)[1]
+    original_height, original_width, channel = image.shape
     startLine, lastLine = get_start_and_end_index(thresh)
     top = round(startLine*image_height/original_height, 1)
     bottom = round(lastLine*image_height/original_height, 1)
     height = bottom-top
     startLine, lastLine = get_start_and_end_index(thresh.T)
     left = round(startLine*image_width/original_width, 1)
     right = round(lastLine*image_width/original_width, 1)
     width = right-left
     return TextField(id=id, x=left, y=top, width=width, height=height)
 
+def get_start_and_end_index_gray(image, thresholdSum) ->(int, int):
+    """    
+    """
+    startLine = -1
+    lastLine = -1
+    for id, line in enumerate(image):
+        if startLine == -1 and np.sum(line) < thresholdSum: 
+            if id-lastLine < THRESHOLD:
+                lastLine = id
+            else:
+                startLine = lastLine
+                lastLine = id
+                break
+    return startLine, lastLine
+
 def get_start_and_end_index(thresh) ->(int, int):
     """    
     """
     startLine = -1
     lastLine = -1
     for id, line in enumerate(thresh):
         if startLine == -1 and np.sum(line) == 0: 
             if id-lastLine < THRESHOLD:
                 lastLine = id
             else:
                 startLine = lastLine
                 lastLine = id
                 break
     return startLine, lastLine
 
 def usage():
     """prints information on how to use the script
     """
     print(main.__doc__)
 
 def main(argv):
     """This program can be used to create svg files with a rect for the text_field.
 
     fixes/get_text_field.py  [OPTIONS] <faksimile-image> width height
 
         <faksimile-image>            the directory where the files should be saved to
 
         OPTIONS:
         -h|--help                       show help
     
         :return: exit code (int)
     """
     try:
         opts, args = getopt.getopt(argv, "h", ["help"])
     except getopt.GetoptError:
         usage()
         return 2
     for opt, arg in opts:
         if opt in ('-h', '--help'):
             usage()
             return 0
     if len(args) < 3:  
         usage()
         return 2
     exit_status = 0
     image_file = args[0]
     image_width = float(args[1])
     image_height = float(args[2])
     if isfile(image_file):
         textfield = get_text_field_on_image(image_file, image_width, image_height)
         print(textfield)
     else:
         raise FileNotFoundError(f'File {image_file} does not exist!')
     return exit_status
 
 if __name__ == "__main__":
     sys.exit(main(sys.argv[1:]))
Index: fixes/create_folio_name.py
===================================================================
--- fixes/create_folio_name.py	(revision 0)
+++ fixes/create_folio_name.py	(revision 114)
@@ -0,0 +1,202 @@
+#!/usr/bin/env python3
+# -*- coding: utf-8 -*-
+
+"""This program can be used to add a name for a folio.
+"""
+#    Copyright (C) University of Basel 2021  {{{1
+#
+#    This program is free software: you can redistribute it and/or modify
+#    it under the terms of the GNU General Public License as published by
+#    the Free Software Foundation, either version 3 of the License, or
+#    (at your option) any later version.
+#
+#    This program is distributed in the hope that it will be useful,
+#    but WITHOUT ANY WARRANTY; without even the implied warranty of
+#    MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
+#    GNU General Public License for more details.
+#
+#    You should have received a copy of the GNU General Public License
+#    along with this program.  If not, see <https://www.gnu.org/licenses/> 1}}}
+
+from colorama import Fore, Style
+import csv
+import getopt
+import json
+import lxml.etree as ET
+import shutil
+import subprocess
+import sys
+import os
+import wget
+from os import listdir, sep, path, setpgrp, devnull, mkdir, remove
+from os.path import exists, isfile, isdir, dirname, basename
+from progress.bar import Bar
+import re
+import warnings
+
+from fix_old_data import save_page
+from get_text_field import get_text_field_on_image
+
+sys.path.append('svgscripts')
+from datatypes.faksimile_image import FaksimileImage
+from datatypes.faksimile import FaksimilePage
+from datatypes.matrix import Matrix
+from datatypes.archival_manuscript import ArchivalManuscriptUnity
+from datatypes.page import Page, STATUS_MERGED_OK, STATUS_POSTMERGED_OK
+from util import back_up, back_up_svg_file, copy_faksimile_update_image_location, copy_faksimile_svg_file
+from process_files import update_svgposfile_status
+from process_words_post_merging import update_faksimile_line_positions, MERGED_DIR
+
+sys.path.append('shared_util')
+from myxmlwriter import copy_to_bak_dir, write_pretty, xml_has_type, FILE_TYPE_SVG_WORD_POSITION, FILE_TYPE_XML_MANUSCRIPT
+from main_util import create_function_dictionary
+
+
+__author__ = "Christian Steiner"
+__maintainer__ = __author__
+__copyright__ = 'University of Basel'
+__email__ = "christian.steiner@unibas.ch"
+__status__ = "Development"
+__license__ = "GPL v3"
+__version__ = "0.0.1"
+
+UNITTESTING = False
+NAME = 'folio-name'
+DESCRIPTION_KEY = 'description'
+ALIAS = 'alias'
+LABEL = 'label'
+URL = 'nietzschesource-url'
+
+def _create_name(current_title, tmp_items, includeTitle=True) ->str:
+    """Return a name.
+    """
+    if not includeTitle:
+        return '_'.join([ tmp_row[ALIAS].replace(current_title, '').replace(',','').replace(' ', '') for tmp_row in tmp_items if 'thumb' not in tmp_row[LABEL] ])
+    return current_title.replace(' ','-') + ',' + '_'.join([ tmp_row[ALIAS].replace(current_title, '').replace(',','').replace(' ', '') for tmp_row in tmp_items if 'thumb' not in tmp_row[LABEL] ])
+
+def _update_old_name(current_title, name_dictionary, last_description, tmp_items, items):
+    folio_name = _create_name(current_title, tmp_items) 
+    if bool(name_dictionary.get(current_title + last_description)):
+        last_folio_name = name_dictionary[current_title + last_description]
+        folio_name = last_folio_name + '_' + _create_name(current_title, tmp_items, includeTitle=False) 
+        for old_row in [ tmp_row for tmp_row in items if tmp_row[NAME] == last_folio_name ]:
+            old_row[NAME] = folio_name
+    name_dictionary.update({ current_title + last_description: folio_name})
+    for tmp_row in tmp_items:
+        tmp_row[NAME] = folio_name
+        items.append(tmp_row)
+
+def process_csv_file(csv_file_name):
+    """Process the csv_file: create a name for folios.
+    """
+    items = []
+    fieldnames = []
+    current_title = None
+    with open(csv_file_name, newline='') as csvfile: 
+        reader = csv.DictReader(csvfile)
+        fieldnames = reader.fieldnames
+        last_description = None
+        tmp_items = []
+        name_dictionary = {} 
+        if len([ key for key in reader.fieldnames if DESCRIPTION_KEY in key ]) > 0:
+            for row in reader:
+                if current_title != row[ALIAS][:row[ALIAS].index(',')]:
+                    if len(tmp_items) > 0:
+                        _update_old_name(current_title, name_dictionary, last_description, tmp_items, items)
+                        tmp_items = []
+                    current_title = row[ALIAS][:row[ALIAS].index(',')]
+                    last_description = row[DESCRIPTION_KEY]
+                    tmp_items.append(row)
+                elif bool(row[DESCRIPTION_KEY]):
+                    if row[DESCRIPTION_KEY] != last_description:
+                        if len(tmp_items) > 0:
+                            _update_old_name(current_title, name_dictionary, last_description, tmp_items, items)
+                        last_description = row[DESCRIPTION_KEY]
+                        tmp_items = [ row ]
+                    else:
+                        tmp_items.append(row)
+        else:
+            return 2
+    if len(tmp_items) > 0:
+        _update_old_name(current_title,name_dictionary, last_description, tmp_items, items)
+    target_csv_file = 'updated_' + csv_file_name
+    with open(target_csv_file, 'w', newline='') as csvfile: 
+         writer = csv.DictWriter(csvfile, fieldnames=fieldnames)
+         writer.writeheader()
+         for row in items:
+             writer.writerow(row)
+    return 0
+
+def process_fix_url(csv_file_name):
+    """Process the csv_file: create a name for folios.
+    """
+    NIETZSCHE_SOURCES_URL = 'http://www.nietzschesource.org/DFGAapi/api/page/download/'
+    THUMB_URL_PREFIX = 'http://www.nietzschesource.org/DFGAapi/images/DFGA/'
+    items = []
+    fieldnames = []
+    with open(csv_file_name, newline='') as csvfile: 
+        reader = csv.DictReader(csvfile)
+        fieldnames = reader.fieldnames
+        for row in reader:
+            if not '_thumb' in row[LABEL] and not row[URL].endswith(row[LABEL].replace('.jpg','')):
+                row[URL] = NIETZSCHE_SOURCES_URL + row[LABEL].replace('.jpg','')
+            elif '_thumb' in row[LABEL] and row[URL].startswith(NIETZSCHE_SOURCES_URL):
+                title = row[LABEL][:row[LABEL].index(',')]
+                row[URL] = THUMB_URL_PREFIX + title + '/mini/' + row[LABEL].replace('_thumb','')
+            items.append(row)
+    target_csv_file = 'url_fixed_' + csv_file_name
+    with open(target_csv_file, 'w', newline='') as csvfile: 
+         writer = csv.DictWriter(csvfile, fieldnames=fieldnames)
+         writer.writeheader()
+         for row in items:
+             writer.writerow(row)
+    return 0
+                           
+
+
+def usage():
+    """prints information on how to use the script
+    """
+    print(main.__doc__)
+
+def main(argv):
+    """This program can be used to add or update a faksimile image to a page xml file.
+
+    fixes/create_folio_name.py [OPTIONS]   <csv-file> 
+
+        <csv-file>              a csv-file containing a folio descriptions.
+
+        OPTIONS:
+        -h|--help      show help
+        -f|--fix-url   fix image url 
+    
+        :return: exit code (int)
+    """
+    fix_url = False
+    try:
+        opts, args = getopt.getopt(argv, "hf", ["help", "fix-url"])
+    except getopt.GetoptError:
+        usage()
+        return 2
+    for opt, arg in opts:
+        if opt in ('-h', '--help'):
+            usage()
+            return 0
+        elif opt in ('-f', '--fix-url'):
+            fix_url = True
+    exit_status = 0
+    if len(args) < 1:  
+        usage()
+        return 2
+    csv_file = args[0]
+    if isfile(csv_file):
+        if fix_url:
+            process_fix_url(csv_file)
+        else:
+            process_csv_file(csv_file)
+    else:
+        raise FileNotFoundError('File {csv_file} does not exist!')
+    return exit_status
+
+if __name__ == "__main__":
+    sys.exit(main(sys.argv[1:]))
Index: fixes/checker_handler.py
===================================================================
--- fixes/checker_handler.py	(revision 113)
+++ fixes/checker_handler.py	(revision 114)
@@ -1,79 +1,79 @@
 #!/usr/bin/env python3
 # -*- coding: utf-8 -*-
 
 """   This program can be used to handle the manual check status of xml files.
 """
 #    Copyright (C) University of Basel 2021  {{{1
 #
 #    This program is free software: you can redistribute it and/or modify
 #    it under the terms of the GNU General Public License as published by
 #    the Free Software Foundation, either version 3 of the License, or
 #    (at your option) any later version.
 #
 #    This program is distributed in the hope that it will be useful,
 #    but WITHOUT ANY WARRANTY; without even the implied warranty of
 #    MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
 #    GNU General Public License for more details.
 #
 #    You should have received a copy of the GNU General Public License
 #    along with this program.  If not, see <https://www.gnu.org/licenses/> 1}}}
 
 from datetime import datetime
 import lxml.etree as ET
 import sys
 
 
 sys.path.append('svgscripts')
 from datatypes.page import Page
 
 __author__ = "Christian Steiner"
 __maintainer__ = __author__
 __copyright__ = 'University of Basel'
 __email__ = "christian.steiner@unibas.ch"
 __status__ = "Development"
 __license__ = "GPL v3"
 __version__ = "0.0.1"
 
 UNITTESTING = False
 
 class CheckerHandler:
     """This class can be used to handle  the manual check status of xml files.
     """
     XML_TAG = 'manual-checks'
-    CHECKS = [ 'transkription positions', 'hyphenation', 'boxes/correction history',\
-               'mark foreign hands', 'line assignement', 'deletion paths', 'faksimile/transkription word correspondance' ]
+    CHECKS = [ 'transkription positions','line assignement', 'hyphenation', 'boxes/correction history',\
+               'mark foreign hands',  'deletion paths', 'faksimile/transkription word correspondance' ]
 
 
     def __init__(self, page: Page):
         self.page = page
 
     def get_todos(self) ->list:
         """Return todos as a list
         """
         todos = self.page.page_tree.xpath(f'//metadata/{self.XML_TAG}/todo/text()')
         if len(todos) > 0\
         or len(self.page.page_tree.xpath(f'//metadata/{self.XML_TAG}/done/text()')) == len(self.CHECKS):
             return todos
         return self.CHECKS
 
     def set_task_done(self, task: str):
         """Set task as done.
         """
         date = datetime.now().strftime('%Y-%m-%d %H:%M:%S')
         checks = self.page.page_tree.xpath(f'//metadata/{self.XML_TAG}')[0]\
             if len(self.page.page_tree.xpath(f'//metadata/{self.XML_TAG}')) > 0\
             else ET.SubElement(self.page.page_tree.xpath('//metadata')[0], self.XML_TAG)
         if len(checks.xpath('./todo')) == 0:
             for todo in self.CHECKS:
                 if todo != task:
                     ET.SubElement(checks, 'todo').text = todo
                 else:
                     ET.SubElement(checks, 'done', attrib={'date': date}).text = task
         elif len(checks.xpath(f'./todo[text()="{task}"]')) > 0:
             done = checks.xpath(f'./todo[text()="{task}"]')[0]
             done.tag = 'done'
             done.set('date', date)
         else:
             ET.SubElement(checks, 'done', attrib={'date': date}).text = task
 
 
Index: fixes/crop_rotate_thumbs.py
===================================================================
--- fixes/crop_rotate_thumbs.py	(revision 0)
+++ fixes/crop_rotate_thumbs.py	(revision 114)
@@ -0,0 +1,224 @@
+#!/usr/bin/env python3
+# -*- coding: utf-8 -*-
+
+"""   This program can be used to crop and/or rotate thumb images.
+"""
+#    Copyright (C) University of Basel 2019  {{{1
+#
+#    This program is free software: you can redistribute it and/or modify
+#    it under the terms of the GNU General Public License as published by
+#    the Free Software Foundation, either version 3 of the License, or
+#    (at your option) any later version.
+#
+#    This program is distributed in the hope that it will be useful,
+#    but WITHOUT ANY WARRANTY; without even the implied warranty of
+#    MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
+#    GNU General Public License for more details.
+#
+#    You should have received a copy of the GNU General Public License
+#    along with this program.  If not, see <https://www.gnu.org/licenses/> 1}}}
+
+from colorama import Fore, Style
+import cv2
+import getopt
+import json
+import lxml.etree as ET
+from numpy import ndarray
+import shutil
+import subprocess
+import sys
+import os
+import wget
+from os import listdir, sep, path, setpgrp, devnull, mkdir, remove
+from os.path import exists, isfile, isdir, dirname, basename
+from progress.bar import Bar
+import warnings
+
+from fix_old_data import save_page
+from get_text_field import get_text_field_on_image, get_text_field_on_thumb
+
+sys.path.append('svgscripts')
+from datatypes.faksimile_image import FaksimileImage
+from datatypes.faksimile import FaksimilePage
+from datatypes.archival_manuscript import ArchivalManuscriptUnity
+from datatypes.page import Page, STATUS_MERGED_OK, STATUS_POSTMERGED_OK
+from datatypes.matrix import Matrix 
+from util import back_up, back_up_svg_file, copy_faksimile_update_image_location, copy_faksimile_svg_file
+from process_files import update_svgposfile_status
+from process_words_post_merging import update_faksimile_line_positions, MERGED_DIR
+
+sys.path.append('shared_util')
+from myxmlwriter import copy_to_bak_dir, write_pretty, xml_has_type, FILE_TYPE_SVG_WORD_POSITION, FILE_TYPE_XML_MANUSCRIPT
+from main_util import create_function_dictionary
+
+
+__author__ = "Christian Steiner"
+__maintainer__ = __author__
+__copyright__ = 'University of Basel'
+__email__ = "christian.steiner@unibas.ch"
+__status__ = "Development"
+__license__ = "GPL v3"
+__version__ = "0.0.1"
+
+MAX_SVG_XY_THRESHOLD = 10
+BLANK_STATUS = 'blank'
+
+
+class ImageManipulator:
+    """This class can be used in order to create svg files with textfield rects.
+    """
+    UNITTESTING = False
+
+    def __init__(self, faksimile_dir=None, fix_doubles=False):
+        self.faksimile_dir = faksimile_dir
+        self.fix_doubles = fix_doubles 
+
+    def _crop_image(self, image: ndarray, image_width: float, image_height: float, x: float, y: float, height: float, width: float) ->ndarray:
+        """Crop image.  Return cropped image.
+        """
+        original_height, original_width, channel = image.shape
+        image_x = round(x*original_width/image_width)
+        image_w = round(width*original_width/image_width)
+        image_y = round(y*original_height/image_height)
+        image_h = round(height*original_height/image_height)
+        return image[image_y:image_y+image_h,image_x:image_x+image_w]
+
+    def crop_according2svg(self, image: ndarray, thumb_svg: str) -> ndarray:
+        """Crop according to svg and return image.
+        """
+        svg_tree = ET.parse(thumb_svg) 
+        namespaces = { k if k is not None else 'ns': v for k, v in svg_tree.getroot().nsmap.items() }
+        images = svg_tree.xpath('//ns:image', namespaces=namespaces)
+        if len(images) > 0:
+            image_width = float(images[0].get('width')) if bool(images[0].get('width')) else 0
+            image_height = float(images[0].get('height')) if bool(images[0].get('height')) else 0
+            viewBox = svg_tree.getroot().get('viewBox') if bool(svg_tree.getroot().get('viewBox')) else '0 0 0 0'
+            x, y, width, height = [ float(i) for i in viewBox.split(' ') ]
+            return self._crop_image(image, image_width, image_height, x, y, height, width)
+        else:
+            return image
+
+    def rotate_according2transform(self, image, transform) ->ndarray:
+        """Rotate image according to transform
+        """
+        rotation_flags = [ cv2.ROTATE_90_CLOCKWISE, cv2.ROTATE_180, cv2.ROTATE_90_COUNTERCLOCKWISE ]
+        matrix = Matrix(transform)
+        mindex = matrix.get90DegreeIndex()
+        if mindex != -1:
+            return cv2.rotate(image, rotation_flags[mindex])
+        return image
+
+    def process_thumb_of_page(self, page_file: str) -> int:
+        """ Create a svg file.
+            [return] exit_status
+        """
+        page = Page.create_cls(page_file)
+        faksimile_nodes = page.page_tree.xpath('//faksimile-image')
+        if len(faksimile_nodes) > 0:
+            transform = faksimile_nodes[0].get('transform')
+            thumb_image = self.faksimile_dir + sep + faksimile_nodes[0].get('file-name').replace('.jpg', '_thumb.jpg')
+            thumb_svg = thumb_image.replace('.jpg', '.svg')
+            if bool(faksimile_nodes[0].get('thumb')):
+                thumb_svg = self.faksimile_dir + sep + faksimile_nodes[0].get('thumb')
+                if thumb_svg.endswith('jpg'):
+                    thumb_svg = thumb_image.replace('.jpg', '.svg')
+            if self.fix_doubles and 'et' in basename(thumb_svg):
+                base_thumb_svg = basename(thumb_svg)
+                thumb_svg = self.faksimile_dir + sep + base_thumb_svg[:base_thumb_svg.index('et')] + '_thumb.svg'
+            if isfile(thumb_svg) or bool(transform):
+                target_extension = ''
+                image = cv2.imread(thumb_image)
+                if isfile(thumb_svg):
+                    image = self.crop_according2svg(image, thumb_svg)
+                    target_extension = '_cropped'
+                if bool(transform):
+                    image = self.rotate_according2transform(image, transform)
+                    target_extension = target_extension + '_rotated'
+                if target_extension != '':
+                    target_file = thumb_image.replace('_thumb', target_extension + '_thumb')
+                    if 'et' in basename(thumb_image):
+                        base_thumb_image = basename(thumb_image)
+                        if page.faksimile_image.text_field.left < (page.faksimile_image.width-page.faksimile_image.text_field.left)/2:
+                            target_file = self.faksimile_dir + sep + base_thumb_image[:base_thumb_image.index('et')] + target_extension + '_thumb.jpg'
+                        else:
+                            target_file = self.faksimile_dir + sep \
+                                    + base_thumb_image[:base_thumb_image.index('et')-2]\
+                                    + base_thumb_image[base_thumb_image.index('et')+2:].replace('_thumb', target_extension + '_thumb')
+                    cv2.imwrite(target_file, image)
+                    faksimile_nodes[0].set('thumb', basename(target_file))
+                    save_page(page, backup=True) 
+                return 0
+            return 1
+        else:
+            print(page_file)
+        return 2
+
+def usage():
+    """prints information on how to use the script
+    """
+    print(main.__doc__)
+
+def main(argv):
+    """This program can be used to crop and/or rotate thumb images. 
+
+    fixes/crop_rotate_thumbs.py [OPTIONS]   <xmlManuscriptFile|svg_pos_file> <faksimile-dir>
+
+        <xmlManuscriptFile>     a xml file about a manuscript, containing information about its pages.
+        <svg_pos_file>          a xml file about a page, containing information about svg word positions.
+        <faksimile-dir>         a directory containing faksimile images
+
+        OPTIONS:
+        -h|--help               show help
+        -d|--fix-doubles        fix double pages
+    
+        :return: exit code (int)
+    """
+    fix_doubles = False
+    try:
+        opts, args = getopt.getopt(argv, "hd", ["help", "fix-doubles"])
+    except getopt.GetoptError:
+        usage()
+        return 2
+    for opt, arg in opts:
+        if opt in ('-h', '--help'):
+            usage()
+            return 0
+        elif opt in ('-d', '--fix-doubles'):
+            fix_doubles = True
+    exit_status = 0
+    if len(args) < 2:  
+        usage()
+        return 2
+    xml_file = args[0]
+    faksimile_dir = args[1]
+    if isfile(xml_file) and isdir(faksimile_dir):
+        counter = 0
+        xpath = f'//page'
+        manuscript_file = xml_file
+        if len(xml_file.split('_')) > 2: # svg_pos_file
+            manuscript_file = '_'.join(xml_file.split('_')[0:2]) + '.xml'    
+            if isfile(manuscript_file):
+                source_tree = ET.parse(manuscript_file)
+                xpath = f'//page[contains(@output,"{xml_file}")]'
+            else:
+                raise FileNotFoundError(f'There is no manuscript file {manuscript_file} for svg_pos_file {xml_file}!')
+        else:
+            source_tree = ET.parse(xml_file)
+        image_manipulator = ImageManipulator(faksimile_dir, fix_doubles=fix_doubles)
+        title = basename(manuscript_file).replace('.xml','').replace('_',' ')
+        for page in source_tree.xpath(xpath):
+            if not ImageManipulator.UNITTESTING: 
+                number = page.get('number')
+                print(Fore.CYAN + f'Processing thumb image of {title}, {number}  ...' + Style.RESET_ALL)
+            if image_manipulator.process_thumb_of_page(page.get('output')) == 0:
+                counter += 1
+        if not ImageManipulator.UNITTESTING: 
+            print(Style.RESET_ALL + f'[{counter} images changed]')
+    else:
+        if not isdir(faksimile_dir):
+            raise FileNotFoundError(f'Directory {faksimile_dir} does not exist!')
+        raise FileNotFoundError('File {} does not exist!'.format(xml_file))
+    return exit_status
+
+if __name__ == "__main__":
+    sys.exit(main(sys.argv[1:]))
Index: fixes/test_create_blank_svg_files.py
===================================================================
--- fixes/test_create_blank_svg_files.py	(revision 113)
+++ fixes/test_create_blank_svg_files.py	(revision 114)
@@ -1,38 +1,45 @@
 import lxml.etree as ET
 from os import sep, path, remove
 from os.path import isdir, isfile, dirname, basename
 import shutil
 import sys
 import tempfile
 import unittest
 import warnings
 
-from create_blank_svg_files import SVGFileCreator, OldSVGFileCreator
+from create_blank_svg_files import SVGFileCreator, OldSVGFileCreator, CSVSVGFileCreator, process_csv
 
 
 sys.path.append('shared_util')
 from myxmlwriter import copy_to_bak_dir
 
 
-
 class TestCreateSVGFILES(unittest.TestCase):
     def setUp(self):
         SVGFileCreator.UNITTESTING = True
         DATADIR = path.dirname(__file__) + sep + 'test_data'  
         self.xml_file = DATADIR + sep + 'N_VII_1_page138.xml'
         self.fix_transkription_positions = DATADIR + sep + 'Mp_XIV_page419a.xml'
 
     def test_init(self):
         svg_creator = OldSVGFileCreator('Mp XVI', '/home/knister0/ownCloud/nietzscheDE/Bearbeitung_Faksimile/Mp_XVI')
         self.assertTrue(svg_creator.avg_left != -1)
         self.assertTrue(svg_creator.avg_top != -1)
         #print(svg_creator.avg_left, svg_creator.avg_top, svg_creator.avg_width, svg_creator.avg_height)
 
     def test_update_svg_file(self):
+        pass
+        """
         svg_file = '/home/knister0/ownCloud/nietzscheDE/Bearbeitung_Faksimile/Myriam/Blank/Mp_XVI/Mp_XVI_page81v.svg'
         copy_to_bak_dir(svg_file)
         exit_status = SVGFileCreator.UPDATE_TEXTFIELD_OF_SVG_FILE(svg_file)
         self.assertTrue(exit_status == 0)
+        """
+    
+    def test_process_csv(self):
+        csv_file = 'Druckmanuscripte/D_20.csv'
+        process_csv(csv_file, '/home/knister0/ownCloud/myNietzscheDE/Druckmanuscripte/faksimiles', '/home/knister0/ownCloud/myNietzscheDE/Druckmanuscripte/svg')
+
 
 if __name__ == "__main__":
     unittest.main()
Index: fixes/create_blank_svg_files.py
===================================================================
--- fixes/create_blank_svg_files.py	(revision 113)
+++ fixes/create_blank_svg_files.py	(revision 114)
@@ -1,349 +1,554 @@
 #!/usr/bin/env python3
 # -*- coding: utf-8 -*-
 
 """   This program can be used to create svg files with a rect for the text_field.
 """
 #    Copyright (C) University of Basel 2019  {{{1
 #
 #    This program is free software: you can redistribute it and/or modify
 #    it under the terms of the GNU General Public License as published by
 #    the Free Software Foundation, either version 3 of the License, or
 #    (at your option) any later version.
 #
 #    This program is distributed in the hope that it will be useful,
 #    but WITHOUT ANY WARRANTY; without even the implied warranty of
 #    MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
 #    GNU General Public License for more details.
 #
 #    You should have received a copy of the GNU General Public License
 #    along with this program.  If not, see <https://www.gnu.org/licenses/> 1}}}
 
 from colorama import Fore, Style
+import csv
 import getopt
 import json
 import lxml.etree as ET
 import shutil
 import subprocess
 import sys
 import os
 import wget
 from os import listdir, sep, path, setpgrp, devnull, mkdir, remove
 from os.path import exists, isfile, isdir, dirname, basename
 from progress.bar import Bar
 import warnings
 
 from fix_old_data import save_page
-from get_text_field import get_text_field_on_image
+from get_text_field import get_text_field_on_image, get_text_field_on_thumb
 
 sys.path.append('svgscripts')
 from datatypes.faksimile_image import FaksimileImage
 from datatypes.faksimile import FaksimilePage
 from datatypes.archival_manuscript import ArchivalManuscriptUnity
 from datatypes.page import Page, STATUS_MERGED_OK, STATUS_POSTMERGED_OK
+from datatypes.matrix import Matrix 
 from util import back_up, back_up_svg_file, copy_faksimile_update_image_location, copy_faksimile_svg_file
 from process_files import update_svgposfile_status
 from process_words_post_merging import update_faksimile_line_positions, MERGED_DIR
 
 sys.path.append('shared_util')
 from myxmlwriter import copy_to_bak_dir, write_pretty, xml_has_type, FILE_TYPE_SVG_WORD_POSITION, FILE_TYPE_XML_MANUSCRIPT
 from main_util import create_function_dictionary
 
 
 __author__ = "Christian Steiner"
 __maintainer__ = __author__
 __copyright__ = 'University of Basel'
 __email__ = "christian.steiner@unibas.ch"
 __status__ = "Development"
 __license__ = "GPL v3"
 __version__ = "0.0.1"
 
 MAX_SVG_XY_THRESHOLD = 10
 BLANK_STATUS = 'blank'
 
 class SPARQLQuery:
     HEADER_OPTION = '--header'
     HEADER_VALUE = 'Accept: application/sparql-results+json,*/*;q=0.9'
     ENDPOINT = 'https://nietzsche.fuseki.services.dasch.swiss/nietzsche'
     QUERY = 'query=PREFIX+tln%3A+%3Chttp%3A%2F%2Fwww.nie.org%2Fontology%2Fnietzsche%23%3E%0ASELECT+(AVG(%3Fleft)+as+%3Favg_left)+(AVG(%3Ftop)+as+%3Favg_top)+(AVG(%3Fwidth)+as+%3Favg_width)+(AVG(%3Fheight)+as+%3Favg_height)+WHERE+%7B%0A+%3Fimage+a+tln%3AFaksimileImage%3B+tln%3AhasTextField+%3Ftextfield.%0A+%3Ftextfield+tln%3AhasLeft+%3Fleft%3B+tln%3AhasTop+%3Ftop%3B+tln%3AhasWidth+%3Fwidth%3B+tln%3AhasHeight+%3Fheight.%7D+'
     REQUEST_OPTION = '--request'
     REQUEST_VALUE = 'POST'
 class OldSVGFileCreator:
     """This class can be used in order to create svg files with textfield rects.
     """
     UNITTESTING = False
     RESPONSE = 'response.json'
 
     def __init__(self, title, faksimile_dir, endpoint=SPARQLQuery.ENDPOINT, target_dir='./tmp'):
         self.avg_left = -1
         self.avg_top = -1
         self.avg_height = -1
         self.avg_width = -1
         self.endpoint = endpoint
         self.faksimile_dir = faksimile_dir
         self.target_dir = target_dir
         self.title = title
         self.curl = self._get_ext_program_path('curl')
         self.inkscape = self._get_ext_program_path('inkscape')
         self.namespaces = None
         self._init_averages()
 
     def _init_averages(self):
         """Initialize average dimension of textfield based on the data from the endpoint
         """
         if not isfile(self.RESPONSE):
             subprocess.run([self.curl, self.endpoint,\
                 SPARQLQuery.REQUEST_OPTION, SPARQLQuery.REQUEST_VALUE, '--data', SPARQLQuery.QUERY, SPARQLQuery.HEADER_OPTION, SPARQLQuery.HEADER_VALUE, '-o', self.RESPONSE ], check=True)
         with open(self.RESPONSE) as json_file:
             data = json.load(json_file)
             keys = data['head']['vars']
             for key in keys:
                 for item in data['results']['bindings']:
                     self.__dict__[key] = float(item[key]['value'])
 
     def _get_ext_program_path(self, program_name) ->str:
         """Return path to external program
         """    
         program_path = None
         error_msg = f'External command "{program_name}" not found!\nPlease install "{program_name}", check the output of "which {program_name}" and retry.'
         try:
             cp = subprocess.run(["which", program_name], stdout=subprocess.PIPE, check=True)
             program_path = cp.stdout.decode().strip()
             if not bool(program_path) or not isfile(program_path):
                 raise FileNotFoundError(error_msg)
         except subprocess.CalledProcessError:
             print(error_msg)
             raise
         return program_path
 
     def create_svg_file(self, page: ET.Element) -> int:
         """ Create a svg file.
             [return] exit_status
         """
         number = page.get('number')
         page_file = page.get('output')
         faksimile_file = self.faksimile_dir + sep + page.get('alias') + '.jpg'\
                 if page.get('alias') is not None\
                 else None
         page_id = self.title.replace(' ', '_') + '_' + number
         if bool(page.get('alias')) and not isfile(faksimile_file):
             wget.download(FaksimileImage.NIETZSCHE_SOURCES_URL + page.get('alias'), out=faksimile_file)
         if bool(page.get('alias')) and isfile(faksimile_file) and page_file is not None and isfile(page_file):
             target_file = basename(page_file).replace('.xml', '.svg')
             if not isfile(self.target_dir + sep + target_file):
                 prog_list = [self.inkscape, '-z', '-l', target_file, faksimile_file]
                 subprocess.run(prog_list, check=True)
                 svg_tree = ET.parse(target_file)
                 namespaces = { k if k is not None else 'ns': v for k, v in svg_tree.getroot().nsmap.items() }
                 images = svg_tree.xpath('//ns:image', namespaces=namespaces)
                 if len(images) > 0:
                     image_file = dirname(target_file) + sep + images[0].get('{%s}href' % namespaces['xlink'])
                     image_width = float(images[0].get('width')) if bool(images[0].get('width')) else 0
                     image_height = float(images[0].get('height')) if bool(images[0].get('height')) else 0
                     text_filed = get_text_field_on_image(image_file, image_width, image_height, id=page_id)
                     text_filed.attach_as_rect(svg_tree.getroot())
                     copy_faksimile_update_image_location(faksimile_tree=svg_tree, target_directory=self.target_dir)
                     remove(target_file)
                 else:
                     print(f'There has been an error: could not find an image in {target_file}!')
                     return 2
             return 0
         else:
             print(faksimile_file, page_file)
         return 2
+
     def update_textfield_of_svg_file(self, svg_file: str) -> int:
         """ Update the textfield of the svg file by using image analysis. 
             [return] exit_status
         """
         svg_tree = ET.parse(target_file)
         namespaces = { k if k is not None else 'ns': v for k, v in svg_tree.getroot().nsmap.items() }
         rects = svg_tree.xpath('//ns:rect[not(contains(@id, "rect"))]', namespaces=namespaces)
         images = svg_tree.xpath('//ns:image', namespaces=namespaces)
         if len(rects) > 0 and len(images) > 0:
             image_file = dirname(svg_file) + sep + images[0].get('{%s}href' % namespaces['xlink'])
             image_width = float(images[0].get('width')) if bool(images[0].get('width')) else 0
             image_height = float(images[0].get('height')) if bool(images[0].get('height')) else 0
             text_filed = get_text_field_on_image(image_file, image_width, image_height)
             text_filed.attach_as_rect(rects[0])
             copy_faksimile_svg_file(target_file=svg_file, faksimile_tree=svg_tree)
             return 0
         else:
             print(f'There has been an error: could not find a rect and an image in {svg_file}!')
             return 2
         return 2
 
 class SVGFileCreator:
     """This class can be used in order to create svg files with textfield rects.
     """
     UNITTESTING = False
 
-    def __init__(self, title, faksimile_dir, target_dir='./tmp'):
+    def __init__(self, title=None, faksimile_dir=None, target_dir='./tmp'):
         self.faksimile_dir = faksimile_dir
         self.target_dir = target_dir
         self.title = title
         self.inkscape = self._get_ext_program_path('inkscape')
         self.namespaces = None
 
     def _get_ext_program_path(self, program_name) ->str:
         """Return path to external program
         """    
         program_path = None
         error_msg = f'External command "{program_name}" not found!\nPlease install "{program_name}", check the output of "which {program_name}" and retry.'
         try:
             cp = subprocess.run(["which", program_name], stdout=subprocess.PIPE, check=True)
             program_path = cp.stdout.decode().strip()
             if not bool(program_path) or not isfile(program_path):
                 raise FileNotFoundError(error_msg)
         except subprocess.CalledProcessError:
             print(error_msg)
             raise
         return program_path
 
     def create_svg_file(self, page: ET.Element) -> int:
         """ Create a svg file.
             [return] exit_status
         """
         number = page.get('number')
         page_file = page.get('output')
         faksimile_file = self.faksimile_dir + sep + page.get('alias') + '.jpg'\
                 if page.get('alias') is not None\
                 else None
         page_id = self.title.replace(' ', '_') + '_' + number
         if bool(page.get('alias')) and not isfile(faksimile_file):
             wget.download(FaksimileImage.NIETZSCHE_SOURCES_URL + page.get('alias'), out=faksimile_file)
         if bool(page.get('alias')) and isfile(faksimile_file) and page_file is not None and isfile(page_file):
             target_file = basename(page_file).replace('.xml', '.svg')
-            if not isfile(self.target_dir + sep + target_file):
+            return self._create_svg_file(target_file, faksimile_file, page_id)    
+        else:
+            print(faksimile_file, page_file)
+        return 2
+
+    def _create_svg_file(self, target_file, faksimile_file, page_id=0) ->int:
+        """ Create a svg file.
+        [return] exit_status
+        """
+        if not isfile(self.target_dir + sep + target_file):
+            prog_list = [self.inkscape, '-z', '-l', target_file, faksimile_file]
+            subprocess.run(prog_list, check=True)
+            svg_tree = ET.parse(target_file)
+            namespaces = { k if k is not None else 'ns': v for k, v in svg_tree.getroot().nsmap.items() }
+            images = svg_tree.xpath('//ns:image', namespaces=namespaces)
+            if len(images) > 0:
+                image_file = dirname(target_file) + sep + images[0].get('{%s}href' % namespaces['xlink']).replace('file://', '')
+                image_width = float(images[0].get('width')) if bool(images[0].get('width')) else 0
+                image_height = float(images[0].get('height')) if bool(images[0].get('height')) else 0
+                print(image_file, image_width, image_height)
+                text_field = get_text_field_on_image(image_file, image_width, image_height, id=page_id)
+                text_field.attach_as_rect(svg_tree.getroot())
+                copy_faksimile_update_image_location(faksimile_tree=svg_tree, target_directory=self.target_dir)
+                remove(target_file)
+            else:
+                print(f'There has been an error: could not find an image in {target_file}!')
+                return 2
+        return 0
+
+    def create_rotation_svg_file(self, page_file: str) -> int:
+        """ Create a svg file.
+            [return] exit_status
+        """
+        page_tree = ET.parse(page_file)
+        transform = page_tree.xpath('//faksimile-image/@transform')[0] 
+        thumb = page_tree.xpath('//faksimile-image/@file-name')[0].replace('.jpg', '_thumb.svg')
+        if len(page_tree.xpath('//faksimile-image/@thumb')) > 0:
+            thumb = page_tree.xpath('//faksimile-image/@thumb')[0]
+        thumb_file = self.faksimile_dir + sep + thumb
+        faksimile_file = thumb_file.replace('.svg', '.jpg')
+        if not isfile(thumb_file) and isfile(faksimile_file):
+            faksimile_file = thumb_file.replace('.svg', '.jpg')
+            prog_list = [self.inkscape, '-z', '-l', target_file, faksimile_file]
+            subprocess.run(prog_list, check=True)
+        elif not isfile(thumb_file) and not isfile(faksimile_file):
+            print(f'There has been an error: could not find the faksimile_file {faksimile_file}!')
+            return 2
+        if isfile(thumb_file):
+            svg_tree = ET.parse(thumb_file)
+            namespaces = { k if k is not None else 'ns': v for k, v in svg_tree.getroot().nsmap.items() }
+            images = svg_tree.xpath('//ns:image', namespaces=namespaces)
+            if len(images) > 0:
+                matrix = Matrix(transform)
+                if matrix.matrix[matrix.B] != 0.0 and matrix.matrix[matrix.C] != 0.0:
+                    width = float(svg_tree.getroot().get('width'))
+                    height = float(svg_tree.getroot().get('height'))
+                    matrix.updateOffset(height, width)
+                images[0].set('{%s}href' % namespaces['xlink'], basename(faksimile_file))
+                svg_tree.getroot().set('transform', matrix.toString())
+                copy_faksimile_svg_file(target_file=thumb_file, faksimile_tree=svg_tree)
+            else:
+                print(f'There has been an error: could not find an image in {thumb_file}!')
+                return 2
+            return 0
+        else:
+            print(thumb_file, page_file)
+        return 2
+
+    def create_svg_thumb_file(self, faksimile_file: str) -> int:
+        """ Create a svg thumb file.
+            [return] exit_status
+        """
+        if isfile(faksimile_file):
+            target_file = faksimile_file.replace('.jpg', '.svg')
+            if not isfile(target_file):
                 prog_list = [self.inkscape, '-z', '-l', target_file, faksimile_file]
                 subprocess.run(prog_list, check=True)
                 svg_tree = ET.parse(target_file)
                 namespaces = { k if k is not None else 'ns': v for k, v in svg_tree.getroot().nsmap.items() }
                 images = svg_tree.xpath('//ns:image', namespaces=namespaces)
                 if len(images) > 0:
-                    image_file = dirname(target_file) + sep + images[0].get('{%s}href' % namespaces['xlink']).replace('file://', '')
-                    image_width = float(images[0].get('width')) if bool(images[0].get('width')) else 0
-                    image_height = float(images[0].get('height')) if bool(images[0].get('height')) else 0
-                    print(image_file)
-                    text_filed = get_text_field_on_image(image_file, image_width, image_height, id=page_id)
-                    text_filed.attach_as_rect(svg_tree.getroot())
-                    copy_faksimile_update_image_location(faksimile_tree=svg_tree, target_directory=self.target_dir)
-                    remove(target_file)
+                    text_field, width, height = get_text_field_on_thumb(faksimile_file)
+                    images[0].set('width', str(width))
+                    images[0].set('height', str(height))
+                    images[0].set('{%s}href' % namespaces['xlink'], basename(faksimile_file))
+                    svg_tree.getroot().set('width', str(text_field.width))
+                    svg_tree.getroot().set('height', str(text_field.height))
+                    svg_tree.getroot().set('viewBox', f'{text_field.left} {text_field.top} {text_field.width} {text_field.height}')
+                    copy_faksimile_svg_file(target_file=target_file, faksimile_tree=svg_tree)
                 else:
                     print(f'There has been an error: could not find an image in {target_file}!')
                     return 2
             return 0
         else:
             print(faksimile_file, page_file)
         return 2
 
     @staticmethod
     def UPDATE_TEXTFIELD_OF_SVG_FILE(svg_file: str) -> int:
         """ Update the textfield of the svg file by using image analysis. 
             [return] exit_status
         """
         svg_tree = ET.parse(svg_file)
         namespaces = { k if k is not None else 'ns': v for k, v in svg_tree.getroot().nsmap.items() }
         rects = svg_tree.xpath('//ns:rect[not(contains(@id, "rect"))]', namespaces=namespaces)
         images = svg_tree.xpath('//ns:image', namespaces=namespaces)
         if len(rects) > 0 and len(images) > 0:
             image_file = dirname(svg_file) + sep + images[0].get('{%s}href' % namespaces['xlink'])
             image_width = float(images[0].get('width')) if bool(images[0].get('width')) else 0
             image_height = float(images[0].get('height')) if bool(images[0].get('height')) else 0
-            text_filed = get_text_field_on_image(image_file, image_width, image_height)
-            text_filed.update_rect(rects[0])
+            text_field = get_text_field_on_image(image_file, image_width, image_height)
+            text_field.update_rect(rects[0])
             copy_faksimile_svg_file(target_file=svg_file, faksimile_tree=svg_tree)
             return 0
         else:
             print(f'There has been an error: could not find a rect and an image in {svg_file}!')
             return 2
         return 2
 
-def usage():
-    """prints information on how to use the script
+class CSVSVGFileCreator(SVGFileCreator):
+    """This class can be used in order to create svg files with textfield rects from a csv file.
     """
-    print(main.__doc__)
-
-def main(argv):
-    """This program can be used to create svg files with a rect for the text_field.
+    FOLIO = "Blatt-ID"
+    LABEL = "Label"
+    ALIAS = "Alias"
+    URL = "Nietzschesource-URL"
+    CONTENT = "Inhalt"
+
+    def __init__(self, title=None, faksimile_dir=None, target_dir='./tmp'):
+        super(CSVSVGFileCreator,self).__init__(title=title, faksimile_dir=faksimile_dir, target_dir=target_dir)
+  
+    def create_svg_file_from_csv_input(self, faksimile_file, page_id) ->int:
+        """Create a svg file from csv input.
+        """
+        target_file = basename(faksimile_file).replace('.jpg', '.svg')
+        return self._create_svg_file(target_file, faksimile_file, page_id)
 
-    fixes/create_blank_svg_files.py [OPTIONS]   <xmlManuscriptFile|svg_pos_file> <faksimile-dir> <target-dir>
-    fixes/create_blank_svg_files.py -u|--update <svg-dir>
+def process_update(args) ->int:
+    """ Process option update
+    """
+    if len(args) < 0:
+        usage()
+        return 2
+    svg_dir = args[0]
+    if not isdir(svg_dir):
+        raise FileNotFoundError(f'Directory {svg_dir} does not exist!')
+    counter = 0
+    for svg_file in [ svg_dir + sep + svg_file for svg_file in listdir(svg_dir) if isfile(svg_dir + sep + svg_file) and svg_file.endswith('.svg') ]:
+        if not SVGFileCreator.UNITTESTING: 
+            print(Fore.CYAN + f'Updating svg file  {svg_file}  ...' + Style.RESET_ALL)
+        copy_to_bak_dir(svg_file)
+        if SVGFileCreator.UPDATE_TEXTFIELD_OF_SVG_FILE(svg_file) == 0:
+            counter += 1
+    if not SVGFileCreator.UNITTESTING: 
+        print(Style.RESET_ALL + f'[{counter} pages created]')
+    return 0
 
-        <xmlManuscriptFile>     a xml file about a manuscript, containing information about its pages.
-        <svg_pos_file>          a xml file about a page, containing information about svg word positions.
-        <faksimile-dir>         a directory containing faksimile images
-        <target-dir>            the directory where the files should be saved to
+def process_rotate(args) ->int:
+    """ Process option rotate 
+    """
+    if len(args) < 2:
+        usage()
+        return 2
+    xml_file = args[0]
+    faksimile_dir = args[1]
+    if not isdir(faksimile_dir):
+        raise FileNotFoundError(f'Directory {faksimile_dir} does not exist!')
+    xpath = f'//page'
+    source_tree = ET.parse(xml_file)
+    if len(xml_file.split('_')) > 2: # svg_pos_file
+        manuscript_file = '_'.join(xml_file.split('_')[0:2]) + '.xml'    
+        if isfile(manuscript_file):
+            source_tree = ET.parse(manuscript_file)
+            xpath = f'//page[contains(@output,"{xml_file}")]'
+        else:
+            raise FileNotFoundError(f'There is no manuscript file {manuscript_file} for svg_pos_file {xml_file}!')
+    counter = 0
+    svg_creator = SVGFileCreator('', faksimile_dir)
+    for page in [ page for page in source_tree.xpath(xpath) if len(ET.parse(page.get('output')).xpath('//faksimile-image/@transform')) > 0 ]:
+        if not SVGFileCreator.UNITTESTING: 
+            number = page.get('number')
+            print(Fore.CYAN + f'Rotating svg file for page {number}  ...' + Style.RESET_ALL)
+        if svg_creator.create_rotation_svg_file(page) == 0:
+            counter += 1
+    if not SVGFileCreator.UNITTESTING: 
+        print(Style.RESET_ALL + f'[{counter} pages created]')
+    return 0
 
-        OPTIONS:
-        -h|--help               show help
-        -u|--update             update svg_files: use image analysis in order to update the textfield of the svg_files
-    
-        :return: exit code (int)
+def process_thumb(args) ->int:
+    """ Process option thumb 
     """
-    update = False
-    try:
-        opts, args = getopt.getopt(argv, "hu", ["help","update"])
-    except getopt.GetoptError:
+    if len(args) == 0:
         usage()
         return 2
-    for opt, arg in opts:
-        if opt in ('-h', '--help'):
-            usage()
-            return 0
-        elif opt in ('-u', '--update'):
-            update = True
-    exit_status = 0
-    if update:
-        if len(args) == 0:
-            usage()
-            return 2
-        svg_dir = args[0]
-        if not isdir(svg_dir):
-            raise FileNotFoundError(f'Directory {svg_dir} does not exist!')
-        counter = 0
-        for svg_file in [ svg_dir + sep + svg_file for svg_file in listdir(svg_dir) if isfile(svg_dir + sep + svg_file) and svg_file.endswith('.svg') ]:
-            if not SVGFileCreator.UNITTESTING: 
-                print(Fore.CYAN + f'Updating svg file  {svg_file}  ...' + Style.RESET_ALL)
-            copy_to_bak_dir(svg_file)
-            if SVGFileCreator.UPDATE_TEXTFIELD_OF_SVG_FILE(svg_file) == 0:
-                counter += 1
+    faksimile_dir = args[0]
+    title = args[1]\
+            if len(args) > 1\
+            else ''
+    svg_creator = SVGFileCreator('', faksimile_dir)
+    print(faksimile_dir, title)
+    if not isdir(faksimile_dir):
+        raise FileNotFoundError(f'Directory {faksimile_dir} does not exist!')
+    counter = 0
+    for faksimile_file in [ faksimile_dir + sep + faksimile_file for faksimile_file in listdir(faksimile_dir)\
+                            if isfile(faksimile_dir + sep + faksimile_file)\
+                            and basename(faksimile_file).startswith(title)\
+                            and faksimile_file.endswith('_thumb.jpg') ]:
         if not SVGFileCreator.UNITTESTING: 
-            print(Style.RESET_ALL + f'[{counter} pages created]')
-        return exit_status
+            print(Fore.CYAN + f'Creating a svg for faksimile file  {faksimile_file}  ...' + Style.RESET_ALL)
+        if svg_creator.create_svg_thumb_file(faksimile_file) == 0:
+            counter += 1
+    if not SVGFileCreator.UNITTESTING: 
+        print(Style.RESET_ALL + f'[{counter} thumb svg files created]')
+    return 0
 
+def process_csv(csv_file_name, faksimile_dir, target_dir, downloadOnly=False) ->int:
+    """ Default process 
+    """
+    title = basename(csv_file_name).replace('.csv','').replace('_', ' ')
+    file_creator = CSVSVGFileCreator(title, faksimile_dir, target_dir)
+    exit_status = 0
+    with open(csv_file_name, newline='') as csvfile: 
+        reader = csv.DictReader(csvfile)
+        for row in reader:
+            faksimile_name = row[CSVSVGFileCreator.LABEL]
+            if '_thumb' not in faksimile_name:
+                faksimile_url = row[CSVSVGFileCreator.URL]
+                page_id = row[CSVSVGFileCreator.ALIAS].replace(',', '').replace(' ', '_')
+                faksimile_file = faksimile_dir + sep + faksimile_name
+                if not isfile(faksimile_file):
+                    wget.download(faksimile_url, out=faksimile_file)
+                if not downloadOnly:
+                    if isfile(faksimile_file):
+                        print(f'processing {faksimile_file} ...')
+                        if file_creator.create_svg_file_from_csv_input(faksimile_file, page_id) > 0:
+                            exit_status = 2
+                    else:
+                        exit_status = 2
+                        print(f'There has been an error on downloading {faksimile_url}!', e)
+    return exit_status
+
+def process_default(args) ->int:
+    """ Default process 
+    """
     if len(args) < 3:  
         usage()
         return 2
-    xml_file = args[0]
     faksimile_dir = args[1]
     target_dir = args[2]
     not isdir(target_dir) and mkdir(target_dir)
+    if args[0].endswith('.csv'):
+        return process_csv(args[0], faksimile_dir, target_dir)
+    xml_file = args[0]
     if isfile(xml_file) and isdir(faksimile_dir):
         counter = 0
         xpath = f'//page[contains(@status, "{BLANK_STATUS}")]'
         if len(xml_file.split('_')) > 2: # svg_pos_file
             manuscript_file = '_'.join(xml_file.split('_')[0:2]) + '.xml'    
             if isfile(manuscript_file):
                 source_tree = ET.parse(manuscript_file)
                 xpath = f'//page[contains(@output,"{xml_file}")]'
             else:
                 raise FileNotFoundError(f'There is no manuscript file {manuscript_file} for svg_pos_file {xml_file}!')
         else:
             source_tree = ET.parse(xml_file)
         title = source_tree.getroot().get('title')
         svg_creator = SVGFileCreator(title, faksimile_dir, target_dir=target_dir)
         for page in source_tree.xpath(xpath):
             if not SVGFileCreator.UNITTESTING: 
                 number = page.get('number')
                 print(Fore.CYAN + f'Creating a svg file for  {title}, {number}  ...' + Style.RESET_ALL)
             if svg_creator.create_svg_file(page) == 0:
                 counter += 1
         if not SVGFileCreator.UNITTESTING: 
             print(Style.RESET_ALL + f'[{counter} pages created]')
     else:
         if not isdir(faksimile_dir):
             raise FileNotFoundError(f'Directory {faksimile_dir} does not exist!')
         raise FileNotFoundError('File {} does not exist!'.format(xml_file))
-    return exit_status
+    return 0
+
+
+def usage():
+    """prints information on how to use the script
+    """
+    print(main.__doc__)
+
+def main(argv):
+    """This program can be used to create svg files with a rect for the text_field.
+
+    fixes/create_blank_svg_files.py [OPTIONS]   <xmlManuscriptFile|svg_pos_file|csv_file> <faksimile-dir> <target-dir>
+    fixes/create_blank_svg_files.py -r|--rotate-thumb <xmlManuscriptFile|svg_pos_file> <faksimile-dir>
+    fixes/create_blank_svg_files.py -u|--update <svg-dir>
+    fixes/create_blank_svg_files.py -t|--thumb <faksimile-dir> [<title>]
+
+        <xmlManuscriptFile>     a xml file about a manuscript, containing information about its pages.
+        <svg_pos_file>          a xml file about a page, containing information about svg word positions.
+        <csv_file>              a csv file with faksimile information.
+        <faksimile-dir>         a directory containing faksimile images
+        <target-dir>            the directory where the files should be saved to
+
+        OPTIONS:
+        -h|--help               show help
+        -r|--rotate-thumb       use image analysis in order to create a svg file for the thumb faksimile files that need rotation. 
+        -u|--update             update svg_files: use image analysis in order to update the textfield of the svg_files
+        -t|--thumb              use image analysis in order to create a svg file for the thumb faksimile files that need cropping. 
+    
+        :return: exit code (int)
+    """
+    update = False
+    thumb = False
+    rotate = True
+    try:
+        opts, args = getopt.getopt(argv, "hrut", ["help","rotate-thumb","update", "thumb"])
+    except getopt.GetoptError:
+        usage()
+        return 2
+    for opt, arg in opts:
+        if opt in ('-h', '--help'):
+            usage()
+            return 0
+        elif opt in ('-r', '--rotate-thumb'):
+            rotate = True
+        elif opt in ('-u', '--update'):
+            update = True
+        elif opt in ('-t', '--thumb'):
+            thumb = True
+    if update:
+        return process_update(args)
+    elif rotate:
+        return process_rotate(args)
+    elif thumb:
+        return process_thumb(args)
+    return process_default(args)
 
 if __name__ == "__main__":
     sys.exit(main(sys.argv[1:]))
Index: fixes/test_add_faksimile_image.py
===================================================================
--- fixes/test_add_faksimile_image.py	(revision 113)
+++ fixes/test_add_faksimile_image.py	(revision 114)
@@ -1,32 +1,41 @@
 import lxml.etree as ET
 from os import sep, path, remove
 from os.path import isdir, isfile, dirname, basename
 import shutil
 import sys
 import tempfile
 import unittest
 import warnings
 
 import add_faksimile_image
 
 
 sys.path.append('shared_util')
 from myxmlwriter import copy_to_bak_dir
 
 
 sys.path.append('svgscripts')
 from datatypes.page import Page
 
 class TestAddFaksimileImage(unittest.TestCase):
+    def setUp(self):
+        add_faksimile_image.UNITTESTING = True
+        self.csv_file = 'tests_svgscripts/test_data/bd_12_Layout.csv'
 
     def testAdd(self):
         add_faksimile_image.UNITTESTING = True
         page = Page.create_cls('xml/Mp_XVI_page52v.xml')
         faksimile_dir = '/home/knister0/ownCloud/nietzscheDE/Bearbeitung_Faksimile/Myriam/Blank/Mp_XVI/Fertig'
         exit_status = add_faksimile_image.add_faksimile_image(page, faksimile_dir)
         self.assertEqual(exit_status, 0)
         #print(ET.dump(page.page_tree.xpath('//faksimile-image')[0]))
 
+    def testCSV(self):
+        #csv_handler = add_faksimile_image.FlippedSidesCSVHandler(self.csv_file, 'Mp XVI')
+        csv_handler = add_faksimile_image.FlippedSidesCSVHandler('/home/knister0/ownCloud/myNietzscheDE/KGW-IX_13/bd_13.csv', 'Mp XVIII')
+        print(csv_handler.page_dictionary)        
+        page = Page.create_cls('xml/Mp_XVIII_page12v.xml')
+        self.assertEqual(add_faksimile_image.update_faksimile_image(page, csv_handler), 0)
 
 if __name__ == "__main__":
     unittest.main()
Index: fixes/add_faksimile_image.py
===================================================================
--- fixes/add_faksimile_image.py	(revision 113)
+++ fixes/add_faksimile_image.py	(revision 114)
@@ -1,134 +1,205 @@
 #!/usr/bin/env python3
 # -*- coding: utf-8 -*-
 
 """This program can be used to add a faksimile image to a page xml file.
 """
 #    Copyright (C) University of Basel 2021  {{{1
 #
 #    This program is free software: you can redistribute it and/or modify
 #    it under the terms of the GNU General Public License as published by
 #    the Free Software Foundation, either version 3 of the License, or
 #    (at your option) any later version.
 #
 #    This program is distributed in the hope that it will be useful,
 #    but WITHOUT ANY WARRANTY; without even the implied warranty of
 #    MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
 #    GNU General Public License for more details.
 #
 #    You should have received a copy of the GNU General Public License
 #    along with this program.  If not, see <https://www.gnu.org/licenses/> 1}}}
 
 from colorama import Fore, Style
+import csv
 import getopt
 import json
 import lxml.etree as ET
 import shutil
 import subprocess
 import sys
 import os
 import wget
 from os import listdir, sep, path, setpgrp, devnull, mkdir, remove
 from os.path import exists, isfile, isdir, dirname, basename
 from progress.bar import Bar
+import re
 import warnings
 
 from fix_old_data import save_page
 from get_text_field import get_text_field_on_image
 
 sys.path.append('svgscripts')
 from datatypes.faksimile_image import FaksimileImage
 from datatypes.faksimile import FaksimilePage
+from datatypes.matrix import Matrix
 from datatypes.archival_manuscript import ArchivalManuscriptUnity
 from datatypes.page import Page, STATUS_MERGED_OK, STATUS_POSTMERGED_OK
 from util import back_up, back_up_svg_file, copy_faksimile_update_image_location, copy_faksimile_svg_file
 from process_files import update_svgposfile_status
 from process_words_post_merging import update_faksimile_line_positions, MERGED_DIR
 
 sys.path.append('shared_util')
 from myxmlwriter import copy_to_bak_dir, write_pretty, xml_has_type, FILE_TYPE_SVG_WORD_POSITION, FILE_TYPE_XML_MANUSCRIPT
 from main_util import create_function_dictionary
 
 
 __author__ = "Christian Steiner"
 __maintainer__ = __author__
 __copyright__ = 'University of Basel'
 __email__ = "christian.steiner@unibas.ch"
 __status__ = "Development"
 __license__ = "GPL v3"
 __version__ = "0.0.1"
 
 MAX_SVG_XY_THRESHOLD = 10
 BLANK_STATUS = 'blank'
 UNITTESTING = False
 
+class FlippedSidesCSVHandler:
+    """This class can be used to handle csv files that contain information about the title and layout of the svg files.
+    """
+    ENTRY_KEY_PAGE = 'pdf_page_number'
+    ENTRY_KEY_FILE = 'svg_source_file'
+    ENTRY_KEY_TITLE = 'manuscript_title'
+    ENTRY_KEY_PAGE_NAMES = 'page_names'
+    ENTRY_KEY_MARG_PAGE = 'marginals_page_entry'
+    MANUSCRIPT_AE_REMOVAL = re.compile('[a-e]')
+    MANUSCRIPT_KEY = 'Ms'
+    MANUSCRIPT_PATTERN = re.compile(r'(\d+)(>\s)(.*)')
+    MANUSCRIPT_TITLE_EXTENSION = 'Mp' 
+    MANUSCRIPT_TITLE_PARTS = re.compile(r'([I-X]+[a-e]*)(\s)(\d+\w*)(/\d+\w*)*')
+    MARGINALS_PAGE = re.compile(r'([I-X]+[a-e]*)(\s)(\d+\w*)(\s)(Marg)')
+    REMOVE_NONNUMERIC = re.compile('\D')
+
+    def __init__(self, csv_file_name: str, title: str):
+        self.page_dictionary = {}
+        self.title = title
+        self._init_csv_entries(csv_file_name)
+
+
+    def _init_csv_entries(self, csv_file_name):
+        """Init csv entries by reading the csv_file.
+        """
+        with open(csv_file_name, newline='') as csvfile: 
+            reader = csv.DictReader(csvfile)
+            flipped_key = 'Gedrehte Seiten'
+            if len([ key for key in reader.fieldnames if flipped_key in key ]) > 0:
+                flipped_key = [ key for key in reader.fieldnames if flipped_key in key ][0]
+                for row in reader:
+                    if bool(row[flipped_key]):
+                        ms_string = row[self.MANUSCRIPT_KEY]
+                        manuscript_match = re.match(self.MANUSCRIPT_PATTERN, ms_string)
+                        for flipped_line in row[flipped_key].split('\n'):
+                            flipped_msg = re.split(r'(\s*Drehung\s*|\s*\(.*)', flipped_line)
+                            if len(flipped_msg) > 2 and manuscript_match is not None:
+                                page_number = flipped_msg[0]
+                                rotation = flipped_msg[2]
+                                title_parts = re.match(self.MANUSCRIPT_TITLE_PARTS, manuscript_match.group(3))
+                                if title_parts is not None\
+                                    and self.MANUSCRIPT_TITLE_EXTENSION + ' ' + self.MANUSCRIPT_AE_REMOVAL.sub('', title_parts.group(1)) == self.title:
+                                    self.page_dictionary.update({page_number: rotation})
+
 
 def add_faksimile_image(page: Page, faksimile_dir: str) ->int:
     """Add faksimile image to page.
         [:return:] exit_code
     """
     svg_file = faksimile_dir + sep + basename(page.page_tree.docinfo.URL).replace('.xml','.svg') 
     if isfile(svg_file):
         fp = FaksimilePage.get_faksimile_pages(svg_file, page_number=page.number, isBlank=True)  
         if len(fp) > 0 and fp[0].faksimile_image is not None:
             fp[0].faksimile_image.text_field = fp[0].text_field
             fp[0].faksimile_image.attach_object_to_tree(page.page_tree)
             if not UNITTESTING:
                 save_page(page)
             return 0
     return 2
 
+def update_faksimile_image(page: Page, csv_handler: FlippedSidesCSVHandler) ->int:
+    """Update faksimile image of page: add rotation matrix.
+        [:return:] exit_code
+    """
+    rotation = csv_handler.page_dictionary.get(page.number)
+    if rotation is not None:
+        matrix = Matrix(f'rotate({rotation})')
+        page.faksimile_image.transform = matrix
+        page.faksimile_image.attach_object_to_tree(page.page_tree)
+        if not UNITTESTING:
+            save_page(page)
+        return 0
+    else:
+        print(page.number, csv_handler.page_dictionary.keys())
+    return 2
+
 def usage():
     """prints information on how to use the script
     """
     print(main.__doc__)
 
 def main(argv):
-    """This program can be used to add a faksimile image to a page xml file.
+    """This program can be used to add or update a faksimile image to a page xml file.
 
-    fixes/add_faksimile_image.py [OPTIONS]   <xmlManuscriptFile|svg_pos_file> <faksimile-dir> 
+    fixes/add_faksimile_image.py [OPTIONS]   <xmlManuscriptFile|svg_pos_file> <faksimile-dir|csv-file> 
 
         <xmlManuscriptFile>     a xml file about a manuscript, containing information about its pages.
         <svg_pos_file>          a xml file about a page, containing information about svg word positions.
         <faksimile-dir>         a directory containing the blank faksimile svg files
+        <csv-file>              a csv-file containing a column about the rotation of the transkription.
 
         OPTIONS:
         -h|--help               show help
     
         :return: exit code (int)
     """
     try:
         opts, args = getopt.getopt(argv, "h", ["help"])
     except getopt.GetoptError:
         usage()
         return 2
     for opt, arg in opts:
         if opt in ('-h', '--help'):
             usage()
             return 0
     exit_status = 0
     if len(args) < 2:  
         usage()
         return 2
     xml_file = args[0]
     manuscript_file = xml_file\
         if len(xml_file.split('_')) < 3\
         else '_'.join(xml_file.split('_')[0:2]) + '.xml'
-    faksimile_dir = args[1]
-    if isfile(xml_file) and isdir(faksimile_dir):
+    task = add_faksimile_image
+    argument = args[1]
+    if argument.endswith('.csv'):
+        if isfile(argument):
+            argument = FlippedSidesCSVHandler(argument, basename(manuscript_file).replace('_', ' ').replace('.xml',''))
+            task = update_faksimile_image
+        else:
+            raise FileNotFoundError(f'File {argument} does not exist!')
+    elif not isdir(argument):
+        raise FileNotFoundError(f'Directory {argument} does not exist!')
+    if isfile(xml_file):
         counter = 0
         for page in Page.get_pages_from_xml_file(xml_file, status_contains=BLANK_STATUS):
             if not UNITTESTING: 
-                print(Fore.CYAN + f'Adding a faksimile image to  {page.title}, {page.number}  ...' + Style.RESET_ALL)
+                print(Fore.CYAN + f'{task.__name__}:  {page.title}, {page.number}  ...' + Style.RESET_ALL)
                 back_up(page, page.xml_file)
-            if add_faksimile_image(page, faksimile_dir) == 0:
+            if task(page, argument) == 0:
                 counter += 1
         if not UNITTESTING: 
-            print(Style.RESET_ALL + f'[{counter} pages created]')
+            print(Style.RESET_ALL + f'[{counter} pages processed]')
     else:
-        if not isdir(faksimile_dir):
-            raise FileNotFoundError(f'Directory {faksimile_dir} does not exist!')
         raise FileNotFoundError('File {} does not exist!'.format(xml_file))
     return exit_status
 
 if __name__ == "__main__":
     sys.exit(main(sys.argv[1:]))
Index: py2ttl/data_handler.py
===================================================================
--- py2ttl/data_handler.py	(revision 113)
+++ py2ttl/data_handler.py	(revision 114)
@@ -1,197 +1,294 @@
 #!/usr/bin/env python3
 # -*- coding: utf-8 -*-
 
 """   This class can be used to add data to a rdf graph.
 """
 #    Copyright (C) University of Basel 2019  {{{1
 #
 #    This program is free software: you can redistribute it and/or modify
 #    it under the terms of the GNU General Public License as published by
 #    the Free Software Foundation, either version 3 of the License, or
 #    (at your option) any later version.
 #
 #    This program is distributed in the hope that it will be useful,
 #    but WITHOUT ANY WARRANTY; without even the implied warranty of
 #    MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
 #    GNU General Public License for more details.
 #
 #    You should have received a copy of the GNU General Public License
 #    along with this program.  If not, see <https://www.gnu.org/licenses/> 1}}}
 
 __author__ = "Christian Steiner"
 __maintainer__ = __author__
 __copyright__ = 'University of Basel'
 __email__ = "christian.steiner@unibas.ch"
 __status__ = "Development"
 __license__ = "GPL v3"
 __version__ = "0.0.1"
 
 from rdflib import Graph, URIRef, Literal, BNode, OWL, RDF, RDFS, XSD
 from rdflib import RDF as ns_rdf
 from os.path import isfile
 import random
 import warnings
 
 from class_spec import SemanticClass
 from config import DATA_URL
 
 class RDFDataHandler:
     """
     This class can be used to add data to a rdf graph.
     """
     UNITTESTING = False
     SIMPLE_DATA_TYPE_MAPPING = { int: XSD.integer, float: XSD.float, str: XSD.string, bool: XSD.boolean, list: RDF.List }
     
     def __init__(self, target_file, mapping_dictionary):
         self.target_file = target_file
         self.mapping_dictionary = mapping_dictionary
         self.ontology_graph = Graph()
         self.data_graph = Graph()
         self.data_identifier_mapping = {}
         if bool(self.mapping_dictionary.get('ontology')):
             self.project_name = self.mapping_dictionary['ontology'].get('project_name')
             self.project_uri = URIRef(self.mapping_dictionary['ontology'].get('project_uri'))
             ontology_file = self.mapping_dictionary['ontology'].get('ontology_file')
             if bool(ontology_file) and isfile(ontology_file):
                 self.ontology_graph.parse(ontology_file, format="turtle")
             self.ns = { uriref: ns for ns, uriref in self.data_graph.namespace_manager.namespaces() }
             self.data_graph.bind(self.project_name, self.project_uri)
             self.data_graph.bind('data', DATA_URL + '#')
         else:
             raise Exception('Error: mapping_dictionary does not contain key "ontology"!')
 
     def add_data(self, data_instance, identifier_prefix, parent_data_instance=None, skip_data_instance_list=None):
         """Add a data rdf instance of data_instance to the data_graph.
 
             :return: (rdflib.URIRef) subject_uri of data instance
         """
         skip_data_instance_list = [] if skip_data_instance_list is None else skip_data_instance_list
         identifier_uri = self.create_identifier_uri(data_instance, identifier_prefix)
         if type(data_instance).__name__ not in skip_data_instance_list and bool(self.mapping_dictionary['classes'].get(type(data_instance).__name__)):
             class_uri = self.mapping_dictionary['classes'][type(data_instance).__name__]['class_uri']
             self.data_identifier_mapping.update({data_instance: identifier_uri})
             self.data_graph_add((identifier_uri, RDF.type, class_uri))
             semantic_dict = data_instance.get_semantic_dictionary()
             for key, content in semantic_dict['properties'].items():
                 if bool(self.mapping_dictionary['classes'][type(data_instance).__name__]['properties'].get(key)):
                     datatype = content.get('class')
                     cardinality = content.get('cardinality')\
                             if bool(content.get('cardinality')) else 0
                     if data_instance.__dict__.get(key) is not None\
                             and (type(data_instance.__dict__.get(key)) != int or data_instance.__dict__.get(key) != -1):
                         predicate_uri = self.mapping_dictionary['classes'][type(data_instance).__name__]['properties'][key]
                         child_data_instance = data_instance.__dict__.get(key)
                         new_identifier_prefix = identifier_uri[identifier_uri.index('#')+1:]
                         if datatype is list:
                             self.add_ordered_list(child_data_instance, identifier_uri, predicate_uri,\
                                         new_identifier_prefix, data_instance, skip_data_instance_list=skip_data_instance_list)
                         elif issubclass(datatype, SemanticClass):
                             if type(child_data_instance) is not list:
                                 if type(child_data_instance) != datatype\
                                         and not issubclass(type(child_data_instance), datatype):
                                     child_id = child_data_instance
                                     child_data_instance = parent_data_instance.get_object_from_list_with_id(datatype,\
                                             child_id)
                                     if child_data_instance is None:
                                         print(key, content)# parent_data_instance.number, child_id, type(child_id), datatype)
                                         msg = 'No child_data_instance found for data_instance {0}: looking for {1} with id {2}'.format(\
                                                 type(parent_data_instance), datatype, child_id)
                                         raise Exception(msg)
                                     else:
                                         new_list_name = 'list_of_' + datatype.__name__ + 's'
                                         if new_list_name in data_instance.__dict__.keys():
                                             data_instance.__dict__[new_list_name].append(child_data_instance)
                                         else:
                                             data_instance.__dict__.update({ new_list_name: [ child_data_instance ]})
                                 if child_data_instance not in self.data_identifier_mapping.keys():
                                     child_identifier_uri = self.add_data(child_data_instance, new_identifier_prefix,\
                                         parent_data_instance=data_instance, skip_data_instance_list=skip_data_instance_list)
                                 else:
                                     child_identifier_uri = self.data_identifier_mapping[child_data_instance]
                                 self.data_graph_add((identifier_uri, predicate_uri, child_identifier_uri))
                             else:
                                 for child_item in child_data_instance:
                                     if child_item not in self.data_identifier_mapping.keys():
                                         child_identifier_uri = self.add_data(child_item, new_identifier_prefix,\
                                                                             parent_data_instance=data_instance, skip_data_instance_list=skip_data_instance_list)
                                     else:
                                         child_identifier_uri = self.data_identifier_mapping[child_item]
                                     self.data_graph_add((identifier_uri, predicate_uri, child_identifier_uri))
 
                         else:
                             literal_datatype = RDFDataHandler.SIMPLE_DATA_TYPE_MAPPING[datatype]
                             ontology_datatypes = [ o for o in self.ontology_graph.objects(subject=predicate_uri, predicate=RDFS.range) ] 
                             if len(ontology_datatypes) > 0:
                                 literal_datatype = ontology_datatypes[0]
                             if type(child_data_instance) is list:
                                 for child_item in child_data_instance:
                                     object_literal = Literal(str(child_item), datatype=literal_datatype)
                                     self.data_graph_add((identifier_uri, predicate_uri, object_literal))
                             else:
                                 object_literal = Literal(str(child_data_instance), datatype=literal_datatype)
                                 self.data_graph_add((identifier_uri, predicate_uri, object_literal))
                 else:
                     msg = 'Mapping dictionary for {0} does not contain a entry for {1}!'.format(type(data_instance).__name__, key)
                     raise Exception(msg)
         elif type(data_instance).__name__ not in skip_data_instance_list:
             msg = 'Mapping dictionary does not contain a entry for {}!'.format(type(data_instance).__name__)
             raise Exception(msg)
         return identifier_uri
 
+    def add_data_instance2parent_uri(self, parent_uri, predicate, data_instance):
+        """Add a data rdf instance of data_instance to the data_graph.
+
+            :return: (rdflib.URIRef) subject_uri of data instance
+        """
+        predicate_uri = URIRef(self.project_uri + predicate)
+        if (parent_uri, predicate_uri, None) not in self.data_graph:
+            identifier_prefix = parent_uri[parent_uri.index('#')+1:]
+            identifier_uri = self.create_identifier_uri(data_instance, identifier_prefix)
+            if bool(self.mapping_dictionary['classes'].get(type(data_instance).__name__)):
+                class_uri = self.mapping_dictionary['classes'][type(data_instance).__name__]['class_uri']
+                self.data_identifier_mapping.update({data_instance: identifier_uri})
+                self.data_graph_add((identifier_uri, RDF.type, class_uri))
+                self.data_graph_add((parent_uri, predicate_uri, identifier_uri))
+                semantic_dict = data_instance.get_semantic_dictionary()
+                for key, content in semantic_dict['properties'].items():
+                    if bool(self.mapping_dictionary['classes'][type(data_instance).__name__]['properties'].get(key)):
+                        datatype = content.get('class')
+                        cardinality = content.get('cardinality')\
+                                if bool(content.get('cardinality')) else 0
+                        if data_instance.__dict__.get(key) is not None\
+                                and (type(data_instance.__dict__.get(key)) != int or data_instance.__dict__.get(key) != -1):
+                            predicate_uri = self.mapping_dictionary['classes'][type(data_instance).__name__]['properties'][key]
+                            child_data_instance = data_instance.__dict__.get(key)
+                            new_identifier_prefix = identifier_uri[identifier_uri.index('#')+1:]
+                            if datatype is list:
+                                self.add_ordered_list(child_data_instance, identifier_uri, predicate_uri, new_identifier_prefix, data_instance)
+                            elif issubclass(datatype, SemanticClass):
+                                if type(child_data_instance) is not list:
+                                    if type(child_data_instance) != datatype\
+                                            and not issubclass(type(child_data_instance), datatype):
+                                        child_id = child_data_instance
+                                        child_data_instance = data_instance.get_object_from_list_with_id(datatype, child_id)
+                                        if child_data_instance is None:
+                                            print(key, content)# parent_data_instance.number, child_id, type(child_id), datatype)
+                                            msg = 'No child_data_instance found for data_instance {0}: looking for {1} with id {2}'.format(\
+                                                    type(data_instance), datatype, child_id)
+                                            raise Exception(msg)
+                                        else:
+                                            new_list_name = 'list_of_' + datatype.__name__ + 's'
+                                            if new_list_name in data_instance.__dict__.keys():
+                                                data_instance.__dict__[new_list_name].append(child_data_instance)
+                                            else:
+                                                data_instance.__dict__.update({ new_list_name: [ child_data_instance ]})
+                                    if child_data_instance not in self.data_identifier_mapping.keys():
+                                        child_identifier_uri = self.add_data(child_data_instance, new_identifier_prefix,\
+                                            parent_data_instance=data_instance)
+                                    else:
+                                        child_identifier_uri = self.data_identifier_mapping[child_data_instance]
+                                    self.data_graph_add((identifier_uri, predicate_uri, child_identifier_uri))
+                                else:
+                                    for child_item in child_data_instance:
+                                        if child_item not in self.data_identifier_mapping.keys():
+                                            child_identifier_uri = self.add_data(child_item, new_identifier_prefix, parent_data_instance=data_instance)
+                                        else:
+                                            child_identifier_uri = self.data_identifier_mapping[child_item]
+                                        self.data_graph_add((identifier_uri, predicate_uri, child_identifier_uri))
+                            else:
+                                literal_datatype = RDFDataHandler.SIMPLE_DATA_TYPE_MAPPING[datatype]
+                                ontology_datatypes = [ o for o in self.ontology_graph.objects(subject=predicate_uri, predicate=RDFS.range) ] 
+                                if len(ontology_datatypes) > 0:
+                                    literal_datatype = ontology_datatypes[0]
+                                if type(child_data_instance) is list:
+                                    for child_item in child_data_instance:
+                                        object_literal = Literal(str(child_item), datatype=literal_datatype)
+                                        self.data_graph_add((identifier_uri, predicate_uri, object_literal))
+                                else:
+                                    object_literal = Literal(str(child_data_instance), datatype=literal_datatype)
+                                    self.data_graph_add((identifier_uri, predicate_uri, object_literal))
+                    else:
+                        msg = 'Mapping dictionary for {0} does not contain a entry for {1}!'.format(type(data_instance).__name__, key)
+                        raise Exception(msg)
+            return identifier_uri
+
     def add_ordered_list(self, data_instance_list, identifier_uri, predicate_uri, identifier_prefix, data_instance, skip_data_instance_list=None):
         """Add a data rdf instance of data_instance to the data_graph.
         """
         if len(data_instance_list) > 0:
             child_identifiers = []
             for item in data_instance_list:
                 if item not in self.data_identifier_mapping.keys():
                     child_identifiers.append(self.add_data(item, identifier_prefix, data_instance, skip_data_instance_list=skip_data_instance_list))
                 else:
                     child_identifiers.append(self.data_identifier_mapping[item])
             list_node = self.generate_RDF_collection(child_identifiers)
             self.data_graph_add((identifier_uri, predicate_uri, list_node))
 
+    def add_external_class_item(self, data_type, identifier_prefix, id) ->URIRef:
+        """Add a externally defined item.
+        """
+        class_uri = URIRef(self.project_uri  + data_type)
+        identifier_uri = self.create_simple_identifier_uri(data_type, identifier_prefix, id)
+        self.data_graph_add((identifier_uri, RDF.type, class_uri))
+        return identifier_uri
+
+    def add_external_property(self, identifier_uri, predicate, list_of_uris):
+        """Add a externally defined item.
+        """
+        predicate_uri = URIRef(self.project_uri  + predicate)
+        for uri in [ uri.replace('"', '') for uri in list_of_uris ]:
+            self.data_graph_add((identifier_uri, predicate_uri, URIRef(DATA_URL + '#' + uri[uri.index('#')+1:])))
+
+    def create_simple_identifier_uri(self, data_type, identifier_prefix, id):
+        """Return a data identifier uri.
+
+            :return: (rdflib.URIRef) subject_uri of data instance
+        """
+        identifier_uri = URIRef(DATA_URL + '#' + identifier_prefix + '_' + data_type + str(id))
+        return identifier_uri
+
     def create_identifier_uri(self, data_instance, identifier_prefix):
         """Return a data identifier uri.
 
             :return: (rdflib.URIRef) subject_uri of data instance
         """
         data_type, id = data_instance.get_name_and_id()
         identifier_uri = URIRef(DATA_URL + '#' + identifier_prefix + '_' + data_type + str(id))
         randombit_length = 5
         while (identifier_uri, None, None) in self.data_graph:
             identifier_uri = URIRef(DATA_URL + '#' + identifier_prefix + '_' + data_type + str(random.getrandbits(randombit_length)))
             randombit_length += 1
         return identifier_uri
 
     def data_graph_add(self, rdf_triple):
         """Add a triple to the graph.
         """
         #not RDFDataHandler.UNITTESTING and print(rdf_triple)
         self.data_graph.add(rdf_triple)
 
     def generate_RDF_collection(self, vals ) -> BNode:
         """
 	Generate an RDF List from vals, returns the head of the list
         @URL: <https://github.com/MKLab-ITI/prophet/blob/master/rdflib/plugins/parsers/pyMicrodata/utils.py>
         @organization: U{World Wide Web Consortium<http://www.w3.org>}
         @author: U{Ivan Herman<a href="http://www.w3.org/People/Ivan/">}
         @license: 
         U{W3C® SOFTWARE NOTICE AND LICENSE<href="http://www.w3.org/Consortium/Legal/2002/copyright-software-20021231">}
 	@param graph: RDF graph
 	@type graph: RDFLib Graph
 	@param vals: array of RDF Resources
 	@return: head of the List (an RDF Resource)
 	"""
         heads = [ BNode() for r in vals ] + [ ns_rdf["nil"] ]
         for i in range(0, len(vals)) :
             self.data_graph_add( (heads[i], ns_rdf["first"], vals[i]) )
             self.data_graph_add( (heads[i], ns_rdf["rest"],  heads[i+1]) )
         return heads[0]
 
     def write(self, output_format="turtle"):
         """Write graph.
         """
         f = open(self.target_file, 'wb+')
         f.write(self.data_graph.serialize(format=output_format))
         f.close()
Index: py2ttl/create_manuscript_description.py
===================================================================
--- py2ttl/create_manuscript_description.py	(revision 0)
+++ py2ttl/create_manuscript_description.py	(revision 114)
@@ -0,0 +1,186 @@
+#!/usr/bin/env python3
+# -*- coding: utf-8 -*-
+
+"""   This program can be used to create a manuscript description in turtle format.
+"""
+#    Copyright (C) University of Basel 2019  {{{1
+#
+#    This program is free software: you can redistribute it and/or modify
+#    it under the terms of the GNU General Public License as published by
+#    the Free Software Foundation, either version 3 of the License, or
+#    (at your option) any later version.
+#
+#    This program is distributed in the hope that it will be useful,
+#    but WITHOUT ANY WARRANTY; without even the implied warranty of
+#    MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
+#    GNU General Public License for more details.
+#
+#    You should have received a copy of the GNU General Public License
+#    along with this program.  If not, see <https://www.gnu.org/licenses/> 1}}}
+
+from colorama import Fore, Style
+import csv
+import getopt
+import lxml.etree as ET
+from os import sep, path, listdir
+from os.path import isfile, isdir, dirname, basename
+from progress.bar import Bar
+import re
+import sys
+
+sys.path.append('svgscripts')
+from datatypes.manuscript_description import ManuscriptDescription
+
+if dirname(__file__) not in sys.path:
+    sys.path.append(dirname(__file__))
+
+from class_spec import SemanticClass
+from config import check_config_files_exist, get_datatypes_dir, PROJECT_NAME, PROJECT_ONTOLOGY_FILE, PROJECT_URL
+from py2ttl_data import Py2TTLDataConverter
+from py2ttl_ontology import Py2TTLOntologyConverter
+from data_handler import RDFDataHandler
+
+
+sys.path.append('shared_util')
+from myxmlwriter import xml2dict
+from main_util import get_manuscript_files_and_include_status
+
+__author__ = "Christian Steiner"
+__maintainer__ = __author__
+__copyright__ = 'University of Basel'
+__email__ = "christian.steiner@unibas.ch"
+__status__ = "Development"
+__license__ = "GPL v3"
+__version__ = "0.0.1"
+
+FILE_TYPE_XML_PROJECT = "xmlProjectFile"
+
+class Py2TTLCSVManuscriptDescriptionConverter:
+    """This class can be used convert manuscript description to rdf data in turtle format.
+    """
+    UNITTESTING = False
+    NAME = 'folio-name'
+    DESCRIPTION_KEY = 'description'
+    ALIAS = 'alias'
+    LABEL = 'label'
+    URL = 'nietzschesource-url'
+
+    def __init__(self, csv_file: str, faksimile_mapping: str, mapping_dictionary: str):
+        self.mapping_dictionary = mapping_dictionary
+        self.csv_file = csv_file
+        self.faksimile_mapping_dict = self._init_mapping(faksimile_mapping)
+
+    def _init_mapping(self, faksimile_mapping) ->dict:
+        """Init faksimile_mapping dictionary.
+        """
+        faksimile_mapping_dict = {}
+        with open(faksimile_mapping, newline='') as csvfile: 
+            reader = csv.DictReader(csvfile)
+            fieldnames = reader.fieldnames
+            for row in reader:
+                if bool(faksimile_mapping_dict.get(row[fieldnames[1]])):
+                    faksimile_mapping_dict[row[fieldnames[1]]].append(row[fieldnames[0]])
+                else:
+                    faksimile_mapping_dict.update({ row[fieldnames[1]]: [row[fieldnames[0]]]})
+        return faksimile_mapping_dict
+   
+    def convert(self, target_data_file):
+        """Convert manuscript decriptions from csv_file to rdf data and write to target_file.
+        """
+        not Py2TTLCSVManuscriptDescriptionConverter.UNITTESTING and print(Fore.CYAN + 'initializing python objects with file "{}" ...'.format(self.csv_file))
+        data_handler = RDFDataHandler(target_data_file, self.mapping_dictionary)
+        with open(self.csv_file, newline='') as csvfile: 
+            reader = csv.DictReader(csvfile)
+            fieldnames = reader.fieldnames
+            leaf_id = ''
+            description = ''
+            images = []
+            counter = 0
+            for row in [ row for row in reader if '_thumb' not in row[self.LABEL]]:
+                if row[self.NAME] != leaf_id:
+                    if leaf_id != '':
+                        counter += 1
+                        identifier_uri = data_handler.add_external_class_item('Leaf', '', leaf_id)
+                        data_handler.add_external_property(identifier_uri, 'isDepictedBy', images)
+                        manuscript_description = ManuscriptDescription.create_cls_from_raw_text(description)
+                        data_handler.add_data_instance2parent_uri(identifier_uri, 'leafHasDescription', manuscript_description)
+                    leaf_id = row[self.NAME]
+                    description = row[self.DESCRIPTION_KEY]
+                    images = []
+                if bool(self.faksimile_mapping_dict.get(row[self.LABEL])):
+                    for image in self.faksimile_mapping_dict[row[self.LABEL]]:
+                        images.append(image)
+            if len(images) > 0: 
+                counter += 1
+                identifier_uri = data_handler.add_external_class_item('Leaf', '', leaf_id)
+                data_handler.add_external_property(identifier_uri, 'isDepictedBy', images)
+                manuscript_description = ManuscriptDescription.create_cls_from_raw_text(description)
+                data_handler.add_data_instance2parent_uri(identifier_uri, 'leafHasDescription', manuscript_description)
+        if not Py2TTLCSVManuscriptDescriptionConverter.UNITTESTING:
+            print(Fore.GREEN + f'[{counter} leafs added]')
+        if not Py2TTLCSVManuscriptDescriptionConverter.UNITTESTING:
+            print(Fore.CYAN + 'adding triples to rdf graph ... ')
+        if not Py2TTLCSVManuscriptDescriptionConverter.UNITTESTING:
+            print(Fore.GREEN + '[{} statements added]'.format(str(len(data_handler.data_graph))))
+            print(Fore.CYAN + 'writing graph to file "{}" ...'.format(target_data_file))
+        data_handler.write()
+        if not Py2TTLCSVManuscriptDescriptionConverter.UNITTESTING:
+            print(Fore.GREEN + '[OK]')
+            print(Style.RESET_ALL)
+
+def usage():
+    """prints information on how to use the script
+    """
+    print(main.__doc__)
+
+def main(argv):
+    """This program can be used to convert py objects to a owl:Ontology and rdf data in turtle format.
+
+    py2ttl/create_manuscript_description.py [OPTIONS] <csv-file> <mapping-csv> 
+
+        <csv-file>            csv file that contains the description of the manuscript.
+        <mapping-csv>         a image to faksimile iri mapping csv file
+
+        OPTIONS:
+        -h|--help:          show help
+        -o|--output=FILE    specify output file
+
+        :return: exit code (int)
+    """
+    check_config_files_exist()
+    datatypes_dir =  get_datatypes_dir()
+    source_ontology_file = PROJECT_ONTOLOGY_FILE 
+    target_ontology_file = '.{0}{1}-ontology_autogenerated.ttl'.format(sep, PROJECT_NAME)
+    output_file = './include-ttl/descriptions.ttl'
+    try:
+        opts, args = getopt.getopt(argv, "ho:", ["help", "output="])
+    except getopt.GetoptError:
+        usage()
+        return 2
+    for opt, arg in opts:
+        if opt in ('-h', '--help'):
+            usage()
+            return 0
+        elif opt in ('-0', '--output'):
+            output_file = arg
+    if len(args) < 2 :
+        usage()
+        return 2
+    ontology_created = False
+    ontology_converter = Py2TTLOntologyConverter(project_ontology_file=source_ontology_file)
+    csv_file = args[0]
+    mapping_csv_file = args[1]
+    output = 2
+    print(Fore.CYAN + 'Create ontology  ...')
+    if ontology_converter.create_ontology(datatypes_dir, target_ontology_file) == 0:
+        print(Fore.GREEN + '[Ontology file {0} created]'.format(target_ontology_file))
+    else:
+        return 2
+    print(Fore.CYAN + f'Create data from  "{csv_file}" with  ...')
+    data_converter = Py2TTLCSVManuscriptDescriptionConverter(csv_file, mapping_csv_file, mapping_dictionary=ontology_converter.uri_mapping4cls_and_properties)
+    output = data_converter.convert(output_file)
+    return output
+
+
+if __name__ == "__main__":
+    sys.exit(main(sys.argv[1:]))
Index: tests_py2ttl/test_data/mapping_dict.xml
===================================================================
--- tests_py2ttl/test_data/mapping_dict.xml	(revision 113)
+++ tests_py2ttl/test_data/mapping_dict.xml	(revision 114)
@@ -1,417 +1,421 @@
 <?xml version="1.0" encoding="utf-8"?>
 <root>
 	<dict>
 		<ontology>
 			<project_name type="str">tln</project_name>
 			<project_uri type="URIRef">http://www.nie.org/ontology/nietzsche#</project_uri>
 			<ontology_file type="str">./tln-ontology_autogenerated.ttl</ontology_file>
 		</ontology>
 		<classes>
 			<ManuscriptUnity>
 				<class_uri type="URIRef">http://www.nie.org/ontology/nietzsche#ManuscriptUnity</class_uri>
 				<properties>
 					<title type="URIRef">http://www.nie.org/ontology/nietzsche#hasTitle</title>
 					<manuscript_type type="URIRef">http://www.nie.org/ontology/nietzsche#hasManuscriptType</manuscript_type>
 					<pages type="URIRef">http://www.nie.org/ontology/nietzsche#hasPages</pages>
 					<description type="URIRef">http://www.nie.org/ontology/nietzsche#hasDescription</description>
 				</properties>
 			</ManuscriptUnity>
 			<ArchivalManuscriptUnity>
 				<class_uri type="URIRef">http://www.nie.org/ontology/nietzsche#ArchivalManuscriptUnity</class_uri>
 				<properties>
 					<title type="URIRef">http://www.nie.org/ontology/nietzsche#hasTitle</title>
 					<manuscript_type type="URIRef">http://www.nie.org/ontology/nietzsche#hasManuscriptType</manuscript_type>
 					<pages type="URIRef">http://www.nie.org/ontology/nietzsche#hasPages</pages>
+					<status type="URIRef">http://www.nie.org/ontology/nietzsche#archivalManuscriptUnityHasDataProcessingStatus</status>
 					<styles type="URIRef">http://www.nie.org/ontology/nietzsche#hasStyles</styles>
 					<gsa_signature type="URIRef">http://www.nie.org/ontology/nietzsche#hasGsaSignature</gsa_signature>
 					<description type="URIRef">http://www.nie.org/ontology/nietzsche#hasDescription</description>
 					<reconstructed_konvoluts type="URIRef">http://www.nie.org/ontology/nietzsche#partsBelongToReconstructedKonvolut</reconstructed_konvoluts>
 					<earlier_descriptions type="URIRef">http://www.nie.org/ontology/nietzsche#hasEarlierDescriptions</earlier_descriptions>
 				</properties>
 			</ArchivalManuscriptUnity>
 			<EditorComment>
 				<class_uri type="URIRef">http://www.nie.org/ontology/nietzsche#EditorComment</class_uri>
 				<properties>
 					<is_uncertain type="URIRef">http://www.nie.org/ontology/nietzsche#isUncertain</is_uncertain>
 					<comment type="URIRef">http://www.nie.org/ontology/nietzsche#hasComment</comment>
 					<text type="URIRef">http://www.nie.org/ontology/nietzsche#commentHasText</text>
 				</properties>
 			</EditorComment>
 			<AtypicalWriting>
 				<class_uri type="URIRef">http://www.nie.org/ontology/nietzsche#AtypicalWriting</class_uri>
 				<properties>
 					<is_uncertain type="URIRef">http://www.nie.org/ontology/nietzsche#isUncertain</is_uncertain>
 					<comment type="URIRef">http://www.nie.org/ontology/nietzsche#hasComment</comment>
 					<text type="URIRef">http://www.nie.org/ontology/nietzsche#commentHasText</text>
 				</properties>
 			</AtypicalWriting>
 			<Path>
 				<class_uri type="URIRef">http://www.nie.org/ontology/nietzsche#Path</class_uri>
 				<properties>
 					<d_attribute type="URIRef">http://www.nie.org/ontology/nietzsche#hasDAttribute</d_attribute>
 				</properties>
 			</Path>
 			<Box>
 				<class_uri type="URIRef">http://www.nie.org/ontology/nietzsche#Box</class_uri>
 				<properties>
 					<d_attribute type="URIRef">http://www.nie.org/ontology/nietzsche#hasDAttribute</d_attribute>
 					<earlier_text type="URIRef">http://www.nie.org/ontology/nietzsche#hasEarlierText</earlier_text>
 				</properties>
 			</Box>
 			<Clarification>
 				<class_uri type="URIRef">http://www.nie.org/ontology/nietzsche#Clarification</class_uri>
 				<properties>
 					<is_uncertain type="URIRef">http://www.nie.org/ontology/nietzsche#isUncertain</is_uncertain>
 					<comment type="URIRef">http://www.nie.org/ontology/nietzsche#hasComment</comment>
 					<text type="URIRef">http://www.nie.org/ontology/nietzsche#commentHasText</text>
 				</properties>
 			</Clarification>
 			<Color>
 				<class_uri type="URIRef">http://www.nie.org/ontology/nietzsche#Color</class_uri>
 				<properties>
 					<name type="URIRef">http://www.nie.org/ontology/nietzsche#colorHasName</name>
 					<hex_color type="URIRef">http://www.nie.org/ontology/nietzsche#hasHexadecimalValue</hex_color>
 				</properties>
 			</Color>
 			<Text>
 				<class_uri type="URIRef">http://www.nie.org/ontology/nietzsche#Text</class_uri>
 				<properties>
 					<content type="URIRef">http://www.nie.org/ontology/nietzsche#textHasContent</content>
 					<standoff_markups type="URIRef">http://www.nie.org/ontology/nietzsche#textHasMarkup</standoff_markups>
 				</properties>
 			</Text>
 			<Description>
 				<class_uri type="URIRef">http://www.nie.org/ontology/nietzsche#Description</class_uri>
 				<properties>
 					<content type="URIRef">http://www.nie.org/ontology/nietzsche#textHasContent</content>
 					<standoff_markups type="URIRef">http://www.nie.org/ontology/nietzsche#textHasMarkup</standoff_markups>
 				</properties>
 			</Description>
 			<EarlierDescription>
 				<class_uri type="URIRef">http://www.nie.org/ontology/nietzsche#EarlierDescription</class_uri>
 				<properties>
 					<content type="URIRef">http://www.nie.org/ontology/nietzsche#textHasContent</content>
 					<author type="URIRef">http://www.nie.org/ontology/nietzsche#hasAuthor</author>
 					<citation type="URIRef">http://www.nie.org/ontology/nietzsche#hasCitation</citation>
 					<standoff_markups type="URIRef">http://www.nie.org/ontology/nietzsche#textHasMarkup</standoff_markups>
 				</properties>
 			</EarlierDescription>
 			<EditorCorrection>
 				<class_uri type="URIRef">http://www.nie.org/ontology/nietzsche#EditorCorrection</class_uri>
 				<properties>
 					<is_uncertain type="URIRef">http://www.nie.org/ontology/nietzsche#isUncertain</is_uncertain>
 					<comment type="URIRef">http://www.nie.org/ontology/nietzsche#hasComment</comment>
 					<correction_text type="URIRef">http://www.nie.org/ontology/nietzsche#hasCorrectionText</correction_text>
 					<text type="URIRef">http://www.nie.org/ontology/nietzsche#commentHasText</text>
 				</properties>
 			</EditorCorrection>
 			<Image>
 				<class_uri type="URIRef">http://www.nie.org/ontology/nietzsche#Image</class_uri>
 				<properties>
 					<height type="URIRef">http://www.nie.org/ontology/nietzsche#hasHeight</height>
 					<width type="URIRef">http://www.nie.org/ontology/nietzsche#hasWidth</width>
 					<file_name type="URIRef">http://www.nie.org/ontology/nietzsche#hasFileName</file_name>
 					<transform_string type="URIRef">http://www.nie.org/ontology/nietzsche#hasTransform</transform_string>
 					<primaryURL type="URIRef">http://www.nie.org/ontology/nietzsche#hasPrimaryurl</primaryURL>
 					<secondaryURL type="URIRef">http://www.nie.org/ontology/nietzsche#hasSecondaryurl</secondaryURL>
 					<text_field type="URIRef">http://www.nie.org/ontology/nietzsche#hasTextField</text_field>
 				</properties>
 			</Image>
 			<FaksimileImage>
 				<class_uri type="URIRef">http://www.nie.org/ontology/nietzsche#FaksimileImage</class_uri>
 				<properties>
 					<height type="URIRef">http://www.nie.org/ontology/nietzsche#hasHeight</height>
 					<width type="URIRef">http://www.nie.org/ontology/nietzsche#hasWidth</width>
 					<file_name type="URIRef">http://www.nie.org/ontology/nietzsche#hasFileName</file_name>
 					<transform_string type="URIRef">http://www.nie.org/ontology/nietzsche#hasTransform</transform_string>
 					<primaryURL type="URIRef">http://www.nie.org/ontology/nietzsche#hasPrimaryurl</primaryURL>
 					<secondaryURL type="URIRef">http://www.nie.org/ontology/nietzsche#hasSecondaryurl</secondaryURL>
 					<apiURL type="URIRef">http://www.nie.org/ontology/nietzsche#hasApiurl</apiURL>
 					<thumbURL type="URIRef">http://www.nie.org/ontology/nietzsche#hasThumburl</thumbURL>
 					<mediumURL type="URIRef">http://www.nie.org/ontology/nietzsche#hasMediumurl</mediumURL>
 					<text_field type="URIRef">http://www.nie.org/ontology/nietzsche#hasTextField</text_field>
 				</properties>
 			</FaksimileImage>
 			<PositionalObject>
 				<class_uri type="URIRef">http://www.nie.org/ontology/nietzsche#PositionalObject</class_uri>
 				<properties>
 					<height type="URIRef">http://www.nie.org/ontology/nietzsche#hasHeight</height>
 					<width type="URIRef">http://www.nie.org/ontology/nietzsche#hasWidth</width>
 					<left type="URIRef">http://www.nie.org/ontology/nietzsche#hasLeft</left>
 					<top type="URIRef">http://www.nie.org/ontology/nietzsche#hasTop</top>
 					<bottom type="URIRef">http://www.nie.org/ontology/nietzsche#hasBottom</bottom>
 					<transform_string type="URIRef">http://www.nie.org/ontology/nietzsche#hasTransform</transform_string>
 				</properties>
 			</PositionalObject>
 			<WordPosition>
 				<class_uri type="URIRef">http://www.nie.org/ontology/nietzsche#WordPosition</class_uri>
 				<properties>
 					<height type="URIRef">http://www.nie.org/ontology/nietzsche#hasHeight</height>
 					<width type="URIRef">http://www.nie.org/ontology/nietzsche#hasWidth</width>
 					<left type="URIRef">http://www.nie.org/ontology/nietzsche#hasLeft</left>
 					<top type="URIRef">http://www.nie.org/ontology/nietzsche#hasTop</top>
 					<bottom type="URIRef">http://www.nie.org/ontology/nietzsche#hasBottom</bottom>
 					<transform_string type="URIRef">http://www.nie.org/ontology/nietzsche#hasTransform</transform_string>
 				</properties>
 			</WordPosition>
 			<FaksimilePosition>
 				<class_uri type="URIRef">http://www.nie.org/ontology/nietzsche#FaksimilePosition</class_uri>
 				<properties>
 					<height type="URIRef">http://www.nie.org/ontology/nietzsche#hasHeight</height>
 					<width type="URIRef">http://www.nie.org/ontology/nietzsche#hasWidth</width>
 					<left type="URIRef">http://www.nie.org/ontology/nietzsche#hasLeft</left>
 					<top type="URIRef">http://www.nie.org/ontology/nietzsche#hasTop</top>
 					<bottom type="URIRef">http://www.nie.org/ontology/nietzsche#hasBottom</bottom>
 					<transform_string type="URIRef">http://www.nie.org/ontology/nietzsche#hasTransform</transform_string>
 				</properties>
 			</FaksimilePosition>
 			<Imprint>
 				<class_uri type="URIRef">http://www.nie.org/ontology/nietzsche#Imprint</class_uri>
 				<properties>
 					<reference type="URIRef">http://www.nie.org/ontology/nietzsche#imprintHasReference</reference>
 					<lines type="URIRef">http://www.nie.org/ontology/nietzsche#imprintRefersToLines</lines>
 				</properties>
 			</Imprint>
 			<Line>
 				<class_uri type="URIRef">http://www.nie.org/ontology/nietzsche#Line</class_uri>
 				<properties>
 					<id type="URIRef">http://www.nie.org/ontology/nietzsche#lineHasNumber</id>
 					<bottom type="URIRef">http://www.nie.org/ontology/nietzsche#lineHasBottomValueOnTranskription</bottom>
 					<top type="URIRef">http://www.nie.org/ontology/nietzsche#lineHasTopValueOnTranskription</top>
 					<faksimile_inner_bottom type="URIRef">http://www.nie.org/ontology/nietzsche#lineHasInnerBottomValueOnFaksimile</faksimile_inner_bottom>
 					<faksimile_inner_top type="URIRef">http://www.nie.org/ontology/nietzsche#lineHasInnerTopValueOnFaksimile</faksimile_inner_top>
 					<faksimile_outer_bottom type="URIRef">http://www.nie.org/ontology/nietzsche#lineHasOuterBottomValueOnFaksimile</faksimile_outer_bottom>
 					<faksimile_outer_top type="URIRef">http://www.nie.org/ontology/nietzsche#lineHasOuterTopValueOnFaksimile</faksimile_outer_top>
 					<is_even type="URIRef">http://www.nie.org/ontology/nietzsche#isMainLine</is_even>
 					<editor_comments type="URIRef">http://www.nie.org/ontology/nietzsche#lineHasEditorComment</editor_comments>
 				</properties>
 			</Line>
 			<LineContinuation>
 				<class_uri type="URIRef">http://www.nie.org/ontology/nietzsche#LineContinuation</class_uri>
 				<properties>
 					<is_uncertain type="URIRef">http://www.nie.org/ontology/nietzsche#isUncertain</is_uncertain>
 					<comment type="URIRef">http://www.nie.org/ontology/nietzsche#hasComment</comment>
 					<to_reference type="URIRef">http://www.nie.org/ontology/nietzsche#isLineAContinuationTo</to_reference>
 					<text type="URIRef">http://www.nie.org/ontology/nietzsche#commentHasText</text>
 					<reference type="URIRef">http://www.nie.org/ontology/nietzsche#lineContinuationHasReference</reference>
 				</properties>
 			</LineContinuation>
 			<SimpleWord>
 				<class_uri type="URIRef">http://www.nie.org/ontology/nietzsche#SimpleWord</class_uri>
 				<properties>
 					<text type="URIRef">http://www.nie.org/ontology/nietzsche#hasText</text>
 					<clean_text type="URIRef">http://www.nie.org/ontology/nietzsche#hasCleanText</clean_text>
 					<lines type="URIRef">http://www.nie.org/ontology/nietzsche#wordBelongsToLine</lines>
 					<transkription_positions type="URIRef">http://www.nie.org/ontology/nietzsche#hasTranskriptionPosition</transkription_positions>
 					<faksimile_positions type="URIRef">http://www.nie.org/ontology/nietzsche#hasFaksimilePosition</faksimile_positions>
 				</properties>
 			</SimpleWord>
 			<SpecialWord>
 				<class_uri type="URIRef">http://www.nie.org/ontology/nietzsche#SpecialWord</class_uri>
 				<properties>
 					<text type="URIRef">http://www.nie.org/ontology/nietzsche#hasText</text>
 					<clean_text type="URIRef">http://www.nie.org/ontology/nietzsche#hasCleanText</clean_text>
 					<lines type="URIRef">http://www.nie.org/ontology/nietzsche#wordBelongsToLine</lines>
 					<transkription_positions type="URIRef">http://www.nie.org/ontology/nietzsche#hasTranskriptionPosition</transkription_positions>
 					<faksimile_positions type="URIRef">http://www.nie.org/ontology/nietzsche#hasFaksimilePosition</faksimile_positions>
 				</properties>
 			</SpecialWord>
 			<MarkForeignHands>
 				<class_uri type="URIRef">http://www.nie.org/ontology/nietzsche#MarkForeignHands</class_uri>
 				<properties>
 					<text type="URIRef">http://www.nie.org/ontology/nietzsche#hasText</text>
 					<clean_text type="URIRef">http://www.nie.org/ontology/nietzsche#hasCleanText</clean_text>
 					<pen type="URIRef">http://www.nie.org/ontology/nietzsche#penOfForeignHands</pen>
 					<resolution type="URIRef">http://www.nie.org/ontology/nietzsche#resolutionOfAbbreviation</resolution>
 					<comment type="URIRef">http://www.nie.org/ontology/nietzsche#foreignHandHasCommentByEditors</comment>
 					<lines type="URIRef">http://www.nie.org/ontology/nietzsche#wordBelongsToLine</lines>
 					<transkription_positions type="URIRef">http://www.nie.org/ontology/nietzsche#hasTranskriptionPosition</transkription_positions>
 					<faksimile_positions type="URIRef">http://www.nie.org/ontology/nietzsche#hasFaksimilePosition</faksimile_positions>
 					<foreign_hands_text type="URIRef">http://www.nie.org/ontology/nietzsche#textOfForeignHands</foreign_hands_text>
+					<overwrites_mark type="URIRef">http://www.nie.org/ontology/nietzsche#foreignHandOverwritesForeignHand</overwrites_mark>
 				</properties>
 			</MarkForeignHands>
 			<Page>
 				<class_uri type="URIRef">http://www.nie.org/ontology/nietzsche#Page</class_uri>
 				<properties>
 					<number type="URIRef">http://www.nie.org/ontology/nietzsche#hasNumber</number>
+					<status type="URIRef">http://www.nie.org/ontology/nietzsche#pageHasDataProcessingStatus</status>
 					<orientation type="URIRef">http://www.nie.org/ontology/nietzsche#hasOrientation</orientation>
 					<lines type="URIRef">http://www.nie.org/ontology/nietzsche#hasLines</lines>
 					<imprints type="URIRef">http://www.nie.org/ontology/nietzsche#hasImprints</imprints>
 					<mark_foreign_hands type="URIRef">http://www.nie.org/ontology/nietzsche#hasMarkForeignHands</mark_foreign_hands>
 					<words type="URIRef">http://www.nie.org/ontology/nietzsche#hasWords</words>
 					<word_deletion_paths type="URIRef">http://www.nie.org/ontology/nietzsche#hasWordDeletionPaths</word_deletion_paths>
 					<word_insertion_marks type="URIRef">http://www.nie.org/ontology/nietzsche#hasWordInsertionMarks</word_insertion_marks>
 					<editor_comments type="URIRef">http://www.nie.org/ontology/nietzsche#hasEditorComments</editor_comments>
 					<faksimile_image type="URIRef">http://www.nie.org/ontology/nietzsche#hasFaksimileImage</faksimile_image>
 					<svg_text_field type="URIRef">http://www.nie.org/ontology/nietzsche#pageIsOnSVGTextField</svg_text_field>
 					<faksimile_text_field type="URIRef">http://www.nie.org/ontology/nietzsche#pageIsOnFaksimileTextField</faksimile_text_field>
 					<svg_image type="URIRef">http://www.nie.org/ontology/nietzsche#hasSvgImage</svg_image>
 				</properties>
 			</Page>
 			<NonExistentPage>
 				<class_uri type="URIRef">http://www.nie.org/ontology/nietzsche#NonExistentPage</class_uri>
 				<properties>
 					<number type="URIRef">http://www.nie.org/ontology/nietzsche#hasNumber</number>
+					<status type="URIRef">http://www.nie.org/ontology/nietzsche#pageHasDataProcessingStatus</status>
 					<orientation type="URIRef">http://www.nie.org/ontology/nietzsche#hasOrientation</orientation>
 					<lines type="URIRef">http://www.nie.org/ontology/nietzsche#hasLines</lines>
 					<imprints type="URIRef">http://www.nie.org/ontology/nietzsche#hasImprints</imprints>
 					<mark_foreign_hands type="URIRef">http://www.nie.org/ontology/nietzsche#hasMarkForeignHands</mark_foreign_hands>
 					<words type="URIRef">http://www.nie.org/ontology/nietzsche#hasWords</words>
 					<word_deletion_paths type="URIRef">http://www.nie.org/ontology/nietzsche#hasWordDeletionPaths</word_deletion_paths>
 					<word_insertion_marks type="URIRef">http://www.nie.org/ontology/nietzsche#hasWordInsertionMarks</word_insertion_marks>
 					<editor_comments type="URIRef">http://www.nie.org/ontology/nietzsche#hasEditorComments</editor_comments>
-					<status type="URIRef">http://www.nie.org/ontology/nietzsche#hasStatus</status>
 					<faksimile_image type="URIRef">http://www.nie.org/ontology/nietzsche#hasFaksimileImage</faksimile_image>
 					<svg_text_field type="URIRef">http://www.nie.org/ontology/nietzsche#pageIsOnSVGTextField</svg_text_field>
 					<faksimile_text_field type="URIRef">http://www.nie.org/ontology/nietzsche#pageIsOnFaksimileTextField</faksimile_text_field>
 					<svg_image type="URIRef">http://www.nie.org/ontology/nietzsche#hasSvgImage</svg_image>
 				</properties>
 			</NonExistentPage>
 			<ReconstructedKonvolut>
 				<class_uri type="URIRef">http://www.nie.org/ontology/nietzsche#ReconstructedKonvolut</class_uri>
 				<properties>
 					<title type="URIRef">http://www.nie.org/ontology/nietzsche#hasTitle</title>
 					<manuscript_type type="URIRef">http://www.nie.org/ontology/nietzsche#hasManuscriptType</manuscript_type>
 					<pages type="URIRef">http://www.nie.org/ontology/nietzsche#hasPages</pages>
 					<description type="URIRef">http://www.nie.org/ontology/nietzsche#hasDescription</description>
 				</properties>
 			</ReconstructedKonvolut>
 			<Reference>
 				<class_uri type="URIRef">http://www.nie.org/ontology/nietzsche#Reference</class_uri>
 				<properties>
 					<first_line type="URIRef">http://www.nie.org/ontology/nietzsche#firstLineOfReference</first_line>
 					<last_line type="URIRef">http://www.nie.org/ontology/nietzsche#lastLineOfReference</last_line>
 					<word_reference type="URIRef">http://www.nie.org/ontology/nietzsche#wordReference</word_reference>
 					<is_uncertain type="URIRef">http://www.nie.org/ontology/nietzsche#IsUncertain</is_uncertain>
 					<title type="URIRef">http://www.nie.org/ontology/nietzsche#hasTitle</title>
 					<page_number type="URIRef">http://www.nie.org/ontology/nietzsche#hasPageNumber</page_number>
 				</properties>
 			</Reference>
 			<SVGImage>
 				<class_uri type="URIRef">http://www.nie.org/ontology/nietzsche#SVGImage</class_uri>
 				<properties>
 					<height type="URIRef">http://www.nie.org/ontology/nietzsche#hasHeight</height>
 					<width type="URIRef">http://www.nie.org/ontology/nietzsche#hasWidth</width>
 					<file_name type="URIRef">http://www.nie.org/ontology/nietzsche#hasFileName</file_name>
 					<transform_string type="URIRef">http://www.nie.org/ontology/nietzsche#hasTransform</transform_string>
 					<primaryURL type="URIRef">http://www.nie.org/ontology/nietzsche#hasPrimaryurl</primaryURL>
 					<secondaryURL type="URIRef">http://www.nie.org/ontology/nietzsche#hasSecondaryurl</secondaryURL>
 					<text_field type="URIRef">http://www.nie.org/ontology/nietzsche#hasTextField</text_field>
 				</properties>
 			</SVGImage>
 			<StandoffTag>
 				<class_uri type="URIRef">http://www.nie.org/ontology/nietzsche#StandoffTag</class_uri>
 				<properties>
 					<startIndex type="URIRef">http://www.nie.org/ontology/nietzsche#standoffTagHasStartIndex</startIndex>
 					<endIndex type="URIRef">http://www.nie.org/ontology/nietzsche#standoffTagHasEndIndex</endIndex>
 					<css_string type="URIRef">http://www.nie.org/ontology/nietzsche#standoffTagHasCSS</css_string>
 				</properties>
 			</StandoffTag>
 			<Style>
 				<class_uri type="URIRef">http://www.nie.org/ontology/nietzsche#Style</class_uri>
 				<properties>
 					<font type="URIRef">http://www.nie.org/ontology/nietzsche#styleHasFont</font>
 					<writing_instrument type="URIRef">http://www.nie.org/ontology/nietzsche#styleHasWritingInstrument</writing_instrument>
 					<css_string type="URIRef">http://www.nie.org/ontology/nietzsche#styleHasCSS</css_string>
 					<color type="URIRef">http://www.nie.org/ontology/nietzsche#styleHasColor</color>
 				</properties>
 			</Style>
 			<TextConnectionMark>
 				<class_uri type="URIRef">http://www.nie.org/ontology/nietzsche#TextConnectionMark</class_uri>
 				<properties>
 					<text type="URIRef">http://www.nie.org/ontology/nietzsche#hasText</text>
 					<clean_text type="URIRef">http://www.nie.org/ontology/nietzsche#hasCleanText</clean_text>
 					<lines type="URIRef">http://www.nie.org/ontology/nietzsche#wordBelongsToLine</lines>
 					<transkription_positions type="URIRef">http://www.nie.org/ontology/nietzsche#hasTranskriptionPosition</transkription_positions>
 					<faksimile_positions type="URIRef">http://www.nie.org/ontology/nietzsche#hasFaksimilePosition</faksimile_positions>
 					<text_source type="URIRef">http://www.nie.org/ontology/nietzsche#textConnectionMarkHasTextSource</text_source>
 				</properties>
 			</TextConnectionMark>
 			<TextField>
 				<class_uri type="URIRef">http://www.nie.org/ontology/nietzsche#TextField</class_uri>
 				<properties>
 					<height type="URIRef">http://www.nie.org/ontology/nietzsche#hasHeight</height>
 					<width type="URIRef">http://www.nie.org/ontology/nietzsche#hasWidth</width>
 					<left type="URIRef">http://www.nie.org/ontology/nietzsche#hasLeft</left>
 					<top type="URIRef">http://www.nie.org/ontology/nietzsche#hasTop</top>
 					<bottom type="URIRef">http://www.nie.org/ontology/nietzsche#hasBottom</bottom>
 					<transform_string type="URIRef">http://www.nie.org/ontology/nietzsche#hasTransform</transform_string>
 				</properties>
 			</TextField>
 			<TranskriptionPosition>
 				<class_uri type="URIRef">http://www.nie.org/ontology/nietzsche#TranskriptionPosition</class_uri>
 				<properties>
 					<height type="URIRef">http://www.nie.org/ontology/nietzsche#hasHeight</height>
 					<width type="URIRef">http://www.nie.org/ontology/nietzsche#hasWidth</width>
 					<left type="URIRef">http://www.nie.org/ontology/nietzsche#hasLeft</left>
 					<top type="URIRef">http://www.nie.org/ontology/nietzsche#hasTop</top>
 					<bottom type="URIRef">http://www.nie.org/ontology/nietzsche#hasBottom</bottom>
 					<transform_string type="URIRef">http://www.nie.org/ontology/nietzsche#hasTransform</transform_string>
 				</properties>
 			</TranskriptionPosition>
 			<UncertainDecipherment>
 				<class_uri type="URIRef">http://www.nie.org/ontology/nietzsche#UncertainDecipherment</class_uri>
 				<properties>
 					<is_uncertain type="URIRef">http://www.nie.org/ontology/nietzsche#isUncertain</is_uncertain>
 					<comment type="URIRef">http://www.nie.org/ontology/nietzsche#hasComment</comment>
 					<text type="URIRef">http://www.nie.org/ontology/nietzsche#commentHasText</text>
 				</properties>
 			</UncertainDecipherment>
 			<Word>
 				<class_uri type="URIRef">http://www.nie.org/ontology/nietzsche#Word</class_uri>
 				<properties>
 					<text type="URIRef">http://www.nie.org/ontology/nietzsche#hasText</text>
 					<clean_text type="URIRef">http://www.nie.org/ontology/nietzsche#hasCleanText</clean_text>
 					<edited_text type="URIRef">http://www.nie.org/ontology/nietzsche#hasEditedText</edited_text>
 					<clean_edited_text type="URIRef">http://www.nie.org/ontology/nietzsche#hasCleanEditedText</clean_edited_text>
 					<word_parts type="URIRef">http://www.nie.org/ontology/nietzsche#wordHasWordParts</word_parts>
 					<lines type="URIRef">http://www.nie.org/ontology/nietzsche#wordBelongsToLine</lines>
 					<transkription_positions type="URIRef">http://www.nie.org/ontology/nietzsche#hasTranskriptionPosition</transkription_positions>
 					<faksimile_positions type="URIRef">http://www.nie.org/ontology/nietzsche#hasFaksimilePosition</faksimile_positions>
 					<styles type="URIRef">http://www.nie.org/ontology/nietzsche#wordHasStyle</styles>
 					<overwrites_word type="URIRef">http://www.nie.org/ontology/nietzsche#overwritesWord</overwrites_word>
+					<undosCorrectionOfWord type="URIRef">http://www.nie.org/ontology/nietzsche#undosCorrectionOfWord</undosCorrectionOfWord>
 					<isTransformationOfWord type="URIRef">http://www.nie.org/ontology/nietzsche#isTransformationOfWord</isTransformationOfWord>
 					<isExtensionOfWord type="URIRef">http://www.nie.org/ontology/nietzsche#isExtensionOfWord</isExtensionOfWord>
 					<isDeletionOfWord type="URIRef">http://www.nie.org/ontology/nietzsche#isDeletionOfWord</isDeletionOfWord>
 					<isClarificationOfWord type="URIRef">http://www.nie.org/ontology/nietzsche#isClarificationOfWord</isClarificationOfWord>
 					<earlier_version type="URIRef">http://www.nie.org/ontology/nietzsche#wordHasEarlierVersion</earlier_version>
 					<corrections type="URIRef">http://www.nie.org/ontology/nietzsche#wordHasCorrection</corrections>
 					<undeleted_from_deletion_paths type="URIRef">http://www.nie.org/ontology/nietzsche#wordIsUndeletedFromPath</undeleted_from_deletion_paths>
 					<deletion_paths type="URIRef">http://www.nie.org/ontology/nietzsche#wordIsDeletedByPath</deletion_paths>
 					<editor_comments type="URIRef">http://www.nie.org/ontology/nietzsche#wordHasEditorComment</editor_comments>
 					<markup4partThatOverwritesWord type="URIRef">http://www.nie.org/ontology/nietzsche#hasStandoffMarkup4PartThatOverwritesWord</markup4partThatOverwritesWord>
 				</properties>
 			</Word>
 			<WordDeletionPath>
 				<class_uri type="URIRef">http://www.nie.org/ontology/nietzsche#WordDeletionPath</class_uri>
 				<properties>
 					<d_attribute type="URIRef">http://www.nie.org/ontology/nietzsche#hasDAttribute</d_attribute>
 					<style type="URIRef">http://www.nie.org/ontology/nietzsche#hasStyle</style>
 				</properties>
 			</WordDeletionPath>
 			<WordInsertionMark>
 				<class_uri type="URIRef">http://www.nie.org/ontology/nietzsche#WordInsertionMark</class_uri>
 				<properties>
 					<height type="URIRef">http://www.nie.org/ontology/nietzsche#hasHeight</height>
 					<width type="URIRef">http://www.nie.org/ontology/nietzsche#hasWidth</width>
 					<left type="URIRef">http://www.nie.org/ontology/nietzsche#hasLeft</left>
 					<top type="URIRef">http://www.nie.org/ontology/nietzsche#hasTop</top>
 					<bottom type="URIRef">http://www.nie.org/ontology/nietzsche#hasBottom</bottom>
 					<transform_string type="URIRef">http://www.nie.org/ontology/nietzsche#hasTransform</transform_string>
 					<mark_type type="URIRef">http://www.nie.org/ontology/nietzsche#hasMarkType</mark_type>
 					<symbol_id type="URIRef">http://www.nie.org/ontology/nietzsche#hasSymbolId</symbol_id>
 					<next_word_id type="URIRef">http://www.nie.org/ontology/nietzsche#hasNextWord</next_word_id>
 					<previous_word_id type="URIRef">http://www.nie.org/ontology/nietzsche#hasPreviousWord</previous_word_id>
 					<line type="URIRef">http://www.nie.org/ontology/nietzsche#wordInsertionMarkBelongsToLine</line>
 				</properties>
 			</WordInsertionMark>
 		</classes>
 	</dict>
 	<metadata>
 		<type>xml-dictionary</type>
 		<createdBy>
 			<script>dict2xml</script>
-			<date>2021-09-30 15:34:35</date>
+			<date>2021-12-14 11:26:46</date>
 		</createdBy>
 	</metadata>
 </root>
Index: tests_py2ttl/test_data/descriptions.csv
===================================================================
--- tests_py2ttl/test_data/descriptions.csv	(revision 0)
+++ tests_py2ttl/test_data/descriptions.csv	(revision 114)
@@ -0,0 +1,10 @@
+folio-name,label,alias,nietzschesource-url,license,description
+"Mp-XIV,416_417","Mp-XIV-1,416.jpg","Mp XIV, 416","http://www.nietzschesource.org/DFGAapi/api/page/download/Mp-XIV-1,416",CC BY-NC-ND 4.0,"Heftblatt, 17,4x22, liniiert; Rekto links beschnitten. Ursprünglich gegenüberliegende Seiten: 418 / 416, 417 / Mp XVI, 21ar."
+"Mp-XIV,416_417","Mp-XIV-1,416_thumb.jpg","Mp XIV, 416","http://www.nietzschesource.org/DFGAapi/images/DFGA/Mp-XIV-1/mini/Mp-XIV-1,416.jpg",CC BY-NC-ND 4.0,"Heftblatt, 17,4x22, liniiert; Rekto links beschnitten. Ursprünglich gegenüberliegende Seiten: 418 / 416, 417 / Mp XVI, 21ar."
+"Mp-XIV,416_417","Mp-XIV-1,417.jpg","Mp XIV, 417","http://www.nietzschesource.org/DFGAapi/api/page/download/Mp-XIV-1,417",CC BY-NC-ND 4.0,"Heftblatt, 17,4x22, liniiert; Rekto links beschnitten. Ursprünglich gegenüberliegende Seiten: 418 / 416, 417 / Mp XVI, 21ar."
+"Mp-XIV,416_417","Mp-XIV-1,417_thumb.jpg","Mp XIV, 417","http://www.nietzschesource.org/DFGAapi/images/DFGA/Mp-XIV-1/mini/Mp-XIV-1,417.jpg",CC BY-NC-ND 4.0,"Heftblatt, 17,4x22, liniiert; Rekto links beschnitten. Ursprünglich gegenüberliegende Seiten: 418 / 416, 417 / Mp XVI, 21ar."
+"Mp-XIV,418_419","Mp-XIV-1,418.jpg","Mp XIV, 418","http://www.nietzschesource.org/DFGAapi/api/page/download/Mp-XIV-1,418",CC BY-NC-ND 4.0,"Heftblatt, 17,4x22, liniiert; Rekto rechts beschnitten. Ursprünglich gegenüberliegende Seiten: 418 / 416, 419a / 419."
+"Mp-XIV,418_419","Mp-XIV-1,418_thumb.jpg","Mp XIV, 418","http://www.nietzschesource.org/DFGAapi/images/DFGA/Mp-XIV-1/mini/Mp-XIV-1,418.jpg",CC BY-NC-ND 4.0,"Heftblatt, 17,4x22, liniiert; Rekto rechts beschnitten. Ursprünglich gegenüberliegende Seiten: 418 / 416, 419a / 419."
+"Mp-XIV,419a_419b","Mp-XIV-1,419a.jpg","Mp XIV, 419a","http://www.nietzschesource.org/DFGAapi/api/page/download/Mp-XIV-1,419a",CC BY-NC-ND 4.0,"Heftblatt, 17,4x22, liniiert; Rekto rechts beschnitten. Ursprünglich gegenüberliegende Seiten: 419a / 419."
+"Mp-XIV,419a_419b","Mp-XIV-1,419a_thumb.jpg","Mp XIV, 419a","http://www.nietzschesource.org/DFGAapi/images/DFGA/Mp-XIV-1/mini/Mp-XIV-1,419a.jpg",CC BY-NC-ND 4.0,"Heftblatt, 17,4x22, liniiert; Rekto rechts beschnitten. Ursprünglich gegenüberliegende Seiten: 419a / 419."
+"Mp-XIV,419a_419b","Mp-XIV-1,419b.jpg","Mp XIV, 419b","http://www.nietzschesource.org/DFGAapi/api/page/download/Mp-XIV-1,419b",CC BY-NC-ND 4.0,"Heftblatt, 17,4x22, liniiert; Rekto rechts beschnitten. Ursprünglich gegenüberliegende Seiten: 419a / 419."
Index: tests_py2ttl/test_data_handler.py
===================================================================
--- tests_py2ttl/test_data_handler.py	(revision 113)
+++ tests_py2ttl/test_data_handler.py	(revision 114)
@@ -1,55 +1,57 @@
 import unittest
 from os import sep, path
 from os.path import dirname, isfile
 import inspect
 from rdflib import Graph, URIRef, Literal, BNode, OWL, RDF, RDFS, XSD
 import rdflib
 import sys
 
 sys.path.append('shared_util')
 from myxmlwriter import xml2dict
 sys.path.append('svgscripts')
 from datatypes.image import Image
 from datatypes.page import Page
 from datatypes.archival_manuscript import ArchivalManuscriptUnity
 from datatypes.text_field import TextField
 sys.path.append('py2ttl')
 from data_handler import RDFDataHandler
 
     
 class TestRDFDataHandler(unittest.TestCase):
     def setUp(self):
         RDFDataHandler.UNITTESTING = True
         DATADIR = dirname(__file__) + sep + 'test_data'
         self.mapping_dictionary = xml2dict(DATADIR + sep + 'mapping_dict.xml')
         self.xml_file = DATADIR + sep + 'N_VII_1_page001.xml'
         self.manuscript_file = DATADIR + sep + 'N_VII_1.xml'
 
     def test_add_data(self):
         data_handler = RDFDataHandler('test.ttl', self.mapping_dictionary)
         page = Page(self.xml_file)
         data_handler.add_data(page, page.title.replace(' ', '_'))
         manuscript = ArchivalManuscriptUnity.create_cls(self.manuscript_file)
         data_handler.add_data(page, '', skip_data_instance_list=['Page'])
         #print(data_handler.data_graph.serialize(format="turtle"))
         #data_handler.write()
+        #manuscript = ArchivalManuscriptUnity.create_cls('xml/Mp_XVIII.xml')
+        #data_handler.add_data(manuscript, '')
 
     def test_init(self):
         with self.assertRaises(Exception):
             RDFDataHandler(None, {})
         mapping_dictionary = { 'ontology': { 'project_name': 'test', 'project_uri': 'test' }}
         data_handler = RDFDataHandler('test.ttl', mapping_dictionary)
         self.assertEqual(data_handler.project_name, 'test')
 
     def test_create_identifier_uri(self):
         tf = TextField()
         mapping_dictionary = { 'ontology': { 'project_name': 'test', 'project_uri': 'test' }}
         data_handler = RDFDataHandler('test.ttl', mapping_dictionary)
         identifier_uri = data_handler.create_identifier_uri(tf, 'asdf')
         data_handler.data_graph.add((identifier_uri, RDF.type, OWL.Class))
         next_identifier_uri = data_handler.create_identifier_uri(tf, 'asdf')
         self.assertEqual(identifier_uri != next_identifier_uri, True)
 
 
 if __name__ == "__main__":
     unittest.main()
Index: tests_py2ttl/test_create_manuscript_description.py
===================================================================
--- tests_py2ttl/test_create_manuscript_description.py	(revision 0)
+++ tests_py2ttl/test_create_manuscript_description.py	(revision 114)
@@ -0,0 +1,30 @@
+import unittest
+from os import sep, path
+import lxml.etree as ET
+import sys
+
+sys.path.append('py2ttl')
+import config
+
+class TestConfig(unittest.TestCase):
+    def test_check_config_files_exist(self):
+        self.assertEqual(config.check_config_files_exist(), 0)
+        dir_saved = config.__dict__.get('ONTOLOGY_DIR')
+        config.__dict__['ONTOLOGY_DIR'] = __file__
+        with self.assertRaises(NotADirectoryError):
+            config.check_config_files_exist()
+        config.__dict__['ONTOLOGY_DIR'] = 'asf'
+        with self.assertRaises(FileNotFoundError):
+            config.check_config_files_exist()
+        config.__dict__['ONTOLOGY_DIR'] = dir_saved
+
+    def test_get_datatypes_dir(self):
+        self.assertEqual(config.get_datatypes_dir(), config.DATATYPES_DIR.replace('./', ''))
+        dir_saved = config.__dict__.get('DATATYPES_DIR')
+        del config.__dict__['DATATYPES_DIR']
+        self.assertEqual(config.get_datatypes_dir(), None)
+        config.__dict__['DATATYPES_DIR'] = dir_saved
+
+
+if __name__ == "__main__":
+    unittest.main()