Index: shared_util/main_util.py
===================================================================
--- shared_util/main_util.py	(revision 102)
+++ shared_util/main_util.py	(revision 103)
@@ -1,8 +1,23 @@
+import lxml.etree as ET
+from os.path import isfile, isdir, dirname, basename
+
+FILE_TYPE_XML_PROJECT = "xmlProjectFile"
+
 def create_function_dictionary(list_of_keys, target_function, function_dictionary=None) -> dict:
     """Create a function_dictionary
     """
     if function_dictionary is None:
         function_dictionary = {}
     for key in list_of_keys:
         function_dictionary.update({key: target_function})
     return function_dictionary
+
+def get_manuscript_files(args: list) ->list:
+    """Return a list of manuscript files. If first element is of type FILE_TYPE_XML_PROJECT read from
+        xml file and return as list of filenames.
+    """
+    if len(args) == 1\
+            and args[0].endswith('.xml')\
+            and ET.parse(args[0]).getroot().find('metadata/type').text == FILE_TYPE_XML_PROJECT:
+        return ET.parse(args[0]).xpath('//manuscript[contains(@status, "OK")]/@file')
+    return args
Index: Friedrich-Nietzsche-late-work-ontology.ttl
===================================================================
--- Friedrich-Nietzsche-late-work-ontology.ttl	(revision 102)
+++ Friedrich-Nietzsche-late-work-ontology.ttl	(revision 103)
@@ -1,41 +1,57 @@
 @prefix dct: <http://purl.org/dc/terms/>.
 @prefix document: <http://e-editiones.ch/ontology/document#>.
 @prefix homotypic: <http://www.nie.org/ontology/homotypic#>.
 @prefix stoff: <http://www.nie.org/ontology/standoff#>.
 @prefix text: <http://www.e-editiones.ch/ontology/text#>.
 @prefix owl: <http://www.w3.org/2002/07/owl#>.
 @prefix rdfs: <http://www.w3.org/2000/01/rdf-schema#>.
 @prefix xsd: <http://www.w3.org/2001/XMLSchema#>.
 
 @prefix tln: <http://www.nie.org/ontology/nietzsche#>.
 
 <http://www.nie.org/ontology/nietzsche>
 	a owl:Ontology;
 	dct:license <http://creativecommons.org/licenses/by/3.0/>;
 	dct:title "An ontology about the collected late works of Friedrich Nietzsche"@en;
 	dct:description """Formal description of specific concepts in the scientific study of Friedrich Nietzsches late work."""@en;
 	dct:creator "Dominique Steinbach, tool coordinator/software developer, NIE-INE/digital edition of der späte Nietzsche, Basel University, Switzerland"@en;
 	dct:contributor "Christian Steiner, software developer, digital edition of der späte Nietzsche, University of Basel, Switzerland"@en;
    dct:publisher "Basel University, Switzerland"@en.
 
+
+tln:Page a owl:Class ;
+    rdfs:subClassOf document:Page .
+
+tln:hasImage a owl:ObjectProperty ;
+    rdfs:label "relates a page to a image"@en ;
+    rdfs:comment "relates a page to an image that has a textfield that specifies the area where the writing that constitutes the page can be found."@en ;
+    rdfs:isDefinedBy <http://www.nie.org/ontology/nietzsche> ;
+    rdfs:domain tln:Page ;
+    rdfs:range tln:Image .
+
 tln:inheritOverwritesWord a owl:ObjectProperty ;
    rdfs:subPropertyOf tln:overwritesWord;
    rdfs:label "word overwrites word (inherited from tln:wordHasCorrection)"@en ;
    rdfs:comment "The author has used this word in order to overwrite that word."@en ;
    rdfs:isDefinedBy <http://www.nie.org/ontology/nietzsche> ;
    owl:propertyChainAxiom  ( tln:wordHasCorrection tln:overwritesWord ).
 
-tln:Page a owl:Class ;
-    rdfs:subClassOf document:Page .
+tln:lineContinuesOn a owl:ObjectProperty ;
+    rdfs:label "writing from subject line continues on object line"@en ;
+    rdfs:comment "the writing that ends on subject line continues on object line"@en ;
+    rdfs:isDefinedBy <http://www.nie.org/ontology/nietzsche> ;
+    rdfs:domain tln:Line ;
+    rdfs:range tln:Line .
+
+tln:pageIsOnTextField a owl:ObjectProperty ;
+    rdfs:label "page is on text field"@en ;
+    rdfs:comment "the writing that is referred to as subject can be found on object"@en ;
+    rdfs:isDefinedBy <http://www.nie.org/ontology/nietzsche> ;
+    rdfs:domain tln:Page ;
+    rdfs:range tln:TextField .
 
 tln:writingContinuesWithWord a owl:ObjectProperty ;
     rdfs:label "writing continues with next word"@en ;
     rdfs:isDefinedBy <http://www.nie.org/ontology/nietzsche> ;
     rdfs:domain tln:Word ;
     rdfs:range tln:Word .
-
-tln:lineContinuesOn a owl:ObjectProperty ;
-    rdfs:label "writing from subject line continues with object line"@en ;
-    rdfs:isDefinedBy <http://www.nie.org/ontology/nietzsche> ;
-    rdfs:domain tln:Line ;
-    rdfs:range tln:Line .
Index: svgscripts/extractWordPosition.py
===================================================================
--- svgscripts/extractWordPosition.py	(revision 102)
+++ svgscripts/extractWordPosition.py	(revision 103)
@@ -1,550 +1,550 @@
 #!/usr/bin/env python3
 # -*- coding: utf-8 -*-
 
 """   This program can be used to extract the position of the words in a svg file and write them to a xml file.
 """
 #    Copyright (C) University of Basel 2019  {{{1
 #
 #    This program is free software: you can redistribute it and/or modify
 #    it under the terms of the GNU General Public License as published by
 #    the Free Software Foundation, either version 3 of the License, or
 #    (at your option) any later version.
 #
 #    This program is distributed in the hope that it will be useful,
 #    but WITHOUT ANY WARRANTY; without even the implied warranty of
 #    MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
 #    GNU General Public License for more details.
 #
 #    You should have received a copy of the GNU General Public License
 #    along with this program.  If not, see <https://www.gnu.org/licenses/> 1}}}
 
 import inspect
 import getopt
 from lxml import etree as ET
 from os import sep, listdir, mkdir, path
 from os.path import exists, isfile, isdir
 from progress.bar import Bar
 import re
 import sys
 import warnings
 
 from datatypes.lineNumber import LineNumber
 from datatypes.matrix import Matrix
 from datatypes.page_creator import PageCreator, FILE_TYPE_SVG_WORD_POSITION, FILE_TYPE_XML_MANUSCRIPT
 from datatypes.pdf import PDFText
 from datatypes.transkriptionField import TranskriptionField
 from datatypes.transkription_position import TranskriptionPosition
 from datatypes.word import Word
 from datatypes.word_insertion_mark import WordInsertionMark
 from util import process_warnings4status, reset_tp_with_matrix
 
 sys.path.append('shared_util')
 from myxmlwriter import write_pretty
 
 __author__ = "Christian Steiner"
 __maintainer__ = __author__
 __copyright__ = 'University of Basel'
 __email__ = "christian.steiner@unibas.ch"
 __status__ = "Development"
 __license__ = "GPL v3"
 __version__ = "0.0.1"
 
 class Extractor:
     """
     This class can be used to extract the word positions in a svg file and write it to a xml file.
 
     Args:
         [xml_dir (str): target directory]
         [title (str): title of document]
         [manuscript_file (str): xml file containing information about the archival unity to which the current page belongs
     """
     UNITTESTING = False
     SONDERZEICHEN_LIST = [ 'A', 'B', '{', '}' ]
     SET_POSITIONS_TO_TEXTFIELD_0_0 = False
 
     def __init__(self, xml_dir=None, title=None, manuscript_file=None, compare2pdf=False):
         if bool(xml_dir):
             self.xml_dir = xml_dir
             not isdir(self.xml_dir) and mkdir(self.xml_dir)
         else:
             self.xml_dir = 'xml' if(isdir('xml')) else '' 
         self.latest_status = None
         self.compare2pdf = compare2pdf
         self.xml_dir = self.xml_dir + sep if(bool(self.xml_dir)) else ''
         self.title = title
         self.manuscript_file = manuscript_file
         self.manuscript_tree = None
         if not bool(self.title) and bool(self.manuscript_file) and isfile(self.manuscript_file):
             self.manuscript_tree = ET.parse(self.manuscript_file)
             self.title = self.manuscript_tree.getroot().get('title')
         elif bool(self.manuscript_file):
             raise FileNotFoundError('File "{}" does not exist!'.format(self.manuscript_file))
         elif bool(self.title):
             self.update_title_and_manuscript(self.title, False)
 
     def add_word(self, page, index, word_part_objs, endSign, endX, matrix=None, debug_msg=None, transkription_field=None) ->int:
         """Creates transkription_positions and a new word from word_part_objs (i.e. a list of dictionaries about parts of this word).
             If word contains a Sonderzeichen as specified by self.SONDERZEICHEN_LIST, word_part_objs will be split and several words are created.
 
             :returns: the new word counter (int)
         """
         break_points = []
         if(len(page.sonderzeichen_list) > 0): # check for Sonderzeichen and special chars -> mark for word insertion, create break points
             for Sonderzeichen in self.SONDERZEICHEN_LIST:
                 contains_Sonderzeichen = [ dict['text'] == Sonderzeichen and any(sz in dict['class'] for sz in page.sonderzeichen_list) for dict in word_part_objs ]
                 if True in contains_Sonderzeichen:
                     break_points += [ (endPoint, endPoint + 1) for endPoint in  [i for i, e in enumerate(contains_Sonderzeichen) if e == True ]] 
                     for sz_point in [i for i, e in break_points]:
                         wim_index = len(page.word_insertion_marks)
                         x = float(word_part_objs[sz_point]['x'])
                         y = float(word_part_objs[sz_point]['y'])
                         if page.svg_file is not None and isfile(page.svg_file)\
                                 and (not self.SET_POSITIONS_TO_TEXTFIELD_0_0 or transkription_field is not None):
                             svg_path_tree = ET.parse(page.svg_file)
                             namespaces = { k if k is not None else 'ns': v for k, v in svg_path_tree.getroot().nsmap.items() }
                             xmin = 0 if not self.SET_POSITIONS_TO_TEXTFIELD_0_0 else transkription_field.xmin
                             ymin = 0 if not self.SET_POSITIONS_TO_TEXTFIELD_0_0 else transkription_field.ymin
                             wim = WordInsertionMark.CREATE_WORD_INSERTION_MARK(svg_path_tree, namespaces, id=wim_index, x=x, y=y, xmin=xmin, ymin=ymin,\
                                     line_number=page.get_line_number(y-1), mark_type=Sonderzeichen)
                             page.word_insertion_marks.append(wim)
         if(bool(re.search(r'\d[A-Za-z]', self.get_word_from_part_obj(word_part_objs)))): # case: digits from line number and chars from words -> create break points
             THRESHOLDX = 20 # Threshold between line number and text
             last_x = -1
             for i, x in enumerate([float(dict['x']) for dict in word_part_objs]):
                 if(last_x > -1 and (x - last_x > THRESHOLDX)):
                     break_points.append((i, i))
                 last_x = x
         if(len(break_points) > 0): # if there are break points -> split word_part_obj and add the corresponding words
             from_index = 0
             for end_point, next_from_index in break_points:
                 new_word_part_objs = word_part_objs[from_index:end_point]
                 new_endX = word_part_objs[end_point]['x']
                 from_index = next_from_index
                 index = self.add_word(page, index, new_word_part_objs, None, new_endX, matrix=matrix, debug_msg=debug_msg, transkription_field=transkription_field)
             if from_index > 0 and from_index < len(word_part_objs):
                 new_word_part_objs = word_part_objs[from_index:]
                 index = self.add_word(page, index, new_word_part_objs, endSign, endX, matrix=matrix, debug_msg=debug_msg, transkription_field=transkription_field)
             return index
         else:
             if len(word_part_objs) > 0:
                 provide_tf = None if not self.SET_POSITIONS_TO_TEXTFIELD_0_0 else transkription_field
                 transkription_positions = TranskriptionPosition.CREATE_TRANSKRIPTION_POSITION_LIST(page, word_part_objs, matrix=matrix,\
                         debug_msg_string=debug_msg, transkription_field=provide_tf)
                 text = self.get_word_from_part_obj(word_part_objs)
                 line_number = page.get_line_number((transkription_positions[0].bottom+transkription_positions[0].top)/2)
                 if line_number == -1:
                     if transkription_positions[0].transform is not None:
                         line_number = page.get_line_number(transkription_positions[0].transform.getY())
                     if line_number == -1 and len(page.words) > 0:
                         lastWord = page.words[-1]
                         lastWord_lastTP = lastWord.transkription_positions[-1]
                         lastTP = transkription_positions[-1]
                         if transkription_positions[0].left > lastWord_lastTP.left\
                                 and abs(lastWord_lastTP.bottom-lastTP.bottom) < lastTP.height/2:
                             line_number = lastWord.line_number
                         else:
                             line_number = lastWord.line_number+1
-                reset_tp_with_matrix(page, transkription_positions)
+                #reset_tp_with_matrix(transkription_positions)
                 newWord = Word(id=index, text=text, line_number=line_number, transkription_positions=transkription_positions)
                 page.words.append(newWord)
                 return int(index) + 1
             else:
                 return int(index)
 
     def extractAndWriteInformation(self, file_name, page_number=None, xml_target_file=None, svg_file=None, pdfFile=None, record_warnings=False, warning_filter='default', multipage_index=-1, marginals_page=None):
         """Extracts information about positions of text elements and writes them to a xml file.
         """
         if isfile(file_name):
             if not bool(xml_target_file):
                 xml_target_file = self.get_file_name(file_name, page_number)
             if bool(self.xml_dir) and not bool(path.dirname(xml_target_file)):
                 xml_target_file = path.dirname(self.xml_dir) + sep + xml_target_file
             exit_status = 0
             with warnings.catch_warnings(record=record_warnings) as w:
                 warnings.simplefilter(warning_filter)
                 page = self.extract_information(file_name, page_number=page_number, xml_target_file=xml_target_file, svg_file=svg_file, pdfFile=pdfFile,\
                         multipage_index=multipage_index, marginals_page=marginals_page) 
                 status_message = process_warnings4status(w, [ PageCreator.WARNING_MISSING_USE_NODE4PWP, PageCreator.WARNING_MISSING_GLYPH_ID4WIM ],\
                         '', 'OK', 'with warnings')
                 if status_message != 'OK':
                     self.latest_status = status_message
                     exit_status = 1
                 else:
                     self.latest_status = None
                 page.page_tree.getroot().set('status', status_message)
             write_pretty(xml_element_tree=page.page_tree, file_name=xml_target_file, script_name=__file__, file_type=FILE_TYPE_SVG_WORD_POSITION)
             return exit_status 
         else:
             raise FileNotFoundError('\"{}\" is not an existing file!'.format(file_name))
 
     def extract_information(self, file_name, page_number=None, xml_target_file=None, svg_file=None, pdfFile=None, multipage_index=-1, marginals_page=None) -> PageCreator:
         """Extracts information about positions of text elements.
         """
         if isfile(file_name):
             if not bool(xml_target_file):
                 xml_target_file = self.get_file_name(file_name, page_number)
             if bool(self.xml_dir) and not bool(path.dirname(xml_target_file)):
                 xml_target_file = path.dirname(self.xml_dir) + sep + xml_target_file
             transkription_field = TranskriptionField(file_name, multipage_index=multipage_index) 
             text_field = transkription_field.convert_to_text_field()
             svg_tree = ET.parse(file_name) 
             page = PageCreator(xml_target_file, title=self.title, multipage_index=multipage_index,\
                     page_number=page_number, pdfFile=pdfFile, svg_file=svg_file,\
                     svg_text_field=text_field, source=file_name, marginals_source=marginals_page)
             sonderzeichen_list, letterspacing_list, style_dict = self.get_style(svg_tree.getroot())
             page.add_style(sonderzeichen_list=sonderzeichen_list, letterspacing_list=letterspacing_list, style_dict=style_dict)
             page.init_line_numbers(LineNumber.extract_line_numbers(svg_tree, transkription_field, set_to_text_field_zero=self.SET_POSITIONS_TO_TEXTFIELD_0_0),\
                     transkription_field.ymax) 
             self.extract_word_position(svg_tree, page, transkription_field=transkription_field)
             page.create_writing_processes_and_attach2tree()
             page.update_and_attach_words2tree()
             for word_insertion_mark in page.word_insertion_marks:
                 # it is not clear if we really need to know this alternative word ordering. See 'TODO.md'
                 #word_insertion_mark.inserted_words = self.find_inserted_words(page.page_tree, word_insertion_mark) 
                 word_insertion_mark.attach_object_to_tree(page.page_tree)
             return page
         else:
             raise FileNotFoundError('\"{}\" is not an existing file!'.format(file_name))
 
     def extract_word_position(self, svg_tree, page, transkription_field=None):
         """Extracts word positions.
         """
         counter = 0
         word_part_obj = []
         endSign = '%'
         last_matrix = None
         MAXBOTTOMDIFF = 5
         MAXXDIFF = 6
         if not Extractor.UNITTESTING:
             bar = Bar('extracting word positions from text_item', max=len([*self.get_text_items(svg_tree.getroot(), transkription_field=transkription_field)]))
         for text_item in self.get_text_items(svg_tree.getroot(), transkription_field=transkription_field):
             provide_tf = None if not self.SET_POSITIONS_TO_TEXTFIELD_0_0 else transkription_field
             current_matrix = Matrix(text_item.get('transform'), transkription_field=provide_tf)
             # check for line breaks
             if (last_matrix is not None and len(word_part_obj) > 0 and (\
                     Matrix.DO_CONVERSION_FACTORS_DIFFER(last_matrix, current_matrix) or\
                     (abs(current_matrix.getY() - last_matrix.getY()) > MAXBOTTOMDIFF) or\
                     (abs(current_matrix.getX() - word_part_obj[len(word_part_obj)-1]['x']) > MAXXDIFF)))\
                     or (len(word_part_obj) > 0 and self.get_word_object_multi_char_x(word_part_obj[0]) > current_matrix.getX()):
                 endSign = '%'
                 if(self.get_word_from_part_obj(word_part_obj) != ''):
                     debug_msg = 'check for line breaks, diffx: {}, diffy: {}, diff_conversion_matrix: {}'.format(\
                             round(abs(current_matrix.getX()  - word_part_obj[len(word_part_obj)-1]['x']), 3), round(abs(current_matrix.getY() - last_matrix.getY()), 3),\
                             str(Matrix.DO_CONVERSION_FACTORS_DIFFER(last_matrix, current_matrix)))
                     counter = self.add_word(page, counter, word_part_obj, endSign, endX, matrix=last_matrix, debug_msg=debug_msg, transkription_field=transkription_field)
                 word_part_obj = []
             endX = current_matrix.getX()
             if(len(text_item.findall(".//tspan", svg_tree.getroot().nsmap)) < 1): # case: <svg><text>TEXT
                 if(bool(text_item.text) and not bool(re.search(r'^\s*$', text_item.text))):
                     word_part_obj.append( { "text": text_item.text, "x": current_matrix.getX(), "y": current_matrix.getY(), "class": text_item.get('class'), "matrix": current_matrix} )
                 else:
                     endSign = text_item.text
                     if(self.get_word_from_part_obj(word_part_obj) != ''):
                         counter = self.add_word(page, counter, word_part_obj, endSign, endX, matrix=last_matrix, debug_msg='svg/text/\s', transkription_field=transkription_field)  
                     word_part_obj = []
                     endSign = '%'
             for tspan_item in text_item.findall(".//tspan", svg_tree.getroot().nsmap): # case: <svg><text><tspan>TEXT
                 endX = current_matrix.add2X(tspan_item.get('x'))
                 if(tspan_item.text != None and tspan_item.text != '' and not bool(re.search(r'^\s*$', tspan_item.text))):
                     y = current_matrix.add2Y(tspan_item.get('y'))
                     word_part_obj.append( { "text": tspan_item.text, "x": endX, "y": y, "class": tspan_item.get('class'), "matrix": current_matrix })
                     if len(set(page.letterspacing_list) & set(tspan_item.get('class').split(' '))) > 0:  
                         """text_item has letterspacing class 
                         (set s & set t = new set with elements common to s and t)
                         """
                         endSign = '%'
                         if(self.get_word_from_part_obj(word_part_obj) != ''):
                             counter = self.add_word(page, counter, word_part_obj, endSign, endX, matrix=current_matrix,\
                                     debug_msg='tspan with letterspacing', transkription_field=transkription_field)  
                         word_part_obj = []
                 else:
                     endSign = tspan_item.text
                     if(self.get_word_from_part_obj(word_part_obj) != ''):
                         counter = self.add_word(page, counter, word_part_obj, endSign, endX, matrix=current_matrix,\
                                 debug_msg='svg/text/tspan/\s', transkription_field=transkription_field)
                     word_part_obj = []
                     endSign = '%'
             last_matrix = current_matrix
             not bool(Extractor.UNITTESTING) and bar.next()
         if(self.get_word_from_part_obj(word_part_obj) != ''):
             counter = self.add_word(page, counter, word_part_obj, endSign, endX, matrix=current_matrix, debug_msg='end of loop',\
                     transkription_field=transkription_field)
         word_part_obj = []
         endSign = '%'
         not bool(Extractor.UNITTESTING) and bar.finish()
 
     def find_inserted_words_by_position(self, target_tree, x, y):
         """Returns an Array with the words that are inserted above the x, y position or [] if not found.
         """
         warnings.warn('Function "find_inserted_words_by_position" does not work and it is not clear whether we need this.')
         MINY = 31.0
         MAXY = 10.0
         DIFFX = 9.0
         if(len(target_tree.getroot().xpath('//word[@id]')) > 0):
             result_list = []
             minus2left = 20.0
             minus2top = 19.0
             while len(result_list) == 0 and minus2top < MINY and minus2left > DIFFX :
                 result_list = [ Word.CREATE_WORD(item) for item in target_tree.getroot().xpath(\
                         '//word[@top>{0} and @top<{1} and @left>{2} and @left<{3}]'.format(y - minus2top, y - MAXY, x - minus2left, x + DIFFX)) ]
                 minus2left -= 1
                 minus2top  += 1
             if len(result_list) > 0:
                 result_bottom = result_list[len(result_list)-1].bottom
                 result_left_min = result_list[len(result_list)-1].left + result_list[len(result_list)-1].width
                 for item in target_tree.getroot().xpath('//word[@bottom={0} and @left>{1}]'.format(result_bottom, result_left_min)):
                     result_left_min = result_list[len(result_list)-1].left + result_list[len(result_list)-1].width
                     result_left_max = result_left_min + DIFFX
                     if float(item.get('left')) - result_left_max < DIFFX:
                         result_list.append(Word.CREATE_WORD(item))
                     else:
                         break
             return result_list 
         else:
             return []
 
     def find_inserted_words(self, target_tree, word_insertion_mark):
         """Returns an Array with the words that are inserted above/underneath the word_insertion_mark.
 
         """
         warnings.warn('Function "find_inserted_words" does not work and it is not clear whether we need this.')
         if word_insertion_mark.line_number < 2 or word_insertion_mark.line_number % 2 == 1:
             return self.find_inserted_words_by_position(target_tree, word_insertion_mark.x, word_insertion_mark.y)
         if(len(target_tree.getroot().xpath('//word[@id]')) > 0):
             MINY = 31.0
             MAXY = 10.0
             DIFFX = 9.0
             result_list = []
             x = word_insertion_mark.x
             y = word_insertion_mark.y
             if word_insertion_mark.mark_type != 'B': # all insertions that are above the current line
                 line_number = word_insertion_mark.line_number - 1 
                 words_on_line = [ Word.CREATE_WORD(item) for item in target_tree.getroot().xpath(\
                                 '//word[@line-number={0}]'.format(line_number)) ]
                 if len(words_on_line) > 0:
                     minus2top = 1.0
                     while len(result_list) == 0 and minus2top < MINY:
                         for word in words_on_line:
                             for transkription_position in word.transkription_positions:
                                 if transkription_position.top > y - minus2top\
                                         and transkription_position.left > x - DIFFX\
                                         and transkription_position.left < x + DIFFX:
                                     result_list.append(word)
                                     break
                         minus2top  += 1
             elif word_insertion_mark.mark_type == 'B': # B means insertion is underneath the current line
                 line_number = word_insertion_mark.line_number + 1
                 words_on_line = [ Word.CREATE_WORD(item) for item in target_tree.getroot().xpath(\
                                 '//word[@line-number={0}]'.format(line_number)) ]
                 if len(words_on_line) > 0:
                     plus2top = 1.0
                     while len(result_list) == 0 and plus2top < MINY :
                         for word in words_on_line:
                             for transkription_position in word.transkription_positions:
                                 if transkription_position.top > y + plus2top\
                                         and transkription_position.left > x - DIFFX\
                                         and transkription_position.left < x + DIFFX:
                                     result_list.append(word)
                                     break
                         plus2top  += 1
             if len(result_list) > 0: # now, collect more words that are right of already collected words
                 result_bottom = result_list[len(result_list)-1].transkription_positions[0].bottom
                 result_left_min = result_list[len(result_list)-1].transkription_positions[0].left\
                         + result_list[len(result_list)-1].transkription_positions[0].width
                 for item in target_tree.getroot().xpath(\
                         '//word[@line-number={0} and @bottom>{1} and @bottom<{2} and @left>{3}]'.format(line_number, result_bottom-5, result_bottom+5, result_left_min)):
                     result_left_min = result_list[len(result_list)-1].transkription_positions[0].left\
                             + result_list[len(result_list)-1].transkription_positions[0].width
                     result_left_max = result_left_min + DIFFX
                     if float(item.get('left')) - result_left_max < DIFFX:
                         result_list.append(Word.CREATE_WORD(item))
                     else:
                         break
             return result_list 
         else:
             return []
 
     def get_file_name(self, file_name, page_number=None):
         """Returns the file_name of the target xml file.
         """
         dir_name = path.dirname(self.xml_dir) + sep if(bool(self.xml_dir)) else ''
         if bool(self.title):
             return dir_name + self.title.replace(' ', '_') + '_page' + self.get_page_number(file_name, page_number=page_number) + '.xml'
         else:
             return '{}{}'.format(dir_name, path.basename(file_name).replace('.svg', '.xml'))
 
     def get_page_number(self, file_name, page_number=None):
         """ Returns page number as a string (with leading zero(s) if len(page_number) < 3).
         """
         if not bool(page_number) and bool(re.search(r'\d', file_name)):
             """if page_number=None and filename contains digits,
                 then split filename into its parts that contain only digits, remove empty strings
                 and return the last part containing only digits.
             """
             page_number = list(filter(lambda x: x != '', re.split(r'\D+', file_name))).pop()
         if bool(page_number):
             leading_zeros = '00' if(len(page_number) == 1) else '0' if(len(page_number) == 2) else ''
             return leading_zeros + str(page_number)
         else:
             return ''
 
     def get_style(self, etree_root):
         """Returns the style specification as a dictionary.
 
             :returns: 
                 sonderzeichen_list:     list of keys for classes that are 'Sonderzeichen'
                 style_dict:             dictionary: key = class name (str), value = style specification (dictionary)
         """
         style_dict = {}
         sonderzeichen_list = []
         letterspacing_list = []
         style = etree_root.find('style', etree_root.nsmap)
         if style is not None:
             for style_item in list(filter(lambda x: x != '', style.text.split("\n\t"))):
                 style_key = style_item.split('{')[0].replace('.', '')
                 style_value_dict = {  item.split(':')[0]: item.split(':')[1].replace('\'','') \
                     for item in list(filter(lambda x: x!= '', style_item.split('{')[1].replace('}', '').replace('\n','').split(';')))}
                 style_dict[style_key] = style_value_dict
                 if bool(style_value_dict.get('font-family')) and 'Sonderzeichen' in style_value_dict.get('font-family'):
                     sonderzeichen_list.append(style_key)
                 if bool(style_value_dict.get('letter-spacing')):
                     letterspacing_list.append(style_key)
         return sonderzeichen_list, letterspacing_list, style_dict
 
     def get_text_items(self, tree_root, transkription_field=None):
         """Returns all text elements with a matrix or (if transkription_field is specified) 
         all text elements that are located inside the transkription field.
         """
         if transkription_field is not None:
             return filter(lambda x: Matrix.IS_PART_OF_TRANSKRIPTION_FIELD(transkription_field, text_node=x),\
                     tree_root.iterfind(".//text", tree_root.nsmap))
         else:
             return tree_root.iterfind(".//text", tree_root.nsmap)
 
     def get_word_from_part_obj(self, word_part_obj):
         """Extracts all 'text' from a list of dicitonaries and concats it to a string.
         """
         return ''.join([ dict['text'] for dict in word_part_obj])
 
     def get_word_object_multi_char_x(self, word_part_obj_dict):
         """Returns the x of the last char of word_part_object.
 
         TODO: get real widths from svg_file!!!
         """
         WIDTHFACTOR = 2.6
         return word_part_obj_dict['x'] if len(word_part_obj_dict['text']) < 2 else word_part_obj_dict['x'] + len(word_part_obj_dict['text']) * WIDTHFACTOR
 
     def update_title_and_manuscript(self, title, update_manuscript=True):
         """Updates title and manuscript.
         """
         self.title = title
         if update_manuscript or not bool(self.manuscript_file):
             self.manuscript_file = self.xml_dir + self.title.replace(' ', '_') + '.xml'
         if not isfile(self.manuscript_file):
             self.manuscript_tree = ET.ElementTree(ET.Element('manuscript', attrib={"title": self.title}))
             write_pretty(xml_element_tree=self.manuscript_tree, file_name=self.manuscript_file, script_name=__file__, file_type='xmlManuscriptFile')
 
 def usage():
     """prints information on how to use the script
     """
     print(main.__doc__)
 
 def main(argv):
     """This program can be used to extract the position of the words in a svg file and write them to a xml file. 
 
     svgscripts/extractWordPosition.py [OPTIONS] <file|dir>
 
         <file>                              svg file OR xml target file containing file name of svg file as "/page/@source".
         <dir>                               directory containing svg files
 
         OPTIONS:
         -h|--help:                          show help
         -c|--compare-to-pdf                 compare words to pdf and autocorrect 
         -d|--xml-dir=xmlDir:                target directory for the xml output file(s)
         -m|--manuscript-file:               xml file containing information about the archival order to which the current page(s) belong(s)
         -p|--page=pageNumber:               page number of the current page. For use with _one_ file only.
         -P|--PDF=pdfFile:                   pdf file - used for word correction
         -s|--svg=svgFile:                   svg web file
         -t|--title=title:                   title of the manuscript to which the current page(s) belong(s)
         -x|--xml-target-file=xmlOutputFile: xml target file 
 
         :return: exit code (int)
     """
     compare2pdf = True
     manuscript_file = None
     page_number = None
     pdfFile = None
     svg_file = None
     title = None
     xml_target_file = None
     xml_dir = ".{}xml".format(sep)
 
     try:
         opts, args = getopt.getopt(argv, "hcd:m:t:p:s:x:P:", ["help", "compare-to-pdf", "xml-dir=", "manuscript-file=", "title=", "page=", "svg=", "xml-target-file=", "PDF="])
     except getopt.GetoptError:
         usage()
         return 2
 
     for opt, arg in opts:
         if opt in ('-h', '--help') or not args:
             usage()
             return 0
         elif opt in ('-c', '--compare-to-pdf'):
             compare2pdf = True
         elif opt in ('-d', '--xml-dir'):
             xml_dir = arg
         elif opt in ('-m', '--manuscript-file'):
             manuscript_file = arg
         elif opt in ('-t', '--title'):
             title = arg
         elif opt in ('-p', '--page'):
             page_number = str(arg)
         elif opt in ('-s', '--svg'):
             svg_file = arg
         elif opt in ('-P', '--PDF'):
             pdfFile = arg
         elif opt in ('-x', '--xml-target-file'):
             xml_target_file = str(arg)
     files_to_process = list()
     for arg in args:
         if isfile(arg):
             files_to_process.append(arg)
         elif isdir(arg):
             files_to_process = files_to_process + list(filter(lambda file: '.svg' in file, listdir(arg))) 
         else:
             print("'{}' does not exist!".format(arg))
             return 2
     
     if len(files_to_process) < 1 or args[0].endswith('xml'):
         if xml_target_file is None:
             xml_target_file = args[0] if len(args) > 0 else None
         if xml_target_file is not None and isfile(xml_target_file):
             target_file_tree = ET.parse(xml_target_file)
             file_name = target_file_tree.getroot().get('source')
             title = target_file_tree.getroot().get('title') if title is None else title
             page_number = target_file_tree.getroot().get('number') if page_number is None else page_number
             if svg_file is None:
                 if len(target_file_tree.xpath('//svg-image')) > 0:
                     svg_file = target_file_tree.xpath('.//svg-image/@file-name')[0]\
                         if len(target_file_tree.xpath('.//svg-image/@file-name')) > 0 else None
                 else:
                     svg_file = target_file_tree.xpath('.//svg/@file')[0]\
                         if len(target_file_tree.xpath('.//svg/@file')) > 0 else None
             files_to_process.insert(0, file_name)
             if xml_target_file in files_to_process:
                 files_to_process.remove(xml_target_file)
         else:
             usage()
             return 2
     if len(files_to_process) > 1 and (bool(page_number) or bool(xml_target_file) or bool(pdfFile) or bool(svg_file)):
         print("ERROR: too many input files:  options --PDF, --page, --svg and --xml-target-file presuppose only one input file!")
         usage()
         return 2
 
     extractor = Extractor(xml_dir=xml_dir, title=title, manuscript_file=manuscript_file, compare2pdf=compare2pdf)
     for file in files_to_process:
         extractor.extractAndWriteInformation(file, page_number=page_number, xml_target_file=xml_target_file, pdfFile=pdfFile, svg_file=svg_file)
     return 0
 
 if __name__ == "__main__":
     sys.exit(main(sys.argv[1:]))
Index: svgscripts/datatypes/positional_object.py
===================================================================
--- svgscripts/datatypes/positional_object.py	(revision 102)
+++ svgscripts/datatypes/positional_object.py	(revision 103)
@@ -1,145 +1,148 @@
 #!/usr/bin/env python3
 # -*- coding: utf-8 -*-
 
 """   This class can be used to represent an object with positional information.
 """
 #    Copyright (C) University of Basel 2019  {{{1
 #
 #    This program is free software: you can redistribute it and/or modify
 #    it under the terms of the GNU General Public License as published by
 #    the Free Software Foundation, either version 3 of the License, or
 #    (at your option) any later version.
 #
 #    This program is distributed in the hope that it will be useful,
 #    but WITHOUT ANY WARRANTY; without even the implied warranty of
 #    MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
 #    GNU General Public License for more details.
 #
 #    You should have received a copy of the GNU General Public License
 #    along with this program.  If not, see <https://www.gnu.org/licenses/> 1}}}
 
 __author__ = "Christian Steiner"
 __maintainer__ = __author__
 __copyright__ = 'University of Basel'
 __email__ = "christian.steiner@unibas.ch"
 __status__ = "Development"
 __license__ = "GPL v3"
 __version__ = "0.0.1"
 
 from lxml import etree as ET
 import sys
 
 from .matrix import Matrix
 from .attachable_object import AttachableObject
 
 sys.path.append('py2ttl')
 from class_spec import SemanticClass
 
 
 class PositionalObject(AttachableObject,SemanticClass):
     """
     This (super) class represents an object with positional information.
 
     Args:
 
         id (int):                   object id
         matrix (datatypes.Matrix):  matrix containing information about conversion.
         height (float):             height of 
         width (float):              width of object
         x (float):                  x position of object
         y (float):                  y position of object
     """
     XML_TAG = 'positional-object'
     floatKeys = [ 'height', 'width', 'left', 'top', 'bottom']
     intKeys = [  ]
     stringKeys = [ ]
 
     def __init__(self, node=None, id=0, height=0.0, width=0.0, x=0.0, y=0.0, matrix=None, tag=XML_TAG):
         self.floatKeys = []
         self.floatKeys += PositionalObject.floatKeys
         self.intKeys = []
         self.intKeys += PositionalObject.intKeys
         self.stringKeys = [ 'id' ]
         self.stringKeys += PositionalObject.stringKeys
         self.attachable_objects = []
         if node is not None:
             self.id = str(node.get('id'))
             if id > 0 and str(id) != self.id:
                 self.id = str(id)
             self.height = float(node.get('height'))
             self.width = float(node.get('width'))
             self.left = float(node.get('left'))
             self.top = float(node.get('top'))
             self.bottom = float(node.get('bottom'))
             self.transform = Matrix(node.get('transform')) if bool(node.get('transform')) and 'matrix(' in node.get('transform') else None
             self.tag = node.tag
         else:
             self.id = str(id)
             self.height = round(height, 3)
             self.width = round(width, 3)
             self.left = round(x, 3)
             self.top = round(y, 3)
             self.bottom = round(y + height, 3)
             self.transform = matrix
             self.tag = tag
+        self.transform_string = self.transform.toString()\
+                if self.transform is not None\
+                else None
 
     def attach_object_to_tree(self, target_tree):
         """Attach object to tree.
         """
         if target_tree.__class__.__name__ == '_ElementTree':
             target_tree = target_tree.getroot()
         obj_node = target_tree.xpath('.//' + self.tag + '[@id="%s"]' % self.id)[0] \
                 if(len(target_tree.xpath('.//' + self.tag + '[@id="%s"]' % self.id)) > 0) \
                 else ET.SubElement(target_tree, self.tag)
         for key in self.floatKeys:
             if self.__dict__[key] is not None:
                 obj_node.set(key.replace('_','-'), str(round(self.__dict__[key], 3)))
         for key in self.intKeys + self.stringKeys:
             if self.__dict__[key] is not None:
                 obj_node.set(key.replace('_','-'), str(self.__dict__[key]))
         if self.transform is not None and self.transform.isRotationMatrix():
             obj_node.set('transform', self.transform.toString())
         for attachable_object in self.attachable_objects:
             attachable_object.attach_object_to_tree(obj_node) 
 
     @classmethod
     def get_semantic_dictionary(cls):
         """ Creates a semantic dictionary as specified by SemanticClass.
         """
         dictionary = {} 
         class_dict = cls.get_class_dictionary()
         properties = {}
         for intKey in cls.intKeys:
             properties.update(cls.create_semantic_property_dictionary(intKey, int))
         for floatKey in cls.floatKeys:
             properties.update(cls.create_semantic_property_dictionary(floatKey, float, cardinality=1))
         for stringKey in cls.stringKeys:
             properties.update(cls.create_semantic_property_dictionary(stringKey, str, cardinality=1))
-        properties.update(cls.create_semantic_property_dictionary('transform', str))
+        properties.update(cls.create_semantic_property_dictionary('transform_string', str, name='hasTransform'))
         dictionary.update({cls.CLASS_KEY: class_dict})
         dictionary.update({cls.PROPERTIES_KEY: properties})
         return cls.return_dictionary_after_updating_super_classes(dictionary)
 
     @staticmethod
     def POSITIONS_OVERLAP_HORIZONTALLY(position_a, position_b):
         """Returns whether position a and b overlap horizontally.
         """
         return (position_a.left < position_b.left+position_b.width)\
                 and (position_a.left+position_a.width > position_b.left)
 
     @staticmethod
     def POSITIONS_OVERLAP_VERTICALLY(position_a, position_b):
         """Returns whether position a and b overlap vertically.
         """
         return (position_a.top < position_b.bottom)\
                 and (position_a.bottom > position_b.top)
 
     @staticmethod
     def POSITIONS_ARE_STACKED(position_a, position_b):
         """Returns whether position a and b are stacked, i.e. are above each other.
         """
         return PositionalObject.POSITIONS_OVERLAP_HORIZONTALLY(position_a, position_b)\
                 and (not PositionalObject.POSITIONS_OVERLAP_VERTICALLY(position_a, position_b)\
                     or abs(position_a.top-position_b.top) > (position_a.height/4 + position_b.height/4))
 
 
Index: svgscripts/datatypes/positional_word_part.py
===================================================================
--- svgscripts/datatypes/positional_word_part.py	(revision 102)
+++ svgscripts/datatypes/positional_word_part.py	(revision 103)
@@ -1,180 +1,184 @@
 #!/usr/bin/env python3
 # -*- coding: utf-8 -*-
 
 """   This class can be used to represent a positional word part, i.e. part of a word that has a position on the transkription.
 """
 #    Copyright (C) University of Basel 2019  {{{1
 #
 #    This program is free software: you can redistribute it and/or modify
 #    it under the terms of the GNU General Public License as published by
 #    the Free Software Foundation, either version 3 of the License, or
 #    (at your option) any later version.
 #
 #    This program is distributed in the hope that it will be useful,
 #    but WITHOUT ANY WARRANTY; without even the implied warranty of
 #    MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
 #    GNU General Public License for more details.
 #
 #    You should have received a copy of the GNU General Public License
 #    along with this program.  If not, see <https://www.gnu.org/licenses/> 1}}}
 
 __author__ = "Christian Steiner"
 __maintainer__ = __author__
 __copyright__ = 'University of Basel'
 __email__ = "christian.steiner@unibas.ch"
 __status__ = "Development"
 __license__ = "GPL v3"
 __version__ = "0.0.1"
 
 from lxml import etree as ET
 from svgpathtools.parser import parse_path
 import sys
 import warnings
 
 from .positional_object import PositionalObject 
 
 
 sys.path.append('py2ttl')
 from class_spec import UnSemanticClass
 
 class PositionalWordPart(PositionalObject,UnSemanticClass):
     """
     This class represents a positional word part, i.e. a part of a word that has a position on the transkription.
 
     Args:
 
         id (int):                   object id
         text (str):                 text
         symbol_id (str):            id of corresponding symbol
         style_class (str)           style class id
         matrix (datatypes.Matrix):  matrix containing information about conversion.
         height (float):             height of 
         width (float):              width of object
         x (float):                  x position of object
         y (float):                  y position of object
     """
     WARN_NO_USE_NODE_FOUND = 'No use_node found'
     XML_TAG = 'word-part'
     extraStringKeys = [ 'text', 'symbol_id', 'style_class' ]
 
     def __init__(self, node=None, id=0, height=0.0, width=0.0, x=0.0, y=0.0, matrix=None, text=None, symbol_id=None, style_class=None):
         super(PositionalWordPart, self).__init__(id=id, node=node, height=height, width=width, x=x, y=y, matrix=matrix, tag=PositionalWordPart.XML_TAG)
         self.stringKeys += [ 'text', 'symbol_id', 'style_class' ]
         self.text = text
         self.symbol_id = symbol_id
         self.style_class = style_class
         if node is not None:
             self.text = node.get('text')
             self.symbol_id = node.get('symbol-id')
             self.style_class = node.get('style-class')
 
     @classmethod
     def get_semantic_dictionary(cls):
         """ Creates a semantic dictionary as specified by SemanticClass.
         """
         dictionary = super(cls,cls).get_semantic_dictionary()
         for extraStringKey in cls.extraStringKeys:
             dictionary[cls.PROPERTIES_KEY].update(cls.create_semantic_property_dictionary(extraStringKey, str, cardinality=1))
         return cls.return_dictionary_after_updating_super_classes(dictionary)
 
     @staticmethod
     def CREATE_POSITIONAL_WORD_PART(text, use_node, namespaces, start_id=0, xmin=0.0, ymin=0.0, matrix=None, style_class=None, original_x=0.0, original_y=0.0):
         """Creates a PositionalWordPart.
 
             [:return:] a PositionalWordPart
         """
         symbol_id = use_node.get('{%s}href' % namespaces['xlink']).replace('#', '') 
         x = float(use_node.get('x')) - xmin if bool(use_node.get('x')) else 0.0
         y = float(use_node.get('y')) - ymin if bool(use_node.get('y')) else 0.0
         if matrix is not None and matrix.isRotationMatrix():
-            x = matrix.get_old_x(x=x, y=y)
+            x = matrix.get_old_x(x=x, y=y) \
+                    if matrix.getX() != matrix.get_old_x(x=x, y=y)\
+                    else 0
             #print('origin_x {} -> x {}'.format(original_x, x))
             y = original_y if original_y != 0 else y
+            if y > 0 and y == matrix.getY():
+                y = 0
         d_strings = use_node.xpath('//ns:symbol[@id="{0}"]/ns:path/@d'.format(symbol_id), namespaces=namespaces)
         if len(d_strings) > 0 and d_strings[0] != '':
             path = parse_path(d_strings[0])
             xmin, xmax, ymin, ymax = path.bbox()
             width = xmax - xmin
             height = ymax - ymin if ymax - ymin > 3 else 3
             if ymin < 0 and ymax < 0:
                 y += ymin
             return PositionalWordPart(id=start_id, text=text, height=height, width=width, x=x, y=y-height,\
                     matrix=matrix, symbol_id=symbol_id, style_class=style_class)
         else:
             return PositionalWordPart(id=start_id, text=text, x=x, y=y, matrix=matrix, symbol_id=symbol_id, style_class=style_class)
 
     @staticmethod
     def CREATE_POSITIONAL_WORD_PART_LIST(word_part_obj, svg_path_tree, namespaces, page=None, start_id=0, xmin=0.0, ymin=0.0, threshold=0.4, throw_error_if_not_found=False):
         """Creates a list of PositionalWordPart from a word_part_obj (a dictionary with the keys: text, x, y, matrix, class),
             using a (lxml.ElementTree) svg_path_tree and the corresponding namespaces.
 
             [:return:] a list of PositionalWordPart
         """
         word_part_list = []
         original_x, original_y = 0.0, 0.0
         x = float(word_part_obj['x']) if bool(word_part_obj.get('x')) else 0.0
         y = float(word_part_obj['y']) if bool(word_part_obj.get('y')) else 0.0
         text = word_part_obj.get('text')
         matrix = word_part_obj.get('matrix')
         style_class = word_part_obj.get('class')
         if matrix is not None and matrix.isRotationMatrix():
             original_x, original_y = x, y
             x = matrix.get_new_x(x=original_x, y=original_y)
             y = matrix.get_new_y(x=original_x, y=original_y)
         if text is not None and text != '':
             svg_x = x + xmin
             svg_y = y + ymin
             use_nodes = svg_path_tree.xpath('//ns:use[@x>="{0}" and @x<="{1}" and @y>="{2}" and @y<="{3}"]'\
                     .format(svg_x-threshold, svg_x+threshold,svg_y-threshold, svg_y+threshold), namespaces=namespaces)
             if len(use_nodes) > 0:
                 current_use_node = use_nodes[0]
                 index = 0
                 word_part_list.append(PositionalWordPart.CREATE_POSITIONAL_WORD_PART(text[index], current_use_node, namespaces,\
                         start_id=start_id, xmin=xmin, ymin=ymin, matrix=matrix, style_class=style_class, original_x=original_x, original_y=original_y))
                 index, start_id = index + 1, start_id + 1
                 while index < len(text) and current_use_node.getnext() is not None:
                     current_use_node = current_use_node.getnext()
                     word_part_list.append(PositionalWordPart.CREATE_POSITIONAL_WORD_PART(text[index], current_use_node, namespaces,\
                         start_id=start_id, xmin=xmin, ymin=ymin, matrix=matrix, style_class=style_class, original_x=original_x, original_y=original_y))
                     index, start_id = index+1, start_id+1
                 if index < len(text) and current_use_node.getnext() is None:
                     last_pwp = word_part_list[len(word_part_list)-1]
                     new_word_part_obj = word_part_obj.copy()
                     new_word_part_obj['x'] = last_pwp.left + last_pwp.width + 0.5
                     new_word_part_obj['y'] = last_pwp.bottom
                     new_word_part_obj['text'] = word_part_obj['text'][index:]
                     word_part_list += PositionalWordPart.CREATE_POSITIONAL_WORD_PART_LIST(new_word_part_obj,\
                             svg_path_tree, namespaces, page, start_id=start_id, xmin=xmin, ymin=ymin)
                 return word_part_list
             elif page is None or throw_error_if_not_found:
                 raise Exception('{} for text {} svg_x {}, svg_y {}'.format(PositionalWordPart.WARN_NO_USE_NODE_FOUND, text, svg_x, svg_y))
             else:
                 warnings.warn('{} for text {} svg_x {}, svg_y {}'.format(PositionalWordPart.WARN_NO_USE_NODE_FOUND, text, svg_x, svg_y))
                 return PositionalWordPart.CREATE_SIMPLE_POSITIONAL_WORD_PART_LIST(page, [word_part_obj]) 
         else:
             return [ ]
 
     @staticmethod
     def CREATE_SIMPLE_POSITIONAL_WORD_PART_LIST(page, word_part_objs):
         """Creates a list of PositionalWordPart from word_part_objs (i.e. a list of dictionaries  
         with the keys: text, x, y, matrix, class).
 
             [:return:] a list of (datatypes.positional_word_part) PositionalWordPart
         """
         positional_word_parts = []
         HEIGHT_FACTOR = 1.1 # factor that multiplies font_size -> height
         FONTWIDTHFACTOR = 0.7 # factor that multiplies lastCharFontSize
         SPACING = 0.2
         for index, part_obj in enumerate(word_part_objs):
             text = part_obj.get('text')
             matrix = part_obj.get('matrix')
             style_class = part_obj.get('class')
             x = float(part_obj['x']) if bool(part_obj.get('x')) else 0.0
             y = float(part_obj['y']) if bool(part_obj.get('y')) else 0.0
             font_size = page.get_biggest_fontSize4styles(style_set=set(style_class.split(' ')))
             height = round(font_size * HEIGHT_FACTOR + HEIGHT_FACTOR / font_size, 3)
             width = round(font_size * FONTWIDTHFACTOR, 3)
             if index+1 < len(word_part_objs) and bool(word_part_objs[index+1].get('x')):
                 width = float(word_part_objs[index+1]['x']) - x - SPACING
             positional_word_parts.append(PositionalWordPart(id=index, text=text, height=height, width=width, x=x, y=y, matrix=matrix, style_class=style_class))
         return positional_word_parts
Index: svgscripts/datatypes/simple_word.py
===================================================================
--- svgscripts/datatypes/simple_word.py	(revision 102)
+++ svgscripts/datatypes/simple_word.py	(revision 103)
@@ -1,127 +1,127 @@
 #!/usr/bin/env python3
 # -*- coding: utf-8 -*-
 
 """   This super class can be used to represent a simple word.
 """
 #    Copyright (C) University of Basel 2019  {{{1
 #
 #    This program is free software: you can redistribute it and/or modify
 #    it under the terms of the GNU General Public License as published by
 #    the Free Software Foundation, either version 3 of the License, or
 #    (at your option) any later version.
 #
 #    This program is distributed in the hope that it will be useful,
 #    but WITHOUT ANY WARRANTY; without even the implied warranty of
 #    MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
 #    GNU General Public License for more details.
 #
 #    You should have received a copy of the GNU General Public License
 #    along with this program.  If not, see <https://www.gnu.org/licenses/> 1}}}
 
 __author__ = "Christian Steiner"
 __maintainer__ = __author__
 __copyright__ = 'University of Basel'
 __email__ = "christian.steiner@unibas.ch"
 __status__ = "Development"
 __license__ = "GPL v3"
 __version__ = "0.0.1"
 
 import abc
 from lxml import etree as ET
 import sys
 
 from .line import Line
 from .faksimile_position import FaksimilePosition
 from .transkription_position import TranskriptionPosition
 from .word_position import WordPosition
 
 sys.path.append('py2ttl')
 from class_spec import SemanticClass
 
 class SimpleWord(SemanticClass, metaclass=abc.ABCMeta):
     """
     This class represents a simple word.
 
     """
     XML_TAG = 'simple-word'
     XML_SUB_TAG = 'content'
 
     def __init__(self, id=0, line_number=-1, line=None, text='', deleted=False, transkription_positions=None, faksimile_positions=None):
         self.id = id
         self.text = text
         self.line_number = line_number
         self.lines = []
         if line is not None:
             self.lines.append(line)
         self.transkription_positions = transkription_positions if transkription_positions is not None else []
         self.faksimile_positions = faksimile_positions if faksimile_positions is not None else []
     
     def attach_word_to_tree(self, target_tree):
         """Attaches word to tree target_tree.
         """
         if target_tree.__class__.__name__ == '_ElementTree':
             target_tree = target_tree.getroot()
         if len(target_tree.xpath('.//' + self.XML_TAG + '[@id="%s"]' % self.id)) > 0:
             word_node = target_tree.xpath('.//' + self.XML_TAG + '[@id="%s"]' % self.id)[0]
             word_node.getparent().remove(word_node)
         word_node = ET.SubElement(target_tree, self.XML_TAG, attrib={'id': str(self.id)})
         word_node.set('text', self.text)
         if self.line_number > -1:
             word_node.set('line-number', str(self.line_number))
         for id, transkription_position in enumerate(self.transkription_positions):
             transkription_position.id = id
             transkription_position.attach_object_to_tree(word_node)
         for faksimile_position in self.faksimile_positions:
             faksimile_position.attach_object_to_tree(word_node)
         return word_node
 
     @classmethod
     def create_cls(cls, word_node):
         """Creates a cls from a (lxml.Element) node.
 
             [:return:] cls
         """
         if word_node is not None: # init word from xml node
             id = int(word_node.get('id'))
             line_number = int(word_node.get('line-number')) if bool(word_node.get('line-number')) else -1
             text = word_node.get('text')
             transkription_positions = [ TranskriptionPosition(id=id, node=node) for id, node in enumerate(word_node.findall('./' + WordPosition.TRANSKRIPTION)) ]
             faksimile_positions = [ WordPosition(node=node) for node in word_node.findall('./' + WordPosition.FAKSIMILE) ]
             return cls(id=id, text=text, line_number=line_number, transkription_positions=transkription_positions,\
                     faksimile_positions=faksimile_positions)
         else:
             error_msg = 'word_node has not been defined'
             raise Exception('Error: {}'.format(error_msg))
 
     @classmethod
     def get_semantic_dictionary(cls):
         """ Creates and returns a semantic dictionary as specified by SemanticClass.
         """
         dictionary = {}
         class_dict = cls.get_class_dictionary()
         properties = { 'lines': {cls.CLASS_KEY: Line,\
                                  cls.CARDINALITY: 1,\
                                  cls.CARDINALITY_RESTRICTION: 'minCardinality',\
                                  cls.PROPERTY_NAME: 'wordBelongsToLine',\
                                  cls.PROPERTY_LABEL: 'word belongs to a line',\
                                  cls.PROPERTY_COMMENT: 'Relating a word to a line.'}}
         properties.update(cls.create_semantic_property_dictionary('transkription_positions', TranskriptionPosition,\
                 name='hasTranskriptionPosition', cardinality=1, cardinality_restriction='minCardinality'))
         properties.update(cls.create_semantic_property_dictionary('faksimile_positions', FaksimilePosition,\
-                name='hasFaksimilePosition')) #, cardinality=1, cardinality_restriction='minCardinality'))
+                name='hasFaksimilePosition', cardinality=1, cardinality_restriction='minCardinality'))
         properties.update(cls.create_semantic_property_dictionary('text', str, cardinality=1,\
                 subPropertyOf=cls.HOMOTYPIC_HAS_TEXT_URL_STRING))
         dictionary.update({cls.CLASS_KEY: class_dict})
         dictionary.update({cls.PROPERTIES_KEY: properties})
         return cls.return_dictionary_after_updating_super_classes(dictionary)
 
     def init_word(self, page):
         """Initialize word with objects from page.
         """
         #for transkription_position in self.transkription_positions:
         #    transkription_position.svg_image = page.svg_image
         #self.faksimile_positions = FaksimilePosition.create_list_of_cls(self.faksimile_positions, page.faksimile_image, page.text_field)
         if self.line_number > -1:
             self.lines += [ line for line in page.lines if line.id == self.line_number ]
         elif 'word_parts' in self.__dict__.keys() and len(self.word_parts) > 0:
             self.lines += [ line for line in page.lines if line.id in [ wp.line_number for wp in self.word_parts ] ]
Index: svgscripts/util.py
===================================================================
--- svgscripts/util.py	(revision 102)
+++ svgscripts/util.py	(revision 103)
@@ -1,522 +1,525 @@
 #!/usr/bin/env python3
 # -*- coding: utf-8 -*-
 
 """   This program can be used to copy a faksimile svg file with the option of highlighting some word boxes.
 """
 #    Copyright (C) University of Basel 2019  {{{1
 #
 #    This program is free software: you can redistribute it and/or modify
 #    it under the terms of the GNU General Public License as published by
 #    the Free Software Foundation, either version 3 of the License, or
 #    (at your option) any later version.
 #
 #    This program is distributed in the hope that it will be useful,
 #    but WITHOUT ANY WARRANTY; without even the implied warranty of
 #    MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
 #    GNU General Public License for more details.
 #
 #    You should have received a copy of the GNU General Public License
 #    along with this program.  If not, see <https://www.gnu.org/licenses/> 1}}}
 
 from colorama import Fore, Style
 from datetime import datetime
 from functools import cmp_to_key
 import getopt
 import inspect
 import itertools
 import lxml.etree as ET
 import re
 import shutil
 import signal
 import string
 import subprocess
 from svgpathtools import svg_to_paths
 import sys
 import tempfile
 import os
 from os import listdir, sep, path, setpgrp, devnull, makedirs
 from os.path import basename, commonpath, dirname, exists, isfile, isdir, realpath, splitext 
 import warnings
 import wget
 import xml.etree.ElementTree as XET
 
 if dirname(__file__) not in sys.path:
     sys.path.append(dirname(__file__))
 
 from datatypes.faksimile import FaksimilePage, get_paths_inside_rect
 from datatypes.faksimile_image import FaksimileImage
 from datatypes.lineNumber import LineNumber
 from datatypes.mark_foreign_hands import MarkForeignHands
+from datatypes.matrix import Matrix
 from datatypes.page import Page
 from datatypes.page_creator import PageCreator
 from datatypes.transkriptionField import TranskriptionField
 from datatypes.transkription_position import TranskriptionPosition
 from datatypes.word import Word, update_transkription_position_ids
 from local_config import FAKSIMILE_LOCATION, PDF_READER, SVG_EDITOR, USER_ROOT_LOCATION_DICT
 
 sys.path.append('shared_util')
 from myxmlwriter import write_pretty, FILE_TYPE_SVG_WORD_POSITION, FILE_TYPE_XML_MANUSCRIPT
 
 
 __author__ = "Christian Steiner"
 __maintainer__ = __author__
 __copyright__ = 'University of Basel'
 __email__ = "christian.steiner@unibas.ch"
 __status__ = "Development"
 __license__ = "GPL v3"
 __version__ = "0.0.1"
 
 UNITTESTING = False
 HIGHLIGHT_COLOR = 'red'
 OPACITY = '0.5'
 
 class ExternalViewer:
     """This class can be used to show files with external viewers.
     """
     file_format_viewer_dict = { '.pdf': PDF_READER, '.svg': SVG_EDITOR }
 
     @classmethod
     def show_files(cls, single_file=None, list_of_files=[]):
         """Opens file(s) with corresponding external viewer(s).
         """
         DEVNULL = None
         if type(single_file) == list:
             list_of_files = single_file
         elif single_file is not None:
             list_of_files.append(single_file)
         if len(list_of_files) > 1: 
             DEVNULL = open(devnull, 'wb')
         process_list = []
         list_of_files.reverse()
         while len(list_of_files) > 0:
             file2open = list_of_files.pop() 
             viewer = cls.file_format_viewer_dict.get(splitext(file2open)[1])
             if viewer is not None:
                 if len(list_of_files) > 0:
                     process_list.append(\
                             subprocess.Popen([viewer, file2open], stdout=DEVNULL, stderr=DEVNULL, preexec_fn=os.setsid))
                 else:
                     subprocess.run([viewer, file2open])
         for process in process_list:
             os.killpg(os.getpgid(process.pid), signal.SIGTERM)
         if DEVNULL is not None:
             DEVNULL.close()
 
 def back_up(page: Page, reference_file, bak_dir='./bak') -> str:
     """Back up a xml_source_file.
 
         :return: target_file_name
     """
     date_string = datetime.now().strftime('%Y-%m-%d_%H:%M:%S')
     makedirs(bak_dir, exist_ok=True)
     page.bak_file = bak_dir + sep + basename(page.page_tree.docinfo.URL) + '_' + date_string
     write_pretty(xml_element_tree=page.page_tree, file_name=page.bak_file,\
                 script_name=__file__ + '({0},{1})'.format(inspect.currentframe().f_code.co_name, reference_file),\
                 file_type=FILE_TYPE_SVG_WORD_POSITION)
     return page.bak_file
 
 def back_up_svg_file(svg_tree: ET.ElementTree, namespaces=None, bak_dir='./bak') -> str:
     """Back up a xml_source_file.
 
         :return: target_file_name
     """
     if namespaces is None:
         namespaces = { k if k is not None else 'ns': v for k, v in svg_tree.getroot().nsmap.items() }
     date_string = datetime.now().strftime('%Y-%m-%d_%H:%M:%S')
     makedirs(bak_dir, exist_ok=True)
     bak_file = bak_dir + sep + date_string + '_' + basename(svg_tree.docinfo.URL)  
     copy_faksimile_svg_file(target_file=bak_file, faksimile_tree=svg_tree, namespaces=namespaces)
     return bak_file
 
 def copy_faksimile_svg_file(target_file=None, faksimile_source_file=None, faksimile_tree=None, target_directory=None, abs_image_path=None, local_image_path=None, namespaces=None):
     """Copy a faksimile_svg_file to target_file.
     """
     if faksimile_source_file is None and faksimile_tree is not None:
         faksimile_source_file = faksimile_tree.docinfo.URL
     elif faksimile_source_file is None:
         raise Exception('copy_faksimile_svg_file needs either a faksimile_tree (lxml.etree.ElementTree) or a faksimile_source_file')
     if target_file is not None and target_directory is not None:
         target_file = target_directory + sep + target_file
     elif target_file is None and target_directory is not None:
         target_file = target_directory + sep + basename(faksimile_source_file)
     elif target_file is None:
         raise Exception('copy_faksimile_svg_file needs either a target_file or a target_directory')
     paths, attributes, svg_attributes = svg_to_paths.svg2paths(faksimile_source_file, return_svg_attributes=True)
     for key in [ key for key in svg_attributes.keys() if key.startswith('xmlns:') ]:
         try:
             XET.register_namespace(key.replace('xmlns:', ''), svg_attributes[key])
         except ValueError: pass 
     XET.register_namespace('', 'http://www.w3.org/2000/svg')
     if namespaces is None:
         namespaces = { 'ns': svg_attributes['xmlns'], 'xlink': svg_attributes['xmlns:xlink'],\
                        'sodipodi': svg_attributes['xmlns:sodipodi'] }
     if faksimile_tree is not None:
         element = XET.fromstring(ET.tostring(faksimile_tree))\
                 if type(faksimile_tree) == ET._ElementTree\
                 else XET.fromstring(XET.tostring(faksimile_tree.getroot())) 
         target_tree = XET.ElementTree(element)
     else:
         target_tree = XET.parse(faksimile_source_file)
     if (local_image_path is not None or abs_image_path is not None)\
             and len(target_tree.findall('.//ns:image', namespaces=namespaces)) > 0:
         image_node = target_tree.findall('.//ns:image', namespaces=namespaces)[0]
         if local_image_path is not None:
             image_node.set('{%s}href' % namespaces['xlink'], local_image_path)
         if abs_image_path is not None:
             image_node.set('{%s}absref' % namespaces['sodipodi'], abs_image_path)
     target_tree.write(target_file)
 
 def copy_faksimile_update_image_location(faksimile_source_file=None, faksimile_tree=None, target_file=None, target_directory=None, overwrite=False):
     """Copy a faksimile_svg_file to target_file and update image location.
     """
     if faksimile_source_file is None and faksimile_tree is not None:
         faksimile_source_file = faksimile_tree.docinfo.URL
     elif faksimile_source_file is None:
         raise Exception('copy_faksimile_svg_file needs either a faksimile_tree (lxml.etree.ElementTree) or a faksimile_source_file')
     if target_file is not None and target_directory is not None:
         target_file = target_directory + sep + target_file
     elif target_file is None and target_directory is not None:
         target_file = target_directory + sep + basename(faksimile_source_file)
     elif target_directory is None and target_file is not None:
         target_directory = dirname(target_file)
     elif target_file is None:
         raise Exception('copy_faksimile_svg_file needs either a target_file or a target_directory')
     source_tree = ET.parse(faksimile_source_file) if faksimile_tree is None else faksimile_tree
     namespaces = { k if k is not None else 'ns': v for k, v in source_tree.getroot().nsmap.items() }
     image_nodes = source_tree.xpath('//ns:image', namespaces=namespaces)
     local_image_path = None
     abs_image_path = None
     user_abs_image_path = None
     if len(image_nodes) > 0:
         image = FaksimileImage.CREATE_IMAGE(image_nodes[0], source_file=faksimile_source_file)
         abs_image_path = image.local_path
         for user_name in USER_ROOT_LOCATION_DICT.keys():
             if user_name in target_directory:
                 user_abs_image_path = abs_image_path.replace(FAKSIMILE_LOCATION, USER_ROOT_LOCATION_DICT[user_name]).replace('//','/')
                 break
         # if target_directory is subdir of FAKSIMILE_LOCATION
         if realpath(target_directory).startswith(realpath(FAKSIMILE_LOCATION)):
             common_path = commonpath([ realpath(target_directory), realpath(dirname(image.local_path)) ])
             relative_directory = '/'.join(\
                     [ '..' for d in realpath(target_directory).replace(common_path + '/', '').split('/') ])
             local_image_path = relative_directory + realpath(image.local_path).replace(common_path, '')
             if not isfile(target_directory + sep + local_image_path):
                 local_image_path = None
         elif abs_image_path is not None:
             local_image_path = abs_image_path
     if abs_image_path is not None and not isfile(abs_image_path):
         wget.download(image.URL, out=dirname(abs_image_path))
     if not isfile(target_file) or overwrite:
         abs_image_path = user_abs_image_path if user_abs_image_path is not None else abs_image_path
         copy_faksimile_svg_file(target_file=target_file, faksimile_source_file=faksimile_source_file,\
                 faksimile_tree=faksimile_tree, abs_image_path=abs_image_path,\
                 local_image_path=local_image_path, namespaces=namespaces)
     else:
         msg = 'File {0} not copied to directory {1}, it already contains a file {2}.'.format(faksimile_source_file, target_directory, target_file)
         warnings.warn(msg)
 
 def copy_xml_file_word_pos_only(xml_source_file, target_directory):
     """Copy word positions of a xml file to target directory.
 
         :return: (str) xml_target_file
     """
     xml_target_file = target_directory + sep + basename(xml_source_file)
     source_page = Page(xml_source_file)
     target_page = PageCreator(xml_target_file, title=source_page.title, page_number=source_page.number, orientation=source_page.orientation)
     target_page.words = source_page.words
     target_page.update_and_attach_words2tree()
     write_pretty(xml_element_tree=target_page.page_tree, file_name=xml_target_file,\
                 script_name=__file__ + '({})'.format(inspect.currentframe().f_code.co_name), file_type=FILE_TYPE_SVG_WORD_POSITION)
     return xml_target_file
 
 def create_highlighted_svg_file(faksimile_tree, node_ids, nodes_color_dict=None, target_file=None, target_directory=None, local_image_path=None, namespaces=None, highlight_color=HIGHLIGHT_COLOR, opacity=OPACITY):
     """Highlights the nodes of a faksimile_tree that are specified by the list of node_ids and writes the tree to a file.
     """
     if namespaces is None:
         namespaces = { k if k is not None else 'ns': v for k, v in faksimile_tree.getroot().nsmap.items() }
     for node in itertools.chain(*[\
             faksimile_tree.xpath('//ns:rect[@id="{0}"]|//ns:path[@id="{0}"]'.format(node_id), namespaces=namespaces)\
             for node_id in node_ids\
         ]):
         node.set('fill', highlight_color)
         node.set('opacity', opacity)
         node.set('style', '')
     copy_faksimile_update_image_location(target_file=target_file, faksimile_tree=faksimile_tree, target_directory=target_directory)
 
 def get_empty_node_ids(faksimile_tree, x_min=0.0, x_max=0.0, y_min=0.0, y_max=0.0, text_field_id=None, faksimile_page=None, namespaces={}):
     """Returns a list of ids of rect and path nodes that do not have a title element.
     """
     THRESHOLD_X = 10
     if faksimile_page is not None:
         x_min = faksimile_page.text_field.xmin + faksimile_page.faksimile_image.x
         x_max = faksimile_page.text_field.xmax + faksimile_page.faksimile_image.x - THRESHOLD_X
         y_min = faksimile_page.text_field.ymin + faksimile_page.faksimile_image.y
         y_max = faksimile_page.text_field.ymax + faksimile_page.faksimile_image.y
         text_field_id = faksimile_page.text_field.id
     if len(namespaces) == 0:
         namespaces = { k if k is not None else 'ns': v for k, v in faksimile_tree.getroot().nsmap.items() }
     empyt_node_ids = []
     nodes_without_title = faksimile_tree.xpath('//ns:rect[@x>"{0}" and @x<"{1}" and @y>"{2}" and @y<"{3}" and @id!="{4}" and not(./ns:title)]'.format(\
         x_min, x_max, y_min, y_max, text_field_id), namespaces=namespaces)
     nodes_without_title += get_paths_inside_rect(faksimile_tree, '//ns:path[not(./ns:title)]', x_min, x_max, y_min, y_max, text_field_id, namespaces=namespaces)
     for node_without_title in nodes_without_title:
         empyt_node_ids.append(node_without_title.get('id'))
     return empyt_node_ids
 
 def get_mismatching_ids(words, faksimile_positions):
     """ Return the list of mismatching words and the list of mismatching faksimile_positions
         as a 2-tuple.
     """
     mismatching_words = []
     mismatching_faksimile_positions = []
     faksimile_positions, unique_faksimile_words = replace_chars(words, faksimile_positions)
     word_texts = [ word.text for word in words if word.text != '.' ]
     for word_text in set(word_texts):
         if word_text not in unique_faksimile_words:
             mismatching_words += [ word for word in words if word.text == word_text ]
     for faksimile_position_text in unique_faksimile_words:
         if faksimile_position_text not in set(word_texts):
             mismatching_faksimile_positions += [ faksimile_position for faksimile_position in faksimile_positions\
                                                  if faksimile_position.text == faksimile_position_text ]
     return mismatching_words, mismatching_faksimile_positions
 
 def process_warnings4status(warnings, warning_messages, current_status, ok_status, status_prefix='') ->str:
     """Process potential warnings and return actual status.
     """
     if warnings is not None and len(warnings) > 0:
         status = status_prefix
         for warning_message in warning_messages:
             if True in [ str(warn.message).startswith(warning_message) for warn in warnings ]:
                 status += f':{warning_message}:'
         if status != status_prefix:
             return status
         return f'{current_status}:{ok_status}:'
     else:
         return f'{current_status}:{ok_status}:'
 
 def record_changes(original_svg_file, changed_svg_file, node_ids, namespaces={}):
     """Copy changes made to changed_svg_file to original_svg_file.
     """
     old_tree = ET.parse(original_svg_file)
     new_tree = ET.parse(changed_svg_file)
     if len(namespaces) == 0:
         namespaces = { k if k is not None else 'ns': v for k, v in new_tree.getroot().nsmap.items() }
     for node_id in node_ids:
         new_titles = new_tree.xpath('//ns:rect[@id="{0}"]/ns:title|//ns:path[@id="{0}"]/ns:title'.format(node_id), namespaces=namespaces)
         old_nodes = old_tree.xpath('//ns:rect[@id="{0}"]|//ns:path[@id="{0}"]'.format(node_id), namespaces=namespaces)
         if len(new_titles) > 0 and len(old_nodes) > 0:
             if old_nodes[0].find('ns:title', namespaces=namespaces) is not None:
                 old_nodes[0].find('ns:title', namespaces=namespaces).text = new_titles[0].text
             else:
                 old_title_id_string = new_titles[0].get('id')
                 old_title = ET.SubElement(old_nodes[0], 'title', attrib={ 'id': old_title_id_string })
                 old_title.text = new_titles[0].text
         elif len(old_nodes) > 0:
             for old_node in old_nodes:
                 old_node.getparent().remove(old_node)
     copy_faksimile_svg_file(target_file=original_svg_file, faksimile_tree=old_tree)
 
 def record_changes_on_svg_file_to_page(xml_source_file, svg_file, word_ids=None):
     """Copy changes made to svg_file to xml_source_file.
         
         :return: datatypes.page.Page
     """
     svg_tree = ET.parse(svg_file)
     namespaces = { k if k is not None else 'ns': v for k, v in svg_tree.getroot().nsmap.items() }
     transkription_field = TranskriptionField(svg_file)
     page = Page(xml_source_file)
     words = [ word for word in page.words if word.id in word_ids ]\
             if word_ids is not None else page.words
     new_page_words = []
     for word in words:
         word_id = 'word_' + str(word.id) + '_'
         recorded_ids = []
         for transkription_position in word.transkription_positions:
             transkription_position_id = word_id + str(transkription_position.id)
             tp_nodes = svg_tree.xpath('//ns:g[@id="Transkription"]/ns:rect[@id="{0}"]'.format(transkription_position_id), namespaces=namespaces)
             if len(tp_nodes) > 0:
                 record_changes_to_transkription_position(tp_nodes[0], transkription_position,\
                         transkription_field.xmin, transkription_field.ymin, namespaces=namespaces)
                 recorded_ids.append(transkription_position_id)
         extra_nodes = [ node for node in\
                 svg_tree.xpath('//ns:g[@id="Transkription"]/ns:rect[contains(@id, "{0}")]'.format(word_id), namespaces=namespaces)\
                 if node.get('id') not in recorded_ids ]
         if len(extra_nodes) > 0:
             for extra_node in extra_nodes:
                 old_ids = [ inkscape_id.replace('#','') for inkscape_id in\
                         svg_tree.xpath('//ns:g[@id="Transkription"]/ns:rect[@id="{0}"]/@inkscape:label'.format(extra_node.get('id')),\
                         namespaces=namespaces) ]
                 if len(old_ids) > 0 and re.match(r'word_[0-9]+_[0-9]+', old_ids[0]):
                     old_id_list = old_ids[0].split('_')    
                     ref_word_id = int(old_id_list[1])
                     ref_tp_id = old_id_list[2]
                     ref_words = [ word for word in page.words if word.id == ref_word_id ]
                     if len(ref_words) > 0:
                         ref_tps = [ tp for tp in ref_words[0].transkription_positions\
                                 if tp.id == ref_tp_id ]
                         if len(ref_tps) > 0:
                             ref_words[0].transkription_positions.remove(ref_tps[0])
                             record_changes_to_transkription_position(extra_node,\
                                     ref_tps[0], transkription_field.xmin, transkription_field.ymin, namespaces=namespaces)
                             word.transkription_positions.append(ref_tps[0])
     for word in page.words:
         if word.has_mixed_status('text'):
             new_page_words += [ word for word in word.split_according_to_status('text') if word.text is not None and word.text != '' ]
         elif len(word.transkription_positions) > 0:
             new_text = [ tp.text for tp in word.transkription_positions if tp.text is not None and tp.text != '' ]
             if len(new_text) > 0:
                 word.text = new_text[0]
             new_page_words.append(word)
     page.words = new_page_words
     page.update_and_attach_words2tree(update_function_on_word=update_transkription_position_ids)
     page.unlock()
     if not UNITTESTING:
         write_pretty(xml_element_tree=page.page_tree, file_name=xml_source_file,\
                 script_name=__file__ + ' -> ' + inspect.currentframe().f_code.co_name, file_type=FILE_TYPE_SVG_WORD_POSITION)
     return page
 
 def record_changes_on_xml_file_to_page(xml_source_file, xml_file) -> Page:
     """Copy changes made to xml_file to xml_source_file.
         
         :return: datatypes.page.Page
     """
     copy_page = Page(xml_file)
     page = Page(xml_source_file)
     page.unlock()
     back_up(page, xml_file)
     page.words = []
     for word in copy_page.words:
         if word.split_strings is None\
                 or len(word.split_strings) == 0:
             page.words.append(word)
         else:
             next_word = word
             for split_string in word.split_strings:
                 _, new_word, next_word = next_word.split(split_string)
                 page.words.append(new_word)
             if next_word is not None:
                 page.words.append(next_word)
     page.update_and_attach_words2tree(update_function_on_word=update_transkription_position_ids)
     remove_words_if_done = []
     for word in page.words:
         if 'join_string' in word.__dict__.keys()\
                 and word.join_string is not None:
             if word.id > 0\
             and page.words[word.id-1].text + word.text == word.join_string:
                 page.words[word.id-1].join(word)
                 remove_words_if_done.append(word)
             elif word.id < len(page.words)\
             and word.text + page.words[word.id+1].text == word.join_string:
                 word.join(page.words[word.id+1])
                 remove_words_if_done.append(page.words[word.id+1])
     for word in remove_words_if_done:
         page.words.remove(word)
     page.update_and_attach_words2tree(update_function_on_word=update_transkription_position_ids)
     if not UNITTESTING:
         write_pretty(xml_element_tree=page.page_tree, file_name=xml_source_file,\
                 script_name=__file__ + '({0},{1})'.format(inspect.currentframe().f_code.co_name, xml_file), file_type=FILE_TYPE_SVG_WORD_POSITION)
     return page
                    
 def record_changes_to_transkription_position(node, transkription_position, xmin=0.0, ymin=0.0, namespaces=None):
     """Record changes made to node to transkription_position.
     """
     if namespaces is None:
         namespaces = { k if k is not None else 'ns': v for k, v in node.nsmap.items() }
     if bool(node.get('x')):
         transkription_position.left = float(node.get('x')) - xmin
     if bool(node.get('y')):
         transkription_position.top = float(node.get('y')) - ymin
     if bool(node.get('width')):
         transkription_position.width = float(node.get('width'))
     if bool(node.get('height')):
         transkription_position.height = float(node.get('height'))
     if len(node.xpath('./ns:title/text()', namespaces=namespaces)) > 0:
         transkription_position.text = node.xpath('./ns:title/text()', namespaces=namespaces)[0]
 
 def replace_chars(words, faksimile_positions, unique_faksimile_words=None):
     """Return unique_faksimile_words and faksimile_positions, with characters changed according to transcription words.
     """
     if unique_faksimile_words is None:
         unique_faksimile_words = sorted(set(faksimile_position.text for faksimile_position in faksimile_positions),\
                                         key=lambda text: len(text))
     for index, word_text in enumerate(unique_faksimile_words):
         if len([ word for word in words if word.text == word_text ]) == 0:
             if re.match(r'.*".*', word_text)\
                and len([ word for word in words if word.text == word_text.replace('"', '“') ]) > 0:
                 unique_faksimile_words[index] = word_text.replace('"', '“')
             elif re.match(r'.*ss.*', word_text)\
                 and len([ word for word in words if word.text == word_text.replace('ss', 'ß') ]) > 0:
                 unique_faksimile_words[index] = word_text.replace('ss', 'ß')
             elif re.match(r'.*-.*', word_text)\
                 and len([ word for word in words if word.text == word_text.replace('-', '–') ]) > 0:
                 unique_faksimile_words[index] = word_text.replace('-', '–')
             for faksimile_position in [ faksimile_position for faksimile_position in faksimile_positions\
                                         if faksimile_position.text == word_text ]:
                 faksimile_position.text = unique_faksimile_words[index]
         elif word_text == '-'\
                 and len([ word for word in words if word.text == '–' ]) > 0:
             print([ word.text for word in words if word.text == word_text ])
             print([ word.text for word in words if word.text == '–' ])
     return faksimile_positions, unique_faksimile_words
 
-def reset_tp_with_matrix(page, transkription_positions, new_left=0, new_top=-5):
-    """Set left = 0, top = -5 for each transkription_position with transform matrix.
+def reset_tp_with_matrix(transkription_positions, new_left=0, new_top=-5, tr_xmin=0.0, tr_ymin=0.0):
+    """Fix transkription_position with transform matrix.
     """
-    if len(transkription_positions) > 0\
-        and (page.svg_image is None\
-            or page.svg_image.text_field is None):
+    if len(transkription_positions) > 0:
         for tp in transkription_positions:
             if tp.transform is not None\
-                and tp.transform.isRotationMatrix()\
-                and tp.left > 10 and tp.top > 10:
-                tp.left = new_left
-                tp.top = new_top
+                and tp.transform.isRotationMatrix():
+                tp.transform.matrix[Matrix.XINDEX] = round(tp.transform.matrix[Matrix.XINDEX] + tr_xmin, 3) 
+                tp.left = round(tp.left, 3) - tp.transform.matrix[Matrix.XINDEX]\
+                        if abs(round(tp.left, 3) - tp.transform.matrix[Matrix.XINDEX]) > 1\
+                        else 0
+                tp.bottom = round(tp.bottom, 3) - tp.transform.matrix[Matrix.YINDEX]
+                tp.transform.matrix[Matrix.YINDEX] = round(tp.transform.matrix[Matrix.YINDEX] + tr_ymin, 3) 
+                tp.top= tp.bottom - tp.height + 2
 
 def update_svgposfile_status(file_name, manuscript_file=None, status='changed', append=True):
     """Updates svg position file's status. Changes its status to status if it does not contain 'OK',
         else it appends new status to old status.
     """
     if isfile(file_name):
         parser = ET.XMLParser(remove_blank_text=True)
         file_tree = ET.parse(file_name, parser)
         old_status = file_tree.getroot().get('status')
         if old_status is None or 'OK' not in old_status.split(':'):
             file_tree.getroot().set('status', status)
         elif append:
             if status not in old_status.split(':'):
                 new_status = old_status + ':' + status
                 file_tree.getroot().set('status', new_status)
         else:
             file_tree.getroot().set('status', new_status)
         write_pretty(xml_element_tree=file_tree, file_name=file_name, script_name=__file__, file_type=FILE_TYPE_SVG_WORD_POSITION)
         if manuscript_file is not None and isfile(manuscript_file):
             page_number = file_tree.getroot().get('number')
             update_manuscript_file(manuscript_file, page_number, file_name, status=status)
 
 def update_manuscript_file(manuscript_file, page_number, file_name, status='changed', append=True):
     """Updates manuscript file: adds status information about page.
     """
     if isfile(manuscript_file):
         parser = ET.XMLParser(remove_blank_text=True)
         manuscript_tree = ET.parse(manuscript_file, parser)
         if len(manuscript_tree.getroot().xpath('//page[@number="%s"]' % page_number)) > 0:
             node = manuscript_tree.getroot().xpath('//page[@number="%s"]' % page_number)[0] 
             old_status = node.get('status')
             if old_status is None or 'OK' not in old_status.split(':'):
                 node.set('status', status)
             elif append:
                 if status not in old_status.split(':'):
                     new_status = old_status + ':' + status
                     node.set('status', new_status)
             else:
                 node.set('status', new_status)
             if not bool(node.get('output')):
                 node.set('output', file_name)
         else:
             pages_node = manuscript_tree.getroot().find('pages')\
                     if manuscript_tree.getroot().find('pages') is not None\
                     else ET.SubElement(manuscript_tree.getroot(), 'pages')
             new_id = len(pages_node.findall('page')) + 1
             ET.SubElement(pages_node, 'page', attrib={'id': str(new_id), 'number': str(page_number), 'status': status, 'output': file_name})
         write_pretty(xml_element_tree=manuscript_tree, file_name=manuscript_file, script_name=__file__, file_type=FILE_TYPE_XML_MANUSCRIPT)
 
Index: svgscripts/convert_wordPositions.py
===================================================================
--- svgscripts/convert_wordPositions.py	(revision 102)
+++ svgscripts/convert_wordPositions.py	(revision 103)
@@ -1,695 +1,724 @@
 #!/usr/bin/env python3
 # -*- coding: utf-8 -*-
 
 """   This program can be used to convert the word positions to HTML for testing purposes.
 """
 #    Copyright (C) University of Basel 2019  {{{1
 #
 #    This program is free software: you can redistribute it and/or modify
 #    it under the terms of the GNU General Public License as published by
 #    the Free Software Foundation, either version 3 of the License, or
 #    (at your option) any later version.
 #
 #    This program is distributed in the hope that it will be useful,
 #    but WITHOUT ANY WARRANTY; without even the implied warranty of
 #    MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
 #    GNU General Public License for more details.
 #
 #    You should have received a copy of the GNU General Public License
 #    along with this program.  If not, see <https://www.gnu.org/licenses/> 1}}}
 
 import cairosvg
 import getopt
 import json
 from lxml.html import builder as E
 from lxml.html import open_in_browser
 import lxml
 from pathlib import Path as PathLibPath
 from os import sep, listdir, mkdir, path, remove
 from os.path import exists, isfile, isdir, dirname
 import re
 import sys
 from svgpathtools import svg_to_paths
 import xml.etree.ElementTree as ET
 
 if dirname(__file__) not in sys.path:
     sys.path.append(dirname(__file__))
 
 from datatypes.matrix import Matrix
 from datatypes.page import Page
 from datatypes.page_creator import PageCreator
 from datatypes.transkriptionField import TranskriptionField
 from datatypes.text_field import TextField
 from datatypes.writing_process import WritingProcess
 from datatypes.word import Word
 
 
 __author__ = "Christian Steiner"
 __maintainer__ = __author__
 __copyright__ = 'University of Basel'
 __email__ = "christian.steiner@unibas.ch"
 __status__ = "Development"
 __license__ = "GPL v3"
 __version__ = "0.0.1"
 
 EXIST_DB = 'http://130.60.24.65:8081/exist/rest/db/ProjectData/Nietzsche/'
+LOCAL_SERVER = 'http://localhost:8000/'
 
 class Converter:
     """The converter super class.
     """
     def __init__(self, page, non_testing=True, show_word_insertion_mark=False):
         self.page = page
         self.non_testing = non_testing
         self.show_word_insertion_mark = show_word_insertion_mark
 
     def _get_transkription_positions(self, transkription_positions, stage_version=''):
         """Returns the transkription_positions of the indicated stage_version.
         """
         convertable_transkription_positions = transkription_positions
         if stage_version != '':
             convertable_transkription_positions = []
             if re.match(r'^\d$', stage_version):
                 writing_process_id = int(stage_version)
                 for transkription_position in transkription_positions:
                     if transkription_position.writing_process_id == writing_process_id:
                         convertable_transkription_positions.append(transkription_position)
             elif re.match(r'^\d\+$', stage_version):
                 version_range = [ *range(int(stage_version.replace('+','')), len(WritingProcess.VERSION_DESCRIPTION)) ]
                 for transkription_position in transkription_positions:
                     if transkription_position.writing_process_id in version_range:
                         convertable_transkription_positions.append(transkription_position)
             elif re.match(r'^\d\-\d$', stage_version):
                 start_stop = [ int(i) for i in re.split(r'-', stage_version) ]
                 version_range = [ *range(start_stop[0], start_stop[1]+1) ]
                 for transkription_position in transkription_positions:
                     if transkription_position.writing_process_id in version_range:
                         convertable_transkription_positions.append(transkription_position)
         return convertable_transkription_positions 
 
     def _get_words(self, words, highlighted_words=None):
         """Return the words that will be hightlighted.
         """
         return highlighted_words if highlighted_words is not None else words
 
     def convert(self, output_file=None, stage_version='', highlighted_words=None):
         """Prints all words.
         """
         first_word_of_line = None
         out = sys.stdout
         if output_file is not None:
             out = open(output_file, 'w')
         for word in self.page.words:
             if first_word_of_line is None or first_word_of_line.line_number != word.line_number:
                 out.write('\n')
                 first_word_of_line = word
                 if word.line_number % 2 == 0:
                     out.write(str(word.line_number).zfill(2) + ' ')
                 else:
                     out.write('   ')
             if stage_version == '' or len(self._get_transkription_positions(word.transkription_positions, stage_version=stage_version)) > 0:
                 if word.text is not None:
                     out.write(word.text + ' ')
         out.close()
         return 0
 
     @classmethod
     def CREATE_CONVERTER(cls, page, non_testing=True, converter_type='', show_word_insertion_mark=False, key=''):
         """Returns a converter of type converter_type.
 
             [:return:] SVGConverter for 'SVG', HTMLConverter for 'HTML', Converter for None
         """
         cls_dict = { subclass.__name__: subclass for subclass in cls.__subclasses__() }
         cls_key = converter_type + 'Converter'
         if bool(cls_dict.get(cls_key)):
             converter_cls = cls_dict[cls_key]
             if converter_cls == JSONConverter:
                 return converter_cls(page, non_testing, key=key)
             return converter_cls(page, non_testing, show_word_insertion_mark)
         else:
             return Converter(page, non_testing, show_word_insertion_mark)
 
 class JSONConverter(Converter):
     """This class can be used to convert a 'svgWordPositions' xml file to a json file.
     """
     def __init__(self, page, non_testing=True, key=''):
         Converter.__init__(self, page, non_testing, False)
 
-    def _add_word_to_list(self, words, word, text, text_field=None, edited_text=None, earlier_version=None, overwrites_word=None, parent_id=-1):
+    def _add_word_to_list(self, words, word, text, text_field=None, edited_text=None, earlier_version=None, overwrites_word=None, parent_id=-1, faksimile_positions=None):
         """Add word to list.
         """
         id = word.id\
                 if parent_id == -1\
                 else parent_id
         edited_text = word.edited_text\
                 if edited_text is None\
                 else edited_text
         earlier_version = word.earlier_version\
                 if earlier_version is None\
                 else earlier_version
         overwrites_word = word.overwrites_word\
                 if overwrites_word is None\
                 else overwrites_word
         line_number = word.line_number
         for tp in word.transkription_positions:
             tp_id = f'w{word.id}:tp{tp.id}'\
                     if parent_id == -1\
                     else f'w{parent_id}:w{word.id}:tp{tp.id}'
             if text_field is not None:
                 word_dict = { 'id': id, 'text': text, 'left': tp.left + text_field.left, 'top': tp.top + text_field.top,\
                         'width': tp.width, 'height': tp.height, 'line': line_number, 'tp_id': tp_id, 'deleted': word.deleted }
                 if tp.transform is not None:
                     matrix = tp.transform.clone_transformation_matrix()
                     xmin = text_field.left 
                     ymin = text_field.top 
                     matrix.matrix[Matrix.XINDEX] = round(tp.transform.matrix[Matrix.XINDEX] + xmin, 3)
                     matrix.matrix[Matrix.YINDEX] = round(tp.transform.matrix[Matrix.YINDEX] + ymin, 3)
                     word_dict.update({ 'transform': matrix.toString() })
                     if tp.left > 0:
                         word_dict.update({ 'left': round(tp.left - tp.transform.matrix[Matrix.XINDEX], 3)})
                     else:
                         word_dict.update({ 'left': 0})
                     word_dict.update({ 'top': round((tp.height-1.5)*-1, 3)})
             else:
                 word_dict = { 'id': id, 'text': text, 'left': tp.left, 'top': tp.top, 'width': tp.width,\
                         'height': tp.height, 'line': line_number, 'tp_id': tp_id, 'deleted': word.deleted }
                 if tp.transform is not None:
                     word_dict.update({ 'transform': tp.transform.toString() })
             if edited_text is not None:
                 word_dict.update({'edited_text': edited_text})
             if earlier_version is not None:
                 word_dict.update({'earlier_version': earlier_version.text })
             if overwrites_word is not None:
                 word_dict.update({'overwrites_word': overwrites_word.text })
             if parent_id > -1:
                 word_dict.update({'part_text': word.text })
             words.append(word_dict)
+        if faksimile_positions is not None:
+            faksimile_dict = {}
+            for fp in word.faksimile_positions:
+                faksimile_dict = { 'id': id, 'text': text, 'left': fp.left, 'top': fp.top,\
+                        'width': fp.width, 'height': fp.height, 'line': line_number, 'fp_id': fp.id, 'deleted': word.deleted }
+                if fp.transform is not None:
+                    faksimile_dict.update({ 'transform': fp.transform.toString() })
+                if len(faksimile_dict) > 0:
+                    if edited_text is not None:
+                        faksimile_dict.update({'edited_text': edited_text})
+                    if earlier_version is not None:
+                        faksimile_dict.update({'earlier_version': earlier_version.text })
+                    if overwrites_word is not None:
+                        faksimile_dict.update({'overwrites_word': overwrites_word.text })
+                    if parent_id > -1:
+                        faksimile_dict.update({'part_text': word.text })
+                    faksimile_positions.append(faksimile_dict)
         for wp in word.word_parts:
             self._add_word_to_list(words, wp, text, text_field=text_field, edited_text=edited_text,\
-                    earlier_version=earlier_version, overwrites_word=overwrites_word, parent_id=word.id)
+                    earlier_version=earlier_version, overwrites_word=overwrites_word, parent_id=word.id, faksimile_positions=faksimile_positions)
 
     def create_json_dict(self) ->dict:
         """Create and return a json dictionary.
         """
         words = []
+        faksimile_positions = []
         text_field = None
         if self.page.svg_image is not None:
             if self.page.svg_image.text_field is None:
                 text_field = self.page.svg_image.text_field = TranskriptionField(self.page.svg_image.file_name).convert_to_text_field()
             self.page.svg_image.decontextualize_file_name(update_url=EXIST_DB)
         for word in self.page.words:
-            self._add_word_to_list(words, word, word.text, text_field=text_field)
+            self._add_word_to_list(words, word, word.text, text_field=text_field, faksimile_positions=faksimile_positions)
         lines = []
         offset = 0 if text_field is None else text_field.ymin 
+        svg_image = self.add_object2dict(self.page.svg_image)
+        if svg_image is not None:
+            svg_image.update({ 'secondaryURL': LOCAL_SERVER + self.page.svg_image.file_name })
+            svg_image.update({ 'x': self.page.svg_image.text_field.left })
+            svg_image.update({ 'y': self.page.svg_image.text_field.top })
+        faksimile_image = self.add_object2dict(self.page.faksimile_image)
+        if faksimile_image is not None:
+            faksimile_image.update({ 'secondaryURL': LOCAL_SERVER + "faksimiles/" + self.page.faksimile_image.file_name })
+            faksimile_image.update({ 'x': 0 })
+            faksimile_image.update({ 'y': 0 })
         for line in self.page.lines: lines.append({ 'id': line.id, 'top': line.top + offset, 'bottom': line.bottom })
         return { 'title': self.page.title, 'number': self.page.number, 'words': words,\
-                'svg': self.add_object2dict(self.page.svg_image), 'lines': lines }
+                'svg': svg_image, 'lines': lines, 'faksimile': faksimile_image, 'faksimile_positions': faksimile_positions }
 
     def convert(self, output_file=None, stage_version='', highlighted_words=None):
         """Converts Page to JSON.
         """
         if output_file is None:
             output_file = 'output.json'
         json_file = open(output_file, "w+")
         try:
             json.dump(self.create_json_dict(), json_file)
         except Exception:
             raise Exception('Error in json.dump')
         json_file.close()
         return 0
          
     def add_object2dict(self, object_instance):
         """Add an object to json_dict and generate json data and interfaces.
 
             [:return:] json dict or object_instance 
         """
         json_dict = {}
         object_type = type(object_instance)
         if object_type.__module__ == 'builtins':
             if object_type != list:
                 return object_instance
             else:
                 items = []
                 for item in object_instance:
                     items.append(self.add_object2dict(item))
                 if len(items) > 0:
                     return items 
                 else:
                     return { self.key: [] }
         semantic_dictionary = object_type.get_semantic_dictionary()
         for key, content_type in [ (key, content.get('class')) for key, content in semantic_dictionary['properties'].items()]:
             content = object_instance.__dict__.get(key)
             if content_type == list\
                and content is not None\
                and len(content) > 0\
                and type(content[0]).__module__ != 'builtins':
                 content_list = []
                 for content_item in content:
                     content_list.append(self.add_object2dict(content_item))
                 json_dict.update({key: content_list})
             elif content_type.__module__ == 'builtins':
                 if content is not None:
                     json_dict.update({key: content})
             else:
                 if content is not None and type(content) == list:
                     content_list = []
                     for content_item in content:
                         content_list.append(self.add_object2dict(content_item))
                     json_dict.update({key: content_list})
                 else:
                     if content is not None:
                         json_dict.update({key: self.add_object2dict(content)})
         return json_dict
 
 class oldJSONConverter(Converter):
     """This class can be used to convert a 'svgWordPositions' xml file to a json file.
     """
     PY2TS_DICT = { float: 'number', int: 'number', bool: 'boolean', str: 'string' }
 
     def __init__(self, page, non_testing=True, key=''):
         Converter.__init__(self, page, non_testing, False)
         self.key = key
         self.interface_output_dir = PathLibPath('ts_interfaces')
         if not self.interface_output_dir.is_dir():
             self.interface_output_dir.mkdir()
         elif len(list(self.interface_output_dir.glob('*.ts'))) > 0:
             for ts_file in self.interface_output_dir.glob('*.ts'):
                 remove(ts_file)
 
     def convert(self, output_file=None, stage_version='', highlighted_words=None):
         """Converts Page to JSON.
         """
         if output_file is None:
             output_file = 'output.json'
         class_dict = {}
         if self.key != '':
             object_instance = self.page.__dict__.get(self.key)
             if object_instance is not None:
                 json_dict = self.add_object2dict(object_instance, class_dict)
                 if type(json_dict) == list:
                     json_dict = { self.key : json_dict }
             else:
                 print(f'Page initialized from {self.page.page_tree.docinfo.URL} does not have an object at "{self.key}"!')
                 return 2
         else:
             json_dict = self.add_object2dict(self.page, class_dict)
         json_file = open(output_file, "w+")
         try:
             json.dump(json_dict, json_file)
         except Exception:
             raise Exception('Error in json.dump')
         json_file.close()
         self.create_imports(class_dict)
         return 0
          
     def add_object2dict(self, object_instance, class_dict):
         """Add an object to json_dict and generate json data and interfaces.
 
             [:return:] json dict or object_instance 
         """
         json_dict = {}
         interface_list = []
         object_type = type(object_instance)
         if object_type.__module__ == 'builtins':
             if object_type != list:
                 return object_instance
             else:
                 items = []
                 for item in object_instance:
                     items.append(self.add_object2dict(item, class_dict))
                 if len(items) > 0:
                     return { self.key: items }
                 else:
                     return { self.key: 'null' }
         semantic_dictionary = object_type.get_semantic_dictionary()
         for key, content_type in [ (key, content.get('class')) for key, content in semantic_dictionary['properties'].items()]:
             content = object_instance.__dict__.get(key)
             if content_type == list\
                and content is not None\
                and len(content) > 0\
                and type(content[0]).__module__ != 'builtins':
                 content_list = []
                 for content_item in content:
                     content_list.append(self.add_object2dict(content_item, class_dict))
                 json_dict.update({key: content_list})
                 interface_list.append(f'{key}: {type(content[0]).__name__}[];')
             elif content_type.__module__ == 'builtins':
                 if content_type != list:
                     ts_type = self.PY2TS_DICT[content_type]\
                             if content_type in self.PY2TS_DICT.keys()\
                             else 'string'
                     interface_list.append(f'{key}: {ts_type};')
                 json_dict.update({key: content})
             else:
                 if content is not None and type(content) == list:
                     interface_list.append(f'{key}: {content_type.__name__}[];')
                     content_list = []
                     for content_item in content:
                         content_list.append(self.add_object2dict(content_item, class_dict))
                     json_dict.update({key: content_list})
                 else:
                     interface_list.append(f'{key}: {content_type.__name__};')
                     if content is not None:
                         json_dict.update({key: self.add_object2dict(content, class_dict)})
         if object_type not in class_dict.keys(): 
             class_dict.update({object_type: self.create_interface(object_type.__name__, interface_list)})
         return json_dict
 
     def create_imports(self, class_dict):
         """Create an ts interface from a list of key and content_types.
 
             [:return:] file_name of interface
         """
         ts_file = PathLibPath('ts_imports.ts')
         file = open(ts_file, "w+")
         file.write(f'//import all interfaces from {self.interface_output_dir} ' + '\n')
         for interface_name, path_name in class_dict.items() :
             file.write('import {' + interface_name.__name__ + '} from \'./' + str(self.interface_output_dir.joinpath(path_name.stem)) + '\';\n')
         file.close()
         return ts_file
 
     def create_interface(self, class_name, interface_list) -> PathLibPath:
         """Create an ts interface from a list of key and content_types.
 
             [:return:] file_name of interface
         """
         ts_file = self.interface_output_dir.joinpath(PathLibPath(f'{class_name.lower()}.ts'))
         import_list = [ import_class_name for import_class_name in\
                 [ import_class_name.split(': ')[1].replace(';','').replace('[]','') for import_class_name in interface_list ]\
                 if import_class_name not in set(self.PY2TS_DICT.values()) ]
         file = open(ts_file, "w")
         for import_class_name in set(import_list):
             file.write('import {' + import_class_name + '} from \'./' + import_class_name.lower() + '\';\n')
         file.write(f'export interface {class_name} ' + '{\n')
         for interace_string in interface_list:
             file.write(f'\t' + interace_string + '\n')
         file.write('}')
         file.close()
         return ts_file
 
 class SVGConverter(Converter):
     """This class can be used to convert a 'svgWordPositions' xml file to a svg file that combines text as path and text-as-text.
     """
     BG_COLOR = 'yellow'
     OPACITY = '0.2'
 
     def __init__(self, page, non_testing=True, show_word_insertion_mark=False, bg_color=BG_COLOR, opacity=OPACITY):
         Converter.__init__(self, page, non_testing, show_word_insertion_mark)
         self.bg_color = bg_color
         self.opacity = opacity
 
     def convert(self, output_file=None, stage_version='', highlighted_words=None):
         """Converts Page to SVG
         """
         title = self.page.title if(self.page.title is not None) else 'Test Page'
         title = '{}, S. {}'.format(title, self.page.number) if (self.page.number is not None) else title
         svg_file = self.page.svg_file
         if svg_file is None and self.page.svg_image is not None:
             svg_file = self.page.svg_image.file_name
         elif svg_file is None:
             msg = f'ERROR: xml_source_file {self.page.docinfo.URL} does neither have a svg_file nor a svg_image!'
             raise Exception(msg)
         transkription_field = TranskriptionField(svg_file)
         if bool(transkription_field.get_svg_attributes('xmlns')):
             ET.register_namespace('', transkription_field.get_svg_attributes('xmlns'))
         if bool(transkription_field.get_svg_attributes('xmlns:xlink')):
             ET.register_namespace('xlink', transkription_field.get_svg_attributes('xmlns:xlink'))
         svg_tree = ET.parse(svg_file)
         transkription_node = ET.SubElement(svg_tree.getroot(), 'g', attrib={'id': 'Transkription'})
         colors = [ 'yellow', 'orange' ] if self.bg_color == self.BG_COLOR else [ self.bg_color ]
         if highlighted_words is not None:
             colors = ['yellow']
         else:
             highlighted_words = []
         color_index = 0
         for word in self.page.words:
             word_id = 'word_' + str(word.id)
             for transkription_position in self._get_transkription_positions(word.transkription_positions, stage_version=stage_version):
                 transkription_position_id = word_id + '_' + str(transkription_position.id)
                 color = colors[color_index] if word not in highlighted_words else self.bg_color
                 rect_node = ET.SubElement(transkription_node, 'rect',\
                         attrib={'id': transkription_position_id, 'x': str(transkription_position.left + transkription_field.xmin),\
                         'y': str(transkription_position.top + transkription_field.ymin), 'width': str(transkription_position.width),\
                         'height': str(transkription_position.height), 'fill': color, 'opacity': self.opacity})
                 if transkription_position.transform is not None:
                     matrix = transkription_position.transform.clone_transformation_matrix()
                     matrix.matrix[Matrix.XINDEX] = round(transkription_position.transform.matrix[Matrix.XINDEX] + transkription_field.xmin, 3)
                     matrix.matrix[Matrix.YINDEX] = round(transkription_position.transform.matrix[Matrix.YINDEX] + transkription_field.ymin, 3)
                     rect_node.set('transform', matrix.toString())
                     rect_node.set('x', str(round(transkription_position.left - transkription_position.transform.matrix[Matrix.XINDEX], 3)))
                     rect_node.set('y', str(round((transkription_position.height-1.5)*-1, 3)))
                 ET.SubElement(rect_node, 'title').text = word.text
             color_index = (color_index + 1) % len(colors)
         if output_file is not None:
             svg_tree.write(output_file)
         return 0
 
 class HTMLConverter(Converter):
     """This class can be used to convert a 'svgWordPositions' xml file to a test HTML file.
     """
     CSS = """ .highlight0 { background-color: yellow; opacity: 0.2; }
               .highlight1 { background-color: pink; opacity: 0.2; }
               .highlight2 { background-color: red; opacity: 0.2; }
               .foreign { background-color: blue; opacity: 0.4; }
               .overwritten { background-color: green; opacity: 0.4; }
               .word-insertion-mark { background-color: orange; opacity: 0.2; }
               .deleted { background-color: grey; opacity: 0.2; }
           """
     def __init__(self, page, non_testing=True, show_word_insertion_mark=False):
         Converter.__init__(self, page, non_testing, show_word_insertion_mark)
         self.text_field = TextField()
 
     def convert(self, output_file=None, stage_version='', highlighted_words=None):
         """Converts Page to HTML
         """
         title = self.page.title if(self.page.title is not None) else 'Test Page'
         title = '{}, S. {}'.format(title, self.page.number) if (self.page.number is not None) else title
         if stage_version != '':
             title = title + ', Schreibstufe: ' + stage_version
         if self.page.svg_image is not None:
             width = self.page.svg_image.width
             height = self.page.svg_image.height
             self.text_field = self.page.svg_image.text_field
             svg_file = self.page.svg_image.file_name
             print('Textfield found ->adjusting data')
         elif self.page.svg_file is not None:
             svg_file = self.page.svg_file
             transkription_field = TranskriptionField(svg_file)
             width = transkription_field.getWidth()
             height = transkription_field.getHeight()
         style_content = ' position: relative; width: {}px; height: {}px; background-image: url("{}"); background-size: {}px {}px '\
                 .format(width, height, path.abspath(svg_file), width, height)
         style = E.STYLE('#transkription {' + style_content + '}', HTMLConverter.CSS)
         head = E.HEAD(E.TITLE(title),E.META(charset='UTF-8'), style)
         transkription = E.DIV(id="transkription")
         counter = 0
         for word in self.page.words:
             highlight_class = 'highlight' + str(counter)\
                     if not word.deleted else 'deleted'
             if highlighted_words is not None\
                     and word in highlighted_words:
                 highlight_class = 'highlight2'
             earlier_text = '' if word.earlier_version is None else word.earlier_version.text
             if earlier_text == '' and len(word.word_parts) > 0:
                 earlier_versions = [ word for word in word.word_parts if word.earlier_version is not None ]
                 earlier_text = earlier_versions[0].text if len(earlier_versions) > 0 else ''
             if earlier_text != '':
                 word_title = 'id: {}/line: {}\n0: {}\n1: {}'.format(str(word.id), str(word.line_number), earlier_text, word.text)
             else:
                 word_title = 'id: {}/line: {}\n{}'.format(str(word.id), str(word.line_number), word.text)
             if word.edited_text is not None:
                 word_title += f'\n>{word.edited_text}'
             for transkription_position in self._get_transkription_positions(word.transkription_positions, stage_version=stage_version):
                 self._append2transkription(transkription, highlight_class, word_title, transkription_position)
             if word.overwrites_word is not None:
                 overwritten_title = f'{word.text} overwrites {word.overwrites_word.text}'
                 for overwritten_transkription_position in word.overwrites_word.transkription_positions:
                     self._append2transkription(transkription, 'overwritten', overwritten_title, overwritten_transkription_position)
             for part_word in word.word_parts:
                 highlight_class = 'highlight' + str(counter)\
                     if not part_word.deleted else 'deleted'
                 for part_transkription_position in self._get_transkription_positions(part_word.transkription_positions, stage_version=stage_version):
                     self._append2transkription(transkription, highlight_class, word_title, part_transkription_position)
                 if part_word.overwrites_word is not None:
                     overwritten_title = f'{word.text} overwrites {part_word.overwrites_word.text}'
                     for overwritten_transkription_position in part_word.overwrites_word.transkription_positions:
                         self._append2transkription(transkription, 'overwritten', overwritten_title, overwritten_transkription_position)
             counter = (counter + 1) % 2
         word_insertion_mark_class = 'word-insertion-mark'
         counter = 0
         for mark_foreign_hands in self.page.mark_foreign_hands:
             highlight_class = 'foreign'
             title = 'id: {}/line: {}\n{} <i>{}</i>'.format(str(mark_foreign_hands.id), str(mark_foreign_hands.line_number),\
                     mark_foreign_hands.foreign_hands_text, mark_foreign_hands.pen)
             for transkription_position in mark_foreign_hands.transkription_positions:
                 self._append2transkription(transkription, highlight_class, title, transkription_position)
         if self.show_word_insertion_mark:
             for word_insertion_mark in self.page.word_insertion_marks:
                 wim_title = 'id: {}/line: {}\nword insertion mark'.format(str(word_insertion_mark.id), str(word_insertion_mark.line_number))
                 style_content = 'position:absolute; top:{0}px; left:{1}px; width:{2}px; height:{3}px;'.format(\
                         word_insertion_mark.top, word_insertion_mark.left, word_insertion_mark.width, word_insertion_mark.height)
                 link = E.A(' ', E.CLASS(word_insertion_mark_class), title=wim_title,  style=style_content) 
                 transkription.append(link)
         html = E.HTML(head,E.BODY(transkription))
         bool(self.non_testing) and open_in_browser(html)
         if output_file is not None:
             with open(output_file, 'wb') as f:
                 f.write(lxml.html.tostring(html, pretty_print=True, include_meta_content_type=True, encoding='utf-8'))
             f.closed
         return 0
 
     def _append2transkription(self, transkription, highlight_class, title, transkription_position):
         """Append content to transkription-div.
         """
         style_content = 'position:absolute; top:{0}px; left:{1}px; width:{2}px; height:{3}px;'.format(\
                transkription_position.top - self.text_field.top, transkription_position.left - self.text_field.left, transkription_position.width, transkription_position.height)
         if transkription_position.transform is not None:
            style_content = style_content + ' transform: {}; '.format(transkription_position.transform.toCSSTransformString())
            transform_origin_x = (transkription_position.left-round(transkription_position.transform.getX(), 1))*-1\
                    if (transkription_position.left-round(transkription_position.transform.getX(), 1))*-1 < 0 else 0
            style_content = style_content + ' transform-origin: {}px {}px; '.format(transform_origin_x, transkription_position.height)
         link = E.A(' ', E.CLASS(highlight_class), title=title,  style=style_content) 
         transkription.append(link)
 
 def create_pdf_with_highlighted_words(xml_source_file=None, page=None, highlighted_words=None, pdf_file_name='output.pdf', bg_color=SVGConverter.BG_COLOR):
     """Creates a pdf file highlighting some words.
     """
     if not pdf_file_name.endswith('pdf'):
         pdf_file_name = pdf_file_name + '.pdf'
     tmp_svg_file = pdf_file_name.replace('.pdf', '.svg') 
     create_svg_with_highlighted_words(xml_source_file=xml_source_file, page=page, highlighted_words=highlighted_words,\
             svg_file_name=tmp_svg_file, bg_color=bg_color)
     if isfile(tmp_svg_file):
         cairosvg.svg2pdf(url=tmp_svg_file, write_to=pdf_file_name)
         remove(tmp_svg_file)
 
 def create_svg_with_highlighted_words(xml_source_file=None, page=None, highlighted_words=None, svg_file_name='output.svg', bg_color=SVGConverter.BG_COLOR):
     """Creates a svg file highlighting some words.
     """
     if page is None and xml_source_file is not None:
         page = Page(xml_source_file)
     converter = SVGConverter(page, bg_color=bg_color)
     if not svg_file_name.endswith('svg'):
         svg_file_name = svg_file_name + '.svg'
     converter.convert(output_file=svg_file_name, highlighted_words=highlighted_words)
 
 def usage():
     """prints information on how to use the script
     """
     print(main.__doc__)
 
 def main(argv):
     """This program can be used to convert the word positions to HTML, SVG or TEXT for testing purposes. 
 
     svgscripts/convert_wordPositions.py OPTIONS <file> 
 
         OPTIONS:
 
         -h|--help:                          show help
         -H|--HTML [default]                 convert to HTML test file
         -k|--key=key                        option for json converter: 
                                                 only convert object == page.__dict__[key]
         -o|--output=outputFile              save output to file outputFile
         -P|--PDF                            convert to PDF test file
         -S|--SVG                            convert to SVG test file
         -s|--svg=svgFile:                   svg web file
         -T|--TEXT                           convert to TEXT output 
         -t|--text=text                      highlight word
         -w|--word-insertion-mark            show word insertion mark on HTML
         -v|--version=VERSION                show words that belong to writing process VERSION: { 0, 1, 2, 0-1, 0+, etc. }
         -x|--testing                        execute in test mode, do not write to file or open browser
 
         :return: exit code (int)
     """
     convert_to_type = None
     key = ''
     non_testing = True
     output_file = None
     page = None
     show_word_insertion_mark = False
     stage_version = ''
     svg_file = None
     text = None
 
     try:
         opts, args = getopt.getopt(argv, "hk:t:HPSTws:o:v:x", ["help", "key=", "text=", "HTML", "PDF", "SVG", "TEXT", "word-insertion-mark", "svg=", "output=", "version=", "testing"])
     except getopt.GetoptError:
         usage()
         return 2
 
     for opt, arg in opts:
         if opt in ('-h', '--help') or not args:
             usage()
             return 0
         elif opt in ('-v', '--version'):
             if re.match(r'^(\d|\d\+|\d\-\d)$', arg):
                 stage_version = arg
             else:
                 raise ValueError('OPTION -v|--version=VERSION does not work with "{}" as value for VERSION!'.format(arg))
         elif opt in ('-w', '--word-insertion-mark'):
             show_word_insertion_mark = True
         elif opt in ('-P', '--PDF'):
             convert_to_type = 'PDF'
         elif opt in ('-S', '--SVG'):
             convert_to_type = 'SVG'
         elif opt in ('-T', '--TEXT'):
             convert_to_type = 'TEXT'
         elif opt in ('-H', '--HTML'):
             convert_to_type = 'HTML'
         elif opt in ('-x', '--testing'):
             non_testing = False
         elif opt in ('-s', '--svg'):
             svg_file = arg
         elif opt in ('-o', '--output'):
             output_file = arg
         elif opt in ('-k', '--key'):
             key = arg
         elif opt in ('-t', '--text'):
             text = arg
             print(arg)
     
     if len(args) < 1:
         usage()
         return 2
     if convert_to_type is None:
         if output_file is not None and len(re.split(r'\.', output_file)) > 1:
             output_file_part_list = re.split(r'\.', output_file)
             convert_to_type = output_file_part_list[len(output_file_part_list)-1].upper()
         else:
             convert_to_type = 'HTML'
     exit_code = 0
     for word_position_file in args:
         if not isfile(word_position_file):
             print("'{}' does not exist!".format(word_position_file))
             return 2
         if convert_to_type == 'PDF':
             if output_file is None:
                 output_file = 'output.pdf'
             highlighted_words = None
             if text is not None:
                 page = Page(word_position_file)
                 highlighted_words = [ word for word in page.words if word.text == text ]
             create_pdf_with_highlighted_words(word_position_file, pdf_file_name=output_file, highlighted_words=highlighted_words)
         else:
             if svg_file is not None:
                 if isfile(svg_file):
                     page = PageCreator(word_position_file, svg_file=svg_file)
                 else:
                     print("'{}' does not exist!".format(word_position_file))
                     return 2
             else:
                 page = Page(word_position_file)
                 if page.svg_file is None:
                     print('Please specify a svg file!')
                     usage()
                     return 2
 
             highlighted_words = None
             if text is not None:
                 highlighted_words = [ word for word in page.words if word.text == text ]
                 print([ (word.id, word.text) for word in highlighted_words ])
             converter = Converter.CREATE_CONVERTER(page, non_testing=non_testing, converter_type=convert_to_type, show_word_insertion_mark=show_word_insertion_mark, key=key)
             exit_code = converter.convert(output_file=output_file, stage_version=stage_version, highlighted_words=highlighted_words)
     return exit_code 
 
 if __name__ == "__main__":
     sys.exit(main(sys.argv[1:]))
Index: tests_svgscripts/test_util.py
===================================================================
--- tests_svgscripts/test_util.py	(revision 102)
+++ tests_svgscripts/test_util.py	(revision 103)
@@ -1,259 +1,256 @@
 import unittest
 from os import sep, path, remove, listdir
 from os.path import isdir, isfile, dirname, basename
 import shutil
 import sys
 import lxml.etree as ET
 import sys
 import tempfile
 import warnings
 
 sys.path.append('svgscripts')
 
 import util
 from local_config import FAKSIMILE_LOCATION, PDF_READER, SVG_EDITOR, USER_ROOT_LOCATION_DICT
 from datatypes.faksimile import FaksimilePage
 from datatypes.page import Page
 from datatypes.page_creator import PageCreator
 from datatypes.positional_word_part import PositionalWordPart
 from datatypes.text_field import TextField
 from datatypes.transkriptionField import TranskriptionField
 from datatypes.word_position import WordPosition
 from datatypes.word import Word
 
 sys.path.append('shared_util')
 from myxmlwriter import write_pretty, FILE_TYPE_SVG_WORD_POSITION, FILE_TYPE_XML_MANUSCRIPT
 sys.path.append('fixes')
 from fix_old_data import save_page
 
 class TestCopy(unittest.TestCase):
     def setUp(self):
         util.UNITTESTING = True
         DATADIR = path.dirname(__file__) + sep + 'test_data'  
         self.test_dir = DATADIR
         self.faksimile_dir = DATADIR + sep + 'faksimile_svg'
         self.faksimile_file = self.faksimile_dir + sep + 'N-VII-1,5et6.svg'
         self.image = DATADIR + sep + 'image.jpg'
         self.svg_testrecord = DATADIR + sep + 'TESTRECORD.svg'
         self.xml_file = DATADIR + sep + 'N_VII_1_page005.xml'
         self.Mp_XIV_page420 = DATADIR + sep + 'Mp_XIV_page420.xml'
         self.tmp_dir = tempfile.mkdtemp()
 
     def test_copy(self):
         tmp_image = self.tmp_dir + sep + basename(self.image)
         target_file = 'asdf.svg'
         shutil.copy(self.image, self.tmp_dir)
         util.copy_faksimile_svg_file(target_file, faksimile_source_file=self.faksimile_file,\
                 target_directory=self.tmp_dir, local_image_path=tmp_image)
         self.assertEqual(isfile(self.tmp_dir + sep + target_file), True)
         util.copy_faksimile_svg_file(faksimile_source_file=self.faksimile_file,\
                 target_directory=self.tmp_dir, local_image_path=tmp_image)
         self.assertEqual(isfile(self.tmp_dir + sep + basename(self.faksimile_file)), True)
         with self.assertRaises(Exception):
             util.copy_faksimile_svg_file()
         with self.assertRaises(Exception):
             util.copy_faksimile_svg_file(faksimile_source_file=self.faksimile_source_file)
 
     def test_copy_xml(self):
         old_page = Page(self.xml_file)
         xml_file = util.copy_xml_file_word_pos_only(self.xml_file, self.tmp_dir)
         self.assertEqual(isfile(xml_file), True)
         page = Page(xml_file)
         self.assertEqual(len(page.words), len(old_page.words))
         self.assertEqual(len(page.line_numbers), 0)
 
     def test_create_highlighted_svg_file(self):
         target_file = self.tmp_dir + sep + basename(self.faksimile_file)
         tmp_image = self.tmp_dir + sep + basename(self.image)
         faksimile_tree = ET.parse(self.faksimile_file)
         namespaces = { k if k is not None else 'ns': v for k, v in faksimile_tree.getroot().nsmap.items() }
         node_ids = ['rect947', 'rect951', 'rect953', 'rect955', 'rect959', 'rect961', 'rect963']
         highlight_color = 'blue'
         util.create_highlighted_svg_file(faksimile_tree, node_ids, target_directory=self.tmp_dir, highlight_color=highlight_color, namespaces=namespaces)
         self.assertEqual(isfile(target_file), True)
         new_tree = ET.parse(target_file)
         for node in new_tree.xpath('//ns:rect[@fill="{0}"]|//ns:path[@fill="{0}"]'.format(highlight_color), namespaces=namespaces):
             node_ids.remove(node.get('id'))
         self.assertEqual(len(node_ids), 0)
 
     def test_get_empty_node_ids(self):
         faksimile_tree = ET.parse(self.faksimile_file)
         faksimile_page = FaksimilePage.GET_FAKSIMILEPAGES(faksimile_tree)[0]
         empty_node_ids = util.get_empty_node_ids(faksimile_tree, faksimile_page=faksimile_page)
         self.assertEqual('rect1085' in empty_node_ids, True)
 
     def test_record_changes(self):
         new_tree = ET.parse(self.faksimile_file)
         old_tree = ET.parse(self.faksimile_file)
         empty_node_id = 'rect1085'
         title_node_id = 'test001'
         namespaces = { k if k is not None else 'ns': v for k, v in new_tree.getroot().nsmap.items() }
         node = new_tree.xpath('//ns:rect[@id="{0}"]'.format(empty_node_id), namespaces=namespaces)[0]
         title = ET.SubElement(node, 'title', attrib={ 'id': title_node_id })
         title.text = 'test'
         new_file = self.tmp_dir + sep + 'new.svg'
         old_file = self.tmp_dir + sep + 'old.svg'
         util.copy_faksimile_svg_file(target_file=new_file, faksimile_tree=new_tree)
         util.copy_faksimile_svg_file(target_file=old_file, faksimile_tree=old_tree)
         util.record_changes(old_file, new_file, [ empty_node_id ], namespaces=namespaces)
         test_tree = ET.parse(old_file)
         self.assertEqual(len(test_tree.xpath('//ns:rect[@id="{0}"]/ns:title[@id="{1}"]'.format(empty_node_id, title_node_id), namespaces=namespaces)), 1)
 
     def test_replace_chars(self):
         page = Page(self.xml_file)
         faksimile_tree = ET.parse(self.faksimile_file)
         namespaces = { k if k is not None else 'ns': v for k, v in faksimile_tree.getroot().nsmap.items() }
         word_position = WordPosition(id='rect1159', text='„Gedächtniß"')
         wps, texts = util.replace_chars(page.words, [ word_position ])
         self.assertEqual(texts[0].endswith('“'), True)
         self.assertEqual(wps[0].text.endswith('“'), True) 
         word_position = WordPosition(id='rect1173', text='-')
         wps, texts = util.replace_chars(page.words, [ word_position ])
         self.assertEqual(wps[0].text.endswith('–'), True) 
 
     def test_mismatch_words(self):
         page = Page(self.xml_file)
         faksimile_tree = ET.parse(self.faksimile_file)
         faksimile_page = FaksimilePage.GET_FAKSIMILEPAGES(faksimile_tree)[0]
         page = Page('xml/N_VII_1_page174.xml')
         faksimile_tree = ET.parse('faksimile_svg/N-VII-1,173et174.svg')
         faksimile_page = FaksimilePage.GET_FAKSIMILEPAGES(faksimile_tree)[0]
         self.assertEqual('-' in [ tp.text for tp in faksimile_page.word_positions], True)
         wps, texts = util.replace_chars(page.words,faksimile_page.word_positions)
         self.assertEqual('–' in texts, True)
         self.assertEqual(len([ faksimile_position for faksimile_position in wps\
                 if faksimile_position.text == '–' ]), 4)
         mismatching_words, mismatching_faksimile_positions = util.get_mismatching_ids(page.words, faksimile_page.word_positions)
         self.assertEqual(len([word for word in mismatching_words if word.text.endswith('“') ]), 0)
         self.assertEqual(len([word for word in mismatching_words if word.text.endswith('–') ]), 0)
 
     def test_process_warnings(self):
         with warnings.catch_warnings(record=True) as w:
             warnings.simplefilter('default')
             warnings.warn('Test1: asdf')
             warnings.warn('Test2: asdf')
             status = util.process_warnings4status(w, ['Test1', 'Test2' ], 'asdf', 'OK', status_prefix='with warnings')
             #print(status)
             self.assertTrue('Test1' in status.split(':'))
             self.assertTrue('Test2' in status.split(':'))
 
     @unittest.skip('test uses external program, has been tested')
     def test_show_files(self):
         list_of_files = [ self.test_dir + sep + file for file in listdir(self.test_dir) if file.endswith('pdf') ][0:2]
         util.ExternalViewer.show_files(single_file=self.faksimile_file, list_of_files=list_of_files)
 
     def test_record_changes_to_page(self):
         page = util.record_changes_on_svg_file_to_page(self.xml_file, self.svg_testrecord, [ 1 ])
         old_length = len(page.words)
         self.assertEqual(page.words[1].text, 'asdf')
         self.assertEqual(page.words[1].transkription_positions[0].width, 353)
         page = util.record_changes_on_svg_file_to_page(self.xml_file, self.svg_testrecord, [ 13 ])
         self.assertEqual(page.words[13].text, 'er')
         self.assertEqual(page.words[14].text, '=')
         self.assertEqual(len(page.words), old_length+1)
         page = util.record_changes_on_svg_file_to_page(self.xml_file, self.svg_testrecord, [ 64 ])
         self.assertEqual(page.words[64].text, 'Simplifications-apparat')
         self.assertEqual(len(page.words[64].transkription_positions), 3)
         self.assertEqual(len(page.words), old_length-1)
 
     @unittest.skipUnless(__name__ == "__main__", 'tests all words')
     def test_extended__record_changes_to_page(self):
         page = Page(self.xml_file)
         old_length = len(page.words)
         page = util.record_changes_on_svg_file_to_page(self.xml_file, self.svg_testrecord)
         self.assertEqual(page.words[1].text, 'asdf')
         self.assertEqual(page.words[13].text, 'er')
         self.assertEqual(page.words[14].text, '=')
         self.assertEqual(page.words[65].text, 'Simplifications-apparat')
         self.assertEqual(len(page.words), old_length)
 
     def test_copy_faksimile_update_image_location(self):
         test_dir = self.tmp_dir #FAKSIMILE_LOCATION + '/Myriam/Fertig/'
         util.copy_faksimile_update_image_location(self.faksimile_file, target_directory=test_dir)
         with self.assertWarns(UserWarning):
             util.copy_faksimile_update_image_location(self.faksimile_file, target_directory=test_dir)
 
     def test_record_changes_on_xml(self):
         old_page = Page(self.xml_file)
         xml_file = util.copy_xml_file_word_pos_only(self.xml_file, self.tmp_dir)
         tree = ET.parse(xml_file)
         node = tree.xpath('//word[@id="135"]')[0]
         counter =0
         while node.get('text') != 'gar' or counter > 5:
             counter += 1
             nextnode = node.getnext()
             node.set('text', node.get('text') + nextnode.get('text'))
             for element in nextnode.getchildren():
                 node.append(element)
             nextnode.getparent().remove(nextnode)
         write_pretty(xml_element_tree=tree, file_name=xml_file,\
                 script_name=__file__, file_type=FILE_TYPE_SVG_WORD_POSITION)
         new_page = util.record_changes_on_xml_file_to_page(self.xml_file, xml_file)
         self.assertEqual(len(new_page.words), len(old_page.words)-2)
         self.assertEqual(len([ word for word in new_page.words if word.text == 'gar']), 1)
         old_page = Page(self.xml_file)
         xml_file = util.copy_xml_file_word_pos_only(self.xml_file, self.tmp_dir)
         tree = ET.parse(xml_file)
         node = tree.xpath('//word[@id="138"]')[0]
         counter =0
         while node.get('text') != 'nichtvorkommt.' or counter > 5:
             counter += 1
             nextnode = node.getnext()
             node.set('text', node.get('text') + nextnode.get('text'))
             for element in nextnode.getchildren():
                 node.append(element)
             nextnode.getparent().remove(nextnode)
         node.set('split', 'nicht vorkommt.')
         write_pretty(xml_element_tree=tree, file_name=xml_file,\
                 script_name=__file__, file_type=FILE_TYPE_SVG_WORD_POSITION)
         joined_page = Page(xml_file)
         self.assertEqual(len([word for word in joined_page.words if word.text == 'nichtvorkommt.']), 1)
         self.assertEqual(len([word for word in joined_page.words if word.text == 'nichtvorkommt.'][0].split_strings), 2)
         self.assertEqual(len(joined_page.words), len(old_page.words)-1)
         new_page = util.record_changes_on_xml_file_to_page(self.xml_file, xml_file)
         self.assertEqual(len(new_page.words), len(old_page.words))
         self.assertEqual(len([word for word in new_page.words if word.text == 'vorkommt.']), 1)
         self.assertEqual(len([word for word in old_page.words if word.text == 'nicht']),\
                 len([word for word in new_page.words if word.text == 'nicht']))
         xml_file = util.copy_xml_file_word_pos_only(self.xml_file, self.tmp_dir)
         tree = ET.parse(xml_file)
         old_page = Page(xml_file)
         nodes = tree.xpath('//word[@id>="85" and @id<="87"]')
         self.assertEqual(len(nodes), 3)
         prevWordText = nodes[0].get('text')
         nodes[0].set('join', prevWordText + 'z')
         nodes[1].set('split', 'z u')
         lastWordText = nodes[2].get('text')
         nodes[2].set('join', 'u' + lastWordText)
         write_pretty(xml_element_tree=tree, file_name=xml_file,\
                 script_name=__file__, file_type=FILE_TYPE_SVG_WORD_POSITION)
         joined_page = util.record_changes_on_xml_file_to_page(self.xml_file, xml_file)
         self.assertEqual(len(joined_page.words), len(old_page.words)-1)
 
     def test_reset_tp_with_matrix(self):
         page = Page(self.Mp_XIV_page420)
-        util.reset_tp_with_matrix(page, page.words[0].transkription_positions)
+        util.reset_tp_with_matrix(page.words[0].transkription_positions)
         self.assertTrue(page.words[0].transkription_positions[0].left > 0 and page.words[0].transkription_positions[0].top > -5)
         transformed_words = [w for w in page.words if (len(w.transkription_positions) > 0 and w.transkription_positions[0].transform is not None) ]
-        util.reset_tp_with_matrix(page, transformed_words[0].transkription_positions)
+        util.reset_tp_with_matrix(transformed_words[0].transkription_positions)
         self.assertEqual(transformed_words[0].transkription_positions[0].left, 0)
-        self.assertEqual(transformed_words[0].transkription_positions[0].top, -5)
-        page.svg_image.text_field = TextField()
-        util.reset_tp_with_matrix(page, transformed_words[1].transkription_positions)
-        self.assertTrue(transformed_words[1].transkription_positions[0].left > 0 and transformed_words[1].transkription_positions[0].top > -5)
+        self.assertTrue(transformed_words[0].transkription_positions[0].top < 0)
         
     def test_back_up(self):
         test_dir = self.tmp_dir 
         page = Page(self.xml_file)
         target_file_name = util.back_up(page, self.xml_file, bak_dir=test_dir)
         self.assertEqual(isfile(target_file_name), True)
         svg_tree = ET.parse(page.svg_file)
         namespaces = { k if k is not None else 'ns': v for k, v in svg_tree.getroot().nsmap.items() }
         util.back_up_svg_file(svg_tree, namespaces)
         
     def tearDown(self):
         shutil.rmtree(self.tmp_dir, ignore_errors=True)
         pass
 
 if __name__ == "__main__":
     unittest.main()
Index: tests_svgscripts/test_convert_wordPositions.py
===================================================================
--- tests_svgscripts/test_convert_wordPositions.py	(revision 102)
+++ tests_svgscripts/test_convert_wordPositions.py	(revision 103)
@@ -1,72 +1,72 @@
 import unittest
 from os import sep, path, remove
 import lxml.etree as ET
 import lxml.html
 import sys
 
 sys.path.append('svgscripts')
 import convert_wordPositions
 from convert_wordPositions import Converter, SVGConverter, HTMLConverter, JSONConverter
 from datatypes.page import Page
 from datatypes.page_creator import PageCreator
 from datatypes.transkription_position import TranskriptionPosition
 
 class TestConverter(unittest.TestCase):
     def setUp(self):
         DATADIR = path.dirname(__file__) + sep + 'test_data'  
         self.test_file = DATADIR + sep + 'test.xml' 
         self.test_svg_file = DATADIR + sep + 'test421.svg' 
         self.outputfile_txt = 'test.txt'
         self.outputfile_html = 'test.html'
         self.outputfile_svg = 'test.svg'
         self.outputfile_json = 'test.json'
 
     def test_main(self):
         argv = ['-x', '-s', self.test_svg_file, self.test_file]
         self.assertEqual(convert_wordPositions.main(argv), 0)
         argv = ['-x', '-s', self.test_svg_file, '-o', self.outputfile_txt, self.test_file]
         self.assertEqual(convert_wordPositions.main(argv), 0)
         self.assertEqual(path.isfile(self.outputfile_txt), True)
         argv = ['-x', '-s', self.test_svg_file, '-o', self.outputfile_html, self.test_file]
         self.assertEqual(convert_wordPositions.main(argv), 0)
         self.assertEqual(path.isfile(self.outputfile_html), True)
         html_tree = lxml.html.parse(self.outputfile_html)
         self.assertEqual(html_tree.getroot().tag, 'html')
         argv = ['-x', '-s', self.test_svg_file, '-o', self.outputfile_svg, self.test_file]
         self.assertEqual(convert_wordPositions.main(argv), 0)
         self.assertEqual(path.isfile(self.outputfile_svg), True)
         svg_tree = ET.parse(self.outputfile_svg)
         self.assertEqual(svg_tree.getroot().tag, '{http://www.w3.org/2000/svg}svg')
         argv = ['-x', '-k', 'number', '-o', self.outputfile_json, self.test_file]
         self.assertEqual(convert_wordPositions.main(argv), 0)
 
     def test_jsoin_add_object2dict(self):
         page = Page('xml/Mp_XV_page77r.xml')
         json = convert_wordPositions.JSONConverter(page, non_testing=False) 
-        #print(json.add_object2dict(page.lines)) 
+        #print(json.create_json_dict()) 
 
     def test_create_converter(self):
        page = PageCreator(self.test_file, svg_file=self.test_svg_file) 
        converter = Converter.CREATE_CONVERTER(page, False, 'SVG')
        self.assertEqual(isinstance(converter, SVGConverter), True)
        converter = Converter.CREATE_CONVERTER(page, False, 'HTML')
        self.assertEqual(isinstance(converter, HTMLConverter), True)
        converter = Converter.CREATE_CONVERTER(page, False, 'JSON')
        self.assertEqual(isinstance(converter, JSONConverter), True)
        converter = Converter.CREATE_CONVERTER(page, False)
        self.assertEqual(isinstance(converter, Converter), True)
 
     def test_get_transkription_positions(self):
         tp = [ TranskriptionPosition(), TranskriptionPosition(), TranskriptionPosition() ]
         page = PageCreator(self.test_file, svg_file=self.test_svg_file) 
         converter = Converter.CREATE_CONVERTER(page, False, 'SVG')
         converter._get_transkription_positions(tp, stage_version='1+')
 
     def tearDown(self):
         bool(path.isfile(self.outputfile_txt)) and remove(self.outputfile_txt)
         bool(path.isfile(self.outputfile_html)) and remove(self.outputfile_html)
         bool(path.isfile(self.outputfile_svg)) and remove(self.outputfile_svg)
 
 
 if __name__ == "__main__":
     unittest.main()
Index: fixes/test_interactive_editor.py
===================================================================
--- fixes/test_interactive_editor.py	(revision 102)
+++ fixes/test_interactive_editor.py	(revision 103)
@@ -1,110 +1,132 @@
 import lxml.etree as ET
 from os import sep, path, remove
 from os.path import isdir, isfile, dirname, basename
 import shutil
 import sys
 import tempfile
 import unittest
 import warnings
 
 import interactive_editor
 
 sys.path.append('svgscripts')
 from datatypes.faksimile import FaksimilePage
 from datatypes.mark_foreign_hands import MarkForeignHands
 from datatypes.page import Page
 from datatypes.path import Path
 from datatypes.positional_word_part import PositionalWordPart
 from datatypes.text_connection_mark import TextConnectionMark
 from datatypes.transkriptionField import TranskriptionField
 from datatypes.word import Word
 from datatypes.word_position import WordPosition
 from process_words_post_merging import MERGED_DIR
 
 
 class TestInteractiveEditor(unittest.TestCase):
     def setUp(self):
         interactive_editor.UNITTESTING = True
         DATADIR = path.dirname(__file__) + sep + 'test_data'  
         self.xml_file = DATADIR + sep + 'N_VII_1_page138.xml'
         self.fix_transkription_positions = DATADIR + sep + 'Mp_XIV_page419a.xml'
 
-    @unittest.skip('interactive')
+    #@unittest.skip('interactive')
     def test_run(self):
         page = Page(self.xml_file)
-        interactive_editor.InteractiveShell().run_interactive_editor(page)
+        #interactive_editor.InteractiveShell().run_interactive_editor(page)
 
     def test_json_dict(self):
         ro = interactive_editor.ResponseOrganizer()
         json_dict = ro.create_json_dict(self.xml_file)
         #print(json_dict)
 
     def test_handle_json(self):
         ro = interactive_editor.ResponseOrganizer()
         json_dict = ro.handle_response({})
         self.assertEqual(json_dict['actions']['result'], 'ERROR: there was no key "target_file" in json!')
         json_dict = ro.handle_response({'target_file': self.xml_file})
         self.assertEqual(json_dict['actions']['result'], 'ERROR: there was no key "date_stamp" in json')
         json_dict = ro.handle_response({'target_file': self.xml_file, 'date_stamp': path.getmtime(self.xml_file)})
         self.assertEqual(json_dict['actions']['result'], 'Operation "unknown" failed')
         page = Page(self.xml_file)
         json_dict = ro.handle_response({'target_file': self.xml_file, 'date_stamp': path.getmtime(self.xml_file),\
-                'response_handler': { 'action_name': 'join words'}, 'words': [ { 'id': w.id } for w in page.words[:2] ] })
+                'response_handler': { 'action_name': 'join words'}, 'words': [ { 'id': w.id, 'tp_id': f'w{w.id}:t0' } for w in page.words[:2] ] })
         self.assertEqual(json_dict['actions']['result'], 'Operation "join words" succeeded!')
         #self.assertEqual(json_dict['response'], 'ERROR: there was no key "target_file" in json!')
 
     def test_update_word(self):
         page = Page(self.xml_file)
         word = page.words[0]
         rh = interactive_editor.SaveChanges()
-        self.assertEqual(rh._update_word(word, { 'id': word.id, 'deleted': False, 'line': 99, 'tp_id': f'w{word.id}:tp0' }), 0)
+        self.assertEqual(rh._update_word(word, { 'id': word.id, 'deleted': False, 'line': 99, 'tp_id': f'w{word.id}:tp0' }, page.words), 0)
         self.assertEqual(word.deleted, False)
         self.assertEqual(word.line_number, 99)
         word = page.words[18]
-        self.assertEqual(rh._update_word(word, { 'id': word.id, 'deleted': True, 'line': 99, 'tp_id': f'w{word.id}:w0:tp0' }), 0)
+        self.assertEqual(rh._update_word(word, { 'id': word.id, 'deleted': True, 'line': 99, 'tp_id': f'w{word.id}:w0:tp0' }, page.words), 0)
         self.assertEqual(word.word_parts[0].deleted, True)
         self.assertEqual(word.word_parts[0].line_number, 99)
+        old_word = word
+        word = page.words[19]
+        self.assertEqual(rh._update_word(word, { 'id': word.id, 'old_id': old_word.id, 'fp_id': old_word.faksimile_positions[0].id }, page.words), 0)
+        self.assertEqual(len(word.faksimile_positions), 2)
+        self.assertEqual(len(old_word.faksimile_positions), 0)
+
+    def test_save_position(self):
+        page = Page(self.xml_file)
+        word = page.words[0]
+        rh = interactive_editor.SavePositions()
+        self.assertEqual(rh._update_word(word,\
+                [{ 'id': word.id, 'left': word.transkription_positions[0].left + 10, 'top': word.transkription_positions[0].top + 10, 'tp_id': f'w{word.id}:tp0' }]), 0)
+        word = page.words[18]
+        self.assertEqual(rh._update_word(word, [{ 'id': word.id, 'left': word.word_parts[0].transkription_positions[0].left + 10,\
+                'top': word.word_parts[0].transkription_positions[0].top + 10, 'tp_id': f'w{word.id}:w0:tp0' }]), 0)
+
+    def test_get_transkription_words(self):
+        json_dict = { 'words': [{ 'id': 0, 'left': 10, 'top':  10, 'tp_id': 'w0:tp0' }, { 'id': 1, 'left': 10, 'top':  10, 'fp_id': 'rect10' } ] }
+        rh = interactive_editor.ResponseHandler()
+        self.assertEqual(len(rh.get_transkription_words(json_dict)), 1)
 
     def test_dictcontains_keys(self):
-        a_dict = { 'a': { 'b': { 'c': { 'd': 0 }}}}
+        a_dict = { 'a': { 'b': { 'c': { 'd': 0 }
+            }
+        }}
         key_list = [ 'a', 'b', 'c', 'd' ]
         self.assertTrue(interactive_editor.dict_contains_keys(a_dict, key_list))
 
     def test_get_requirement(self):
         rh = interactive_editor.ResponseHandler()
         json_dict = { 'response_handler': { 'requirements' : [ { 'input': 'asdf', 'name': 'test' } ]}}
         name, requirement = rh.get_requirement(json_dict)
         self.assertEqual(name, 'test')
         self.assertEqual(requirement, 'asdf')
         self.assertEqual(rh.get_requirement(json_dict, index=1), (None,None))
 
     def test_split_words_dict(self):
         rh = interactive_editor.SplitWords(action_name='split words', description='asdf asdf')
         self.assertTrue(interactive_editor.dict_contains_keys(rh.create_json_dict(), ['requirements']))
 
     def test_handle_split_text(self):
         page = Page(self.xml_file)
         word = page.words[0]
-        json_dict = { 'words': [{ 'id': word.id }], 'response_handler': { 'requirements' : [ { 'input': 'h', 'name': 'split_text' } ]}}
+        json_dict = { 'words': [{ 'id': word.id, 'tp_id': f'w{word.id}:t0' }], 'response_handler': { 'requirements' : [ { 'input': 'h', 'name': 'split_text' } ]}}
         rh = interactive_editor.SplitWords(action_name='split words', description='asdf asdf')
         self.assertEqual(rh.handle_response(page, json_dict), 0)
         self.assertEqual(page.words[0].text, 'h')
 
     def test_handle_addbox(self):
         page = Page(self.xml_file)
         word = page.words[0]
-        json_dict = { 'words': [{ 'id': word.id }], 'response_handler': { 'requirements' : [ { 'input': 'test', 'name': 'box_text' } ]}}
+        json_dict = { 'words': [{ 'id': word.id, 'tp_id': f'w{word.id}:t0' }], 'response_handler': { 'requirements' : [ { 'input': 'test', 'name': 'box_text' } ]}}
         rh = interactive_editor.AddBox(action_name='add box', description='asdf asdf')
         self.assertEqual(rh.handle_response(page, json_dict), 0)
         self.assertTrue(page.words[0].overwrites_word is not None)
         self.assertEqual(page.words[0].overwrites_word.text, 'test')
         word = page.words[1]
-        json_dict = { 'words': [{ 'id': word.id }], 'response_handler': { 'requirements' : [ { 'input': 'a', 'name': 'box_text' },\
+        json_dict = { 'words': [{ 'id': word.id, 'tp_id': f'w{word.id}:t0' }], 'response_handler': { 'requirements' : [ { 'input': 'a', 'name': 'box_text' },\
                 {'input': 'e', 'name': 'overwritten_by'}, {'input': True, 'name': 'is_earlier_version'}]}}
         self.assertEqual(rh.handle_response(page, json_dict), 0)
         self.assertTrue(page.words[1].earlier_version is not None)
         self.assertEqual(page.words[1].earlier_version.text, 'fast')
 
     
 if __name__ == "__main__":
     unittest.main()
Index: fixes/interactive_editor.py
===================================================================
--- fixes/interactive_editor.py	(revision 102)
+++ fixes/interactive_editor.py	(revision 103)
@@ -1,676 +1,810 @@
 #!/usr/bin/env python3
 # -*- coding: utf-8 -*-
 
 """   This program can be used to process words after they have been merged with faksimile data.
 """
 #    Copyright (C) University of Basel 2019  {{{1
 #
 #    This program is free software: you can redistribute it and/or modify
 #    it under the terms of the GNU General Public License as published by
 #    the Free Software Foundation, either version 3 of the License, or
 #    (at your option) any later version.
 #
 #    This program is distributed in the hope that it will be useful,
 #    but WITHOUT ANY WARRANTY; without even the implied warranty of
 #    MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
 #    GNU General Public License for more details.
 #
 #    You should have received a copy of the GNU General Public License
 #    along with this program.  If not, see <https://www.gnu.org/licenses/> 1}}}
 
 from colorama import Fore, Style
 from datetime import datetime
 from deprecated import deprecated
 from functools import cmp_to_key
 import getopt
 import inspect
 import lxml.etree as ET
 import re
 import shutil
 import string
 from svgpathtools import svg2paths2, svg_to_paths
 from svgpathtools.path import Path as SVGPath
 from svgpathtools.path import Line 
 import sys
 import tempfile
 from operator import attrgetter
 import os
 from os import listdir, sep, path, setpgrp, devnull
 from os.path import exists, isfile, isdir, dirname, basename
 from progress.bar import Bar
 import warnings
 
 
 from fix_old_data import save_page
 from fix_boxes import attach_box, split_into_parts_and_attach_box
 
 sys.path.append('svgscripts')
 from convert_wordPositions import HTMLConverter, JSONConverter
 from datatypes.box import Box
 from datatypes.faksimile import FaksimilePage
 from datatypes.manuscript import ArchivalManuscriptUnity
 from datatypes.mark_foreign_hands import MarkForeignHands
 from datatypes.page import Page, STATUS_MERGED_OK, STATUS_POSTMERGED_OK
 from datatypes.path import Path
 from datatypes.text_connection_mark import TextConnectionMark
 from datatypes.transkriptionField import TranskriptionField
 from datatypes.word import Word, update_transkription_position_ids
 from join_faksimileAndTranskription import sort_words
 from util import back_up, back_up_svg_file, copy_faksimile_svg_file
 from process_files import update_svgposfile_status
 from process_words_post_merging import update_faksimile_line_positions, MERGED_DIR
 
 sys.path.append('shared_util')
 from myxmlwriter import write_pretty, xml_has_type, FILE_TYPE_SVG_WORD_POSITION, FILE_TYPE_XML_MANUSCRIPT
 from main_util import create_function_dictionary
 
 
 __author__ = "Christian Steiner"
 __maintainer__ = __author__
 __copyright__ = 'University of Basel'
 __email__ = "christian.steiner@unibas.ch"
 __status__ = "Development"
 __license__ = "GPL v3"
 __version__ = "0.0.1"
 
 UNITTESTING = False
 MAX_SVG_XY_THRESHOLD = 10
 
 class ResponseHandler:
     def __init__(self, response_starts_with=None, dialog_string=None, action_name=None, description=None):
         self.action_name = action_name
         self.dialog_string = dialog_string
         self.description = description
         self.response_starts_with = response_starts_with
 
     def create_requirement_list(self) ->list:
         """Create a requirement dictionary.
         """
         return []
 
     def create_json_dict(self)->dict:
         """Create a json dictionary.
         """
         json_dict =  { 'action_name': self.action_name, 'description': self.description }
         requirements = self.create_requirement_list()
         if len(requirements) > 0:
             json_dict.update({ 'requirements': requirements })
         return json_dict
 
+    def get_transkription_words(self, json_dict: dict) ->list:
+        """Return words with transkription positions only.
+        """
+        words = json_dict['words']\
+            if bool(json_dict.get('words'))\
+            else []
+        return [ w for w in words if bool(w.get('tp_id')) ]
+
     def get_requirement(self, json_dict: dict, index=0) ->tuple:
         """Return requirement tuple (name, input).
         """
         name = requirement = None
         if dict_contains_keys(json_dict, ['response_handler','requirements'])\
             and index < len(json_dict['response_handler']['requirements']):
             requirement_dict = json_dict['response_handler']['requirements'][index]
             if dict_contains_keys(requirement_dict, ['name'])\
                 and dict_contains_keys(requirement_dict, ['input']):
                 name = requirement_dict['name']
                 requirement = requirement_dict['input']
         return name, requirement
 
     def match(self, response: str) ->bool:
         """Return whether response matchs with handler.
         """
         if self.response_starts_with is not None:
             return response.startswith(self.response_starts_with)
         return True
 
     def print_dialog(self):
         """Print dialog.
         """
         if self.dialog_string is not None:
             print(f'[{self.dialog_string}]')
 
     def handle_response(self, page: Page, json_dict: dict) -> int:
         """Handle response and return exit code.
         """
-        json_word_ids = [ jw.get('id') for jw in json_dict['words'] ]
+        transkription_words = self.get_transkription_words(json_dict)
+        json_word_ids = [ jw.get('id') for jw in transkription_words ]
         action_dictionary = { 'words': [ word for word in page.words if word.id in json_word_ids ] }
         for index, item in enumerate(self.create_requirement_list()):
             name, requirement = self.get_requirement(json_dict, index=index)
             action_dictionary.update({name: requirement})
         return self.run_change(page, action_dictionary)
 
     def handle_interactive_response(self, page: Page, response: str, shell) -> int:
         """Handle response and return exit code.
         """
         return self.run_change(page, {})
 
     def run_change(self, page: Page, action_dictionary: dict) -> int:
         """Run changes on page and return exit code.
         """
         exit_code = 0
         return exit_code
 
 class JoinWords(ResponseHandler):
     def handle_interactive_response(self, page: Page, response: str, shell) -> int:
         """Handle response interactively and return exit code.
         """
         action_dictionary = { 'words' :  shell._get_words_from_response(re.compile('^\D+\s').sub('', response), page.words),\
                               'add_white_space_between_words': re.match(r'^\D+\s', response) }
         if self.run_change(page, action_dictionary) == 0:
             return shell.run_interactive_editor(page)
         return 2
 
     def run_change(self, page: Page, action_dictionary: dict) -> int:
         """Run changes on page and return exit code.
         """
         exit_code = 0
         add_white_space_between_words = action_dictionary['add_white_space_between_words']\
                 if bool(action_dictionary.get('add_white_space_between_words'))\
                 else False
         words = action_dictionary['words']\
             if bool(action_dictionary.get('words'))\
             else []
         if len(words) > 0:
             if len(set([ word.line_number for word in words ])) == 1\
                and len(set([ word.deleted for word in words ])) == 1:
                 new_word = words[0]
                 for word2join in words[1:]:
                     page.words.remove(word2join)
                     new_word.join(word2join, add_white_space_between_words=add_white_space_between_words)
             else:
                 new_word = Word.join_words(words, add_white_space_between_words=add_white_space_between_words)
                 index = len(page.words)
                 if words[0] in page.words:
                     index = page.words.index(words[0])
                 elif len([ word for word in page.words if words[0] in word.word_parts ]) > 0:
                     index = page.words.index([ word for word in page.words if words[0] in word.word_parts ][0])
                 for word2join in words: 
                     if word2join in page.words:
                         page.words.remove(word2join)
                     elif len([ word for word in page.words if word2join in word.word_parts ]) > 0:
                         page.words.remove([ word for word in page.words if word2join in word.word_parts ][0])
                 page.words.insert(index, new_word)
             if not UNITTESTING:
                 print(f'writing to {page.page_tree.docinfo.URL}')
-                save_page(page, attach_first=True, script_name=f'{__file__}:{inspect.currentframe().f_back.f_code.co_name}')
+                save_page(page, backup=True, attach_first=True, script_name=f'{__file__}:{inspect.currentframe().f_back.f_code.co_name}')
                 page = Page(page.page_tree.docinfo.URL)
         else:
             exit_code = 2
         return exit_code
 
 class SimpleJoinWords(JoinWords):
     def match(self, response: str) ->bool:
         """Return whether response matchs with handler.
         """
         return re.match(r'\d+', response)
 
 class SaveChanges(ResponseHandler):
     RELEVANT_PROPERTIES = [ ('deleted','deleted'), ('line_number','line') ] # 0 = word, 1 = word_dict
 
     def handle_interactive_response(self, page: Page, response: str, shell) -> int:
         """Handle response and return exit code.
         """
         self.run_change(page, {})
         return shell.run_interactive_editor(page)
 
-    def _update_word(self, word, word_dict) ->int:
+    def _update_transkription_word(self, word, word_dict) ->int:
         """Update properites of word according to word_dict,
             return exit_code
         """
         exit_code = 0
         for relevant_property in self.RELEVANT_PROPERTIES:
             if len(word.word_parts) > 0:
                 if len(word_dict['tp_id'].split(':')) == 3:
                     wp_index = int(word_dict['tp_id'].split(':')[1].replace('w','')) 
                     word.word_parts[wp_index].__dict__[relevant_property[0]] = word_dict[relevant_property[1]]
                 else:
                     return 2
             else:
                 word.__dict__[relevant_property[0]] = word_dict[relevant_property[1]]
         return exit_code
 
+    def _update_faksimile_word(self, word, word_dict, words) ->int:
+        """Update properites of word according to word_dict,
+            return exit_code
+        """
+        exit_code = 0
+        if word_dict.get('old_id') is not None:
+            fp_id = word_dict['fp_id']
+            old_id = int(word_dict['old_id'])
+            if len([w for w in words if w.id == old_id ]) > 0:
+                old_word = [w for w in words if w.id == old_id ][0]
+                faksimile_position = None
+                if len([ fp for fp in old_word.faksimile_positions if fp.id == fp_id ]) > 0:
+                    faksimile_position = [ fp for fp in old_word.faksimile_positions if fp.id == fp_id ][0] 
+                    old_word.faksimile_positions.remove(faksimile_position)
+                elif len([ fp for w in old_word.word_parts for fp in w.faksimile_positions if fp.id == fp_id ]) > 0:
+                    for w in old_word.word_parts:
+                        for fp in w.faksimile_positions:
+                            if fp.id == fp_id:
+                                faksimile_position = fp
+                                w.faksimile_positions.remove(faksimile_position)
+                                break
+                if faksimile_position is not None: 
+                    word.faksimile_positions.append(faksimile_position)
+                else:
+                    return 2
+            else:
+                return 3
+        return exit_code
+
+    def _update_word(self, word, word_dict, words) ->int:
+        """Update properites of word according to word_dict,
+            return exit_code
+        """
+        exit_code = 0
+        if bool(word_dict.get('tp_id')):
+            exit_code = self._update_transkription_word(word, word_dict)
+            if exit_code > 0:
+                return exit_code
+        elif bool(word_dict.get('fp_id')):
+            exit_code = self._update_faksimile_word(word, word_dict, words)
+            if exit_code > 0:
+                print(exit_code)
+                return exit_code
+        else:
+            return 2
+        return exit_code
+
     def handle_response(self, page: Page, json_dict: dict) -> int:
         """Handle response and return exit code.
         """
-        json_word_ids = [ jw.get('id') for jw in json_dict['words'] ]
+        json_word_ids = [ int(jw.get('id')) for jw in json_dict['words'] ]
+        print('updating word', json_dict, json_word_ids, page.words[0].id)
         for word in page.words:
             if word.id in json_word_ids:
-                word_dict = [ jw for jw in json_dict['words'] if jw.get('id') == word.id ][0]
-                if self._update_word(word, word_dict) > 0:
+                print('updating word', word.id, word.text)
+                word_dict = [ jw for jw in json_dict['words'] if int(jw.get('id')) == word.id ][0]
+                if self._update_word(word, word_dict, page.words) > 0:
                     return 2
         return self.run_change(page, {})
 
     def run_change(self, page: Page, action_dictionary: dict) -> int:
         """Run changes on page and return exit code.
         """
         exit_code = 0
         if not UNITTESTING:
             print(f'writing to {page.page_tree.docinfo.URL}')
-            save_page(page, attach_first=True, script_name=f'{__file__}:{inspect.currentframe().f_back.f_code.co_name}')
+            save_page(page, backup=True, attach_first=True, script_name=f'{__file__}:{inspect.currentframe().f_back.f_code.co_name}')
             page = Page(page.page_tree.docinfo.URL)
         return exit_code
 
+class SavePositions(SaveChanges):
+    def _update_word(self, word, word_dict_list) ->int:
+        """Update properites of word according to word_dict,
+            return exit_code
+        """
+        exit_code = 0
+        for word_dict in word_dict_list:
+            if bool(word_dict.get('tp_id')):
+                exit_code = self._update_transkription_position(word, word_dict)
+                if exit_code > 0:
+                    return exit_code
+            elif bool(word_dict.get('fp_id')):
+                exit_code = self._update_faksimile_position(word, word_dict)
+                if exit_code > 0:
+                    return exit_code
+        return exit_code
+
+    def _update_transkription_position(self, word, word_dict) ->int:
+        """Update transkription position properites of word according to word_dict,
+            return exit_code
+        """
+        tp_id_list = word_dict['tp_id'].split(':')
+        if len(tp_id_list) == 3 and len(word.word_parts) > 0:
+            wp_index = int(tp_id_list[1].replace('w','')) 
+            tp_index = int(tp_id_list[2].replace('tp','')) 
+            if wp_index < len(word.word_parts) and tp_index < len(word.word_parts[wp_index].transkription_positions):
+                word.word_parts[wp_index].transkription_positions[tp_index].left = float(word_dict['left'])
+                word.word_parts[wp_index].transkription_positions[tp_index].top = float(word_dict['top'])
+                word.word_parts[wp_index].transkription_positions[tp_index].bottom = word.word_parts[wp_index].transkription_positions[tp_index].top\
+                        + word.word_parts[wp_index].transkription_positions[tp_index].height
+            else:
+                return 2
+        elif len(tp_id_list) == 2:
+            tp_index = int(tp_id_list[1].replace('tp','')) 
+            if tp_index < len(word.transkription_positions):
+                word.transkription_positions[tp_index].left = float(word_dict['left'])
+                word.transkription_positions[tp_index].top = float(word_dict['top'])
+                word.transkription_positions[tp_index].bottom = word.transkription_positions[tp_index].top\
+                        + word.transkription_positions[tp_index].height
+            else:
+                return 2
+        else:
+            return 2
+        return 0
+
+    def _update_faksimile_position(self, word, word_dict) ->int:
+        """Update faksimile position properites of word according to word_dict,
+            return exit_code
+        """
+        exit_code = 0
+        fp_id = word_dict['fp_id']
+        faksimile_position = None 
+        if len([ fp for fp in word.faksimile_positions if fp.id == fp_id ]) > 0:
+            faksimile_position = [ fp for fp in word.faksimile_positions if fp.id == fp_id ][0] 
+        if len([ fp for w in word.word_parts for fp in w.faksimile_positions if fp.id == fp_id ]) > 0:
+            faksimile_position = [ fp for w in word.word_parts for fp in w.faksimile_positions if fp.id == fp_id ][0] 
+        if faksimile_position is not None: 
+            faksimile_position.left = float(word_dict['left'])
+            faksimile_position.top = float(word_dict['top'])
+            faksimile_position.bottom = faksimile_position.top + faksimile_position.height 
+        else:
+            return 2
+        return exit_code
+
+    def handle_response(self, page: Page, json_dict: dict) -> int:
+        """Handle response and return exit code.
+        """
+        json_word_ids = [ jw.get('id') for jw in json_dict['words'] ]
+        for word in page.words:
+            if word.id in json_word_ids:
+                word_dict_list = [ jw for jw in json_dict['words'] if jw.get('id') == word.id ]
+                if self._update_word(word, word_dict_list) > 0:
+                    return 2
+        return self.run_change(page, {})
+
 class Reload(ResponseHandler):
     def handle_interactive_response(self, page: Page, response: str, shell) -> int:
         """Handle response and return exit code.
         """
         return shell.run_interactive_editor(Page(page.page_tree.docinfo.URL))
 
 class RestoreBackup(ResponseHandler):
     def handle_interactive_response(self, page: Page, response: str, shell) -> int:
         """Handle response and return exit code.
         """
         if page.bak_file is not None:
             return shell.run_interactive_editor(Page(page.bak_file))
         else:
             print('Could not restore backup file, please restore manually!')
             return 2
 
 class ChangeLine2Value(ResponseHandler):
     def handle_interactive_response(self, page: Page, response: str, shell) -> int:
         """Handle response and return exit code.
         """
         words = []
         line_number = -1
         if re.match(r'l:\d+\s\d+', response):
             line_number = int(response.replace('l:', '').split(' ')[0])
             words = shell._get_words_from_response(re.compile('l:\d+\s').sub('', response), page.words)
         else:
             if not re.match(r'l:\d+$', response):
                 new_response_line = input('Specify new line number>') 
                 if re.match(r'^\d+$', new_response_line):
                     line_number = int(new_response_line)
             else:
                 line_number = int(response.replace('l:', ''))
             new_response = input(f'Specify ids of words for which line number should be changed to {line_number}>')
             if re.match(r'\d+', new_response):
                 words = shell_get_words_from_response(new_response, page.words)
         action_dictionary = { 'words': words, 'line_number' : line_number }
         if self.run_change(page, action_dictionary) == 0:
             return shell.run_interactive_editor(page)
         return 2
 
     def run_change(self, page: Page, action_dictionary: dict) -> int:
         """Run changes on page and return exit code.
         """
         exit_code = 0
         line_number = action_dictionary['line_number']\
                 if bool(action_dictionary.get('line_number'))\
                 else -1
         words = action_dictionary['words']\
             if bool(action_dictionary.get('words'))\
             else []
 
         if line_number != -1:
             for word in words: word.line_number = line_number
             if not UNITTESTING:
                 print(f'writing to {page.page_tree.docinfo.URL}')
-                save_page(page, attach_first=True, script_name=f'{__file__}:{inspect.currentframe().f_back.f_code.co_name}')
+                save_page(page, backup=True, attach_first=True, script_name=f'{__file__}:{inspect.currentframe().f_back.f_code.co_name}')
                 page = Page(page.page_tree.docinfo.URL)
         else:
             exit_code = 2
         return exit_code
 
 class CreateCorrectionHistory(ResponseHandler):
     def handle_interactive_response(self, page: Page, response: str, shell) -> int:
         """Handle response and return exit code.
         """
         if re.match(r'c\w*\s\d+', response):
             words = shell._get_words_from_response(re.compile('c\w*\s').sub('', response), page.words) 
         else:
             new_response = input(f'Specify ids of words to create a correction history. >')
             if re.match(r'\d+', new_response):
                 words = shell._get_words_from_response(new_response, page.words)
         action_dictionary = { 'words': words }
         if self.run_change(page, action_dictionary) == 0: 
             return shell.run_interactive_editor(page)
         return 2
                             
     def run_change(self, page: Page, action_dictionary: dict) -> int:
         """Run changes on page and return exit code.
         """
         exit_code = 0
         words = action_dictionary['words']\
             if bool(action_dictionary.get('words'))\
             else []
         if len(words) > 0:
             for word in words: word.create_correction_history()
             if not UNITTESTING:
                 print(f'writing to {page.page_tree.docinfo.URL}')
-                save_page(page, attach_first=True, script_name=f'{__file__}:{inspect.currentframe().f_back.f_code.co_name}')
+                save_page(page, backup=True, attach_first=True, script_name=f'{__file__}:{inspect.currentframe().f_back.f_code.co_name}')
                 page = Page(page.page_tree.docinfo.URL)
         else:
             exit_code = 2
         return exit_code
 
 class DeleteCorrectionHistory(ResponseHandler):
     def handle_interactive_response(self, page: Page, response: str, shell) -> int:
         """Handle response interactively and return exit code.
         """
         if re.match(r'D\w*\s\d+', response):
             words = shell._get_words_from_response(re.compile('D\w*\s').sub('', response), page.words) 
         else:
             new_response = input(f'Specify ids of words to delete their correction history. >')
             if re.match(r'\d+', new_response):
                 words = shell._get_words_from_response(new_response, page.words)
         action_dictionary = { 'words' :  words }
         if self.run_change(page, action_dictionary) == 0:
             return shell.run_interactive_editor(page)
         return 2
 
     def run_change(self, page: Page, action_dictionary: dict) -> int:
         """Run changes on page and return exit code.
         """
         exit_code = 0
         words = action_dictionary['words']\
             if bool(action_dictionary.get('words'))\
             else []
         if len(words) > 0:
             for word in words: 
                 print(word.text)
                 word.earlier_version = None
                 word.corrections = []
             if not UNITTESTING:
                 print(f'writing to {page.page_tree.docinfo.URL}')
-                save_page(page, attach_first=True, script_name=f'{__file__}:{inspect.currentframe().f_back.f_code.co_name}')
+                save_page(page, backup=True, attach_first=True, script_name=f'{__file__}:{inspect.currentframe().f_back.f_code.co_name}')
                 page = Page(page.page_tree.docinfo.URL)
         else:
             exit_code = 2
         return exit_code
 
 class ChangeDeletionStatus(ResponseHandler):
     def handle_interactive_response(self, page: Page, response: str, shell) -> int:
         """Handle response and return exit code.
         """
         if re.match(r'[du]\w*\s\d+', response):
             words = shell._get_words_from_response(re.compile('[du]\w*\s').sub('', response), page.words) 
         else:
             deletion_target = 'delete' if response.startswith('d') else 'undelete'
             new_response = input(f'Specify ids of words to {deletion_target}. >')
             if re.match(r'\d+', new_response):
                 words = shell._get_words_from_response(new_response, page.words)
         action_dictionary = { 'words': words, 'deleted': response.startswith('d') }
         if self.run_change(page, action_dictionary) == 0: 
             return shell.run_interactive_editor(page)
         return 2
 
     def run_change(self, page: Page, action_dictionary: dict) -> int:
         """Run changes on page and return exit code.
         """
         exit_code = 0
         words = action_dictionary['words']\
             if bool(action_dictionary.get('words'))\
             else []
         word_should_be_deleted = bool(action_dictionary.get('deleted'))
         if len(words) > 0:
             for word in words: word.deleted = word_should_be_deleted
             if not UNITTESTING:
                 print(f'writing to {page.page_tree.docinfo.URL}')
-                save_page(page, attach_first=True, script_name=f'{__file__}:{inspect.currentframe().f_back.f_code.co_name}')
+                save_page(page, backup=True, attach_first=True, script_name=f'{__file__}:{inspect.currentframe().f_back.f_code.co_name}')
                 page = Page(page.page_tree.docinfo.URL)
         else:
             exit_code = 2
         return exit_code
 
 class SplitWords(ResponseHandler):
     def _split_word(self, page, word, split_text):
         """Split word.
         """
         index = page.words.index(word)
         _, left, right = word.split(split_text)
         page.words[index] = left
         page.words.insert(index+1, right)
 
     def create_requirement_list(self) ->list:
         """Create a requirement dictionary.
         """
         return  [{ 'name': 'split_text', 'type': 'string', 'input': None }] 
 
     def handle_interactive_response(self, page: Page, response: str, shell) -> int:
         """Handle response and return exit code.
         """
         if re.match(r's\s\w+\s\d+', response):
             words = shell._get_words_from_response(re.compile('s\s\w+\s').sub('', response), page.words) 
             split_text = response.split(' ')[1]
         else:
             split_text = input('Input split text>') 
             new_response = input(f'Specify ids of words to split. >')
             if re.match(r'\d+', new_response):
                 words = shell._get_words_from_response(new_response, page.words)
         action_dictionary = { 'words': words, 'split_text': split_text }
         if self.run_change(page, action_dictionary) == 0: 
             return shell.run_interactive_editor(page)
         return 2
 
     def run_change(self, page: Page, action_dictionary: dict) -> int:
         """Run changes on page and return exit code.
         """
         exit_code = 0
         words = action_dictionary['words']\
             if bool(action_dictionary.get('words'))\
             else []
         split_text = action_dictionary['split_text']\
                if bool(action_dictionary.get('split_text'))\
                else ''
         if len(words) > 0 and split_text != '':
             for word in words: self._split_word(page, word, split_text)
             if not UNITTESTING:
                 print(f'writing to {page.page_tree.docinfo.URL}')
-                save_page(page, attach_first=True, script_name=f'{__file__}:{inspect.currentframe().f_back.f_code.co_name}')
+                save_page(page, backup=True, attach_first=True, script_name=f'{__file__}:{inspect.currentframe().f_back.f_code.co_name}')
                 page = Page(page.page_tree.docinfo.URL)
         else:
             exit_code = 2
         return exit_code
 
 class AddBox(ResponseHandler):
     def create_requirement_list(self) ->list:
         """Create a requirement dictionary.
         """
         return [{ 'name': 'box_text', 'type': 'string', 'input': None },\
                 { 'name': 'overwritten_by', 'type': 'string', 'input': None },\
                 { 'name': 'is_earlier_version', 'type': 'boolean', 'input': False }]
 
     def run_change(self, page: Page, action_dictionary: dict) -> int:
         """Run changes on page and return exit code.
         """
         exit_code = 0
         words = action_dictionary['words']\
             if bool(action_dictionary.get('words'))\
             else []
         missing_text = action_dictionary.get('box_text')
         is_earlier_version = action_dictionary.get('is_earlier_version')
         overwritten_by = action_dictionary.get('overwritten_by')
         if len(words) > 0 and missing_text is not None:
             for word in words: 
                 if overwritten_by is not None:
                     split_into_parts_and_attach_box(word, 0, missing_text, is_earlier_version, overwritten_by)
                 else:
                     attach_box(word, 0, missing_text, False)
                 word.create_correction_history()
                 if len(word.corrections) > 0:
                     for wp in word.word_parts:
                         wp.overwrites_word = None
             if not UNITTESTING:
                 print(f'writing to {page.page_tree.docinfo.URL}')
-                save_page(page, attach_first=True, script_name=f'{__file__}:{inspect.currentframe().f_back.f_code.co_name}')
+                save_page(page, backup=True, attach_first=True, script_name=f'{__file__}:{inspect.currentframe().f_back.f_code.co_name}')
                 page = Page(page.page_tree.docinfo.URL)
         else:
             exit_code = 2
         return exit_code
 
 class ResponseOrganizer:
     RESULT = 'result'
 
     def __init__(self):
         self.response_handler_dictionary = {}
         self._add_response_handler(JoinWords(action_name='join words', description='join words'))
         self._add_response_handler(SplitWords(action_name='split words', description='split word according to split text'))
         self._add_response_handler(CreateCorrectionHistory(action_name='create correction history', description='creates a correction history for selected words'))
         self._add_response_handler(DeleteCorrectionHistory(action_name='delete correction history', description='deletes the correction history of selected words'))
         self._add_response_handler(AddBox(action_name='add box', description='add box with overwritten text'))
         self._add_response_handler(SaveChanges(action_name='save changes', description='save change to line number/deletion status for word(s)' ))
+        self._add_response_handler(SavePositions(action_name='save positions', description='save new transkription position(s)' ))
 
     def _add_response_handler(self, response_handler: ResponseHandler):
         """Add response_handler to response_handler_dictionary.
         """
         self.response_handler_dictionary.update({response_handler.action_name: response_handler})
      
     def create_json_dict(self, xml_file: str, last_operation_result=None) ->dict:
         """Return a json dict of page with information about action.
         """
         page = Page(xml_file)
         replace_ligatures(page)
         converter = JSONConverter(page)
         json_dict = converter.create_json_dict()
         action_dict = { 'target_file': xml_file,\
                 'date_stamp': os.path.getmtime(xml_file)  }
         if last_operation_result is not None:
             action_dict.update({self.RESULT: last_operation_result })
         response_handlers = []
         for response_handler in self.response_handler_dictionary.values():
             response_handlers.append(response_handler.create_json_dict()) 
         action_dict.update({ 'response_handlers': response_handlers })
         json_dict.update({ 'actions': action_dict})
         return json_dict
 
     def handle_response(self, json_dict: dict) ->dict:
         """Handle response in json_dict and return new data json_dict.
         """
         if bool(json_dict.get('target_file')):
             target_file = json_dict['target_file']
             if bool(json_dict.get('date_stamp')):
                 current_stamp = os.path.getmtime(target_file)
                 if current_stamp <= json_dict['date_stamp']:
                     exit_code = 2
                     operation = 'unknown'
                     if bool(json_dict.get('response_handler'))\
                             and bool(self.response_handler_dictionary.get(json_dict['response_handler']['action_name'])):
                         operation = json_dict['response_handler']['action_name']
                         response_handler = self.response_handler_dictionary[operation]
                         exit_code = response_handler.handle_response(Page(target_file), json_dict)
                     message = f'Operation "{operation}" succeeded!' if exit_code == 0 else f'Operation "{operation}" failed'
                     return self.create_json_dict(target_file, last_operation_result=message)
                 else:
                     return self.create_json_dict(target_file,\
                             last_operation_result=f'FAIL: file {target_file} was changed between operations!')
             else:
                 return self.create_json_dict(target_file,\
                         last_operation_result='ERROR: there was no key "date_stamp" in json')
         else:
             return  { 'actions': { self.RESULT: 'ERROR: there was no key "target_file" in json!' }}
         
 class InteractiveShell:
     def __init__(self):
         self.response_handlers = []
         self.response_handlers.append(SimpleJoinWords(dialog_string='specify ids of words to join [default]'))
         self.response_handlers.append(RestoreBackup(response_starts_with='b', dialog_string='b=restore backup'))
         self.response_handlers.append(CreateCorrectionHistory(response_starts_with='c', dialog_string='c=create correction history [+ ids]'))
         self.response_handlers.append(DeleteCorrectionHistory(response_starts_with='D', dialog_string='D=delete correction history [+ ids]'))
         self.response_handlers.append(ChangeDeletionStatus(response_starts_with='d', dialog_string='d=mark deleted [+ ids]'))
         self.response_handlers.append(SaveChanges(response_starts_with='i', dialog_string='i=fix ids' ))
         self.response_handlers.append(ChangeLine2Value(response_starts_with='l', dialog_string='l[:value]=change line to value for ids' ))
         self.response_handlers.append(Reload(response_starts_with='r', dialog_string='r=reload xml file'))
         self.response_handlers.append(SplitWords(response_starts_with='s', dialog_string='s=split and join word ("s splittext id")'))
         self.response_handlers.append(ChangeDeletionStatus(response_starts_with='u', dialog_string='u=undelete [+ ids]'))
         self.response_handlers.append(JoinWords(response_starts_with='w', dialog_string='w=join words with whitespace between them [+ ids]'))
         self.response_handlers.append(ResponseHandler())
 
     def _get_words_from_response(self, response, words) ->list:
         """Return a list of word that correspond to indices
         """
         if re.match(r'\d+-\d+', response)\
             or re.match(r'\d+\+', response):
             index_boundaries = []
             if response[-1] == '+':
                 index_boundaries.append(int(response[:response.index('+')]))
                 index_boundaries.append(index_boundaries[0]+1)
             else:
                 index_boundaries = [ int(i) for i in response.split('-') ]
                 index_boundaries_length_diff = len(response.split('-')[0]) - len(response.split('-')[1])
                 if index_boundaries_length_diff > 0:
                     index_boundaries[1] = int(response.split('-')[0][0-index_boundaries_length_diff-1] + response.split('-')[1])
             indices = [ i for i in range(index_boundaries[0], index_boundaries[1]+1) ]
             if index_boundaries[0] > index_boundaries[1]:
                 indices = [ index_boundaries[0] ] 
                 while indices[-1] > index_boundaries[1]:
                     indices.append(indices[-1]-1)
         else:
             indices = [ int(i) for i in response.split(' ') ]
         result_words = []
         for index in indices:
             if len([ word for word in words if word.id == index ]) > 0:
                 result_words += [ word for word in words if word.id == index ]
         return result_words
     
     def run_interactive_editor(self, page) -> int:
         """Run interactive shell.
         """
         replace_ligatures(page)
         HTMLConverter(page).convert()
         for response_handler in self.response_handlers: response_handler.print_dialog()
         response = input('>')
         for response_handler in self.response_handlers:
             if response_handler.match(response):
                 return response_handler.handle_interactive_response(page, response, self)
 
 def replace_ligatures(page):
     """Replace ligatures
     """
     if len([ word for word in page.words if re.match(r'.*[ﬂﬁ]', word.text) ]) > 0:
         for word in [ word for word in page.words if re.match(r'.*[ﬁ]', word.text) ]:
             word.text = word.text.replace('ﬁ', 'fi')
         for word in [ word for word in page.words if re.match(r'.*[ﬂ]', word.text) ]:
             word.text = word.text.replace('ﬂ', 'fl')
 
 def dict_contains_keys(a_dict, key_list)->bool:
     """Return whether dict a_dict contains key path given by key_list.
     """
     if len(key_list) == 0:
         return True
     else:
         if key_list[0] in a_dict.keys():
             return dict_contains_keys(a_dict[key_list[0]], key_list[1:])
         return False
 
 def usage():
     """prints information on how to use the script
     """
     print(main.__doc__)
 
 def main(argv):
     """This program can be used to fix faksimile position ->set them to their absolute value.
 
     fixes/interactive_editor.py [OPTIONS] <xmlManuscriptFile|svg_pos_file>
 
         <xmlManuscriptFile>     a xml file about a manuscript, containing information about its pages.
         <svg_pos_file>          a xml file about a page, containing information about svg word positions.
 
         OPTIONS:
         -h|--help                       show help
 
         :return: exit code (int)
     """
     try:
         opts, args = getopt.getopt(argv, "h", ["help"])
     except getopt.GetoptError:
         usage()
         return 2
     for opt, arg in opts:
         if opt in ('-h', '--help'):
             usage()
             return 0
     if len(args) < 1:  
         usage()
         return 2
     exit_status = 0
     xml_file = args[0]
     if isfile(xml_file):
         counter = 0
         shell = InteractiveShell()
         for page in Page.get_pages_from_xml_file(xml_file, status_contains=STATUS_MERGED_OK):
             if not UNITTESTING: 
                 print(Fore.CYAN + f'Processing {page.title}, {page.number} with interactive editor ...' + Style.RESET_ALL)
                 back_up(page, page.xml_file)
             counter += 1 if shell.run_interactive_editor(page) == 0 else 0
         if not UNITTESTING:
             print(Style.RESET_ALL + f'[{counter} pages changed by interactive shell]')
     else:
         raise FileNotFoundError('File {} does not exist!'.format(xml_file))
     return exit_status
 
 if __name__ == "__main__":
     sys.exit(main(sys.argv[1:]))
Index: fixes/fix_old_data.py
===================================================================
--- fixes/fix_old_data.py	(revision 102)
+++ fixes/fix_old_data.py	(revision 103)
@@ -1,470 +1,487 @@
 #!/usr/bin/env python3
 # -*- coding: utf-8 -*-
 
 """   This program can be used to fix old data.
 """
 #    Copyright (C) University of Basel 2019  {{{1
 #
 #    This program is free software: you can redistribute it and/or modify
 #    it under the terms of the GNU General Public License as published by
 #    the Free Software Foundation, either version 3 of the License, or
 #    (at your option) any later version.
 #
 #    This program is distributed in the hope that it will be useful,
 #    but WITHOUT ANY WARRANTY; without even the implied warranty of
 #    MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
 #    GNU General Public License for more details.
 #
 #    You should have received a copy of the GNU General Public License
 #    along with this program.  If not, see <https://www.gnu.org/licenses/> 1}}}
 
 from colorama import Fore, Style
 from deprecated import deprecated
 from functools import cmp_to_key
 import getopt
 import inspect
 import lxml.etree as ET
 import re
 import shutil
 import string
 from svgpathtools import svg2paths2, svg_to_paths
 from svgpathtools.path import Path as SVGPath
 from svgpathtools.path import Line 
 import sys
 import tempfile
 from operator import attrgetter
 import os
 from os import listdir, sep, path, setpgrp, devnull
 from os.path import exists, isfile, isdir, dirname, basename
 from progress.bar import Bar
 import warnings
 
 
 sys.path.append('svgscripts')
 from convert_wordPositions import HTMLConverter
 from datatypes.box import Box
 from datatypes.faksimile import FaksimilePage
 from datatypes.manuscript import ArchivalManuscriptUnity
 from datatypes.mark_foreign_hands import MarkForeignHands
 from datatypes.matrix import Matrix
 from datatypes.page import Page, STATUS_MERGED_OK, STATUS_POSTMERGED_OK, FILE_TYPE_SVG_WORD_POSITION, FILE_TYPE_XML_MANUSCRIPT
 from datatypes.path import Path
 from datatypes.word import Word
 from datatypes.text_connection_mark import TextConnectionMark
 from datatypes.transkriptionField import TranskriptionField
 from datatypes.word import Word, update_transkription_position_ids
 from join_faksimileAndTranskription import sort_words
 from util import back_up, back_up_svg_file, copy_faksimile_svg_file, reset_tp_with_matrix
 from process_files import update_svgposfile_status
 from process_words_post_merging import update_faksimile_line_positions, MERGED_DIR
 
 sys.path.append('shared_util')
 from myxmlwriter import write_pretty, xml_has_type, FILE_TYPE_SVG_WORD_POSITION, FILE_TYPE_XML_MANUSCRIPT
-from main_util import create_function_dictionary
+from main_util import create_function_dictionary, get_manuscript_files
 
 
 __author__ = "Christian Steiner"
 __maintainer__ = __author__
 __copyright__ = 'University of Basel'
 __email__ = "christian.steiner@unibas.ch"
 __status__ = "Development"
 __license__ = "GPL v3"
 __version__ = "0.0.1"
 
 UNITTESTING = False
 MAX_SVG_XY_THRESHOLD = 10
 
 #TODO: fix all svg graphical files: change xlink:href to href!!!! 
 
 def convert_old_matrix(tp, xmin, ymin) ->(Matrix, float, float):
     """Return new matrix, x and y for old transkription_position.
     """
     matrix = tp.transform.clone_transformation_matrix()
     matrix.matrix[Matrix.XINDEX] = round(tp.transform.matrix[Matrix.XINDEX] + xmin, 3)
     matrix.matrix[Matrix.YINDEX] = round(tp.transform.matrix[Matrix.YINDEX] + ymin, 3)
     x = round(tp.left - tp.transform.matrix[Matrix.XINDEX], 3)\
             if tp.left > 0\
             else 0
     y = round((tp.height-1.5)*-1, 3)
     return matrix, x, y
 
 
 def save_page(page, attach_first=False, backup=False, script_name=None):
     """Write page to xml file
     """
     if backup:
         back_up(page, page.xml_file)
     if attach_first:
         page.update_and_attach_words2tree()
     if script_name is None:
         script_name = f'{__file__}:{inspect.currentframe().f_back.f_code.co_name}'
     write_pretty(xml_element_tree=page.page_tree, file_name=page.page_tree.docinfo.URL,\
             script_name=script_name, file_type=FILE_TYPE_SVG_WORD_POSITION)
 
 def page_already_changed(page) -> bool:
     """Return whether page has alreadybeen changed by function
     """
     return len(\
             page.page_tree.xpath(f'//metadata/modifiedBy[@script="{__file__}:{inspect.currentframe().f_back.f_code.co_name}"]')\
     ) > 0
 
 def fix_faksimile_line_position(page, redo=False) -> bool:
     """Create a faksimile line position.
     """
     if not redo and page_already_changed(page):
         return False;
     update_faksimile_line_positions(page)
     if not UNITTESTING:
         save_page(page)
     return True
 
 def check_faksimile_positions(page, redo=False) -> bool:
     """Check  faksimile line position.
     """
     if len(page.page_tree.xpath('//data-source/@file')) > 0:
         svg_file = page.page_tree.xpath('//data-source/@file')[0]
         svg_tree = ET.parse(svg_file)
         positions_are_equal_counter = 0
         page_changed = False
         for faksimile_page in FaksimilePage.GET_FAKSIMILEPAGES(svg_tree):
             if page.title == faksimile_page.title\
                     and page.number == faksimile_page.page_number:
                 #print([fp.id for fp in faksimile_page.word_positions ])
                 for word in page.words:
                     for fp in word.faksimile_positions:
                         rect_fps = [ rfp for rfp in faksimile_page.word_positions if rfp.id == fp.id ]
                         if len(rect_fps) > 0:
                             rfp = rect_fps[0]
                             if fp.left != rfp.left or fp.top != rfp.top:
                                 #print(f'{fp.id}: {fp.left}/{rfp.left} {fp.top}/{rfp.top}')
                                 fp.left = rfp.left
                                 fp.top = rfp.top
                                 fp.bottom = fp.top + rfp.height
                                 word.attach_word_to_tree(page.page_tree)
                                 page_changed = True
                             else:
                                 positions_are_equal_counter += 1
         print(f'{positions_are_equal_counter}/{len(page.words)} are equal')
     if page_changed and not UNITTESTING:
         save_page(page)
     return page_changed
 
 def fix_faksimile_positions(page, redo=False) -> bool:
     """Set faksimile positions to absolute values.
 
         [:return:] fixed
     """
     if not redo and len(page.page_tree.xpath(f'//metadata/modifiedBy[@script="{__file__}"]')) > 0:
         return False
     x_min = page.text_field.xmin
     y_min = page.text_field.ymin
     for word in page.words:
         for fp in word.faksimile_positions:
             fp.left = fp.left + x_min
             fp.top = fp.top + y_min
             fp.bottom = fp.bottom + y_min
         word.attach_word_to_tree(page.page_tree)
     if not UNITTESTING:
         print(f'writing to {page.page_tree.docinfo.URL}')
         write_pretty(xml_element_tree=page.page_tree, file_name=page.page_tree.docinfo.URL,\
             script_name=__file__, file_type=FILE_TYPE_SVG_WORD_POSITION)
     return True
 
 def _fix_tp_of_word(page, word, text_field):
     """Fix transkription positions ->set relative to 0,0 instead of text_field.left,text_field.top
     """
     for tp in word.transkription_positions:
         tp.left += text_field.left
         tp.top += text_field.top
-    reset_tp_with_matrix(page, word.transkription_positions)
+    reset_tp_with_matrix(word.transkription_positions)
     if type(word) == Word:
         words_in_word = word.word_parts + [ item for item in word.__dict__.items() if type(item) == Word ]
         for wp in words_in_word:
             _fix_tp_of_word(page, wp, text_field)
 
+def fix_tp_with_matrix(page, redo=False) -> bool:
+    """Fix transkription positions with rotation matrix ->set left to 0 and top to -5. 
+
+        [:return:] fixed
+    """
+    xmin = 0 if page.svg_image is None or page.svg_image.text_field is None else page.svg_image.text_field.left
+    ymin = 0 if page.svg_image is None or page.svg_image.text_field is None else page.svg_image.text_field.top
+    for word in page.words:
+        reset_tp_with_matrix(word.transkription_positions, tr_xmin=xmin, tr_ymin=ymin)
+        for wp in word.word_parts:
+            reset_tp_with_matrix(wp.transkription_positions, tr_xmin=xmin, tr_ymin=ymin)
+    if not UNITTESTING:
+        print(f'writing to {page.page_tree.docinfo.URL}')
+        save_page(page, attach_first=True)
+    return True
+
 def fix_transkription_positions(page, redo=False) -> bool:
     """Fix transkription positions ->set relative to 0,0 instead of text_field.left,text_field.top
 
         [:return:] fixed
     """
     if page.svg_image is not None\
         and page.svg_image.text_field is None:
         if page.svg_image is None:
             if page.svg_file is not None:
                 transkription_field = TranskriptionField(page.svg_file)
                 width = round(tf.documentWidth, 3)
                 height = round(tf.documentHeight, 3)
                 page.svg_image = SVGImage(file_name=svg_file, width=width,\
                         height=height, text_field=transkription_field.convert_to_text_field())
                 page.svg_image.attach_object_to_tree(page.page_tree)
             else:
                 raise Exception(f'ERROR page {page.page_tree.docinfo.URL} does not have a svg_file!')
         elif page.svg_image.text_field is None:
             page.svg_image.text_field = TranskriptionField(page.svg_image.file_name).convert_to_text_field()
             page.svg_image.attach_object_to_tree(page.page_tree)
         for line_number in page.line_numbers:
             line_number.top += page.svg_image.text_field.top
             line_number.bottom += page.svg_image.text_field.top
             line_number.attach_object_to_tree(page.page_tree)
         for word in page.words:
             _fix_tp_of_word(page, word, page.svg_image.text_field) 
         for mark in page.mark_foreign_hands:
             _fix_tp_of_word(page, mark, page.svg_image.text_field) 
         for tcm in page.text_connection_marks:
             _fix_tp_of_word(page, tcm, page.svg_image.text_field) 
         if not UNITTESTING:
             print(f'writing to {page.page_tree.docinfo.URL}')
             save_page(page, attach_first=True)
         return True
     return False
 
 def merge_transkription_positions(page, redo=False) -> bool:
     """Fix transkription positions of merged words
 
         [:return:] fixed
     """
     if not isdir(dirname(page.page_tree.docinfo.URL) + sep + MERGED_DIR)\
             or not isfile(dirname(page.page_tree.docinfo.URL) + sep + MERGED_DIR + sep + basename(page.page_tree.docinfo.URL)):
         return False
     merged_page = Page(dirname(page.page_tree.docinfo.URL) + sep + MERGED_DIR + sep + basename(page.page_tree.docinfo.URL))
     sync_dictionary = sync_words_linewise(merged_page.words, page.words, merged_page.line_numbers) 
     words = []
     for source_word in merged_page.words:
         words.append(source_word)
         if bool(sync_dictionary.get(source_word)):
             _sync_transkriptions_with_words(source_word, sync_dictionary)
         if source_word.text != ''.join([ t.get_text() for t in source_word.transkription_positions ]):
             text = ''.join([ t.get_text() for t in source_word.transkription_positions ])
             print(f'{source_word.line_number}: {source_word.text} has transkription_positions with text "{text}".')
             response = input('Change? [Y/n]>')
             if not response.startswith('n'):
                 new_sync_dictionary = sync_words_linewise(merged_page.words, page.words,\
                         [ line for line in merged_page.line_numbers if line.id == source_word.line_number ], force_sync_on_word=source_word)
                 if bool(new_sync_dictionary.get(source_word)):
                     _sync_transkriptions_with_words(source_word, new_sync_dictionary)
                 else:
                     raise Exception(f'Could not find sourc_word {source_word.text} in {new_sync_dictionary}!')
     page.words = words
     page.update_and_attach_words2tree()
     if not UNITTESTING:
         print(f'writing to {page.page_tree.docinfo.URL}')
         save_page(page)
     return True
 
 def fix_graphical_svg_file(page, redo=False) -> bool:
     """Fix glyphs of word for which there is a /changed-word in page.page_tree
     """
     svg_tree = ET.parse(page.svg_file)
     transkription_field = TranskriptionField(page.source)
     namespaces = { k if k is not None else 'ns': v for k, v in svg_tree.getroot().nsmap.items() }
     back_up_svg_file(svg_tree, namespaces=namespaces)
     tr_xmin = transkription_field.xmin if (page.svg_image is None or page.svg_image.text_field is None) else 0
     tr_ymin = transkription_field.ymin if (page.svg_image is None or page.svg_image.text_field is None) else 0
     for deleted_word_node in page.page_tree.xpath('//deleted-word'):
         deleted_word = Word.create_cls(deleted_word_node)
         _run_function_on_nodes_for_word(svg_tree, namespaces, deleted_word, tr_xmin, tr_ymin, _set_node_attribute_to, 'visibility', 'hidden')
     for changed_word_node in page.page_tree.xpath('//changed-word'):
         changed_word = Word.create_cls(changed_word_node)
         try:
             word = [ word for word in page.words if word.id == changed_word.id and word.text == changed_word.text ][0]
             left_difference = word.transkription_positions[0].left - changed_word.transkription_positions[0].left
             _run_function_on_nodes_for_word(svg_tree, namespaces, word, tr_xmin, tr_ymin, _add_value2attribute, 'x', left_difference)
         except IndexError:
             warnings.warn(f'There is no word for changed_word {changed_word.id}: "{changed_word.text}" in {page.page_tree.docinfo.URL}!')
     copy_faksimile_svg_file(target_file=page.svg_file, faksimile_tree=svg_tree, namespaces=namespaces)
 
 def _add_value2attribute(node, attribute, value):
     """Add left_difference to x of node.
     """
     node.set(attribute, str(float(node.get(attribute)) + value))
     node.set('changed', 'true')
 
 def _get_nodes_with_symbol_id(svg_tree, namespaces, symbol_id, svg_x, svg_y, threshold=0.1) -> list:
     """Return nodes with symbol_id n x = svg_x and y = svg_y.
     """
     nodes = [ node for node in svg_tree.xpath(\
             f'//ns:use[@xlink:href="#{symbol_id}" and @x > {svg_x-threshold} and @x < {svg_x+threshold} and @y > {svg_y-threshold} and @y < {svg_y+threshold} ]',\
             namespaces=namespaces) if not bool(node.get('changed')) ]
     if len(nodes) == 0 and threshold < MAX_SVG_XY_THRESHOLD:
         return _get_nodes_with_symbol_id(svg_tree, namespaces, symbol_id, svg_x, svg_y, threshold=threshold+1)
     return nodes
 
 def _run_function_on_nodes_for_word(svg_tree, namespaces, word, tr_xmin, tr_ymin, function_on_node, attribute, value):
     """Run function on nodes for words.
     """
     for tp in word.transkription_positions:
         for pwp in tp.positional_word_parts:
             symbol_id = pwp.symbol_id
             svg_x = pwp.left + tr_xmin
             svg_y = pwp.bottom + tr_ymin
             nodes = _get_nodes_with_symbol_id(svg_tree, namespaces, symbol_id, svg_x, svg_y)
             if len(nodes) > 0:
                 node = nodes[0]
                 function_on_node(node, attribute, value)
 
 def _set_node_attribute_to(node, attribute, value):
     """Set attribute of node to value.
     """
     node.set(attribute, str(value)) 
     node.set('changed', 'true')
 
 def sync_words_linewise(source_words, target_words, lines, force_sync_on_word=None) -> dict:
     """Sync words an create a dictionary with source_words as keys, refering to a list of corresponding words.
     """
     result_dict = {}
     for word in target_words + source_words: word.processed = False
     for line in lines:
         source_words_on_line = sorted([ word for word in source_words if word.line_number == line.id ], key=lambda word: word.transkription_positions[0].left)
         target_words_on_line = sorted([ word for word in target_words if word.line_number == line.id ], key=lambda word: word.transkription_positions[0].left)
         if len(target_words_on_line) == len(source_words_on_line):
             _sync_same_length(result_dict, source_words_on_line, target_words_on_line, force_sync_on_word=force_sync_on_word)
         elif len(source_words_on_line) < len(target_words_on_line):
             _sync_more_target_words(result_dict, source_words_on_line, target_words_on_line, force_sync_on_word=force_sync_on_word)
         else:
             print('okey dokey')
     return result_dict
 
 def _force_sync_on_word(force_sync_on_word, target_words_on_line, result_dict):
     """Force sync on word.
     """
     unprocessed_target_words = [t_word for t_word in target_words_on_line if not t_word.processed]
     if len(unprocessed_target_words) > 0:
         print([ (i, t_word.text) for i, t_word in enumerate(unprocessed_target_words)])
         response = input(f'Please specify indices of words to sync {force_sync_on_word.text} with: [default:0-{len(unprocessed_target_words)-1}]>')        
         indices = [ i for i in range(0, len(unprocessed_target_words)) ]
         if re.match(r'\d+-\d+', response):
             index_strings = response.split('-')
             indices = [ i for i in range(int(index_strings[0]), int(index_strings[1])+1) ]
         elif response != '':
             indices = [ int(i) for i in response.split(' ') ]
         target_words = []
         for i in indices: target_words.append(unprocessed_target_words[i])
         result_dict.update({ force_sync_on_word: target_words })
     else:
         raise Exception(f'There are no unprocessed target_words for {force_sync_on_word.text} on line {force_sync_on_word.line_number}!')
 
 def _sync_transkriptions_with_words(word, sync_dictionary):
     """Sync transkription_positions of word with syncronized words.
     """
     word.transkription_positions = []
     for target_word in sync_dictionary[word]:
         word.transkription_positions += target_word.transkription_positions
 
 def _sync_more_target_words(result_dict, source_words_on_line, target_words_on_line, force_sync_on_word=None):
     """Sync if there are more target words.
     """
     current_source_word = None
     for target_word in target_words_on_line:
         if current_source_word is not None\
                 and current_source_word.text.startswith(''.join([ w.text for w in result_dict[current_source_word]]) + target_word.text):
             result_dict[current_source_word].append(target_word)    
             target_word.processed = True
             if current_source_word.text == ''.join([ w.text for w in result_dict[current_source_word]]):
                 current_source_word = None
         elif len([ s_word for s_word in source_words_on_line if not s_word.processed and s_word.text == target_word.text ]) > 0:
             source_word = [ s_word for s_word in source_words_on_line if not s_word.processed and s_word.text == target_word.text ][0]
             target_word.processed = True
             source_word.processed = True
             result_dict.update({ source_word: [ target_word ] })
         elif len([ s_word for s_word in source_words_on_line if not s_word.processed and s_word.text.startswith(target_word.text) ]) > 0:
             current_source_word = [ s_word for s_word in source_words_on_line if not s_word.processed and s_word.text.startswith(target_word.text) ][0]
             current_source_word.processed = True
             target_word.processed = True
             result_dict.update({ current_source_word: [ target_word ] })
         else:
             msg = f'On line {target_word.line_number}: target_word "{target_word.text}" does not have a sibling in {[ s.text for s in source_words_on_line if not s.processed ]}'
             warnings.warn(msg)
     if force_sync_on_word is not None:
         _force_sync_on_word(force_sync_on_word, target_words_on_line, result_dict)
 
 def _sync_same_length(result_dict, source_words_on_line, target_words_on_line, force_sync_on_word=None):
     """Sync same length
     """
     for i, word in enumerate(source_words_on_line):
         if word.text == target_words_on_line[i].text:
             word.processed = True
             target_words_on_line[i].processed = True
             result_dict.update({ word: [ target_words_on_line[i] ] })
         elif len([ t_word for t_word in target_words_on_line if not t_word.processed and t_word.text == word.text ]) > 0:
             target_word = [ t_word for t_word in target_words_on_line if not t_word.processed and t_word.text == word.text ][0]
             word.processed = True
             target_word.processed = True
             result_dict.update({ word: [ target_word ] })
         else:
             msg = f'On line {word.line_number}: source_word "{word.text}" does not have a sibling in {[ s.text for s in target_words_on_line]}'
             warnings.warn(msg)
     if force_sync_on_word is not None:
         _force_sync_on_word(force_sync_on_word, target_words_on_line, result_dict)
 
 def usage():
     """prints information on how to use the script
     """
     print(main.__doc__)
 
 def main(argv):
     """This program can be used to fix old data.
 
     svgscripts/fix_old_data.py [OPTIONS] <xmlManuscriptFile|svg_pos_file>
 
         <xmlManuscriptFile>     a xml file about a manuscript, containing information about its pages.
         <svg_pos_file>          a xml file about a page, containing information about svg word positions.
 
         OPTIONS:
         -h|--help                       show help
         -c|--check-faksimile-positions  check whether faksimile positions have been updated
         -l|--faksimile-line-position    create faksimile line positions
         -p|--faksimile-positions        fix old faksimile positions
         -r|--redo                       rerun
         -s|--fix-graphical-svg          fix use position of glyphs for words changed by 'changed-word' and 'deleted-word' in xml file.
-        -p|--transkription-positions    fix old transkription positions ->set to 0,0 instead of text_field.0,0
+        -t|--transkription-positions    fix old transkription positions ->set to 0,0 instead of text_field.0,0
+        -M|--matrix                     fix old transkription positions with transform matrix 
 
         :return: exit code (int)
     """
     function_list = []
     function_dict = create_function_dictionary(['-c', '--check-faksimile-positions'], check_faksimile_positions)
     function_dict = create_function_dictionary(['-l', '--faksimile-line-position'], fix_faksimile_line_position, function_dictionary=function_dict)
     function_dict = create_function_dictionary(['-p', '--faksimile-positions'], fix_faksimile_positions, function_dictionary=function_dict)
     function_dict = create_function_dictionary(['-m', '--merge-positions'], merge_transkription_positions, function_dictionary=function_dict)
     function_dict = create_function_dictionary(['-s', '--fix-graphical-svg'], fix_graphical_svg_file, function_dictionary=function_dict)
-    function_dict = create_function_dictionary(['default', '-t', '--transkription-positions'], fix_transkription_positions, function_dictionary=function_dict)
+    function_dict = create_function_dictionary(['-t', '--transkription-positions'], fix_transkription_positions, function_dictionary=function_dict)
+    function_dict = create_function_dictionary(['default', '-M', '--matrix'], fix_tp_with_matrix, function_dictionary=function_dict)
     redo = False;
     try:
-        opts, args = getopt.getopt(argv, "hcplrmst", ["help", "check-faksimile-positions", "faksimile-positions", "faksimile-line-position",\
-                "redo", "merge-positions", "fix-graphical-svg", "transkription-positions" ])
+        opts, args = getopt.getopt(argv, "hcplrmstM", ["help", "check-faksimile-positions", "faksimile-positions", "faksimile-line-position",\
+                "redo", "merge-positions", "fix-graphical-svg", "transkription-positions", 'matrix' ])
     except getopt.GetoptError:
         usage()
         return 2
     for opt, arg in opts:
         if opt in ('-h', '--help'):
             usage()
             return 0
         elif opt in ('-r', '--redo'):
             redo = True;
         elif opt in function_dict.keys():
             function_list.append(function_dict[opt])
     if len(function_list) == 0:
         function_list.append(function_dict['default'])
     if len(args) < 1:  
         usage()
         return 2
     exit_status = 0
-    xml_file = args[0]
-    for xml_file in args:
+    for xml_file in get_manuscript_files(args):
         if isfile(xml_file):
             counters = { f.__name__: 0 for f in function_list }
             for current_function in function_list:
                 status_contains = STATUS_MERGED_OK if 'faksimile' in current_function.__name__ else 'OK'
                 for page in Page.get_pages_from_xml_file(xml_file, status_contains=status_contains):
                     if not UNITTESTING: 
                         print(Fore.CYAN + f'Processing {page.title}, {page.number} with function {current_function.__name__} ...' + Style.RESET_ALL)
                         back_up(page, page.xml_file)
                     counters[current_function.__name__] += 1 if current_function(page, redo=redo) else 0
             if not UNITTESTING:
                 for function_name, counter in counters.items():
                     print(Style.RESET_ALL + f'[{counter} pages changed by {function_name}]')
         else:
             raise FileNotFoundError('File {} does not exist!'.format(xml_file))
     return exit_status
 
 if __name__ == "__main__":
     sys.exit(main(sys.argv[1:]))
Index: py2ttl/convert.py
===================================================================
--- py2ttl/convert.py	(revision 102)
+++ py2ttl/convert.py	(revision 103)
@@ -1,113 +1,115 @@
 #!/usr/bin/env python3
 # -*- coding: utf-8 -*-
 
 """   This program can be used to convert py objects to ontology and data in turtle format.
 """
 #    Copyright (C) University of Basel 2019  {{{1
 #
 #    This program is free software: you can redistribute it and/or modify
 #    it under the terms of the GNU General Public License as published by
 #    the Free Software Foundation, either version 3 of the License, or
 #    (at your option) any later version.
 #
 #    This program is distributed in the hope that it will be useful,
 #    but WITHOUT ANY WARRANTY; without even the implied warranty of
 #    MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
 #    GNU General Public License for more details.
 #
 #    You should have received a copy of the GNU General Public License
 #    along with this program.  If not, see <https://www.gnu.org/licenses/> 1}}}
 
 from colorama import Fore, Style
 import getopt
 import lxml.etree as ET
 from os import sep, path, listdir
 from os.path import isfile, isdir, dirname, basename
 from progress.bar import Bar
 import re
 import sys
 
 sys.path.append('svgscripts')
 from datatypes.manuscript import ArchivalManuscriptUnity
 
 if dirname(__file__) not in sys.path:
     sys.path.append(dirname(__file__))
 
 from class_spec import SemanticClass
 from config import check_config_files_exist, get_datatypes_dir, PROJECT_NAME, PROJECT_ONTOLOGY_FILE, PROJECT_URL
 from py2ttl_data import Py2TTLDataConverter
 from py2ttl_ontology import Py2TTLOntologyConverter
 
 
 sys.path.append('shared_util')
 from myxmlwriter import xml2dict
+from main_util import get_manuscript_files
 
 __author__ = "Christian Steiner"
 __maintainer__ = __author__
 __copyright__ = 'University of Basel'
 __email__ = "christian.steiner@unibas.ch"
 __status__ = "Development"
 __license__ = "GPL v3"
 __version__ = "0.0.1"
 
+FILE_TYPE_XML_PROJECT = "xmlProjectFile"
 
 def usage():
     """prints information on how to use the script
     """
     print(main.__doc__)
 
 def main(argv):
     """This program can be used to convert py objects to a owl:Ontology and rdf data in turtle format.
 
     py2ttl/py2ttl_data.py [OPTIONS] <manuscript.xml> [<manuscript2.xml> ...]
 
         <manuscript.xml>                   xml file of type shared_util.myxmlwriter.FILE_TYPE_XML_MANUSCRIPT.
 
         OPTIONS:
         -h|--help:                          show help
         -i|--include-status=STATUS          include pages with status = STATUS. STATUS is a ':' seperated string of status, e.g. 'OK:faksimile merged'.
 
         :return: exit code (int)
     """
     check_config_files_exist()
     datatypes_dir =  get_datatypes_dir()
     source_ontology_file = PROJECT_ONTOLOGY_FILE 
     target_ontology_file = '.{0}{1}-ontology_autogenerated.ttl'.format(sep, PROJECT_NAME)
     manuscript_file = None
-    page_status_list = None 
+    page_status_list = [ 'OK', 'faksimile merged' ] 
     try:
         opts, args = getopt.getopt(argv, "hi:", ["help", "include-status="])
     except getopt.GetoptError:
         usage()
         return 2
     for opt, arg in opts:
         if opt in ('-h', '--help'):
             usage()
             return 0
         elif opt in ('-i', '--include-status'):
             page_status_list = arg.split(':') 
     if len(args) < 1 :
         usage()
         return 2
     ontology_created = False
     ontology_converter = Py2TTLOntologyConverter(project_ontology_file=source_ontology_file)
     output = 2
-    for manuscript_file in args:
+    for manuscript_file in get_manuscript_files(args):
         if not isfile(manuscript_file):
             usage()
             return 2
         if not ontology_created:
             print(Fore.CYAN + 'Create ontology from  "{}" ...'.format(manuscript_file))
             if ontology_converter.create_ontology(datatypes_dir, target_ontology_file) == 0:
                 print(Fore.GREEN + '[Ontology file {0} created]'.format(target_ontology_file))
                 ontology_created = True
             else:
                 return 2
         print(Fore.CYAN + 'Create data from  "{}" ...'.format(manuscript_file))
         data_converter = Py2TTLDataConverter(manuscript_file, mapping_dictionary=ontology_converter.uri_mapping4cls_and_properties)
         output = data_converter.convert(page_status_list=page_status_list)
     return output
 
 
 if __name__ == "__main__":
     sys.exit(main(sys.argv[1:]))
Index: py2ttl/config.py
===================================================================
--- py2ttl/config.py	(revision 102)
+++ py2ttl/config.py	(revision 103)
@@ -1,40 +1,40 @@
 #!/usr/bin/env python3
 # -*- coding: utf-8 -*-
 import getpass
 from os.path import isfile, isdir, exists 
 import re
 
 
 PROJECT_NAME = 'tln'
 PROJECT_URL = 'http://www.knora.org/ontology/0068/nietzsche'
 DATA_URL = 'http://rdfh.ch/projects/0068'
 
 ONTOLOGY_DIR = './ontologies' if getpass.getuser() == 'knister0' else './ontologies' # local onotology dir, script will read only
 KNORA_BASE_ONTOLOGY_FILE = '{}/knora-ontologies/knora-base.ttl'.format(ONTOLOGY_DIR)
 SHARED_ONTOLOGIES_DIR = '{}/Ontologies-shared'.format(ONTOLOGY_DIR)
 PROJECT_ONTOLOGY_FILE = './Friedrich-Nietzsche-late-work-ontology.ttl'
-PROJECT_ONTOLOGY_FILE_URL = 'https://c4scdn.ch/file/data/v6tjganrzg2nk3fuukgy/PHID-FILE-lcacdm2atc73ladd3ajq/Friedrich-Nietzsche-late-work-ontology.ttl'
+PROJECT_ONTOLOGY_FILE_URL = 'https://raw.githubusercontent.com/knisterstern/nietzsche-stub/main/Friedrich-Nietzsche-late-work-ontology.ttl'
 
 DATATYPES_DIR = './svgscripts/datatypes' # optional in config file, can be overwritten by passing a <dir> to py2ttl/py2ttl.py
 
 
 def check_config_files_exist():
     """Checks whether all files exist that are specified in this file by uppercase variables ending in 'DIR' or 'FILE'.
 
         :return: exit code (int)
     """
     for key in  [ key for key in globals().keys() if re.match(r'^[A-Z_-]+(DIR|FILE)$', key) ]:
         if not exists(globals().get(key)):
             raise FileNotFoundError('Key {} does not specify an existing file or directory'.format(key))
         if key.endswith('DIR') and not isdir(globals().get(key)):
             raise NotADirectoryError('Key {} does not specify an existing directory'.format(key))
     return 0
             
 def get_datatypes_dir():
     """Returns value of DATATYPES_DIR if set, else None.
     """
     if 'DATATYPES_DIR' in globals().keys():
         return DATATYPES_DIR.replace('./','')
     else:
         None
 
Index: py2ttl/py2ttl_ontology.py
===================================================================
--- py2ttl/py2ttl_ontology.py	(revision 102)
+++ py2ttl/py2ttl_ontology.py	(revision 103)
@@ -1,369 +1,369 @@
 #!/usr/bin/env python3
 # -*- coding: utf-8 -*-
 
 """   This program can be used to convert py classes that are 
       subclasses of class_spec.SemanticClass to 
       a owl ontology in turtle format.
 """
 #    Copyright (C) University of Basel 2019  {{{1
 #
 #    This program is free software: you can redistribute it and/or modify
 #    it under the terms of the GNU General Public License as published by
 #    the Free Software Foundation, either version 3 of the License, or
 #    (at your option) any later version.
 #
 #    This program is distributed in the hope that it will be useful,
 #    but WITHOUT ANY WARRANTY; without even the implied warranty of
 #    MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
 #    GNU General Public License for more details.
 #
 #    You should have received a copy of the GNU General Public License
 #    along with this program.  If not, see <https://www.gnu.org/licenses/> 1}}}
 
 import getopt
 import importlib
 import importlib.util
 import inspect
 import lxml.etree as ET
 from os import sep, path, listdir
 from os.path import isfile, isdir, dirname, basename
 from progress.bar import Bar
 from rdflib import Graph, URIRef, Literal, BNode, OWL, RDF, RDFS, XSD
 import re
 import requests
 import sys
 import warnings
 
 
 if dirname(__file__) not in sys.path:
     sys.path.append(dirname(__file__))
 
 from class_spec import SemanticClass, UnSemanticClass
-from config import check_config_files_exist, get_datatypes_dir, PROJECT_NAME, PROJECT_ONTOLOGY_FILE, PROJECT_ONTOLOGY_FILE_URL, PROJECT_URL
+from config import check_config_files_exist, get_datatypes_dir, PROJECT_NAME, PROJECT_ONTOLOGY_FILE, PROJECT_URL, PROJECT_ONTOLOGY_FILE_URL
 from data_handler import RDFDataHandler
 
 sys.path.append('shared_util')
 from myxmlwriter import dict2xml
 
 __author__ = "Christian Steiner"
 __maintainer__ = __author__
 __copyright__ = 'University of Basel'
 __email__ = "christian.steiner@unibas.ch"
 __status__ = "Development"
 __license__ = "GPL v3"
 __version__ = "0.0.1"
 
 
 class Py2TTLOntologyConverter:
     """This class can be used convert semantic_dictionaries to a owl ontology in turtle format.
     """
     UNITTESTING = False
     INFERRED_SUB_CLASS = RDFS.subClassOf * '*' 
 
     def __init__(self, project_ontology_file=None):
         self.class_uri_dict = {}
         self.uri_mapping4cls_and_properties = {}
         self.project_graph = Graph()
         self.base_uriref = URIRef(PROJECT_URL)
         self.project_name = PROJECT_NAME
         self.ns = { self.base_uriref + '#': self.project_name }
         if project_ontology_file is not None and isfile(project_ontology_file):
             if project_ontology_file == PROJECT_ONTOLOGY_FILE:
                 r = requests.get(PROJECT_ONTOLOGY_FILE_URL)
                 with open(project_ontology_file, 'wb') as f:
                     f.write(r.content)
-                print(f'{project_ontology_file} updated from c4science repository')
+                print(f'{project_ontology_file} updated from github repository')
             self.project_graph.parse(project_ontology_file, format="turtle")
         if len(self.project_graph) > 0:
             self.base_uriref = self.project_graph.value(predicate=RDF.type, object=OWL.Ontology, any=False)
             self.ns = { uriref: ns for ns, uriref in self.project_graph.namespace_manager.namespaces() }
             self.project_name = self.ns.get(self.base_uriref + '#')
         self.project_graph.bind(self.project_name, self.base_uriref + '#')
         self.uri_mapping4cls_and_properties.update({ 'ontology': { 'project_name': self.project_name, 'project_uri': self.base_uriref + '#' }})
         self.uri_mapping4cls_and_properties.update({ 'classes': {} })
 
     def addClass2Graph(self, cls, semantic_dict=None) -> (URIRef, type):
         """Add a class to project_graph.
 
             :return: (cls_uri (URIRef), super_cls (cls))
         """
         if semantic_dict is None:
             semantic_dict = cls.get_semantic_dictionary()
         comment, label = self.get_comment_label(cls)
         cls_uri = URIRef(self.base_uriref + '#' + cls.__name__)
         self.project_graph.add((cls_uri, RDF.type, OWL.Class))
         self.project_graph.add((cls_uri, RDFS.isDefinedBy, self.base_uriref))
         if comment != '':
             self.project_graph.add((cls_uri, RDFS.comment, Literal(comment, lang='en')))
         if label != '':
             self.project_graph.add((cls_uri, RDFS.label, Literal(label, lang='en')))
         super_uri = None
         super_cls = None
         if bool(semantic_dict[SemanticClass.CLASS_KEY].get(SemanticClass.TYPE)):
             super_cls = semantic_dict[SemanticClass.CLASS_KEY].get(SemanticClass.TYPE)
             super_uri = self.createClassAndProperties(super_cls)
             if super_uri is not None:
                 self.project_graph.add((cls_uri, RDFS.subClassOf, super_uri))
         if SemanticClass.SUBCLASS_OF in semantic_dict[SemanticClass.CLASS_KEY].keys()\
                 and len(semantic_dict[SemanticClass.CLASS_KEY][SemanticClass.SUBCLASS_OF]) > 0:
             for super_uri_string in semantic_dict[SemanticClass.CLASS_KEY].get(SemanticClass.SUBCLASS_OF):
                 super_uri = URIRef(super_uri_string)
                 if not (cls_uri, self.INFERRED_SUB_CLASS, super_uri) in self.project_graph:
                     self.project_graph.add((cls_uri, RDFS.subClassOf, super_uri))
         return cls_uri, super_cls
 
     def addProperty2Graph(self, property_uri, domain_uri, range_uri, info_dict, property_type=OWL.ObjectProperty):
         """Add a property to self.project_graph.
         """
         label = 'has ' + property_uri.split('#')[1].replace('has','')\
             if SemanticClass.PROPERTY_LABEL not in info_dict.keys() else info_dict[SemanticClass.PROPERTY_LABEL]
         self.project_graph.add((property_uri, RDF.type, property_type))
         self.project_graph.add((property_uri, RDFS.isDefinedBy, self.base_uriref))
         self.project_graph.add((property_uri, RDFS.domain, domain_uri))
         self.project_graph.add((property_uri, RDFS.range, range_uri))
         if SemanticClass.PROPERTY_COMMENT in info_dict.keys():
             comment =  info_dict[SemanticClass.PROPERTY_COMMENT]
             self.project_graph.add((property_uri, RDFS.comment, Literal(comment, lang='en')))
         self.project_graph.add((property_uri, RDFS.label, Literal(label, lang='en')))
         if SemanticClass.CARDINALITY in info_dict.keys()\
                     and info_dict[SemanticClass.CARDINALITY] > 0:
             self.addRestriction2Class(domain_uri, property_uri, info_dict)
 
     def addRestriction2Class(self, cls_uri, property_uri, info_dict):
         """Adds restriction on property_uri to class cls_uri.
         """
         if SemanticClass.CARDINALITY in info_dict.keys()\
             and info_dict[SemanticClass.CARDINALITY] > 0:
             if (cls_uri, None, None) not in self.project_graph:
                 warnings.warn('{} not in graph!'.format(cls_uri))        
             restriction = BNode()
             cardinality_restriction = URIRef(OWL + info_dict[SemanticClass.CARDINALITY_RESTRICTION])\
                 if SemanticClass.CARDINALITY_RESTRICTION in info_dict.keys()\
                 else OWL.cardinality
             cardinality = info_dict[SemanticClass.CARDINALITY]
             self.project_graph.add((cls_uri, RDFS.subClassOf, restriction))
             self.project_graph.add((restriction, RDF.type, OWL.Restriction))
             self.project_graph.add((restriction, OWL.onProperty, property_uri))
             self.project_graph.add((restriction, cardinality_restriction, Literal(str(cardinality), datatype=XSD.nonNegativeInteger)))
 
     def create_ontology(self, datatypes_dir, target_ontology_file):
         """Convert all classes contained in datatypes_dir that are subclasses of class_spec.SemanticClass to rdf.
     
             :return: exit code (int)
         """
         if isdir(datatypes_dir):
             semantic_classes = self.get_semantic_classes(datatypes_dir)
             if not Py2TTLOntologyConverter.UNITTESTING:
                 bar = Bar('creating classes and properties', max=len(semantic_classes))
             for cls in semantic_classes:
                 self.createClassAndProperties(cls)
                 not bool(Py2TTLOntologyConverter.UNITTESTING) and bar.next()
             not bool(Py2TTLOntologyConverter.UNITTESTING) and bar.finish()
             self.uri_mapping4cls_and_properties['ontology'].update({'ontology_file': target_ontology_file})
             f = open(target_ontology_file, 'wb+')
             f.write(self.project_graph.serialize(format="turtle"))
             f.close()
             if not Py2TTLOntologyConverter.UNITTESTING:
                 xml_file = 'mapping_file4' + datatypes_dir.replace(sep, '.') + '2' + target_ontology_file.replace('.' + sep, '').replace(sep, '.').replace('.ttl', '.xml')
                 dict2xml(self.uri_mapping4cls_and_properties, xml_file)
         else:
             print('Error: dir {} does not exist!'.format(datatypes_dir))
             usage
             return 1
         return 0
 
     def createClassAndProperties(self, cls):
         """Creates a owl:Class and some owl:ObjectProperty from semantic_dictionary of a python class.
         """
         if not cls.__name__ in self.class_uri_dict:
             self.class_uri_dict.update({cls.__name__: cls})
             semantic_dict = cls.get_semantic_dictionary()
             cls_uri, super_cls = self.addClass2Graph(cls, semantic_dict) 
             uri_mapping4properties = {}
             for property_key in self._get_semantic_dictionary_keys_super_first(semantic_dict['properties']):
                 super_semantic_dict = {} if super_cls is None else super_cls.get_semantic_dictionary()
                 if len(super_semantic_dict) == 0 or not bool(super_semantic_dict['properties'].get(property_key)):
                     property_dict4key = semantic_dict['properties'].get(property_key)
                     property_cls = property_dict4key.get('class')
                     subject_uri, property_uri = self.createProperty(cls_uri, property_key, property_cls, property_dict4key)
                     uri_mapping4properties.update({ property_key: property_uri })
                 elif bool(self.uri_mapping4cls_and_properties.get('classes').get(super_cls.__name__).get('properties').get(property_key)):
                     property_uri = self.uri_mapping4cls_and_properties['classes'][super_cls.__name__]['properties'][property_key]
                     uri_mapping4properties.update({ property_key: property_uri})
             self.uri_mapping4cls_and_properties.get('classes').update({ cls.__name__:  { 'class_uri': cls_uri, 'properties': uri_mapping4properties }})
         return URIRef(self.base_uriref + '#' + cls.__name__)
  
     def createProperty(self, domain_uri, property_name, range_cls, info_dict) -> (URIRef, URIRef):
         """Creates a owl:ObjectProperty.
 
             :return: tuple of domain_uri (rdflib.URIRef) and property_uri (rdflib.URIRef) of created property
         """
         name = self.createPropertyName(property_name=property_name)\
                 if SemanticClass.PROPERTY_NAME not in info_dict.keys() else info_dict[SemanticClass.PROPERTY_NAME]
         property_uri = URIRef(self.base_uriref + '#' + name)
         inferredSubClass = RDFS.subClassOf * '*'
         range_uri = URIRef(self.base_uriref + '#' + range_cls.__name__)
         super_property_uri = None
         if SemanticClass.SUBPROPERTYOF in info_dict.keys():
             super_property_uri = URIRef(info_dict[SemanticClass.SUBPROPERTYOF])
         elif SemanticClass.SUPER_PROPERTY in info_dict.keys():
             domain_uri, super_property_uri = self.createProperty(domain_uri,\
                                                 info_dict[SemanticClass.SUPER_PROPERTY].get(SemanticClass.PROPERTY_NAME),\
                                                 range_cls, info_dict[SemanticClass.SUPER_PROPERTY]) 
         if (property_uri, None, None) not in self.project_graph:
             property_type = OWL.ObjectProperty
             if range_cls.__module__ == 'builtins':
                 if range_cls != list:
                     property_type = OWL.DatatypeProperty
                 range_uri = RDFDataHandler.SIMPLE_DATA_TYPE_MAPPING.get(range_cls)
                 if range_uri == XSD.string and property_name == 'URL':
                     range_uri = XSD.anyURI 
             self.addProperty2Graph(property_uri, domain_uri, range_uri, info_dict, property_type=property_type)
         elif not True in [\
                 (domain_uri, inferredSubClass, o) in self.project_graph\
                 for o in self.project_graph.objects(property_uri, RDFS.domain)\
             ]:
             # if domain_uri is NOT a subclass of a cls specified by RDFS.domain
             if SemanticClass.CARDINALITY in info_dict.keys()\
                     and info_dict[SemanticClass.CARDINALITY] > 0:
                 self.addRestriction2Class(domain_uri, property_uri, info_dict)
             self.project_graph.add((property_uri, RDFS.domain, domain_uri))
         if super_property_uri is not None\
             and (property_uri, RDFS.subPropertyOf, super_property_uri) not in self.project_graph:
             self.project_graph.add((property_uri, RDFS.subPropertyOf, super_property_uri))
         return domain_uri, property_uri
 
     def createPropertyName(self, property_name=None, subject_uri=None, object_uri=None, connector='BelongsTo', prefix='has'):
         """Returns a property name.
         """
         if property_name is not None:
             property_name = ''.join([ property_name.split('_')[0].lower() ] + [ text.capitalize() for text in property_name.split('_')[1:] ])
             return prefix + property_name[0].upper() + property_name[1:] if property_name[0].islower()\
                     else prefix + property_name
         elif subject_uri is not None:
             property_name = subject_uri.split('#')[1] + self.createPropertyName(object_uri=object_uri, prefix=connector)
             return property_name[0].lower() + property_name[1:]
         elif object_uri is not None:
             return prefix + object_uri.split('#')[1]
         else:
             return prefix 
 
     def get_comment_label(self, cls):
         """Returns comment and label from cls __doc__.
         """
         comment = cls.__doc__.replace('\n','').lstrip()
         label = cls.__name__
         if '.' in cls.__doc__:
             comment = [ text for text in cls.__doc__.split('\n') if text != '' ][0].lstrip()
         if '@label' in cls.__doc__:
             m = re.search('(@label[:]*\s)(.*[\.]*)', cls.__doc__)
             label_tag, label = m.groups()
         elif re.search('([A-Z][a-z]+)', label):
             m = re.search('([A-Z]\w+)([A-Z]\w+)', label)
             label = ' '.join([ text.lower() for text in re.split(r'([A-Z][a-z]+)', label) if text != '' ])
         return comment, label
 
     def get_semantic_classes(self, datatypes_dir):
         """Returns a list of all classes that are  contained in datatypes_dir that are subclasses of class_spec.SemanticClass.
     
             :return: a list of (str_name, class)
         """
         base_dir = dirname(dirname(__file__))
         sys.path.append(base_dir)
         root_modul_name = datatypes_dir.replace('/','.')
         files = [ file.replace('.py','') for file in listdir(datatypes_dir) if file.endswith('.py') and not file.startswith('test_') and not file.startswith('_')]
         all_modules = []
         for name in files:
             all_modules.append(importlib.import_module('{}.{}'.format(root_modul_name, name)))
         all_classes = []
         for modul in all_modules:
             all_classes += inspect.getmembers(modul, inspect.isclass)
         #all_classes = sorted(set(all_classes))
         all_classes = sorted(set(all_classes), key=lambda current_class: current_class[0])
         semantic_classes = [ cls for name, cls in all_classes if issubclass(cls, SemanticClass)\
                                                               and not issubclass(cls, UnSemanticClass)\
                                                               and not (cls == SemanticClass)]
         return semantic_classes
 
     def _get_builtin_cls_keys(self, property_dict):
         """Returns a list of keys for classes that are builtin.
         """
         builtin_cls_keys = []
         for key in property_dict.keys():
             property_cls = property_dict.get(key).get('class')\
                     if type(property_dict.get(key)) is dict\
                     else property_dict.get(key)[0]
             if type(property_cls) != dict\
                     and property_cls.__module__ == 'builtins':
                 builtin_cls_keys.append(key)
         return builtin_cls_keys
 
     def _get_semantic_dictionary_keys_super_first(self, property_dict):
         """Sorts the keys of the property part of a semantic dictionary 
         and returns the keys for super classes before keys of subclasses.
 
             :return: a sorted list of keys.
         """
         builtin_cls_keys = self._get_builtin_cls_keys(property_dict) 
         complex_cls_keys = []
         for key in [ key for key in property_dict.keys()\
                 if key not in builtin_cls_keys ]:
             current_cls = property_dict.get(key).get('class')
             key_inserted = False
             for index, cls_key in enumerate(complex_cls_keys):
                 potential_sub_cls = property_dict.get(cls_key).get('class')
                 if issubclass(potential_sub_cls, current_cls):
                     complex_cls_keys.insert(index, key)
                     key_inserted = True
                     break
             if not key_inserted:
                 complex_cls_keys.append(key)
         return builtin_cls_keys + complex_cls_keys
 
 def usage():
     """prints information on how to use the script
     """
     print(main.__doc__)
 
 def main(argv):
     """This program can be used to convert py classes that are subclasses of class_spec.SemanticClass to owl:Class
             and its properties to owl:ObjectProperty.
 
     py2ttl/py2ttl_ontology.py [OPTIONS <dir>] 
 
         <dir>                              [optional] directory containing datatypes that are subclasses of class_spec.SemanticClass.
                                             Overwrites DATATYPES_DIR in py2ttl/config.py.
         OPTIONS:
         -h|--help:                          show help
         -s|--source=source_ontology_file    source ontology ttl file, option overwrites PROJECT_ONTOLOGY_FILE in py2ttl/config.py
         -t|--target=target_ontology_file    target ontology ttl file, default: 'PROJECT_PREFIX-ontology_autogenerated.ttl'
 
         :return: exit code (int)
     """
     check_config_files_exist()
     datatypes_dir =  get_datatypes_dir()
     source_ontology_file = PROJECT_ONTOLOGY_FILE 
     target_ontology_file = ''
     try:
         opts, args = getopt.getopt(argv, "hs:t:", ["help","source=", "target="])
     except getopt.GetoptError:
         usage()
         return 2
     for opt, arg in opts:
         if opt in ('-h', '--help'):
             usage()
             return 0
         elif opt in ('-t', '--target'):
             target_ontology_file = arg
         elif opt in ('-s', '--source'):
             source_ontology_file = arg
 
     converter = Py2TTLOntologyConverter(project_ontology_file=source_ontology_file)
     if len(args) > 0:
         datatypes_dir = args[0]
     if target_ontology_file == '':
         target_ontology_file = '.{0}{1}-ontology_autogenerated.ttl'.format(sep, converter.project_name)
     return converter.create_ontology(datatypes_dir, target_ontology_file)
 
 if __name__ == "__main__":
     sys.exit(main(sys.argv[1:]))