From d8b52bdac98e2d228e970f77473cf17c1b8ceaa5 Mon Sep 17 00:00:00 2001
From: Sebastian <sebastian.spaar@ariadne.ai>
Date: Mon, 15 Apr 2019 17:42:20 +0200
Subject: [PATCH] Initial code

---
 LICENSE                   |  20 +
 README.rst                |  76 ++++
 setup.py                  |  16 +
 treeconvert/__init__.py   |   0
 treeconvert/__main__.py   |  73 ++++
 treeconvert/conversion.py | 109 +++++
 treeconvert/declxml.py    | 870 ++++++++++++++++++++++++++++++++++++++
 treeconvert/nml.py        | 128 ++++++
 treeconvert/swc.py        |  98 +++++
 9 files changed, 1390 insertions(+)
 create mode 100644 LICENSE
 create mode 100644 README.rst
 create mode 100644 setup.py
 create mode 100644 treeconvert/__init__.py
 create mode 100644 treeconvert/__main__.py
 create mode 100644 treeconvert/conversion.py
 create mode 100644 treeconvert/declxml.py
 create mode 100644 treeconvert/nml.py
 create mode 100644 treeconvert/swc.py

diff --git a/LICENSE b/LICENSE
new file mode 100644
index 0000000..b608b85
--- /dev/null
+++ b/LICENSE
@@ -0,0 +1,20 @@
+Copyright (C) 2019 ariadne-service gmbh
+
+This software is provided 'as-is', without any express or implied
+warranty.  In no event will the authors be held liable for any damages
+arising from the use of this software.
+
+Permission is granted to anyone to use this software for any purpose,
+including commercial applications, and to alter it and redistribute it
+freely, subject to the following restrictions:
+
+1. The origin of this software must not be misrepresented; you must not
+   claim that you wrote the original software. If you use this software
+   in a product, an acknowledgment in the product documentation would be
+   appreciated but is not required.
+2. Altered source versions must be plainly marked as such, and must not be
+   misrepresented as being the original software.
+3. This notice may not be removed or altered from any source distribution.
+
+ariadne-service gmbh ariadne.ai
+Sebastian Spaar sebastian.spaar@ariadne.ai
diff --git a/README.rst b/README.rst
new file mode 100644
index 0000000..5d313d8
--- /dev/null
+++ b/README.rst
@@ -0,0 +1,76 @@
+===========
+treeconvert
+===========
+
+``treeconvert`` converts NML files [1]_ to SWC [2]_. This allows you to view
+skeletal reconstructions created in (Py)KNOSSOS in viewers for SWC files.
+
+The current version (0.9) is currently a little bit restricted:
+
+- Conversion is only possible from (Py)KNOSSOS NML to SWC, not back.
+- SWC’s *structure identifier* is ``UNDEFINED`` for all edges.
+
+If the NML file consists of multiple trees, a separate SWC file will get
+created for each one.
+
+.. [1] For more information about NML files, visit https://github.com/scalableminds/nml-spec.
+.. [2] http://www.neuronland.org/NLMorphologyConverter/MorphologyFormats/SWC/Spec.html
+
+
+Installation
+============
+
+``treeconvert`` only has a single dependency: ``declxml``. For convenience,
+``declxml`` is included directly inside ``treeconvert``'s source tree.
+
+The ``setup.py`` installs a ``treeconvert`` binary that you can use from your
+``PATH``.
+
+Alternatively, go to `Releases <https://github.com/ariadne-service/treeconvert/releases>`_
+to download a self-contained zip file.
+
+To execute the ``.pyz`` file, execute it with python: ``python3 treeconvert.pyz -h``.
+
+
+Requirements
+============
+
+Minimum Python version is 3.7.
+
+
+Usage
+=====
+
+::
+
+	$ python3 cmutil.pyz -h
+	usage: treeconvert.pyz [-h] --from {NML,PYKNOSSOS_NML} --to {SWC} [--force]
+	                       input_file
+
+	Convert annotation files between various formats.
+
+	positional arguments:
+	  input_file            Input file. Output file will be created automatically
+	                        with extension `.[--to]'.
+
+	optional arguments:
+	  -h, --help            show this help message and exit
+	  --from {NML,PYKNOSSOS_NML}
+	                        input format
+	  --to {SWC}            output format
+	  --force               overwrite existing output files.
+
+	If the output format is SWC, and if there are multiple trees in the input
+	file, treeconvert will create a file for each tree, and append the filename
+	with its index.
+
+There a subtle differences between NML files created from KNOSSOS and those
+created from PyKNOSSOS. Because of this, the input format must either be
+``nml`` or ``pyknossos_nml``.
+
+
+License
+=======
+
+Other than ``declxml`` (released under MIT License), all of ``treeconvert``’s
+files are released under the zlib license (c.f. ``LICENSE``).
diff --git a/setup.py b/setup.py
new file mode 100644
index 0000000..fd51e6a
--- /dev/null
+++ b/setup.py
@@ -0,0 +1,16 @@
+from setuptools import setup
+
+setup(name='treeconvert',
+      version='0.9',
+      description='Convert NML files to SWC files',
+      url='https://github.com/ariadne-service/treeconvert',
+      author='ariadne-service gmbh',
+      author_email='contact@ariadne.ai',
+      license='zlib',
+      packages=['treeconvert'],
+      entry_points={
+          'console_scripts': [
+              'treeconvert = treeconvert.__main__'
+          ]
+      },
+      install_requires=['declxml'])
diff --git a/treeconvert/__init__.py b/treeconvert/__init__.py
new file mode 100644
index 0000000..e69de29
diff --git a/treeconvert/__main__.py b/treeconvert/__main__.py
new file mode 100644
index 0000000..5055d78
--- /dev/null
+++ b/treeconvert/__main__.py
@@ -0,0 +1,73 @@
+# This file is part of treeconvert.
+#
+# Copyright (C) 2019 ariadne-service gmbh
+#
+# This software is provided 'as-is', without any express or implied
+# warranty.  In no event will the authors be held liable for any damages
+# arising from the use of this software.
+#
+# Permission is granted to anyone to use this software for any purpose,
+# including commercial applications, and to alter it and redistribute it
+# freely, subject to the following restrictions:
+#
+# 1. The origin of this software must not be misrepresented; you must not
+#    claim that you wrote the original software. If you use this software
+#    in a product, an acknowledgment in the product documentation would be
+#    appreciated but is not required.
+# 2. Altered source versions must be plainly marked as such, and must not be
+#    misrepresented as being the original software.
+# 3. This notice may not be removed or altered from any source distribution.
+#
+# ariadne-service gmbh ariadne.ai
+# Sebastian Spaar sebastian.spaar@ariadne.ai
+
+from argparse import ArgumentParser
+from pathlib import Path
+from os.path import isfile
+from sys import exit, stderr
+
+from treeconvert.conversion import FileFormats, nml_to_swc, nml_to_dict
+
+parser = ArgumentParser(
+    description='Convert annotation files between various formats.',
+    epilog='If the output format is SWC, and if there are multiple trees in '
+           'the input file, treeconvert will create a file for each tree, '
+           'and append the filename with its index.'
+)
+parser.add_argument('--from', type=FileFormats.argparse, dest='from_format',
+                    help='input format', required=True,
+                    choices=(FileFormats.NML, FileFormats.PYKNOSSOS_NML))
+parser.add_argument('--to', type=FileFormats.argparse, dest='to_format',
+                    help='output format', required=True,
+                    choices=(FileFormats.SWC,))
+parser.add_argument('--force', action='store_true',
+                    help='overwrite existing output files.')
+parser.add_argument('input_file', type=str,
+                    help='Input file. Output file will be created '
+                         'automatically with extension `.[--to]\'.')
+
+args = parser.parse_args()
+
+input_file = Path(args.input_file)
+with input_file.open() as f:
+    content = f.read()
+
+nml = nml_to_dict(content, args.from_format == FileFormats.PYKNOSSOS_NML)
+
+for i, thing in enumerate(nml['things']):
+    swc = nml_to_swc(nml['things'][i])
+
+    if len(nml['things']) == 1:
+        output_file = f'{input_file.stem}.swc'
+    else:
+        # Append index to filename
+        output_file = f'{input_file.stem}.swc.{i + 1}'
+
+    if args.force is False and isfile(output_file):
+        print(f'There is already a file called {output_file}! '
+              f'Use `--force\' to overwrite it.', file=stderr)
+        exit(-1)
+
+    with open(output_file, 'w') as f:
+        f.write(str(swc))
+        f.write('\n')  # so that file ends with empty line
diff --git a/treeconvert/conversion.py b/treeconvert/conversion.py
new file mode 100644
index 0000000..4aeaadb
--- /dev/null
+++ b/treeconvert/conversion.py
@@ -0,0 +1,109 @@
+# This file is part of treeconvert.
+#
+# Copyright (C) 2019 ariadne-service gmbh
+#
+# This software is provided 'as-is', without any express or implied
+# warranty.  In no event will the authors be held liable for any damages
+# arising from the use of this software.
+#
+# Permission is granted to anyone to use this software for any purpose,
+# including commercial applications, and to alter it and redistribute it
+# freely, subject to the following restrictions:
+#
+# 1. The origin of this software must not be misrepresented; you must not
+#    claim that you wrote the original software. If you use this software
+#    in a product, an acknowledgment in the product documentation would be
+#    appreciated but is not required.
+# 2. Altered source versions must be plainly marked as such, and must not be
+#    misrepresented as being the original software.
+# 3. This notice may not be removed or altered from any source distribution.
+#
+# ariadne-service gmbh ariadne.ai
+# Sebastian Spaar sebastian.spaar@ariadne.ai
+
+import sys
+from collections import defaultdict, deque
+from enum import Enum
+from itertools import groupby, chain
+from operator import itemgetter
+
+import declxml
+
+from treeconvert.nml import things_processor, pyknossos_things_processor
+from treeconvert.swc import SwcData, Edge
+
+
+class FileFormats(Enum):
+    NML = 'nml'
+    PYKNOSSOS_NML = 'pyknossos_nml'
+    SWC = 'swc'
+
+    def __str__(self):
+        return self.name
+
+    def __repr__(self):
+        return str(self)
+
+    @staticmethod
+    def argparse(s):
+        try:
+            return FileFormats[s.upper()]
+        except KeyError:
+            return s
+
+
+class ParseError(Exception):
+    """Raised when NML XML could not be parsed correctly."""
+
+
+def nml_to_dict(xml_str: str, is_pyknossos=False) -> dict:
+    """Converts NML into a Python dict."""
+    try:
+        _ = declxml.parse_from_string(
+            things_processor if not is_pyknossos else pyknossos_things_processor,
+            xml_str
+        )
+        return _
+    except declxml.XmlError as error:
+        print(error, file=sys.stderr)
+        raise ParseError(str(error))
+
+
+def nml_to_swc(nml: dict) -> SwcData:
+    nodes = {node['id']: node for node in nml['nodes']}
+    targets = defaultdict(list, {
+        target: [edge['source'] for edge in list(edges)]
+        for target, edges in groupby(
+            sorted(nml['edges'], key=itemgetter('target')),
+            itemgetter('target')
+        )})
+    sources = defaultdict(list, {
+        source: [edge['target'] for edge in list(edges)]
+        for source, edges in groupby(
+            sorted(nml['edges'], key=itemgetter('source')),
+            itemgetter('source')
+        )})
+    neighbors = {node: set(sources[node] + targets[node]) for node in chain(nodes)}
+
+    try:
+        first_node = set(nodes.keys() - targets.keys()).pop()
+    except KeyError:
+        # No root node found, so take random node from nml['nodes'].
+        first_node = set(nodes).pop()
+
+    swc = SwcData()
+    swc.append(Edge.from_nml_entry(nodes[first_node], -1))
+
+    next_nodes = deque([first_node])
+    visited = set()
+
+    while len(next_nodes) > 0:
+        node = next_nodes.popleft()
+        visited.add(node)
+
+        for neighbor in neighbors[node]:
+            if neighbor in visited:
+                continue
+            next_nodes.append(neighbor)
+            swc.append(Edge.from_nml_entry(nodes[neighbor], node))
+    return swc
diff --git a/treeconvert/declxml.py b/treeconvert/declxml.py
new file mode 100644
index 0000000..fad6829
--- /dev/null
+++ b/treeconvert/declxml.py
@@ -0,0 +1,870 @@
+"""
+declxml is a library for declaratively processing XML documents.
+
+Processors
+---------------
+The declxml library uses processors to define the structure of XML documents. Processors can be
+divided into two categories: *primitive processors* and *aggregate processors*.
+
+Primitive Processors
+----------------------
+Primitive processors are used to parse and serialize simple, primitive values. The following module
+functions are used to construct primitive processors:
+
+.. autofunction:: declxml.boolean
+.. autofunction:: declxml.floating_point
+.. autofunction:: declxml.integer
+.. autofunction:: declxml.string
+
+Aggregate Processors
+---------------------
+Aggregate processors are composed of other processors. These processors are used for values such as
+dictionaries, arrays, and user objects.
+
+.. autofunction:: declxml.array
+.. autofunction:: declxml.dictionary
+.. autofunction:: declxml.named_tuple
+.. autofunction:: declxml.user_object
+
+Parsing
+----------
+.. autofunction:: declxml.parse_from_file
+.. autofunction:: declxml.parse_from_string
+
+Serialization
+---------------
+.. autofunction:: declxml.serialize_to_file
+.. autofunction:: declxml.serialize_to_string
+
+Exceptions
+------------
+.. autoexception:: declxml.XmlError
+.. autoexception:: declxml.InvalidPrimitiveValue
+.. autoexception:: declxml.InvalidRootProcessor
+.. autoexception:: declxml.MissingValue
+"""
+from collections import namedtuple
+import warnings
+import xml.dom.minidom as minidom
+import xml.etree.ElementTree as ET
+
+
+class XmlError(Exception):
+    """Base error class representing errors processing XML data"""
+
+
+class InvalidPrimitiveValue(XmlError):
+    """Represents errors due to invalid primitive values"""
+
+
+class InvalidRootProcessor(XmlError):
+    """Represents errors due to invalid root processors"""
+
+
+class MissingValue(XmlError):
+    """Represents errors due to missing required values"""
+
+
+def parse_from_file(root_processor, xml_file_path):
+    """
+    Parses the XML file using the processor starting from the root of the document.
+
+    :param root_processor: Root processor of the XML document.
+    :param xml_file_path: Path to XML file to parse.
+
+    :return: Parsed value.
+    """
+    with open(xml_file_path, 'rb') as xml_file:
+        xml_string = xml_file.read()
+
+    parsed_value = parse_from_string(root_processor, xml_string)
+
+    return parsed_value
+
+
+def parse_from_string(root_processor, xml_string):
+    """
+    Parses the XML string using the processor starting from the root of the document.
+
+    :param xml_string: XML string to parse.
+
+    See also :func:`declxml.parse_from_file`
+    """
+    if not _is_valid_root_processor(root_processor):
+        raise InvalidRootProcessor('Invalid root processor')
+
+    root = ET.fromstring(xml_string)
+    _xml_namespace_strip(root)
+
+    state = _ProcessorState()
+    return root_processor.parse_at_root(root, state)
+
+
+def serialize_to_file(root_processor, value, xml_file_path, indent=None):
+    """
+    Serializes the value to an XML file using the root processor.
+
+    :param root_processor: Root processor of the XML document.
+    :param value: Value to serialize.
+    :param xml_file_path: Path to the XML file to which the serialized value will be written.
+    :param indent: If specified, then the XML will be formatted with the specified indentation.
+    """
+    serialized_value = serialize_to_string(root_processor, value, indent)
+
+    with open(xml_file_path, 'wb') as xml_file:
+        xml_file.write(serialized_value)
+
+
+def serialize_to_string(root_processor, value, indent=None):
+    """
+    Serializes the value to an XML string using the root processor.
+
+    :return: The serialized XML string.
+
+    See also :func:`declxml.serialize_to_file`
+    """
+    if not _is_valid_root_processor(root_processor):
+        raise InvalidRootProcessor('Invalid root processor')
+
+    state = _ProcessorState()
+    state.push_location(root_processor.element_path)
+
+    root = root_processor.serialize(value, state)
+
+    state.pop_location()
+
+    serialized_value = ET.tostring(root)
+
+    # Since element tree does not support pretty printing XML, we use minidom to do the pretty
+    # printing
+    if indent:
+        serialized_value = minidom.parseString(serialized_value).toprettyxml(indent=indent)
+
+    return serialized_value
+
+
+def array(item_processor, alias=None, nested=None, omit_empty=False):
+    """
+    Creates an array processor that can be used to parse and serialize array
+    data.
+
+    XML arrays may be nested within an array element, or they may be embedded
+    within their parent. A nested array would look like:
+
+    .. sourcecode:: xml
+
+        <root-element>
+            <some-element>ABC</some-element>
+            <nested-array>
+                <array-item>0</array-item>
+                <array-item>1</array-item>
+            </nested-array>
+        </root-element>
+
+    The corresponding embedded array would look like:
+
+    .. sourcecode:: xml
+
+        <root-element>
+            <some-element>ABC</some-element>
+            <array-item>0</array-item>
+            <array-item>1</array-item>
+        </root-element>
+
+
+    An array is considered required when its item processor is configured as being
+    required.
+
+    :param item_processor: A declxml processor object for the items of the array.
+    :param alias: If specified, the name given to the array when read from XML.
+        If not specified, then the name of the item processor is used instead.
+    :param nested: If the array is a nested array, then this should be the name of
+        the element under which all array items are located. If not specified, then
+        the array is treated as an embedded array. Can also be specified using supported
+        XPath syntax.
+    :param omit_empty: If True, then nested arrays will be omitted when serializing if
+        they are empty. Only valid when nested is specified. Note that an empty array
+        may only be omitted if it is not itself contained within an array. That is,
+        for an array of arrays, any empty arrays in the outer array will always be
+        serialized to prevent information about the original array from being lost
+        when serializing.
+
+    :return: A declxml processor object.
+    """
+    return _Array(item_processor, alias, nested, omit_empty)
+
+
+def boolean(element_name, attribute=None, required=True, alias=None, default=False, omit_empty=False):
+    """
+    Creates a processor for boolean values.
+
+    :param element_name: Name of the XML element containing the value. Can also be specified
+        using supported XPath syntax.
+    :param attribute: If specified, then the value is searched for under the
+        attribute within the element specified by element_name. If not specified,
+        then the value is searched for as the contents of the element specified by
+        element_name.
+    :param required: Indicates whether the value is required when parsing and serializing.
+    :param alias: If specified, then this is used as the name of the value when read from
+        XML. If not specified, then the element_name is used as the name of the value.
+    :param default: Default value to use if the element is not present. This option is only
+        valid if required is specified as False.
+    :param omit_empty: If True, then Falsey values will be omitted when serializing to XML. Note
+        that Falsey values are never omitted when they are elements of an array. Falsey values can
+        be omitted only when they are standalone elements.
+
+    :return: A declxml processor object.
+    """
+    return _PrimitiveValue(element_name, _parse_boolean, attribute, required, alias, default, omit_empty)
+
+
+def dictionary(element_name, children, required=True, alias=None):
+    """
+    Creates a processor for dictionary values.
+
+    :param element_name: Name of the XML element containing the dictionary value. Can also be
+        specified using supported XPath syntax.
+    :param children: List of declxml processor objects for processing the children
+        contained within the dictionary.
+    :param required: Indicates whether the value is required when parsing and serializing.
+    :param alias: If specified, then this is used as the name of the value when read from
+        XML. If not specified, then the element_name is used as the name of the value.
+
+    :return: A declxml processor object.
+    """
+    return _Dictionary(element_name, children, required, alias)
+
+
+def floating_point(element_name, attribute=None, required=True, alias=None, default=0.0, omit_empty=False):
+    """
+    Creates a processor for floating point values.
+
+    See also :func:`declxml.boolean`
+    """
+    value_parser = _number_parser(float)
+    return _PrimitiveValue(element_name, value_parser, attribute, required, alias, default, omit_empty)
+
+
+def integer(element_name, attribute=None, required=True, alias=None, default=0, omit_empty=False):
+    """
+    Creates a processor for integer values.
+
+    See also :func:`declxml.boolean`
+    """
+    value_parser = _number_parser(int)
+    return _PrimitiveValue(element_name, value_parser, attribute, required, alias, default, omit_empty)
+
+
+def named_tuple(element_name, tuple_type, child_processors, required=True, alias=None):
+    """
+    Creates a processor for namedtuple values.
+
+    :param tuple_type: The namedtuple type.
+
+    See also :func:`declxml.dictionary`
+    """
+    converter = _named_tuple_converter(tuple_type)
+    return _Aggregate(element_name, converter, child_processors, required, alias)
+
+
+def string(element_name, attribute=None, required=True, alias=None, default='', omit_empty=False, strip_whitespace=True):
+    """
+    Creates a processor for string values.
+
+    :param strip_whitespace: Indicates whether leading and trailing whitespace should be stripped
+        from parsed string values.
+
+    See also :func:`declxml.boolean`
+    """
+    value_parser = _string_parser(strip_whitespace)
+    return _PrimitiveValue(element_name, value_parser, attribute, required, alias, default, omit_empty)
+
+
+def user_object(element_name, cls, child_processors, required=True, alias=None):
+    """
+    Creates a processor for user objects.
+
+    :param cls: Class object with a no-argument constructor or other callable no-argument object.
+
+    See also :func:`declxml.dictionary`
+    """
+    converter = _user_object_converter(cls)
+    return _Aggregate(element_name, converter, child_processors, required, alias)
+
+
+# Defines pair of functions to convert between aggregates and dictionaries
+_AggregateConverter = namedtuple('_AggregateConverter', ['from_dict', 'to_dict'])
+
+
+class _Aggregate(object):
+    """An XML processor for processing aggregates"""
+
+    def __init__(self, element_path, converter, child_processors, required=True, alias=None):
+        self.element_path = element_path
+        self._converter = converter
+        self.required = required
+        self._dictionary = _Dictionary(element_path, child_processors, required, alias)
+        if alias:
+            self.alias = alias
+        else:
+            self.alias = element_path
+
+    def parse_at_element(self, element, state):
+        """Parses the provided element as an aggregate"""
+        parsed_dict = self._dictionary.parse_at_element(element, state)
+        return self._converter.from_dict(parsed_dict)
+
+    def parse_at_root(self, root, state):
+        """Parses the root XML element as an aggregate"""
+        parsed_dict = self._dictionary.parse_at_root(root, state)
+        return self._converter.from_dict(parsed_dict)
+
+    def parse_from_parent(self, parent, state):
+        """Parses the aggregate from the provided parent XML element"""
+        parsed_dict = self._dictionary.parse_from_parent(parent, state)
+        return self._converter.from_dict(parsed_dict)
+
+    def serialize(self, value, state):
+        """Serializes the value to a new element and returns the element."""
+        dict_value = self._converter.to_dict(value)
+        return self._dictionary.serialize(dict_value, state)
+
+    def serialize_on_parent(self, parent, value, state):
+        """Serializes the value and adds it to the parent"""
+        dict_value = self._converter.to_dict(value)
+        self._dictionary.serialize_on_parent(parent, dict_value, state)
+
+
+class _Array(object):
+    """An XML processor for Array values"""
+
+    def __init__(self, item_processor, alias=None, nested=None, omit_empty=False):
+        self._item_processor = item_processor
+        self._nested = nested
+        self.required = item_processor.required
+
+        if alias:
+            self.alias = alias
+        elif nested:
+            self.alias = nested
+        else:
+            self.alias = item_processor.alias
+
+        if self._nested:
+            self.element_path = self._nested
+        else:
+            self.element_path = '.'  # Array is embedded directly on parent
+
+        self._item_path = self.element_path + '/' + self._item_processor.element_path
+
+        if not nested or self.required:
+            self.omit_empty = False
+            if omit_empty:
+                warnings.warn('omit_empty ignored for non-nested and/or required arrays')
+        else:
+            self.omit_empty = omit_empty
+
+    def parse_at_element(self, element, state):
+        """Parses the provided element as an array"""
+        item_iter = element.findall(self._item_processor.element_path)
+        return self._parse(item_iter, state)
+
+    def parse_at_root(self, root, state):
+        """Parses the root XML element as an array"""
+        if not self._nested:
+            raise InvalidRootProcessor('Non-nested array "{}" cannot be root element'.format(
+                self.alias))
+
+        parsed_array = []
+
+        array_element = _element_find_from_root(root, self._nested)
+        if array_element is not None:
+            state.push_location(self._nested)
+            parsed_array = self.parse_at_element(array_element, state)
+            state.pop_location()
+        elif self.required:
+            raise MissingValue('Missing required array at root: "{}"'.format(self._nested))
+
+        return parsed_array
+
+    def parse_from_parent(self, parent, state):
+        """Parses the array data from the provided parent XML element"""
+        item_iter = parent.findall(self._item_path)
+        return self._parse(item_iter, state)
+
+    def serialize(self, value, state):
+        """
+        Serializes the value into a new Element object and returns it.
+        """
+        if self._nested is None:
+            state.raise_error(InvalidRootProcessor,
+                              'Cannot directly serialize a non-nested array "{}"'
+                              .format(self.alias))
+
+        if not value and self.required:
+            state.raise_error(MissingValue, 'Missing required array: "{}"'.format(
+                self.alias))
+
+        start_element, end_element = _element_path_create_new(self._nested)
+        self._serialize(end_element, value, state)
+
+        return start_element
+
+    def serialize_on_parent(self, parent, value, state):
+        """Serializes value and appends it to the parent element"""
+        if not value and self.required:
+            state.raise_error(MissingValue, 'Missing required array: "{}"'.format(
+                self.alias))
+
+        if not value and self.omit_empty:
+            return  # Do nothing
+
+        if self._nested is not None:
+            array_parent = _element_get_or_add_from_parent(parent, self._nested)
+        else:
+            # Embedded array has all items serialized directly on the parent.
+            array_parent = parent
+
+        self._serialize(array_parent, value, state)
+
+    def _parse(self, item_iter, state):
+        """
+        Parses the array data by using the provided iterator of XML elements to iterate over
+        the item elements.
+        """
+        parsed_array = []
+
+        for i, item in enumerate(item_iter):
+            state.push_location(self._item_processor.element_path, i)
+            parsed_array.append(self._item_processor.parse_at_element(item, state))
+            state.pop_location()
+
+        if not parsed_array and self.required:
+            state.raise_error(MissingValue, 'Missing required array "{}"'.format(self.alias))
+
+        return parsed_array
+
+    def _serialize(self, array_parent, value, state):
+        """Serializes the array value adding it to the array parent element"""
+        if not value:
+            # Nothing to do. Avoid attempting to iterate over a possibly
+            # None value.
+            return
+
+        for i, item_value in enumerate(value):
+            state.push_location(self._item_processor.element_path, i)
+            item_element = self._item_processor.serialize(item_value, state)
+            array_parent.append(item_element)
+            state.pop_location()
+
+
+class _Dictionary(object):
+    """An XML processor for dictionary values"""
+
+    def __init__(self, element_path, child_processors, required=True, alias=None):
+        self.element_path = element_path
+        self._child_processors = child_processors
+        self.required = required
+        if alias:
+            self.alias = alias
+        else:
+            self.alias = element_path
+
+    def parse_at_element(self, element, state):
+        """Parses the provided element as a dictionary"""
+        parsed_dict = {}
+
+        if element is not None:
+            for child in self._child_processors:
+                state.push_location(child.element_path)
+                parsed_dict[child.alias] = child.parse_from_parent(element, state)
+                state.pop_location()
+        elif self.required:
+            state.raise_error(MissingValue, 'Missing required aggregate "{}"'.format(self.element_path))
+
+        return parsed_dict
+
+    def parse_at_root(self, root, state):
+        """Parses the root XML element as a dictionary"""
+        parsed_dict = {}
+
+        dict_element = _element_find_from_root(root, self.element_path)
+        if dict_element is not None:
+            state.push_location(self.element_path)
+            parsed_dict = self.parse_at_element(dict_element, state)
+            state.pop_location()
+        elif self.required:
+            raise MissingValue('Missing required root aggregate "{}"'.format(self.element_path))
+
+        return parsed_dict
+
+    def parse_from_parent(self, parent, state):
+        """Parses the dictionary data from the provided parent XML element"""
+        element = parent.find(self.element_path)
+        return self.parse_at_element(element, state)
+
+    def serialize(self, value, state):
+        """
+        Serializes the value to a new element and returns the element.
+        """
+        if not value and self.required:
+            state.raise_error(MissingValue, 'Missing required aggregate "{}"'.format(self.element_path))
+
+        start_element, end_element = _element_path_create_new(self.element_path)
+        self._serialize(end_element, value, state)
+        return start_element
+
+    def serialize_on_parent(self, parent, value, state):
+        """Serializes the value and adds it to the parent"""
+        if not value and self.required:
+            state.raise_error(MissingValue, 'Missing required aggregate "{}"'.format(
+                self.element_path))
+
+        if not value:
+            return  # Do Nothing
+
+        element = _element_get_or_add_from_parent(parent, self.element_path)
+        self._serialize(element, value, state)
+
+    def _serialize(self, element, value, state):
+        """Serializes the dictionary appending all serialized children to the element"""
+        for child in self._child_processors:
+            state.push_location(child.element_path)
+            child_value = value.get(child.alias)
+            child.serialize_on_parent(element, child_value, state)
+            state.pop_location()
+
+
+class _PrimitiveValue(object):
+    """An XML processor for processing primitive values"""
+
+    def __init__(self, element_path, parser_func, attribute=None, required=True, alias=None, default=None, omit_empty=False):
+        """
+        :param element_path: Path to XML element containing the value.
+        :param parser_func: Function to parse the raw XML value. Should take a string and return
+            the value parsed from the raw string.
+        :param required: Indicates whether the value is required.
+        :param alias: Alternative name to give to the value. If not specified, element_path is used.
+        :param default: Default value. Only valid if required is False.
+        :param omit_empty: Omit the value when serializing if it is a falsey value. Only valid if required is
+            False.
+        """
+        self.element_path = element_path
+        self._parser_func = parser_func
+        self._attribute = attribute
+        self.required = required
+        self._default = default
+
+        if alias:
+            self.alias = alias
+        elif attribute:
+            self.alias = attribute
+        else:
+            self.alias = element_path
+
+        # If a value is required, then it will never be omitted when serialized. This
+        # is to ensure that data that is serialized by a processor can also be parsed
+        # by a processor. Omitting required values would lead to an error when attempting
+        # to parse the XML data. For primitives, a value must be None to be considered
+        # missing, but is considered empty if it is falsey.
+        if required:
+            self.omit_empty = False
+            if omit_empty:
+                warnings.warn('omit_empty ignored on primitive values when required is specified')
+        else:
+            self.omit_empty = omit_empty
+
+
+    def parse_at_element(self, element, state):
+        """Parses the primitive value at the given XML element"""
+        parsed_value = self._default
+
+        if element is not None:
+            if self._attribute:
+                parsed_value = self._parse_attribute(element, state)
+            else:
+                parsed_value = self._parser_func(element.text, state)
+        elif self.required:
+            state.raise_error(MissingValue, 'Missing required element "{}"'.format(self.element_path))
+
+        return parsed_value
+
+    def parse_from_parent(self, parent, state):
+        """Parses the primitive value under the provided parent XML element"""
+        element = parent.find(self.element_path)
+        return self.parse_at_element(element, state)
+
+    def serialize(self, value, _state):
+        """
+        Serializes the value into a new element object and returns the element. If the omit_empty
+        option was specified and the value is falsey, then this will return None.
+        """
+        # For primitive values, this is only called when the value is part of an array,
+        # in which case we do not need to check for missing or omitted values.
+        start_element, end_element = _element_path_create_new(self.element_path)
+        self._serialize(end_element, value)
+        return start_element
+
+    def serialize_on_parent(self, parent, value, state):
+        """Serializes the value adding it to the parent element"""
+        # Note that falsey values are not treated as missing, but they may be omitted.
+        if value is None and self.required:
+            state.raise_error(MissingValue, self._missing_value_message(parent))
+
+        if not value and self.omit_empty:
+            return  # Do Nothing
+
+        element = _element_get_or_add_from_parent(parent, self.element_path)
+        self._serialize(element, value)
+
+    def _missing_value_message(self, parent):
+        """Returns the message to use to report that value needed for serialization is missing"""
+        if self._attribute is None:
+            message = 'Missing required value for element "{}"'.format(self.element_path)
+        else:
+            if self.element_path == '.':
+                parent_name = parent.tag
+            else:
+                parent_name = self.element_path
+
+            message = 'Missing required value for attribute "{}" on element "{}"'.format(
+                self._attribute, parent_name)
+
+        return message
+
+    def _parse_attribute(self, element, state):
+        """Parses the primitive value within the XML element's attribute"""
+        parsed_value = self._default
+        attribute_value = element.get(self._attribute, None)
+        if attribute_value:
+            parsed_value = self._parser_func(attribute_value, state)
+        elif self.required:
+            state.raise_error(MissingValue, 'Missing required attribute "{}" on element "{}"'.format(
+                self._attribute, element.tag))
+
+        return parsed_value
+
+    def _serialize(self, element, value):
+        """Serializes the value to the element"""
+        # A value is only considered missing, and hence eligible to be replaced by its
+        # default only if it is None. Falsey values are not considered missing and are
+        # not replaced by the default.
+        if value is None:
+            if self._default is None:
+                serialized_value = ''
+            else:
+                serialized_value = str(self._default)
+        else:
+            serialized_value = str(value)
+
+        if self._attribute:
+            element.set(self._attribute, serialized_value)
+        else:
+            element.text = serialized_value
+
+
+class _ProcessorState(object):
+    """Keeps track of the state of the processor in order to provide useful error messages"""
+
+    _Location = namedtuple('_ProcessorLocation', [
+        'element',
+        'array_index',
+    ])
+
+    def __init__(self):
+        self._locations = []
+
+    def pop_location(self):
+        """Pops the most recently pushed location from the state's stack of locations"""
+        return self._locations.pop()
+
+    def push_location(self, element_path, array_index=None):
+        """Pushes an item onto the state's stack of locations"""
+        location = _ProcessorState._Location(element=element_path, array_index=array_index)
+        self._locations.append(location)
+
+    def raise_error(self, exception_type, message):
+        """Raises the given exception type and includes the current state information with the error message"""
+        error_message = '{} at {}'.format(message, self.__repr__())
+        raise exception_type(error_message)
+
+    def __repr__(self):
+        # Exclude the any locations specified with a dot which just means the "current location" from
+        # the path string.
+        location_strings = (_ProcessorState._location_to_string(location) for location in self._locations if
+                            location.element != '.')
+        return '/'.join(location_strings)
+
+    @staticmethod
+    def _location_to_string(location):
+        if location.array_index is not None:
+            location_str = '{}[{}]'.format(location.element, location.array_index)
+        else:
+            location_str = location.element
+
+        return location_str
+
+
+def _element_append_path(start_element, element_names):
+    """
+    Appends the list of element names as a path to the provided start element. Returns the final
+    element along the path.
+    """
+    end_element = start_element
+    for element_name in element_names:
+        new_element = ET.Element(element_name)
+        end_element.append(new_element)
+        end_element = new_element
+
+    return end_element
+
+
+def _element_find_from_root(root, element_path):
+    """
+    Finds the element specified by the given path starting from the root element of the
+    document. The first component of the element path is expected to be the name of the
+    root element. Returns None if the element is not found.
+    """
+    element = None
+
+    element_names = element_path.split('/')
+    if element_names[0] == root.tag:
+        if len(element_names) > 1:
+            element = root.find('/'.join(element_names[1:]))
+        else:
+            element = root
+
+    return element
+
+
+def _element_get_or_add_from_parent(parent, element_path):
+    """
+    Ensures all elements specified in the given path relative to the provided parent element exist,
+    creating new elements along the path only when needed. Returns the final element specified by
+    the path.
+    """
+    element_names = element_path.split('/')
+
+    # Starting from the parent, walk the element path until we find the first element in the path
+    # that does not exist. Create that element and all the elements following it in the path. If
+    # all elements along the path exist, then we will simply walk the full path to the final
+    # element we want to return.
+    previous_element = parent
+    for i, element_name in enumerate(element_names):
+        existing_element = previous_element.find(element_name)
+        if existing_element is None:
+            existing_element = _element_append_path(previous_element, element_names[i:])
+            break
+
+        previous_element = existing_element
+
+    return existing_element
+
+
+def _element_path_create_new(element_path):
+    """
+    Creates an entirely new element path. Returns a tuple where the first item is the first element
+    in the path, and the second item is the final element in the path.
+    """
+    element_names = element_path.split('/')
+
+    start_element = ET.Element(element_names[0])
+    end_element = _element_append_path(start_element, element_names[1:])
+
+    return (start_element, end_element)
+
+
+def _is_valid_root_processor(processor):
+    """Returns True if the given XML processor can be used as a root processor"""
+    return hasattr(processor, 'parse_at_root')
+
+
+def _named_tuple_converter(tuple_type):
+    """Returns an _AggregateConverter for named tuples of the given type"""
+    def _from_dict(dict_value):
+        return tuple_type(**dict_value)
+
+    def _to_dict(value):
+        if value:
+            return value._asdict()
+        else:
+            return {}
+
+    converter = _AggregateConverter(from_dict=_from_dict, to_dict=_to_dict)
+    return converter
+
+
+def _number_parser(str_to_number_func):
+    """Returns a function to parse numbers"""
+    def _parse_number_value(element_text, state):
+        try:
+            value = str_to_number_func(element_text)
+        except (ValueError, TypeError):
+            state.raise_error(InvalidPrimitiveValue,
+                              'Invalid numeric value "{}"'.format(element_text))
+
+        return value
+
+    return _parse_number_value
+
+
+def _parse_boolean(element_text, state):
+    """Parses the raw XML string as a boolean value"""
+    lowered_text = element_text.lower()
+    if lowered_text == 'true':
+        value = True
+    elif lowered_text == 'false':
+        value = False
+    else:
+        state.raise_error(InvalidPrimitiveValue, 'Invalid boolean value "{}"'.format(element_text))
+
+    return value
+
+
+def _string_parser(strip_whitespace):
+    """Returns a parser function for parsing string values"""
+    def _parse_string_value(element_text, _state):
+        if element_text is None:
+            value = ''
+        elif strip_whitespace:
+            value = element_text.strip()
+        else:
+            value = element_text
+
+        return value
+
+    return _parse_string_value
+
+
+def _user_object_converter(cls):
+    """Returns an _AggregateConverter for a user object of the given class"""
+    def _from_dict(dict_value):
+        object_value = cls()
+
+        for field_name, field_value in dict_value.items():
+            setattr(object_value, field_name, field_value)
+
+        return object_value
+
+    def _to_dict(value):
+        if value:
+            return value.__dict__
+        else:
+            return {}
+
+    converter = _AggregateConverter(from_dict=_from_dict, to_dict=_to_dict)
+    return converter
+
+
+def _xml_namespace_strip(root):
+    """Strips the XML namespace prefix from all element tags under the given root Element"""
+    if '}' not in root.tag:
+        return  # Nothing to do, no namespace present
+
+    for element in root.iter():
+        if '}' in element.tag:
+            element.tag = element.tag.split('}')[1]
+        else: # pragma: no cover
+            # We should never get here. If there is a namespace, then the namespace should be
+            # included in all elements.
+            pass
diff --git a/treeconvert/nml.py b/treeconvert/nml.py
new file mode 100644
index 0000000..803a66c
--- /dev/null
+++ b/treeconvert/nml.py
@@ -0,0 +1,128 @@
+# This file is part of treeconvert.
+#
+# Copyright (C) 2019 ariadne-service gmbh
+#
+# This software is provided 'as-is', without any express or implied
+# warranty.  In no event will the authors be held liable for any damages
+# arising from the use of this software.
+#
+# Permission is granted to anyone to use this software for any purpose,
+# including commercial applications, and to alter it and redistribute it
+# freely, subject to the following restrictions:
+#
+# 1. The origin of this software must not be misrepresented; you must not
+#    claim that you wrote the original software. If you use this software
+#    in a product, an acknowledgment in the product documentation would be
+#    appreciated but is not required.
+# 2. Altered source versions must be plainly marked as such, and must not be
+#    misrepresented as being the original software.
+# 3. This notice may not be removed or altered from any source distribution.
+#
+# ariadne-service gmbh ariadne.ai
+# Sebastian Spaar sebastian.spaar@ariadne.ai
+
+
+import declxml
+
+parameters = declxml.dictionary('parameters', [
+    declxml.dictionary('experiment', [
+        declxml.string('.', attribute='name')
+    ], required=False),
+    declxml.dictionary('lastsavedin', [
+        declxml.string('.', attribute='version')
+    ], required=False),
+    declxml.dictionary('createdin', [
+        declxml.string('.', attribute='version')
+    ], required=False),
+    declxml.dictionary('guiMode', [
+        declxml.string('.', attribute='mode')
+    ], required=False),
+    declxml.dictionary('dataset', [
+        declxml.string('.', attribute='path'),
+        declxml.integer('.', attribute='overlay')
+    ], required=False),
+], required=False)
+
+node_processor = declxml.dictionary('node', [
+    declxml.integer('.', attribute='id'),
+    declxml.floating_point('.', attribute='radius', required=False, default=1.0),
+    declxml.integer('.', attribute='x', required=False),
+    declxml.integer('.', attribute='y', required=False),
+    declxml.integer('.', attribute='z', required=False),
+    declxml.integer('.', attribute='inVp', required=False),
+    declxml.integer('.', attribute='inMag', required=False),
+    declxml.integer('.', attribute='time', required=False),
+    declxml.string('.', attribute='comment', required=False)
+], required=False)
+
+pyknossos_node_processor = declxml.dictionary('node', [
+    declxml.integer('.', attribute='id'),
+    declxml.floating_point('.', attribute='radius', required=False, default=1.0),
+    declxml.floating_point('.', attribute='x', required=False),
+    declxml.floating_point('.', attribute='y', required=False),
+    declxml.floating_point('.', attribute='z', required=False),
+    declxml.integer('.', attribute='inVp', required=False),
+    declxml.integer('.', attribute='inMag', required=False),
+    declxml.integer('.', attribute='time', required=False),
+    declxml.string('.', attribute='comment', required=False)
+], required=False)
+
+nodes_processor = declxml.array(node_processor, nested='nodes')
+
+pyknossos_nodes_processor = declxml.array(pyknossos_node_processor, nested='nodes')
+
+edge_processor = declxml.dictionary('edge', [
+    declxml.integer('.', attribute='source'),
+    declxml.integer('.', attribute='target')
+], required=False)
+
+edges_processor = declxml.array(edge_processor, nested='edges')
+
+thing_processor = declxml.dictionary('thing', [
+    declxml.integer('.', attribute='id'),
+    declxml.floating_point('.', attribute='color.r', required=False),
+    declxml.floating_point('.', attribute='color.g', required=False),
+    declxml.floating_point('.', attribute='color.b', required=False),
+    declxml.integer('.', attribute='neuron_id', required=False, omit_empty=True, default=100),
+    declxml.integer('.', attribute='skeleton_id', required=False, omit_empty=True, default=99),
+    nodes_processor,
+    edges_processor
+])
+
+pyknossos_thing_processor = declxml.dictionary('thing', [
+    declxml.floating_point('.', attribute='id'),
+    declxml.floating_point('.', attribute='color.r', required=False),
+    declxml.floating_point('.', attribute='color.g', required=False),
+    declxml.floating_point('.', attribute='color.b', required=False),
+    declxml.integer('.', attribute='neuron_id', required=False, omit_empty=True),
+    declxml.integer('.', attribute='skeleton_id', required=False, omit_empty=True),
+    pyknossos_nodes_processor,
+    edges_processor
+])
+
+comment_processor = declxml.dictionary('comment', [
+    declxml.integer('.', attribute='node'),
+    declxml.string('.', attribute='content')
+], required=False)
+
+comments_processor = declxml.array(comment_processor, nested='comments')
+
+branchpoint_processor = declxml.dictionary('branchpoint', [
+    declxml.integer('.', attribute='id')
+], required=False)
+
+branchpoints_processor = declxml.array(branchpoint_processor, nested='branchpoints')
+
+things_processor = declxml.dictionary('things', [
+    parameters,
+    declxml.array(thing_processor, alias='things'),
+    comments_processor,
+    branchpoints_processor
+])
+
+pyknossos_things_processor = declxml.dictionary('things', [
+    parameters,
+    declxml.array(pyknossos_thing_processor, alias='things'),
+    comments_processor,
+    branchpoints_processor
+])
diff --git a/treeconvert/swc.py b/treeconvert/swc.py
new file mode 100644
index 0000000..34ab800
--- /dev/null
+++ b/treeconvert/swc.py
@@ -0,0 +1,98 @@
+# This file is part of treeconvert.
+#
+# Copyright (C) 2019 ariadne-service gmbh
+#
+# This software is provided 'as-is', without any express or implied
+# warranty.  In no event will the authors be held liable for any damages
+# arising from the use of this software.
+#
+# Permission is granted to anyone to use this software for any purpose,
+# including commercial applications, and to alter it and redistribute it
+# freely, subject to the following restrictions:
+#
+# 1. The origin of this software must not be misrepresented; you must not
+#    claim that you wrote the original software. If you use this software
+#    in a product, an acknowledgment in the product documentation would be
+#    appreciated but is not required.
+# 2. Altered source versions must be plainly marked as such, and must not be
+#    misrepresented as being the original software.
+# 3. This notice may not be removed or altered from any source distribution.
+#
+# ariadne-service gmbh ariadne.ai
+# Sebastian Spaar sebastian.spaar@ariadne.ai
+
+import collections
+from dataclasses import dataclass
+from enum import IntEnum
+
+
+class StructureIdentifier(IntEnum):
+    """Standardized identifiers for SWC (www.neuromorpho.org) -
+
+    """
+    UNDEFINED = 0
+    SOMA = 1
+    AXON = 2
+    BASAL_DENDRITE = 3
+    APICAL_DENDRITE = 4
+    CUSTOM = 5
+
+    @classmethod
+    def _missing_(cls, value):
+        return StructureIdentifier.CUSTOM
+
+    def __str__(self):
+        return str(self.value)
+
+
+@dataclass
+class Edge:
+    """http://www.neuronland.org/NLMorphologyConverter/MorphologyFormats/SWC/Spec.html
+
+    """
+    sample_number: int
+    structure_identifier: StructureIdentifier
+    x_position: float
+    y_position: float
+    z_position: float
+    radius: float
+    parent_sample: int
+
+    def __str__(self):
+        return ' '.join(str(x) for x in vars(self).values())
+
+    @classmethod
+    def from_nml_entry(cls, node: dict, parent_id: int):
+        try:
+            structure_identifier = StructureIdentifier(node['comment'])
+        except KeyError:
+            structure_identifier = StructureIdentifier(0)
+        return Edge(node['id'], structure_identifier,
+                    node['x'], node['y'], node['z'], node['radius'], parent_id)
+
+
+class SwcData(collections.abc.MutableSequence):
+    def __init__(self, *args):
+        self.nodes = []
+        self.extend(list(args))
+
+    def insert(self, index: int, item: Edge) -> None:
+        if not isinstance(item, Edge):
+            raise TypeError(f'Item must be of type {Edge}!')
+        self.nodes.append(item)
+
+    def __getitem__(self, i: int) -> Edge:
+        return self.nodes[i]
+
+    def __setitem__(self, i: int, o: Edge) -> None:
+        self.insert(i, o)
+
+    def __delitem__(self, i: int) -> None:
+        del self.nodes[i]
+
+    def __len__(self) -> int:
+        return len(self.nodes)
+
+    def __str__(self):
+        # This returns a complete SWC file by combining all of its Edges
+        return '\n'.join(str(edge) for edge in self)