From 915826fd9144809f33a9ecdc8beb4b244581a045 Mon Sep 17 00:00:00 2001
From: Daniel Friesel <daniel.friesel@uos.de>
Date: Thu, 2 Jul 2020 09:35:25 +0200
Subject: Remove verbose arg from tests

---
 test/test_ptamodel.py | 24 ++++++++++++------------
 1 file changed, 12 insertions(+), 12 deletions(-)

(limited to 'test/test_ptamodel.py')

diff --git a/test/test_ptamodel.py b/test/test_ptamodel.py
index 7d501e6..7e398bd 100755
--- a/test/test_ptamodel.py
+++ b/test/test_ptamodel.py
@@ -9,9 +9,9 @@ import pytest
 class TestModels(unittest.TestCase):
     def test_model_singlefile_rf24(self):
         raw_data = RawData(['test-data/20170220_164723_RF24_int_A.tar'])
-        preprocessed_data = raw_data.get_preprocessed_data(verbose=False)
+        preprocessed_data = raw_data.get_preprocessed_data()
         by_name, parameters, arg_count = pta_trace_to_aggregate(preprocessed_data)
-        model = PTAModel(by_name, parameters, arg_count, verbose=False)
+        model = PTAModel(by_name, parameters, arg_count)
         self.assertEqual(model.states(), 'POWERDOWN RX STANDBY1 TX'.split(' '))
         self.assertEqual(model.transitions(), 'begin epilogue powerDown powerUp setDataRate_num setPALevel_num startListening stopListening write_nb'.split(' '))
         static_model = model.get_static()
@@ -78,9 +78,9 @@ class TestModels(unittest.TestCase):
 
     def test_model_singlefile_mmparam(self):
         raw_data = RawData(['test-data/20161221_123347_mmparam.tar'])
-        preprocessed_data = raw_data.get_preprocessed_data(verbose=False)
+        preprocessed_data = raw_data.get_preprocessed_data()
         by_name, parameters, arg_count = pta_trace_to_aggregate(preprocessed_data)
-        model = PTAModel(by_name, parameters, arg_count, verbose=False)
+        model = PTAModel(by_name, parameters, arg_count)
         self.assertEqual(model.states(), 'OFF ON'.split(' '))
         self.assertEqual(model.transitions(), 'off setBrightness'.split(' '))
         static_model = model.get_static()
@@ -109,9 +109,9 @@ class TestModels(unittest.TestCase):
             'test-data/20170116_131306_LM75x.tar',
         ]
         raw_data = RawData(testfiles)
-        preprocessed_data = raw_data.get_preprocessed_data(verbose=False)
+        preprocessed_data = raw_data.get_preprocessed_data()
         by_name, parameters, arg_count = pta_trace_to_aggregate(preprocessed_data)
-        model = PTAModel(by_name, parameters, arg_count, verbose=False)
+        model = PTAModel(by_name, parameters, arg_count)
         self.assertEqual(model.states(), 'ACTIVE POWEROFF'.split(' '))
         self.assertEqual(model.transitions(), 'getTemp setHyst setOS shutdown start'.split(' '))
         static_model = model.get_static()
@@ -139,9 +139,9 @@ class TestModels(unittest.TestCase):
             'test-data/20170116_151348_sharpLS013B4DN.tar',
         ]
         raw_data = RawData(testfiles)
-        preprocessed_data = raw_data.get_preprocessed_data(verbose=False)
+        preprocessed_data = raw_data.get_preprocessed_data()
         by_name, parameters, arg_count = pta_trace_to_aggregate(preprocessed_data)
-        model = PTAModel(by_name, parameters, arg_count, verbose=False)
+        model = PTAModel(by_name, parameters, arg_count)
         self.assertEqual(model.states(), 'DISABLED ENABLED'.split(' '))
         self.assertEqual(model.transitions(), 'clear disable enable ioInit sendLine toggleVCOM'.split(' '))
         static_model = model.get_static()
@@ -172,9 +172,9 @@ class TestModels(unittest.TestCase):
             'test-data/20170116_142654_mmstatic.tar',
         ]
         raw_data = RawData(testfiles)
-        preprocessed_data = raw_data.get_preprocessed_data(verbose=False)
+        preprocessed_data = raw_data.get_preprocessed_data()
         by_name, parameters, arg_count = pta_trace_to_aggregate(preprocessed_data)
-        model = PTAModel(by_name, parameters, arg_count, verbose=False)
+        model = PTAModel(by_name, parameters, arg_count)
         self.assertEqual(model.states(), 'B G OFF R'.split(' '))
         self.assertEqual(model.transitions(), 'blue green off red'.split(' '))
         static_model = model.get_static()
@@ -206,9 +206,9 @@ class TestModels(unittest.TestCase):
             'test-data/20170125_154019_cc1200.tar',
         ]
         raw_data = RawData(testfiles)
-        preprocessed_data = raw_data.get_preprocessed_data(verbose=False)
+        preprocessed_data = raw_data.get_preprocessed_data()
         by_name, parameters, arg_count = pta_trace_to_aggregate(preprocessed_data)
-        model = PTAModel(by_name, parameters, arg_count, verbose=False)
+        model = PTAModel(by_name, parameters, arg_count)
         self.assertEqual(model.states(), 'IDLE RX SLEEP SLEEP_EWOR SYNTH_ON TX XOFF'.split(' '))
         self.assertEqual(model.transitions(), 'crystal_off eWOR idle init prepare_xmit receive send setSymbolRate setTxPower sleep txDone'.split(' '))
         static_model = model.get_static()
-- 
cgit v1.2.3


From f1a9e8b419c3b0836989565fa462d7c67a4bc9b9 Mon Sep 17 00:00:00 2001
From: Daniel Friesel <daniel.friesel@uos.de>
Date: Thu, 2 Jul 2020 09:35:48 +0200
Subject: blacken test code

---
 test/test_codegen.py       | 170 +++++----
 test/test_pta.py           | 917 ++++++++++++++++++++++++++-------------------
 test/test_ptamodel.py      | 505 ++++++++++++++++---------
 test/test_timingharness.py | 201 ++++++----
 4 files changed, 1089 insertions(+), 704 deletions(-)

(limited to 'test/test_ptamodel.py')

diff --git a/test/test_codegen.py b/test/test_codegen.py
index 981117b..ce565d6 100755
--- a/test/test_codegen.py
+++ b/test/test_codegen.py
@@ -5,84 +5,74 @@ from dfatool.codegen import get_simulated_accountingmethod
 import unittest
 
 example_json_1 = {
-    'parameters': ['datarate', 'txbytes', 'txpower'],
-    'initial_param_values': [None, None, None],
-    'state': {
-        'IDLE': {
-            'power': {
-                'static': 5,
-            }
-        },
-        'TX': {
-            'power': {
-                'static': 100,
-                'function': {
-                    'raw': 'regression_arg(0) + regression_arg(1)'
-                    ' * parameter(txpower)',
-                    'regression_args': [100, 2]
+    "parameters": ["datarate", "txbytes", "txpower"],
+    "initial_param_values": [None, None, None],
+    "state": {
+        "IDLE": {"power": {"static": 5,}},
+        "TX": {
+            "power": {
+                "static": 100,
+                "function": {
+                    "raw": "regression_arg(0) + regression_arg(1)"
+                    " * parameter(txpower)",
+                    "regression_args": [100, 2],
                 },
             }
         },
     },
-    'transitions': [
+    "transitions": [
         {
-            'name': 'init',
-            'origin': ['UNINITIALIZED', 'IDLE'],
-            'destination': 'IDLE',
-            'duration': {
-                'static': 50000,
-            },
-            'set_param': {
-                'txpower': 10
-            },
+            "name": "init",
+            "origin": ["UNINITIALIZED", "IDLE"],
+            "destination": "IDLE",
+            "duration": {"static": 50000,},
+            "set_param": {"txpower": 10},
         },
         {
-            'name': 'setTxPower',
-            'origin': 'IDLE',
-            'destination': 'IDLE',
-            'duration': {'static': 120},
-            'energy ': {'static': 10000},
-            'arg_to_param_map': {0: 'txpower'},
-            'argument_values': [[10, 20, 30]],
+            "name": "setTxPower",
+            "origin": "IDLE",
+            "destination": "IDLE",
+            "duration": {"static": 120},
+            "energy ": {"static": 10000},
+            "arg_to_param_map": {0: "txpower"},
+            "argument_values": [[10, 20, 30]],
         },
         {
-            'name': 'send',
-            'origin': 'IDLE',
-            'destination': 'TX',
-            'duration': {
-                'static': 10,
-                'function': {
-                    'raw': 'regression_arg(0) + regression_arg(1)'
-                    ' * function_arg(1)',
-                    'regression_args': [48, 8],
+            "name": "send",
+            "origin": "IDLE",
+            "destination": "TX",
+            "duration": {
+                "static": 10,
+                "function": {
+                    "raw": "regression_arg(0) + regression_arg(1)" " * function_arg(1)",
+                    "regression_args": [48, 8],
                 },
             },
-            'energy': {
-                'static': 3,
-                'function': {
-                    'raw': 'regression_arg(0) + regression_arg(1)'
-                    ' * function_arg(1)',
-                    'regression_args': [3, 5],
+            "energy": {
+                "static": 3,
+                "function": {
+                    "raw": "regression_arg(0) + regression_arg(1)" " * function_arg(1)",
+                    "regression_args": [3, 5],
                 },
             },
-            'arg_to_param_map': {1: 'txbytes'},
-            'argument_values': [['"foo"', '"hodor"'], [3, 5]],
-            'argument_combination': 'zip',
+            "arg_to_param_map": {1: "txbytes"},
+            "argument_values": [['"foo"', '"hodor"'], [3, 5]],
+            "argument_combination": "zip",
         },
         {
-            'name': 'txComplete',
-            'origin': 'TX',
-            'destination': 'IDLE',
-            'is_interrupt': 1,
-            'timeout': {
-                'static': 2000,
-                'function': {
-                    'raw': 'regression_arg(0) + regression_arg(1)'
-                    ' * parameter(txbytes)',
-                    'regression_args': [500, 16],
+            "name": "txComplete",
+            "origin": "TX",
+            "destination": "IDLE",
+            "is_interrupt": 1,
+            "timeout": {
+                "static": 2000,
+                "function": {
+                    "raw": "regression_arg(0) + regression_arg(1)"
+                    " * parameter(txbytes)",
+                    "regression_args": [500, 16],
                 },
             },
-        }
+        },
     ],
 }
 
@@ -91,9 +81,11 @@ class TestCG(unittest.TestCase):
     def test_statetransition_immediate(self):
         pta = PTA.from_json(example_json_1)
         pta.set_random_energy_model()
-        pta.state['IDLE'].power.value = 9
-        cg = get_simulated_accountingmethod('static_statetransition_immediate')(pta, 1000000, 'uint8_t', 'uint8_t', 'uint8_t', 'uint8_t')
-        cg.current_state = pta.state['IDLE']
+        pta.state["IDLE"].power.value = 9
+        cg = get_simulated_accountingmethod("static_statetransition_immediate")(
+            pta, 1000000, "uint8_t", "uint8_t", "uint8_t", "uint8_t"
+        )
+        cg.current_state = pta.state["IDLE"]
         cg.sleep(7)
         self.assertEqual(cg.get_energy(), 9 * 7)
         pta.transitions[1].energy.value = 123
@@ -102,8 +94,10 @@ class TestCG(unittest.TestCase):
         cg.pass_transition(pta.transitions[1])
         self.assertEqual(cg.get_energy(), (9 * 7 + 123 + 123) % 256)
 
-        cg = get_simulated_accountingmethod('static_statetransition_immediate')(pta, 100000, 'uint8_t', 'uint8_t', 'uint8_t', 'uint8_t')
-        cg.current_state = pta.state['IDLE']
+        cg = get_simulated_accountingmethod("static_statetransition_immediate")(
+            pta, 100000, "uint8_t", "uint8_t", "uint8_t", "uint8_t"
+        )
+        cg.current_state = pta.state["IDLE"]
         cg.sleep(7)
         self.assertEqual(cg.get_energy(), 0)
         cg.sleep(15)
@@ -111,8 +105,10 @@ class TestCG(unittest.TestCase):
         cg.sleep(90)
         self.assertEqual(cg.get_energy(), 900 % 256)
 
-        cg = get_simulated_accountingmethod('static_statetransition_immediate')(pta, 100000, 'uint8_t', 'uint8_t', 'uint8_t', 'uint16_t')
-        cg.current_state = pta.state['IDLE']
+        cg = get_simulated_accountingmethod("static_statetransition_immediate")(
+            pta, 100000, "uint8_t", "uint8_t", "uint8_t", "uint16_t"
+        )
+        cg.current_state = pta.state["IDLE"]
         cg.sleep(7)
         self.assertEqual(cg.get_energy(), 0)
         cg.sleep(15)
@@ -120,10 +116,12 @@ class TestCG(unittest.TestCase):
         cg.sleep(90)
         self.assertEqual(cg.get_energy(), 900)
 
-        pta.state['IDLE'].power.value = 9  # -> 90 uW
+        pta.state["IDLE"].power.value = 9  # -> 90 uW
         pta.transitions[1].energy.value = 1  # -> 100 pJ
-        cg = get_simulated_accountingmethod('static_statetransition_immediate')(pta, 1000000, 'uint8_t', 'uint8_t', 'uint8_t', 'uint8_t', 1e-5, 1e-5, 1e-10)
-        cg.current_state = pta.state['IDLE']
+        cg = get_simulated_accountingmethod("static_statetransition_immediate")(
+            pta, 1000000, "uint8_t", "uint8_t", "uint8_t", "uint8_t", 1e-5, 1e-5, 1e-10
+        )
+        cg.current_state = pta.state["IDLE"]
         cg.sleep(10)  # 10 us
         self.assertEqual(cg.get_energy(), 90 * 10)
         cg.pass_transition(pta.transitions[1])
@@ -134,9 +132,11 @@ class TestCG(unittest.TestCase):
     def test_statetransition(self):
         pta = PTA.from_json(example_json_1)
         pta.set_random_energy_model()
-        pta.state['IDLE'].power.value = 9
-        cg = get_simulated_accountingmethod('static_statetransition')(pta, 1000000, 'uint8_t', 'uint8_t', 'uint8_t', 'uint8_t')
-        cg.current_state = pta.state['IDLE']
+        pta.state["IDLE"].power.value = 9
+        cg = get_simulated_accountingmethod("static_statetransition")(
+            pta, 1000000, "uint8_t", "uint8_t", "uint8_t", "uint8_t"
+        )
+        cg.current_state = pta.state["IDLE"]
         cg.sleep(7)
         self.assertEqual(cg.get_energy(), 9 * 7)
         pta.transitions[1].energy.value = 123
@@ -148,9 +148,11 @@ class TestCG(unittest.TestCase):
     def test_state_immediate(self):
         pta = PTA.from_json(example_json_1)
         pta.set_random_energy_model()
-        pta.state['IDLE'].power.value = 9
-        cg = get_simulated_accountingmethod('static_state_immediate')(pta, 1000000, 'uint8_t', 'uint8_t', 'uint8_t', 'uint8_t')
-        cg.current_state = pta.state['IDLE']
+        pta.state["IDLE"].power.value = 9
+        cg = get_simulated_accountingmethod("static_state_immediate")(
+            pta, 1000000, "uint8_t", "uint8_t", "uint8_t", "uint8_t"
+        )
+        cg.current_state = pta.state["IDLE"]
         cg.sleep(7)
         self.assertEqual(cg.get_energy(), 9 * 7)
         pta.transitions[1].energy.value = 123
@@ -162,9 +164,11 @@ class TestCG(unittest.TestCase):
     def test_state(self):
         pta = PTA.from_json(example_json_1)
         pta.set_random_energy_model()
-        pta.state['IDLE'].power.value = 9
-        cg = get_simulated_accountingmethod('static_state')(pta, 1000000, 'uint8_t', 'uint8_t', 'uint8_t', 'uint8_t')
-        cg.current_state = pta.state['IDLE']
+        pta.state["IDLE"].power.value = 9
+        cg = get_simulated_accountingmethod("static_state")(
+            pta, 1000000, "uint8_t", "uint8_t", "uint8_t", "uint8_t"
+        )
+        cg.current_state = pta.state["IDLE"]
         cg.sleep(7)
         self.assertEqual(cg.get_energy(), 9 * 7)
         pta.transitions[1].energy.value = 123
@@ -173,8 +177,10 @@ class TestCG(unittest.TestCase):
         cg.pass_transition(pta.transitions[1])
         self.assertEqual(cg.get_energy(), 9 * 7)
 
-        cg = get_simulated_accountingmethod('static_state')(pta, 1000000, 'uint8_t', 'uint16_t', 'uint16_t', 'uint16_t')
+        cg = get_simulated_accountingmethod("static_state")(
+            pta, 1000000, "uint8_t", "uint16_t", "uint16_t", "uint16_t"
+        )
 
 
-if __name__ == '__main__':
+if __name__ == "__main__":
     unittest.main()
diff --git a/test/test_pta.py b/test/test_pta.py
index 9f0778d..d43e702 100755
--- a/test/test_pta.py
+++ b/test/test_pta.py
@@ -5,88 +5,79 @@ import unittest
 import yaml
 
 example_json_1 = {
-    'parameters': ['datarate', 'txbytes', 'txpower'],
-    'initial_param_values': [None, None, None],
-    'state': {
-        'IDLE': {
-            'power': {
-                'static': 5,
-            }
-        },
-        'TX': {
-            'power': {
-                'static': 10000,
-                'function': {
-                    'raw': 'regression_arg(0) + regression_arg(1)'
-                    ' * parameter(txpower)',
-                    'regression_args': [10000, 2]
+    "parameters": ["datarate", "txbytes", "txpower"],
+    "initial_param_values": [None, None, None],
+    "state": {
+        "IDLE": {"power": {"static": 5,}},
+        "TX": {
+            "power": {
+                "static": 10000,
+                "function": {
+                    "raw": "regression_arg(0) + regression_arg(1)"
+                    " * parameter(txpower)",
+                    "regression_args": [10000, 2],
                 },
             }
         },
     },
-    'transitions': [
+    "transitions": [
         {
-            'name': 'init',
-            'origin': ['UNINITIALIZED', 'IDLE'],
-            'destination': 'IDLE',
-            'duration': {
-                'static': 50000,
-            },
-            'set_param': {
-                'txpower': 10
-            },
+            "name": "init",
+            "origin": ["UNINITIALIZED", "IDLE"],
+            "destination": "IDLE",
+            "duration": {"static": 50000,},
+            "set_param": {"txpower": 10},
         },
         {
-            'name': 'setTxPower',
-            'origin': 'IDLE',
-            'destination': 'IDLE',
-            'duration': {'static': 120},
-            'energy ': {'static': 10000},
-            'arg_to_param_map': {0: 'txpower'},
-            'argument_values': [[10, 20, 30]],
+            "name": "setTxPower",
+            "origin": "IDLE",
+            "destination": "IDLE",
+            "duration": {"static": 120},
+            "energy ": {"static": 10000},
+            "arg_to_param_map": {0: "txpower"},
+            "argument_values": [[10, 20, 30]],
         },
         {
-            'name': 'send',
-            'origin': 'IDLE',
-            'destination': 'TX',
-            'duration': {
-                'static': 10,
-                'function': {
-                    'raw': 'regression_arg(0) + regression_arg(1)'
-                    ' * function_arg(1)',
-                    'regression_args': [48, 8],
+            "name": "send",
+            "origin": "IDLE",
+            "destination": "TX",
+            "duration": {
+                "static": 10,
+                "function": {
+                    "raw": "regression_arg(0) + regression_arg(1)" " * function_arg(1)",
+                    "regression_args": [48, 8],
                 },
             },
-            'energy': {
-                'static': 3,
-                'function': {
-                    'raw': 'regression_arg(0) + regression_arg(1)'
-                    ' * function_arg(1)',
-                    'regression_args': [3, 5],
+            "energy": {
+                "static": 3,
+                "function": {
+                    "raw": "regression_arg(0) + regression_arg(1)" " * function_arg(1)",
+                    "regression_args": [3, 5],
                 },
             },
-            'arg_to_param_map': {1: 'txbytes'},
-            'argument_values': [['"foo"', '"hodor"'], [3, 5]],
-            'argument_combination': 'zip',
+            "arg_to_param_map": {1: "txbytes"},
+            "argument_values": [['"foo"', '"hodor"'], [3, 5]],
+            "argument_combination": "zip",
         },
         {
-            'name': 'txComplete',
-            'origin': 'TX',
-            'destination': 'IDLE',
-            'is_interrupt': 1,
-            'timeout': {
-                'static': 2000,
-                'function': {
-                    'raw': 'regression_arg(0) + regression_arg(1)'
-                    ' * parameter(txbytes)',
-                    'regression_args': [500, 16],
+            "name": "txComplete",
+            "origin": "TX",
+            "destination": "IDLE",
+            "is_interrupt": 1,
+            "timeout": {
+                "static": 2000,
+                "function": {
+                    "raw": "regression_arg(0) + regression_arg(1)"
+                    " * parameter(txbytes)",
+                    "regression_args": [500, 16],
                 },
             },
-        }
+        },
     ],
 }
 
-example_yaml_1 = yaml.safe_load("""
+example_yaml_1 = yaml.safe_load(
+    """
 codegen:
   instance: cc1200
 
@@ -124,9 +115,11 @@ transition:
     src: [TX]
     dst: IDLE
     is_interrupt: true
-""")
+"""
+)
 
-example_yaml_2 = yaml.safe_load("""
+example_yaml_2 = yaml.safe_load(
+    """
 codegen:
   instance: cc1200
 
@@ -169,9 +162,11 @@ transition:
     src: [TX]
     dst: IDLE
     is_interrupt: true
-""")
+"""
+)
 
-example_yaml_3 = yaml.safe_load("""
+example_yaml_3 = yaml.safe_load(
+    """
 codegen:
   instance: nrf24l01
   includes: ['driver/nrf24l01.h']
@@ -260,12 +255,17 @@ transition:
       - name: blocking
         values: [1, 1, 1, 1, 1, 1]
     argument_combination: zip
-""")
+"""
+)
 
 
-def dfs_tran_to_name(runs: list, with_args: bool = False, with_param: bool = False) -> list:
+def dfs_tran_to_name(
+    runs: list, with_args: bool = False, with_param: bool = False
+) -> list:
     if with_param:
-        return list(map(lambda run: list(map(lambda x: (x[0].name, x[1], x[2]), run)), runs))
+        return list(
+            map(lambda run: list(map(lambda x: (x[0].name, x[1], x[2]), run)), runs)
+        )
     if with_args:
         return list(map(lambda run: list(map(lambda x: (x[0].name, x[1]), run)), runs))
     return list(map(lambda run: list(map(lambda x: (x[0].name), run)), runs))
@@ -273,117 +273,175 @@ def dfs_tran_to_name(runs: list, with_args: bool = False, with_param: bool = Fal
 
 class TestPTA(unittest.TestCase):
     def test_dfs(self):
-        pta = PTA(['IDLE', 'TX'])
-        pta.add_transition('UNINITIALIZED', 'IDLE', 'init')
-        pta.add_transition('IDLE', 'TX', 'send')
-        pta.add_transition('TX', 'IDLE', 'txComplete')
-        self.assertEqual(dfs_tran_to_name(pta.dfs(0), False), [['init']])
-        self.assertEqual(dfs_tran_to_name(pta.dfs(1), False), [['init', 'send']])
-        self.assertEqual(dfs_tran_to_name(pta.dfs(2), False), [['init', 'send', 'txComplete']])
-        self.assertEqual(dfs_tran_to_name(pta.dfs(3), False), [['init', 'send', 'txComplete', 'send']])
-
-        pta = PTA(['IDLE'])
-        pta.add_transition('UNINITIALIZED', 'IDLE', 'init')
-        pta.add_transition('IDLE', 'IDLE', 'set1')
-        pta.add_transition('IDLE', 'IDLE', 'set2')
-        self.assertEqual(dfs_tran_to_name(pta.dfs(0), False), [['init']])
-        self.assertEqual(sorted(dfs_tran_to_name(pta.dfs(1), False)), [['init', 'set1'], ['init', 'set2']])
-        self.assertEqual(sorted(dfs_tran_to_name(pta.dfs(2), False)), [['init', 'set1', 'set1'],
-                                                                       ['init', 'set1', 'set2'],
-                                                                       ['init', 'set2', 'set1'],
-                                                                       ['init', 'set2', 'set2']])
+        pta = PTA(["IDLE", "TX"])
+        pta.add_transition("UNINITIALIZED", "IDLE", "init")
+        pta.add_transition("IDLE", "TX", "send")
+        pta.add_transition("TX", "IDLE", "txComplete")
+        self.assertEqual(dfs_tran_to_name(pta.dfs(0), False), [["init"]])
+        self.assertEqual(dfs_tran_to_name(pta.dfs(1), False), [["init", "send"]])
+        self.assertEqual(
+            dfs_tran_to_name(pta.dfs(2), False), [["init", "send", "txComplete"]]
+        )
+        self.assertEqual(
+            dfs_tran_to_name(pta.dfs(3), False),
+            [["init", "send", "txComplete", "send"]],
+        )
+
+        pta = PTA(["IDLE"])
+        pta.add_transition("UNINITIALIZED", "IDLE", "init")
+        pta.add_transition("IDLE", "IDLE", "set1")
+        pta.add_transition("IDLE", "IDLE", "set2")
+        self.assertEqual(dfs_tran_to_name(pta.dfs(0), False), [["init"]])
+        self.assertEqual(
+            sorted(dfs_tran_to_name(pta.dfs(1), False)),
+            [["init", "set1"], ["init", "set2"]],
+        )
+        self.assertEqual(
+            sorted(dfs_tran_to_name(pta.dfs(2), False)),
+            [
+                ["init", "set1", "set1"],
+                ["init", "set1", "set2"],
+                ["init", "set2", "set1"],
+                ["init", "set2", "set2"],
+            ],
+        )
 
     def test_dfs_trace_filter(self):
-        pta = PTA(['IDLE'])
-        pta.add_transition('UNINITIALIZED', 'IDLE', 'init')
-        pta.add_transition('IDLE', 'IDLE', 'set1')
-        pta.add_transition('IDLE', 'IDLE', 'set2')
-        self.assertEqual(sorted(dfs_tran_to_name(pta.dfs(2, trace_filter=[['init', 'set1', 'set2'], ['init', 'set2', 'set1']]), False)),
-                         [['init', 'set1', 'set2'], ['init', 'set2', 'set1']])
-        self.assertEqual(sorted(dfs_tran_to_name(pta.dfs(2, trace_filter=[['init', 'set1', '$'], ['init', 'set2', '$']]), False)),
-                         [['init', 'set1'], ['init', 'set2']])
+        pta = PTA(["IDLE"])
+        pta.add_transition("UNINITIALIZED", "IDLE", "init")
+        pta.add_transition("IDLE", "IDLE", "set1")
+        pta.add_transition("IDLE", "IDLE", "set2")
+        self.assertEqual(
+            sorted(
+                dfs_tran_to_name(
+                    pta.dfs(
+                        2,
+                        trace_filter=[
+                            ["init", "set1", "set2"],
+                            ["init", "set2", "set1"],
+                        ],
+                    ),
+                    False,
+                )
+            ),
+            [["init", "set1", "set2"], ["init", "set2", "set1"]],
+        )
+        self.assertEqual(
+            sorted(
+                dfs_tran_to_name(
+                    pta.dfs(
+                        2, trace_filter=[["init", "set1", "$"], ["init", "set2", "$"]]
+                    ),
+                    False,
+                )
+            ),
+            [["init", "set1"], ["init", "set2"]],
+        )
 
     def test_dfs_accepting(self):
-        pta = PTA(['IDLE', 'TX'], accepting_states=['IDLE'])
-        pta.add_transition('UNINITIALIZED', 'IDLE', 'init')
-        pta.add_transition('IDLE', 'TX', 'send')
-        pta.add_transition('TX', 'IDLE', 'txComplete')
-        self.assertEqual(dfs_tran_to_name(pta.dfs(0), False), [['init']])
+        pta = PTA(["IDLE", "TX"], accepting_states=["IDLE"])
+        pta.add_transition("UNINITIALIZED", "IDLE", "init")
+        pta.add_transition("IDLE", "TX", "send")
+        pta.add_transition("TX", "IDLE", "txComplete")
+        self.assertEqual(dfs_tran_to_name(pta.dfs(0), False), [["init"]])
         self.assertEqual(dfs_tran_to_name(pta.dfs(1), False), [])
-        self.assertEqual(dfs_tran_to_name(pta.dfs(2), False), [['init', 'send', 'txComplete']])
+        self.assertEqual(
+            dfs_tran_to_name(pta.dfs(2), False), [["init", "send", "txComplete"]]
+        )
         self.assertEqual(dfs_tran_to_name(pta.dfs(3), False), [])
 
     def test_dfs_objects(self):
-        pta = PTA(['IDLE', 'TX'])
-        pta.add_transition('UNINITIALIZED', 'IDLE', 'init')
-        pta.add_transition('IDLE', 'TX', 'send')
-        pta.add_transition('TX', 'IDLE', 'txComplete')
+        pta = PTA(["IDLE", "TX"])
+        pta.add_transition("UNINITIALIZED", "IDLE", "init")
+        pta.add_transition("IDLE", "TX", "send")
+        pta.add_transition("TX", "IDLE", "txComplete")
         traces = list(pta.dfs(2))
         self.assertEqual(len(traces), 1)
         trace = traces[0]
         self.assertEqual(len(trace), 3)
-        self.assertEqual(trace[0][0].name, 'init')
-        self.assertEqual(trace[1][0].name, 'send')
-        self.assertEqual(trace[2][0].name, 'txComplete')
+        self.assertEqual(trace[0][0].name, "init")
+        self.assertEqual(trace[1][0].name, "send")
+        self.assertEqual(trace[2][0].name, "txComplete")
         self.assertEqual(pta.get_transition_id(trace[0][0]), 0)
         self.assertEqual(pta.get_transition_id(trace[1][0]), 1)
         self.assertEqual(pta.get_transition_id(trace[2][0]), 2)
 
     def test_dfs_with_sleep(self):
-        pta = PTA(['IDLE', 'TX'])
-        pta.add_transition('UNINITIALIZED', 'IDLE', 'init')
-        pta.add_transition('IDLE', 'TX', 'send')
-        pta.add_transition('TX', 'IDLE', 'txComplete')
+        pta = PTA(["IDLE", "TX"])
+        pta.add_transition("UNINITIALIZED", "IDLE", "init")
+        pta.add_transition("IDLE", "TX", "send")
+        pta.add_transition("TX", "IDLE", "txComplete")
         traces = list(pta.dfs(2, sleep=10))
         self.assertEqual(len(traces), 1)
         trace = traces[0]
         self.assertEqual(len(trace), 6)
         self.assertIsNone(trace[0][0])
-        self.assertEqual(trace[1][0].name, 'init')
+        self.assertEqual(trace[1][0].name, "init")
         self.assertIsNone(trace[2][0])
-        self.assertEqual(trace[3][0].name, 'send')
+        self.assertEqual(trace[3][0].name, "send")
         self.assertIsNone(trace[4][0])
-        self.assertEqual(trace[5][0].name, 'txComplete')
+        self.assertEqual(trace[5][0].name, "txComplete")
         self.assertEqual(pta.get_transition_id(trace[1][0]), 0)
         self.assertEqual(pta.get_transition_id(trace[3][0]), 1)
         self.assertEqual(pta.get_transition_id(trace[5][0]), 2)
 
     def test_bfs(self):
-        pta = PTA(['IDLE', 'TX'])
-        pta.add_transition('UNINITIALIZED', 'IDLE', 'init')
-        pta.add_transition('IDLE', 'TX', 'send')
-        pta.add_transition('TX', 'IDLE', 'txComplete')
-        self.assertEqual(dfs_tran_to_name(pta.bfs(0), False), [['init']])
-        self.assertEqual(dfs_tran_to_name(pta.bfs(1), False), [['init'], ['init', 'send']])
-        self.assertEqual(dfs_tran_to_name(pta.bfs(2), False), [['init'], ['init', 'send'], ['init', 'send', 'txComplete']])
-        self.assertEqual(dfs_tran_to_name(pta.bfs(3), False), [['init'], ['init', 'send'], ['init', 'send', 'txComplete'], ['init', 'send', 'txComplete', 'send']])
-
-        pta = PTA(['IDLE'])
-        pta.add_transition('UNINITIALIZED', 'IDLE', 'init')
-        pta.add_transition('IDLE', 'IDLE', 'set1')
-        pta.add_transition('IDLE', 'IDLE', 'set2')
-        self.assertEqual(dfs_tran_to_name(pta.bfs(0), False), [['init']])
-        self.assertEqual(sorted(dfs_tran_to_name(pta.bfs(1), False)), [['init'], ['init', 'set1'], ['init', 'set2']])
-        self.assertEqual(sorted(dfs_tran_to_name(pta.bfs(2), False)), [['init'],
-                                                                       ['init', 'set1'],
-                                                                       ['init', 'set1', 'set1'],
-                                                                       ['init', 'set1', 'set2'],
-                                                                       ['init', 'set2'],
-                                                                       ['init', 'set2', 'set1'],
-                                                                       ['init', 'set2', 'set2']])
+        pta = PTA(["IDLE", "TX"])
+        pta.add_transition("UNINITIALIZED", "IDLE", "init")
+        pta.add_transition("IDLE", "TX", "send")
+        pta.add_transition("TX", "IDLE", "txComplete")
+        self.assertEqual(dfs_tran_to_name(pta.bfs(0), False), [["init"]])
+        self.assertEqual(
+            dfs_tran_to_name(pta.bfs(1), False), [["init"], ["init", "send"]]
+        )
+        self.assertEqual(
+            dfs_tran_to_name(pta.bfs(2), False),
+            [["init"], ["init", "send"], ["init", "send", "txComplete"]],
+        )
+        self.assertEqual(
+            dfs_tran_to_name(pta.bfs(3), False),
+            [
+                ["init"],
+                ["init", "send"],
+                ["init", "send", "txComplete"],
+                ["init", "send", "txComplete", "send"],
+            ],
+        )
+
+        pta = PTA(["IDLE"])
+        pta.add_transition("UNINITIALIZED", "IDLE", "init")
+        pta.add_transition("IDLE", "IDLE", "set1")
+        pta.add_transition("IDLE", "IDLE", "set2")
+        self.assertEqual(dfs_tran_to_name(pta.bfs(0), False), [["init"]])
+        self.assertEqual(
+            sorted(dfs_tran_to_name(pta.bfs(1), False)),
+            [["init"], ["init", "set1"], ["init", "set2"]],
+        )
+        self.assertEqual(
+            sorted(dfs_tran_to_name(pta.bfs(2), False)),
+            [
+                ["init"],
+                ["init", "set1"],
+                ["init", "set1", "set1"],
+                ["init", "set1", "set2"],
+                ["init", "set2"],
+                ["init", "set2", "set1"],
+                ["init", "set2", "set2"],
+            ],
+        )
 
     def test_from_json(self):
         pta = PTA.from_json(example_json_1)
-        self.assertEqual(pta.parameters, ['datarate', 'txbytes', 'txpower'])
-        self.assertEqual(pta.state['UNINITIALIZED'].name, 'UNINITIALIZED')
-        self.assertEqual(pta.state['IDLE'].name, 'IDLE')
-        self.assertEqual(pta.state['TX'].name, 'TX')
+        self.assertEqual(pta.parameters, ["datarate", "txbytes", "txpower"])
+        self.assertEqual(pta.state["UNINITIALIZED"].name, "UNINITIALIZED")
+        self.assertEqual(pta.state["IDLE"].name, "IDLE")
+        self.assertEqual(pta.state["TX"].name, "TX")
         self.assertEqual(len(pta.transitions), 5)
-        self.assertEqual(pta.transitions[0].name, 'init')
-        self.assertEqual(pta.transitions[1].name, 'init')
-        self.assertEqual(pta.transitions[2].name, 'setTxPower')
-        self.assertEqual(pta.transitions[3].name, 'send')
-        self.assertEqual(pta.transitions[4].name, 'txComplete')
+        self.assertEqual(pta.transitions[0].name, "init")
+        self.assertEqual(pta.transitions[1].name, "init")
+        self.assertEqual(pta.transitions[2].name, "setTxPower")
+        self.assertEqual(pta.transitions[3].name, "send")
+        self.assertEqual(pta.transitions[4].name, "txComplete")
 
     # def test_to_json(self):
     #    pta = PTA.from_json(example_json_1)
@@ -394,368 +452,471 @@ class TestPTA(unittest.TestCase):
 
     def test_from_json_dfs_arg(self):
         pta = PTA.from_json(example_json_1)
-        self.assertEqual(sorted(dfs_tran_to_name(pta.dfs(1), False)), [['init', 'init'], ['init', 'send'], ['init', 'setTxPower']])
-        self.assertEqual(sorted(dfs_tran_to_name(pta.dfs(1, with_arguments=True), True)),
-                         [
-            [('init', ()), ('init', ())],
-            [('init', ()), ('send', ('"foo"', 3))],
-            [('init', ()), ('send', ('"hodor"', 5))],
-            [('init', ()), ('setTxPower', (10,))],
-            [('init', ()), ('setTxPower', (20,))],
-            [('init', ()), ('setTxPower', (30,))],
-        ]
+        self.assertEqual(
+            sorted(dfs_tran_to_name(pta.dfs(1), False)),
+            [["init", "init"], ["init", "send"], ["init", "setTxPower"]],
+        )
+        self.assertEqual(
+            sorted(dfs_tran_to_name(pta.dfs(1, with_arguments=True), True)),
+            [
+                [("init", ()), ("init", ())],
+                [("init", ()), ("send", ('"foo"', 3))],
+                [("init", ()), ("send", ('"hodor"', 5))],
+                [("init", ()), ("setTxPower", (10,))],
+                [("init", ()), ("setTxPower", (20,))],
+                [("init", ()), ("setTxPower", (30,))],
+            ],
         )
 
     def test_from_json_dfs_param(self):
         pta = PTA.from_json(example_json_1)
         no_param = {
-            'datarate': None,
-            'txbytes': None,
-            'txpower': 10,
+            "datarate": None,
+            "txbytes": None,
+            "txpower": 10,
         }
         param_tx3 = {
-            'datarate': None,
-            'txbytes': 3,
-            'txpower': 10,
+            "datarate": None,
+            "txbytes": 3,
+            "txpower": 10,
         }
         param_tx5 = {
-            'datarate': None,
-            'txbytes': 5,
-            'txpower': 10,
+            "datarate": None,
+            "txbytes": 5,
+            "txpower": 10,
         }
         param_txp10 = {
-            'datarate': None,
-            'txbytes': None,
-            'txpower': 10,
+            "datarate": None,
+            "txbytes": None,
+            "txpower": 10,
         }
         param_txp20 = {
-            'datarate': None,
-            'txbytes': None,
-            'txpower': 20,
+            "datarate": None,
+            "txbytes": None,
+            "txpower": 20,
         }
         param_txp30 = {
-            'datarate': None,
-            'txbytes': None,
-            'txpower': 30,
+            "datarate": None,
+            "txbytes": None,
+            "txpower": 30,
         }
-        self.assertEqual(sorted(dfs_tran_to_name(pta.dfs(1, with_arguments=True, with_parameters=True), True, True)),
-                         [
-            [('init', (), no_param), ('init', (), no_param)],
-            [('init', (), no_param), ('send', ('"foo"', 3), param_tx3)],
-            [('init', (), no_param), ('send', ('"hodor"', 5), param_tx5)],
-            [('init', (), no_param), ('setTxPower', (10,), param_txp10)],
-            [('init', (), no_param), ('setTxPower', (20,), param_txp20)],
-            [('init', (), no_param), ('setTxPower', (30,), param_txp30)],
-        ]
+        self.assertEqual(
+            sorted(
+                dfs_tran_to_name(
+                    pta.dfs(1, with_arguments=True, with_parameters=True), True, True
+                )
+            ),
+            [
+                [("init", (), no_param), ("init", (), no_param)],
+                [("init", (), no_param), ("send", ('"foo"', 3), param_tx3)],
+                [("init", (), no_param), ("send", ('"hodor"', 5), param_tx5)],
+                [("init", (), no_param), ("setTxPower", (10,), param_txp10)],
+                [("init", (), no_param), ("setTxPower", (20,), param_txp20)],
+                [("init", (), no_param), ("setTxPower", (30,), param_txp30)],
+            ],
         )
 
     def test_from_json_function(self):
         pta = PTA.from_json(example_json_1)
-        self.assertEqual(pta.state['TX'].get_energy(1000, {'datarate': 10, 'txbytes': 6, 'txpower': 10}), 1000 * (10000 + 2 * 10))
-        self.assertEqual(pta.transitions[4].get_timeout({'datarate': 10, 'txbytes': 6, 'txpower': 10}), 500 + 16 * 6)
+        self.assertEqual(
+            pta.state["TX"].get_energy(
+                1000, {"datarate": 10, "txbytes": 6, "txpower": 10}
+            ),
+            1000 * (10000 + 2 * 10),
+        )
+        self.assertEqual(
+            pta.transitions[4].get_timeout(
+                {"datarate": 10, "txbytes": 6, "txpower": 10}
+            ),
+            500 + 16 * 6,
+        )
 
     def test_from_yaml_dfs_param(self):
         pta = PTA.from_yaml(example_yaml_1)
         no_param = {
-            'datarate': None,
-            'txbytes': None,
-            'txpower': None,
+            "datarate": None,
+            "txbytes": None,
+            "txpower": None,
         }
         param_tx3 = {
-            'datarate': None,
-            'txbytes': 3,
-            'txpower': None,
+            "datarate": None,
+            "txbytes": 3,
+            "txpower": None,
         }
         param_tx5 = {
-            'datarate': None,
-            'txbytes': 5,
-            'txpower': None,
+            "datarate": None,
+            "txbytes": 5,
+            "txpower": None,
         }
         param_txp10 = {
-            'datarate': None,
-            'txbytes': None,
-            'txpower': 10,
+            "datarate": None,
+            "txbytes": None,
+            "txpower": 10,
         }
         param_txp20 = {
-            'datarate': None,
-            'txbytes': None,
-            'txpower': 20,
+            "datarate": None,
+            "txbytes": None,
+            "txpower": 20,
         }
         param_txp30 = {
-            'datarate': None,
-            'txbytes': None,
-            'txpower': 30,
+            "datarate": None,
+            "txbytes": None,
+            "txpower": 30,
         }
-        self.assertEqual(sorted(dfs_tran_to_name(pta.dfs(1, with_arguments=True, with_parameters=True), True, True)),
-                         [
-            [('init', (), no_param), ('init', (), no_param)],
-            [('init', (), no_param), ('send', ('"foo"', 3), param_tx3)],
-            [('init', (), no_param), ('send', ('"hodor"', 5), param_tx5)],
-            [('init', (), no_param), ('setTxPower', (10,), param_txp10)],
-            [('init', (), no_param), ('setTxPower', (20,), param_txp20)],
-            [('init', (), no_param), ('setTxPower', (30,), param_txp30)],
-        ]
+        self.assertEqual(
+            sorted(
+                dfs_tran_to_name(
+                    pta.dfs(1, with_arguments=True, with_parameters=True), True, True
+                )
+            ),
+            [
+                [("init", (), no_param), ("init", (), no_param)],
+                [("init", (), no_param), ("send", ('"foo"', 3), param_tx3)],
+                [("init", (), no_param), ("send", ('"hodor"', 5), param_tx5)],
+                [("init", (), no_param), ("setTxPower", (10,), param_txp10)],
+                [("init", (), no_param), ("setTxPower", (20,), param_txp20)],
+                [("init", (), no_param), ("setTxPower", (30,), param_txp30)],
+            ],
         )
 
     def test_normalization(self):
         pta = PTA.from_yaml(example_yaml_2)
         no_param = {
-            'datarate': None,
-            'txbytes': None,
-            'txpower': None,
+            "datarate": None,
+            "txbytes": None,
+            "txpower": None,
         }
         param_tx3 = {
-            'datarate': None,
-            'txbytes': 3,
-            'txpower': None,
+            "datarate": None,
+            "txbytes": 3,
+            "txpower": None,
         }
         param_tx6 = {
-            'datarate': None,
-            'txbytes': 6,
-            'txpower': None,
+            "datarate": None,
+            "txbytes": 6,
+            "txpower": None,
         }
         param_txp10 = {
-            'datarate': None,
-            'txbytes': None,
-            'txpower': -6,
+            "datarate": None,
+            "txbytes": None,
+            "txpower": -6,
         }
         param_txp20 = {
-            'datarate': None,
-            'txbytes': None,
-            'txpower': 4,
+            "datarate": None,
+            "txbytes": None,
+            "txpower": 4,
         }
         param_txp30 = {
-            'datarate': None,
-            'txbytes': None,
-            'txpower': 14,
+            "datarate": None,
+            "txbytes": None,
+            "txpower": 14,
         }
-        self.assertEqual(sorted(dfs_tran_to_name(pta.dfs(1, with_arguments=True, with_parameters=True), True, True)),
-                         [
-            [('init', (), no_param), ('init', (), no_param)],
-            [('init', (), no_param), ('send', ('FOO',), param_tx3)],
-            [('init', (), no_param), ('send', ('LONGER',), param_tx6)],
-            [('init', (), no_param), ('setTxPower', (10,), param_txp10)],
-            [('init', (), no_param), ('setTxPower', (20,), param_txp20)],
-            [('init', (), no_param), ('setTxPower', (30,), param_txp30)],
-        ]
+        self.assertEqual(
+            sorted(
+                dfs_tran_to_name(
+                    pta.dfs(1, with_arguments=True, with_parameters=True), True, True
+                )
+            ),
+            [
+                [("init", (), no_param), ("init", (), no_param)],
+                [("init", (), no_param), ("send", ("FOO",), param_tx3)],
+                [("init", (), no_param), ("send", ("LONGER",), param_tx6)],
+                [("init", (), no_param), ("setTxPower", (10,), param_txp10)],
+                [("init", (), no_param), ("setTxPower", (20,), param_txp20)],
+                [("init", (), no_param), ("setTxPower", (30,), param_txp30)],
+            ],
         )
 
     def test_shrink(self):
         pta = PTA.from_yaml(example_yaml_3)
         pta.shrink_argument_values()
-        self.assertEqual(pta.transitions[0].name, 'setAutoAck')
-        self.assertEqual(pta.transitions[1].name, 'setPALevel')
-        self.assertEqual(pta.transitions[2].name, 'setRetries')
-        self.assertEqual(pta.transitions[3].name, 'setup')
-        self.assertEqual(pta.transitions[4].name, 'setup')
-        self.assertEqual(pta.transitions[5].name, 'write')
+        self.assertEqual(pta.transitions[0].name, "setAutoAck")
+        self.assertEqual(pta.transitions[1].name, "setPALevel")
+        self.assertEqual(pta.transitions[2].name, "setRetries")
+        self.assertEqual(pta.transitions[3].name, "setup")
+        self.assertEqual(pta.transitions[4].name, "setup")
+        self.assertEqual(pta.transitions[5].name, "write")
         self.assertEqual(pta.transitions[0].argument_values, [[0, 1]])
-        self.assertEqual(pta.transitions[1].argument_values, [['Nrf24l01::RF24_PA_MIN', 'Nrf24l01::RF24_PA_MAX']])
+        self.assertEqual(
+            pta.transitions[1].argument_values,
+            [["Nrf24l01::RF24_PA_MIN", "Nrf24l01::RF24_PA_MAX"]],
+        )
         self.assertEqual(pta.transitions[2].argument_values, [[0, 15], [0, 15]])
-        self.assertEqual(pta.transitions[5].argument_values, [['"foo"', '"foo"', '"foofoofoo"', '"foofoofoo"', '"123456789012345678901234567890"',
-                                                               '"123456789012345678901234567890"'], [3, 3, 9, 9, 30, 30], [0, 1, 0, 1, 0, 1], [1, 1, 1, 1, 1, 1]])
+        self.assertEqual(
+            pta.transitions[5].argument_values,
+            [
+                [
+                    '"foo"',
+                    '"foo"',
+                    '"foofoofoo"',
+                    '"foofoofoo"',
+                    '"123456789012345678901234567890"',
+                    '"123456789012345678901234567890"',
+                ],
+                [3, 3, 9, 9, 30, 30],
+                [0, 1, 0, 1, 0, 1],
+                [1, 1, 1, 1, 1, 1],
+            ],
+        )
 
     def test_simulation(self):
         pta = PTA()
-        pta.add_state('IDLE', power=5)
-        pta.add_state('TX', power=100)
-        pta.add_transition('UNINITIALIZED', 'IDLE', 'init', duration=50000)
-        pta.add_transition('IDLE', 'TX', 'send', energy=3, duration=10)
-        pta.add_transition('TX', 'IDLE', 'txComplete', timeout=2000, is_interrupt=True)
+        pta.add_state("IDLE", power=5)
+        pta.add_state("TX", power=100)
+        pta.add_transition("UNINITIALIZED", "IDLE", "init", duration=50000)
+        pta.add_transition("IDLE", "TX", "send", energy=3, duration=10)
+        pta.add_transition("TX", "IDLE", "txComplete", timeout=2000, is_interrupt=True)
         trace = [
-            ['init'],
+            ["init"],
             [None, 10000000],
-            ['send', 'foo', 3],
+            ["send", "foo", 3],
             [None, 5000000],
-            ['send', 'foo', 3]
+            ["send", "foo", 3],
         ]
-        expected_energy = 5. * 10000000 + 3 + 100 * 2000 + 5 * 5000000 + 3 + 100 * 2000
+        expected_energy = 5.0 * 10000000 + 3 + 100 * 2000 + 5 * 5000000 + 3 + 100 * 2000
         expected_duration = 50000 + 10000000 + 10 + 2000 + 5000000 + 10 + 2000
         result = pta.simulate(trace)
         self.assertAlmostEqual(result.energy, expected_energy * 1e-12, places=12)
         self.assertAlmostEqual(result.duration, expected_duration * 1e-6, places=6)
-        self.assertEqual(result.end_state.name, 'IDLE')
+        self.assertEqual(result.end_state.name, "IDLE")
         self.assertEqual(result.parameters, {})
 
     def test_simulation_param_none(self):
-        pta = PTA(parameters=['txpower', 'length'])
-        pta.add_state('IDLE', power=5)
-        pta.add_state('TX', power=100)
-        pta.add_transition('UNINITIALIZED', 'IDLE', 'init', energy=500000, duration=50000)
-        pta.add_transition('IDLE', 'TX', 'send', energy=3, duration=10)
-        pta.add_transition('TX', 'IDLE', 'txComplete', timeout=2000, is_interrupt=True)
+        pta = PTA(parameters=["txpower", "length"])
+        pta.add_state("IDLE", power=5)
+        pta.add_state("TX", power=100)
+        pta.add_transition(
+            "UNINITIALIZED", "IDLE", "init", energy=500000, duration=50000
+        )
+        pta.add_transition("IDLE", "TX", "send", energy=3, duration=10)
+        pta.add_transition("TX", "IDLE", "txComplete", timeout=2000, is_interrupt=True)
         trace = [
-            ['init'],
+            ["init"],
         ]
         expected_energy = 500000
         expected_duration = 50000
         result = pta.simulate(trace)
         self.assertAlmostEqual(result.energy, expected_energy * 1e-12, places=12)
         self.assertAlmostEqual(result.duration, expected_duration * 1e-6, places=6)
-        self.assertEqual(result.end_state.name, 'IDLE')
-        self.assertEqual(result.parameters, {
-            'txpower': None,
-            'length': None
-        })
+        self.assertEqual(result.end_state.name, "IDLE")
+        self.assertEqual(result.parameters, {"txpower": None, "length": None})
 
     def test_simulation_param_update_function(self):
-        pta = PTA(parameters=['txpower', 'length'])
-        pta.add_state('IDLE', power=5)
-        pta.add_state('TX', power=100)
-        pta.add_transition('UNINITIALIZED', 'IDLE', 'init', energy=500000, duration=50000)
-        pta.add_transition('IDLE', 'IDLE', 'setTxPower', energy=10000, duration=120,
-                           param_update_function=lambda param, arg: {**param, 'txpower': arg[0]})
-        pta.add_transition('IDLE', 'TX', 'send', energy=3, duration=10)
-        pta.add_transition('TX', 'IDLE', 'txComplete', timeout=2000, is_interrupt=True)
-        trace = [
-            ['init'],
-            ['setTxPower', 10]
-        ]
+        pta = PTA(parameters=["txpower", "length"])
+        pta.add_state("IDLE", power=5)
+        pta.add_state("TX", power=100)
+        pta.add_transition(
+            "UNINITIALIZED", "IDLE", "init", energy=500000, duration=50000
+        )
+        pta.add_transition(
+            "IDLE",
+            "IDLE",
+            "setTxPower",
+            energy=10000,
+            duration=120,
+            param_update_function=lambda param, arg: {**param, "txpower": arg[0]},
+        )
+        pta.add_transition("IDLE", "TX", "send", energy=3, duration=10)
+        pta.add_transition("TX", "IDLE", "txComplete", timeout=2000, is_interrupt=True)
+        trace = [["init"], ["setTxPower", 10]]
         expected_energy = 510000
         expected_duration = 50120
         result = pta.simulate(trace)
         self.assertAlmostEqual(result.energy, expected_energy * 1e-12, places=12)
         self.assertAlmostEqual(result.duration, expected_duration * 1e-6, places=6)
-        self.assertEqual(result.end_state.name, 'IDLE')
-        self.assertEqual(result.parameters, {
-            'txpower': 10,
-            'length': None
-        })
+        self.assertEqual(result.end_state.name, "IDLE")
+        self.assertEqual(result.parameters, {"txpower": 10, "length": None})
 
     def test_simulation_arg_to_param_map(self):
-        pta = PTA(parameters=['txpower', 'length'])
-        pta.add_state('IDLE', power=5)
-        pta.add_state('TX', power=100)
-        pta.add_transition('UNINITIALIZED', 'IDLE', 'init', energy=500000, duration=50000)
-        pta.add_transition('IDLE', 'IDLE', 'setTxPower', energy=10000, duration=120,
-                           arg_to_param_map={0: 'txpower'})
-        pta.add_transition('IDLE', 'TX', 'send', energy=3, duration=10)
-        pta.add_transition('TX', 'IDLE', 'txComplete', timeout=2000, is_interrupt=True)
-        trace = [
-            ['init'],
-            ['setTxPower', 10]
-        ]
+        pta = PTA(parameters=["txpower", "length"])
+        pta.add_state("IDLE", power=5)
+        pta.add_state("TX", power=100)
+        pta.add_transition(
+            "UNINITIALIZED", "IDLE", "init", energy=500000, duration=50000
+        )
+        pta.add_transition(
+            "IDLE",
+            "IDLE",
+            "setTxPower",
+            energy=10000,
+            duration=120,
+            arg_to_param_map={0: "txpower"},
+        )
+        pta.add_transition("IDLE", "TX", "send", energy=3, duration=10)
+        pta.add_transition("TX", "IDLE", "txComplete", timeout=2000, is_interrupt=True)
+        trace = [["init"], ["setTxPower", 10]]
         expected_energy = 510000
         expected_duration = 50120
         result = pta.simulate(trace)
         self.assertAlmostEqual(result.energy, expected_energy * 1e-12, places=12)
         self.assertAlmostEqual(result.duration, expected_duration * 1e-6, places=6)
-        self.assertEqual(result.end_state.name, 'IDLE')
-        self.assertEqual(result.parameters, {
-            'txpower': 10,
-            'length': None
-        })
+        self.assertEqual(result.end_state.name, "IDLE")
+        self.assertEqual(result.parameters, {"txpower": 10, "length": None})
 
     def test_simulation_set_param(self):
-        pta = PTA(parameters=['txpower', 'length'])
-        pta.add_state('IDLE', power=5)
-        pta.add_state('TX', power=100)
-        pta.add_transition('UNINITIALIZED', 'IDLE', 'init', energy=500000, duration=50000, set_param={'txpower': 10})
+        pta = PTA(parameters=["txpower", "length"])
+        pta.add_state("IDLE", power=5)
+        pta.add_state("TX", power=100)
+        pta.add_transition(
+            "UNINITIALIZED",
+            "IDLE",
+            "init",
+            energy=500000,
+            duration=50000,
+            set_param={"txpower": 10},
+        )
         trace = [
-            ['init'],
+            ["init"],
         ]
         expected_energy = 500000
         expected_duration = 50000
         result = pta.simulate(trace)
         self.assertAlmostEqual(result.energy, expected_energy * 1e-12, places=12)
         self.assertAlmostEqual(result.duration, expected_duration * 1e-6, places=6)
-        self.assertEqual(result.end_state.name, 'IDLE')
-        self.assertEqual(result.parameters, {
-            'txpower': 10,
-            'length': None
-        })
+        self.assertEqual(result.end_state.name, "IDLE")
+        self.assertEqual(result.parameters, {"txpower": 10, "length": None})
 
     def test_simulation_arg_function(self):
-        pta = PTA(parameters=['txpower', 'length'])
-        pta.add_state('IDLE', power=5)
-        pta.add_state('TX', power=100)
-        pta.add_transition('UNINITIALIZED', 'IDLE', 'init', energy=500000, duration=50000)
-        pta.add_transition('IDLE', 'IDLE', 'setTxPower', energy=10000, duration=120,
-                           param_update_function=lambda param, arg: {**param, 'txpower': arg[0]})
-        pta.add_transition('IDLE', 'TX', 'send', energy=3, duration=10,
-                           energy_function=lambda param, arg: 3 + 5 * arg[1],
-                           duration_function=lambda param, arg: 48 + 8 * arg[1])
-        pta.add_transition('TX', 'IDLE', 'txComplete', timeout=2000, is_interrupt=True)
+        pta = PTA(parameters=["txpower", "length"])
+        pta.add_state("IDLE", power=5)
+        pta.add_state("TX", power=100)
+        pta.add_transition(
+            "UNINITIALIZED", "IDLE", "init", energy=500000, duration=50000
+        )
+        pta.add_transition(
+            "IDLE",
+            "IDLE",
+            "setTxPower",
+            energy=10000,
+            duration=120,
+            param_update_function=lambda param, arg: {**param, "txpower": arg[0]},
+        )
+        pta.add_transition(
+            "IDLE",
+            "TX",
+            "send",
+            energy=3,
+            duration=10,
+            energy_function=lambda param, arg: 3 + 5 * arg[1],
+            duration_function=lambda param, arg: 48 + 8 * arg[1],
+        )
+        pta.add_transition("TX", "IDLE", "txComplete", timeout=2000, is_interrupt=True)
         trace = [
-            ['init'],
-            ['setTxPower', 10],
-            ['send', 'foo', 3],
+            ["init"],
+            ["setTxPower", 10],
+            ["send", "foo", 3],
         ]
         expected_energy = 500000 + 10000 + (3 + 5 * 3) + (2000 * 100)
         expected_duration = 50000 + 120 + (48 + 8 * 3) + 2000
         result = pta.simulate(trace)
         self.assertAlmostEqual(result.energy, expected_energy * 1e-12, places=12)
         self.assertAlmostEqual(result.duration, expected_duration * 1e-6, places=6)
-        self.assertEqual(result.end_state.name, 'IDLE')
-        self.assertEqual(result.parameters, {
-            'txpower': 10,
-            'length': None
-        })
-
-        pta = PTA(parameters=['txpower', 'length'])
-        pta.add_state('IDLE', power=5)
-        pta.add_state('TX', power=100)
-        pta.add_transition('UNINITIALIZED', 'IDLE', 'init', energy=500000, duration=50000)
-        pta.add_transition('IDLE', 'IDLE', 'setTxPower', energy=10000, duration=120,
-                           param_update_function=lambda param, arg: {**param, 'txpower': arg[0]})
-        pta.add_transition('IDLE', 'TX', 'send', energy=3, duration=10,
-                           energy_function=lambda param, arg: 3 + 5 * arg[1],
-                           duration_function=lambda param, arg: 48 + 8 * arg[1])
-        pta.add_transition('TX', 'IDLE', 'txComplete', timeout=2000, is_interrupt=True)
+        self.assertEqual(result.end_state.name, "IDLE")
+        self.assertEqual(result.parameters, {"txpower": 10, "length": None})
+
+        pta = PTA(parameters=["txpower", "length"])
+        pta.add_state("IDLE", power=5)
+        pta.add_state("TX", power=100)
+        pta.add_transition(
+            "UNINITIALIZED", "IDLE", "init", energy=500000, duration=50000
+        )
+        pta.add_transition(
+            "IDLE",
+            "IDLE",
+            "setTxPower",
+            energy=10000,
+            duration=120,
+            param_update_function=lambda param, arg: {**param, "txpower": arg[0]},
+        )
+        pta.add_transition(
+            "IDLE",
+            "TX",
+            "send",
+            energy=3,
+            duration=10,
+            energy_function=lambda param, arg: 3 + 5 * arg[1],
+            duration_function=lambda param, arg: 48 + 8 * arg[1],
+        )
+        pta.add_transition("TX", "IDLE", "txComplete", timeout=2000, is_interrupt=True)
         trace = [
-            ['init'],
-            ['setTxPower', 10],
-            ['send', 'foobar', 6],
+            ["init"],
+            ["setTxPower", 10],
+            ["send", "foobar", 6],
         ]
         expected_energy = 500000 + 10000 + (3 + 5 * 6) + (2000 * 100)
         expected_duration = 50000 + 120 + (48 + 8 * 6) + 2000
         result = pta.simulate(trace)
         self.assertAlmostEqual(result.energy, expected_energy * 1e-12, places=12)
         self.assertAlmostEqual(result.duration, expected_duration * 1e-6, places=6)
-        self.assertEqual(result.end_state.name, 'IDLE')
-        self.assertEqual(result.parameters, {
-            'txpower': 10,
-            'length': None
-        })
+        self.assertEqual(result.end_state.name, "IDLE")
+        self.assertEqual(result.parameters, {"txpower": 10, "length": None})
 
     def test_simulation_param_function(self):
-        pta = PTA(parameters=['length', 'txpower'])
-        pta.add_state('IDLE', power=5)
-        pta.add_state('TX', power=100,
-                      power_function=lambda param, arg: 1000 + 2 * param[1])
-        pta.add_transition('UNINITIALIZED', 'IDLE', 'init', energy=500000, duration=50000)
-        pta.add_transition('IDLE', 'IDLE', 'setTxPower', energy=10000, duration=120,
-                           param_update_function=lambda param, arg: {**param, 'txpower': arg[0]})
-        pta.add_transition('IDLE', 'TX', 'send', energy=3, duration=10,
-                           energy_function=lambda param, arg: 3 + 5 * arg[1],
-                           param_update_function=lambda param, arg: {**param, 'length': arg[1]})
-        pta.add_transition('TX', 'IDLE', 'txComplete', timeout=2000, is_interrupt=True,
-                           timeout_function=lambda param, arg: 500 + 16 * param[0])
+        pta = PTA(parameters=["length", "txpower"])
+        pta.add_state("IDLE", power=5)
+        pta.add_state(
+            "TX", power=100, power_function=lambda param, arg: 1000 + 2 * param[1]
+        )
+        pta.add_transition(
+            "UNINITIALIZED", "IDLE", "init", energy=500000, duration=50000
+        )
+        pta.add_transition(
+            "IDLE",
+            "IDLE",
+            "setTxPower",
+            energy=10000,
+            duration=120,
+            param_update_function=lambda param, arg: {**param, "txpower": arg[0]},
+        )
+        pta.add_transition(
+            "IDLE",
+            "TX",
+            "send",
+            energy=3,
+            duration=10,
+            energy_function=lambda param, arg: 3 + 5 * arg[1],
+            param_update_function=lambda param, arg: {**param, "length": arg[1]},
+        )
+        pta.add_transition(
+            "TX",
+            "IDLE",
+            "txComplete",
+            timeout=2000,
+            is_interrupt=True,
+            timeout_function=lambda param, arg: 500 + 16 * param[0],
+        )
         trace = [
-            ['init'],
-            ['setTxPower', 10],
-            ['send', 'foo', 3],
+            ["init"],
+            ["setTxPower", 10],
+            ["send", "foo", 3],
         ]
-        expected_energy = 500000 + 10000 + (3 + 5 * 3) + (1000 + 2 * 10) * (500 + 16 * 3)
+        expected_energy = (
+            500000 + 10000 + (3 + 5 * 3) + (1000 + 2 * 10) * (500 + 16 * 3)
+        )
         expected_duration = 50000 + 120 + 10 + (500 + 16 * 3)
         result = pta.simulate(trace)
         self.assertAlmostEqual(result.energy, expected_energy * 1e-12, places=12)
         self.assertAlmostEqual(result.duration, expected_duration * 1e-6, places=6)
-        self.assertEqual(result.end_state.name, 'IDLE')
-        self.assertEqual(result.parameters, {
-            'txpower': 10,
-            'length': 3
-        })
+        self.assertEqual(result.end_state.name, "IDLE")
+        self.assertEqual(result.parameters, {"txpower": 10, "length": 3})
 
     def test_get_X_expensive_state(self):
         pta = PTA.from_json(example_json_1)
-        self.assertEqual(pta.get_least_expensive_state(), pta.state['IDLE'])
-        self.assertEqual(pta.get_most_expensive_state(), pta.state['TX'])
+        self.assertEqual(pta.get_least_expensive_state(), pta.state["IDLE"])
+        self.assertEqual(pta.get_most_expensive_state(), pta.state["TX"])
         # self.assertAlmostEqual(pta.min_duration_until_energy_overflow(), (2**32 - 1) * 1e-12 / 10e-3, places=9)
         # self.assertAlmostEqual(pta.min_duration_until_energy_overflow(energy_granularity=1e-9), (2**32 - 1) * 1e-9 / 10e-3, places=9)
-        self.assertAlmostEqual(pta.max_duration_until_energy_overflow(), (2**32 - 1) * 1e-12 / 5e-6, places=9)
-        self.assertAlmostEqual(pta.max_duration_until_energy_overflow(energy_granularity=1e-9), (2**32 - 1) * 1e-9 / 5e-6, places=9)
+        self.assertAlmostEqual(
+            pta.max_duration_until_energy_overflow(),
+            (2 ** 32 - 1) * 1e-12 / 5e-6,
+            places=9,
+        )
+        self.assertAlmostEqual(
+            pta.max_duration_until_energy_overflow(energy_granularity=1e-9),
+            (2 ** 32 - 1) * 1e-9 / 5e-6,
+            places=9,
+        )
 
 
-if __name__ == '__main__':
+if __name__ == "__main__":
     unittest.main()
diff --git a/test/test_ptamodel.py b/test/test_ptamodel.py
index 7e398bd..3237450 100755
--- a/test/test_ptamodel.py
+++ b/test/test_ptamodel.py
@@ -8,241 +8,384 @@ import pytest
 
 class TestModels(unittest.TestCase):
     def test_model_singlefile_rf24(self):
-        raw_data = RawData(['test-data/20170220_164723_RF24_int_A.tar'])
+        raw_data = RawData(["test-data/20170220_164723_RF24_int_A.tar"])
         preprocessed_data = raw_data.get_preprocessed_data()
         by_name, parameters, arg_count = pta_trace_to_aggregate(preprocessed_data)
         model = PTAModel(by_name, parameters, arg_count)
-        self.assertEqual(model.states(), 'POWERDOWN RX STANDBY1 TX'.split(' '))
-        self.assertEqual(model.transitions(), 'begin epilogue powerDown powerUp setDataRate_num setPALevel_num startListening stopListening write_nb'.split(' '))
+        self.assertEqual(model.states(), "POWERDOWN RX STANDBY1 TX".split(" "))
+        self.assertEqual(
+            model.transitions(),
+            "begin epilogue powerDown powerUp setDataRate_num setPALevel_num startListening stopListening write_nb".split(
+                " "
+            ),
+        )
         static_model = model.get_static()
-        self.assertAlmostEqual(static_model('POWERDOWN', 'power'), 0, places=0)
-        self.assertAlmostEqual(static_model('RX', 'power'), 52254, places=0)
-        self.assertAlmostEqual(static_model('STANDBY1', 'power'), 7, places=0)
-        self.assertAlmostEqual(static_model('TX', 'power'), 18414, places=0)
-        self.assertAlmostEqual(static_model('begin', 'energy'), 1652249, places=0)
-        self.assertAlmostEqual(static_model('epilogue', 'energy'), 15449, places=0)
-        self.assertAlmostEqual(static_model('powerDown', 'energy'), 4547, places=0)
-        self.assertAlmostEqual(static_model('powerUp', 'energy'), 1641765, places=0)
-        self.assertAlmostEqual(static_model('setDataRate_num', 'energy'), 7749, places=0)
-        self.assertAlmostEqual(static_model('setPALevel_num', 'energy'), 4700, places=0)
-        self.assertAlmostEqual(static_model('startListening', 'energy'), 4309602, places=0)
-        self.assertAlmostEqual(static_model('stopListening', 'energy'), 193775, places=0)
-        self.assertAlmostEqual(static_model('write_nb', 'energy'), 218339, places=0)
-        self.assertAlmostEqual(static_model('begin', 'rel_energy_prev'), 1649571, places=0)
-        self.assertAlmostEqual(static_model('epilogue', 'rel_energy_prev'), -744114, places=0)
-        self.assertAlmostEqual(static_model('powerDown', 'rel_energy_prev'), 3854, places=0)
-        self.assertAlmostEqual(static_model('powerUp', 'rel_energy_prev'), 1641381, places=0)
-        self.assertAlmostEqual(static_model('setDataRate_num', 'rel_energy_prev'), 6777, places=0)
-        self.assertAlmostEqual(static_model('setPALevel_num', 'rel_energy_prev'), 3728, places=0)
-        self.assertAlmostEqual(static_model('startListening', 'rel_energy_prev'), 4307769, places=0)
-        self.assertAlmostEqual(static_model('stopListening', 'rel_energy_prev'), -13533693, places=0)
-        self.assertAlmostEqual(static_model('write_nb', 'rel_energy_prev'), 214618, places=0)
-        self.assertAlmostEqual(static_model('begin', 'duration'), 19830, places=0)
-        self.assertAlmostEqual(static_model('epilogue', 'duration'), 40, places=0)
-        self.assertAlmostEqual(static_model('powerDown', 'duration'), 90, places=0)
-        self.assertAlmostEqual(static_model('powerUp', 'duration'), 10030, places=0)
-        self.assertAlmostEqual(static_model('setDataRate_num', 'duration'), 140, places=0)
-        self.assertAlmostEqual(static_model('setPALevel_num', 'duration'), 90, places=0)
-        self.assertAlmostEqual(static_model('startListening', 'duration'), 260, places=0)
-        self.assertAlmostEqual(static_model('stopListening', 'duration'), 260, places=0)
-        self.assertAlmostEqual(static_model('write_nb', 'duration'), 510, places=0)
-
-        self.assertAlmostEqual(model.stats.param_dependence_ratio('POWERDOWN', 'power', 'datarate'), 0, places=2)
-        self.assertAlmostEqual(model.stats.param_dependence_ratio('POWERDOWN', 'power', 'txbytes'), 0, places=2)
-        self.assertAlmostEqual(model.stats.param_dependence_ratio('POWERDOWN', 'power', 'txpower'), 0, places=2)
-        self.assertAlmostEqual(model.stats.param_dependence_ratio('RX', 'power', 'datarate'), 0.99, places=2)
-        self.assertAlmostEqual(model.stats.param_dependence_ratio('RX', 'power', 'txbytes'), 0, places=2)
-        self.assertAlmostEqual(model.stats.param_dependence_ratio('RX', 'power', 'txpower'), 0.01, places=2)
-        self.assertAlmostEqual(model.stats.param_dependence_ratio('STANDBY1', 'power', 'datarate'), 0.04, places=2)
-        self.assertAlmostEqual(model.stats.param_dependence_ratio('STANDBY1', 'power', 'txbytes'), 0.35, places=2)
-        self.assertAlmostEqual(model.stats.param_dependence_ratio('STANDBY1', 'power', 'txpower'), 0.32, places=2)
-        self.assertAlmostEqual(model.stats.param_dependence_ratio('TX', 'power', 'datarate'), 1, places=2)
-        self.assertAlmostEqual(model.stats.param_dependence_ratio('TX', 'power', 'txbytes'), 0.09, places=2)
-        self.assertAlmostEqual(model.stats.param_dependence_ratio('TX', 'power', 'txpower'), 1, places=2)
+        self.assertAlmostEqual(static_model("POWERDOWN", "power"), 0, places=0)
+        self.assertAlmostEqual(static_model("RX", "power"), 52254, places=0)
+        self.assertAlmostEqual(static_model("STANDBY1", "power"), 7, places=0)
+        self.assertAlmostEqual(static_model("TX", "power"), 18414, places=0)
+        self.assertAlmostEqual(static_model("begin", "energy"), 1652249, places=0)
+        self.assertAlmostEqual(static_model("epilogue", "energy"), 15449, places=0)
+        self.assertAlmostEqual(static_model("powerDown", "energy"), 4547, places=0)
+        self.assertAlmostEqual(static_model("powerUp", "energy"), 1641765, places=0)
+        self.assertAlmostEqual(
+            static_model("setDataRate_num", "energy"), 7749, places=0
+        )
+        self.assertAlmostEqual(static_model("setPALevel_num", "energy"), 4700, places=0)
+        self.assertAlmostEqual(
+            static_model("startListening", "energy"), 4309602, places=0
+        )
+        self.assertAlmostEqual(
+            static_model("stopListening", "energy"), 193775, places=0
+        )
+        self.assertAlmostEqual(static_model("write_nb", "energy"), 218339, places=0)
+        self.assertAlmostEqual(
+            static_model("begin", "rel_energy_prev"), 1649571, places=0
+        )
+        self.assertAlmostEqual(
+            static_model("epilogue", "rel_energy_prev"), -744114, places=0
+        )
+        self.assertAlmostEqual(
+            static_model("powerDown", "rel_energy_prev"), 3854, places=0
+        )
+        self.assertAlmostEqual(
+            static_model("powerUp", "rel_energy_prev"), 1641381, places=0
+        )
+        self.assertAlmostEqual(
+            static_model("setDataRate_num", "rel_energy_prev"), 6777, places=0
+        )
+        self.assertAlmostEqual(
+            static_model("setPALevel_num", "rel_energy_prev"), 3728, places=0
+        )
+        self.assertAlmostEqual(
+            static_model("startListening", "rel_energy_prev"), 4307769, places=0
+        )
+        self.assertAlmostEqual(
+            static_model("stopListening", "rel_energy_prev"), -13533693, places=0
+        )
+        self.assertAlmostEqual(
+            static_model("write_nb", "rel_energy_prev"), 214618, places=0
+        )
+        self.assertAlmostEqual(static_model("begin", "duration"), 19830, places=0)
+        self.assertAlmostEqual(static_model("epilogue", "duration"), 40, places=0)
+        self.assertAlmostEqual(static_model("powerDown", "duration"), 90, places=0)
+        self.assertAlmostEqual(static_model("powerUp", "duration"), 10030, places=0)
+        self.assertAlmostEqual(
+            static_model("setDataRate_num", "duration"), 140, places=0
+        )
+        self.assertAlmostEqual(static_model("setPALevel_num", "duration"), 90, places=0)
+        self.assertAlmostEqual(
+            static_model("startListening", "duration"), 260, places=0
+        )
+        self.assertAlmostEqual(static_model("stopListening", "duration"), 260, places=0)
+        self.assertAlmostEqual(static_model("write_nb", "duration"), 510, places=0)
+
+        self.assertAlmostEqual(
+            model.stats.param_dependence_ratio("POWERDOWN", "power", "datarate"),
+            0,
+            places=2,
+        )
+        self.assertAlmostEqual(
+            model.stats.param_dependence_ratio("POWERDOWN", "power", "txbytes"),
+            0,
+            places=2,
+        )
+        self.assertAlmostEqual(
+            model.stats.param_dependence_ratio("POWERDOWN", "power", "txpower"),
+            0,
+            places=2,
+        )
+        self.assertAlmostEqual(
+            model.stats.param_dependence_ratio("RX", "power", "datarate"),
+            0.99,
+            places=2,
+        )
+        self.assertAlmostEqual(
+            model.stats.param_dependence_ratio("RX", "power", "txbytes"), 0, places=2
+        )
+        self.assertAlmostEqual(
+            model.stats.param_dependence_ratio("RX", "power", "txpower"), 0.01, places=2
+        )
+        self.assertAlmostEqual(
+            model.stats.param_dependence_ratio("STANDBY1", "power", "datarate"),
+            0.04,
+            places=2,
+        )
+        self.assertAlmostEqual(
+            model.stats.param_dependence_ratio("STANDBY1", "power", "txbytes"),
+            0.35,
+            places=2,
+        )
+        self.assertAlmostEqual(
+            model.stats.param_dependence_ratio("STANDBY1", "power", "txpower"),
+            0.32,
+            places=2,
+        )
+        self.assertAlmostEqual(
+            model.stats.param_dependence_ratio("TX", "power", "datarate"), 1, places=2
+        )
+        self.assertAlmostEqual(
+            model.stats.param_dependence_ratio("TX", "power", "txbytes"), 0.09, places=2
+        )
+        self.assertAlmostEqual(
+            model.stats.param_dependence_ratio("TX", "power", "txpower"), 1, places=2
+        )
 
         param_model, param_info = model.get_fitted()
-        self.assertEqual(param_info('POWERDOWN', 'power'), None)
-        self.assertEqual(param_info('RX', 'power')['function']._model_str,
-                         '0 + regression_arg(0) + regression_arg(1) * np.sqrt(parameter(datarate))')
-        self.assertAlmostEqual(param_info('RX', 'power')['function']._regression_args[0], 48530.7, places=0)
-        self.assertAlmostEqual(param_info('RX', 'power')['function']._regression_args[1], 117, places=0)
-        self.assertEqual(param_info('STANDBY1', 'power'), None)
-        self.assertEqual(param_info('TX', 'power')['function']._model_str,
-                         '0 + regression_arg(0) + regression_arg(1) * 1/(parameter(datarate)) + regression_arg(2) * parameter(txpower) + regression_arg(3) * 1/(parameter(datarate)) * parameter(txpower)')
-        self.assertEqual(param_info('epilogue', 'timeout')['function']._model_str,
-                         '0 + regression_arg(0) + regression_arg(1) * 1/(parameter(datarate))')
-        self.assertEqual(param_info('stopListening', 'duration')['function']._model_str,
-                         '0 + regression_arg(0) + regression_arg(1) * 1/(parameter(datarate))')
-
-        self.assertAlmostEqual(param_model('RX', 'power', param=[1, None, None]), 48647, places=-1)
+        self.assertEqual(param_info("POWERDOWN", "power"), None)
+        self.assertEqual(
+            param_info("RX", "power")["function"]._model_str,
+            "0 + regression_arg(0) + regression_arg(1) * np.sqrt(parameter(datarate))",
+        )
+        self.assertAlmostEqual(
+            param_info("RX", "power")["function"]._regression_args[0], 48530.7, places=0
+        )
+        self.assertAlmostEqual(
+            param_info("RX", "power")["function"]._regression_args[1], 117, places=0
+        )
+        self.assertEqual(param_info("STANDBY1", "power"), None)
+        self.assertEqual(
+            param_info("TX", "power")["function"]._model_str,
+            "0 + regression_arg(0) + regression_arg(1) * 1/(parameter(datarate)) + regression_arg(2) * parameter(txpower) + regression_arg(3) * 1/(parameter(datarate)) * parameter(txpower)",
+        )
+        self.assertEqual(
+            param_info("epilogue", "timeout")["function"]._model_str,
+            "0 + regression_arg(0) + regression_arg(1) * 1/(parameter(datarate))",
+        )
+        self.assertEqual(
+            param_info("stopListening", "duration")["function"]._model_str,
+            "0 + regression_arg(0) + regression_arg(1) * 1/(parameter(datarate))",
+        )
+
+        self.assertAlmostEqual(
+            param_model("RX", "power", param=[1, None, None]), 48647, places=-1
+        )
 
     def test_model_singlefile_mmparam(self):
-        raw_data = RawData(['test-data/20161221_123347_mmparam.tar'])
+        raw_data = RawData(["test-data/20161221_123347_mmparam.tar"])
         preprocessed_data = raw_data.get_preprocessed_data()
         by_name, parameters, arg_count = pta_trace_to_aggregate(preprocessed_data)
         model = PTAModel(by_name, parameters, arg_count)
-        self.assertEqual(model.states(), 'OFF ON'.split(' '))
-        self.assertEqual(model.transitions(), 'off setBrightness'.split(' '))
+        self.assertEqual(model.states(), "OFF ON".split(" "))
+        self.assertEqual(model.transitions(), "off setBrightness".split(" "))
         static_model = model.get_static()
-        self.assertAlmostEqual(static_model('OFF', 'power'), 7124, places=0)
-        self.assertAlmostEqual(static_model('ON', 'power'), 17866, places=0)
-        self.assertAlmostEqual(static_model('off', 'energy'), 268079197, places=0)
-        self.assertAlmostEqual(static_model('setBrightness', 'energy'), 168912773, places=0)
-        self.assertAlmostEqual(static_model('off', 'rel_energy_prev'), 105040198, places=0)
-        self.assertAlmostEqual(static_model('setBrightness', 'rel_energy_prev'), 103745586, places=0)
-        self.assertAlmostEqual(static_model('off', 'duration'), 9130, places=0)
-        self.assertAlmostEqual(static_model('setBrightness', 'duration'), 9130, places=0)
+        self.assertAlmostEqual(static_model("OFF", "power"), 7124, places=0)
+        self.assertAlmostEqual(static_model("ON", "power"), 17866, places=0)
+        self.assertAlmostEqual(static_model("off", "energy"), 268079197, places=0)
+        self.assertAlmostEqual(
+            static_model("setBrightness", "energy"), 168912773, places=0
+        )
+        self.assertAlmostEqual(
+            static_model("off", "rel_energy_prev"), 105040198, places=0
+        )
+        self.assertAlmostEqual(
+            static_model("setBrightness", "rel_energy_prev"), 103745586, places=0
+        )
+        self.assertAlmostEqual(static_model("off", "duration"), 9130, places=0)
+        self.assertAlmostEqual(
+            static_model("setBrightness", "duration"), 9130, places=0
+        )
 
         param_lut_model = model.get_param_lut()
-        self.assertAlmostEqual(param_lut_model('OFF', 'power', param=[None, None]), 7124, places=0)
+        self.assertAlmostEqual(
+            param_lut_model("OFF", "power", param=[None, None]), 7124, places=0
+        )
         with self.assertRaises(KeyError):
-            param_lut_model('ON', 'power', param=[None, None])
-            param_lut_model('ON', 'power', param=['a'])
-            param_lut_model('ON', 'power', param=[0])
-        self.assertTrue(param_lut_model('ON', 'power', param=[0, 0]))
+            param_lut_model("ON", "power", param=[None, None])
+            param_lut_model("ON", "power", param=["a"])
+            param_lut_model("ON", "power", param=[0])
+        self.assertTrue(param_lut_model("ON", "power", param=[0, 0]))
         param_lut_model = model.get_param_lut(fallback=True)
-        self.assertAlmostEqual(param_lut_model('ON', 'power', param=[None, None]), 17866, places=0)
+        self.assertAlmostEqual(
+            param_lut_model("ON", "power", param=[None, None]), 17866, places=0
+        )
 
     def test_model_multifile_lm75x(self):
         testfiles = [
-            'test-data/20170116_124500_LM75x.tar',
-            'test-data/20170116_131306_LM75x.tar',
+            "test-data/20170116_124500_LM75x.tar",
+            "test-data/20170116_131306_LM75x.tar",
         ]
         raw_data = RawData(testfiles)
         preprocessed_data = raw_data.get_preprocessed_data()
         by_name, parameters, arg_count = pta_trace_to_aggregate(preprocessed_data)
         model = PTAModel(by_name, parameters, arg_count)
-        self.assertEqual(model.states(), 'ACTIVE POWEROFF'.split(' '))
-        self.assertEqual(model.transitions(), 'getTemp setHyst setOS shutdown start'.split(' '))
+        self.assertEqual(model.states(), "ACTIVE POWEROFF".split(" "))
+        self.assertEqual(
+            model.transitions(), "getTemp setHyst setOS shutdown start".split(" ")
+        )
         static_model = model.get_static()
-        self.assertAlmostEqual(static_model('ACTIVE', 'power'), 332, places=0)
-        self.assertAlmostEqual(static_model('POWEROFF', 'power'), 7, places=0)
-        self.assertAlmostEqual(static_model('getTemp', 'energy'), 26016748, places=0)
-        self.assertAlmostEqual(static_model('setHyst', 'energy'), 22082226, places=0)
-        self.assertAlmostEqual(static_model('setOS', 'energy'), 21774238, places=0)
-        self.assertAlmostEqual(static_model('shutdown', 'energy'), 11808160, places=0)
-        self.assertAlmostEqual(static_model('start', 'energy'), 12445302, places=0)
-        self.assertAlmostEqual(static_model('getTemp', 'rel_energy_prev'), 21722720, places=0)
-        self.assertAlmostEqual(static_model('setHyst', 'rel_energy_prev'), 19001499, places=0)
-        self.assertAlmostEqual(static_model('setOS', 'rel_energy_prev'), 18693283, places=0)
-        self.assertAlmostEqual(static_model('shutdown', 'rel_energy_prev'), 11746224, places=0)
-        self.assertAlmostEqual(static_model('start', 'rel_energy_prev'), 12391462, places=0)
-        self.assertAlmostEqual(static_model('getTemp', 'duration'), 12740, places=0)
-        self.assertAlmostEqual(static_model('setHyst', 'duration'), 9140, places=0)
-        self.assertAlmostEqual(static_model('setOS', 'duration'), 9140, places=0)
-        self.assertAlmostEqual(static_model('shutdown', 'duration'), 6980, places=0)
-        self.assertAlmostEqual(static_model('start', 'duration'), 6980, places=0)
+        self.assertAlmostEqual(static_model("ACTIVE", "power"), 332, places=0)
+        self.assertAlmostEqual(static_model("POWEROFF", "power"), 7, places=0)
+        self.assertAlmostEqual(static_model("getTemp", "energy"), 26016748, places=0)
+        self.assertAlmostEqual(static_model("setHyst", "energy"), 22082226, places=0)
+        self.assertAlmostEqual(static_model("setOS", "energy"), 21774238, places=0)
+        self.assertAlmostEqual(static_model("shutdown", "energy"), 11808160, places=0)
+        self.assertAlmostEqual(static_model("start", "energy"), 12445302, places=0)
+        self.assertAlmostEqual(
+            static_model("getTemp", "rel_energy_prev"), 21722720, places=0
+        )
+        self.assertAlmostEqual(
+            static_model("setHyst", "rel_energy_prev"), 19001499, places=0
+        )
+        self.assertAlmostEqual(
+            static_model("setOS", "rel_energy_prev"), 18693283, places=0
+        )
+        self.assertAlmostEqual(
+            static_model("shutdown", "rel_energy_prev"), 11746224, places=0
+        )
+        self.assertAlmostEqual(
+            static_model("start", "rel_energy_prev"), 12391462, places=0
+        )
+        self.assertAlmostEqual(static_model("getTemp", "duration"), 12740, places=0)
+        self.assertAlmostEqual(static_model("setHyst", "duration"), 9140, places=0)
+        self.assertAlmostEqual(static_model("setOS", "duration"), 9140, places=0)
+        self.assertAlmostEqual(static_model("shutdown", "duration"), 6980, places=0)
+        self.assertAlmostEqual(static_model("start", "duration"), 6980, places=0)
 
     def test_model_multifile_sharp(self):
         testfiles = [
-            'test-data/20170116_145420_sharpLS013B4DN.tar',
-            'test-data/20170116_151348_sharpLS013B4DN.tar',
+            "test-data/20170116_145420_sharpLS013B4DN.tar",
+            "test-data/20170116_151348_sharpLS013B4DN.tar",
         ]
         raw_data = RawData(testfiles)
         preprocessed_data = raw_data.get_preprocessed_data()
         by_name, parameters, arg_count = pta_trace_to_aggregate(preprocessed_data)
         model = PTAModel(by_name, parameters, arg_count)
-        self.assertEqual(model.states(), 'DISABLED ENABLED'.split(' '))
-        self.assertEqual(model.transitions(), 'clear disable enable ioInit sendLine toggleVCOM'.split(' '))
+        self.assertEqual(model.states(), "DISABLED ENABLED".split(" "))
+        self.assertEqual(
+            model.transitions(),
+            "clear disable enable ioInit sendLine toggleVCOM".split(" "),
+        )
         static_model = model.get_static()
-        self.assertAlmostEqual(static_model('DISABLED', 'power'), 22, places=0)
-        self.assertAlmostEqual(static_model('ENABLED', 'power'), 24, places=0)
-        self.assertAlmostEqual(static_model('clear', 'energy'), 14059, places=0)
-        self.assertAlmostEqual(static_model('disable', 'energy'), 0, places=0)
-        self.assertAlmostEqual(static_model('enable', 'energy'), 0, places=0)
-        self.assertAlmostEqual(static_model('ioInit', 'energy'), 0, places=0)
-        self.assertAlmostEqual(static_model('sendLine', 'energy'), 37874, places=0)
-        self.assertAlmostEqual(static_model('toggleVCOM', 'energy'), 30991, places=0)
-        self.assertAlmostEqual(static_model('clear', 'rel_energy_prev'), 13329, places=0)
-        self.assertAlmostEqual(static_model('disable', 'rel_energy_prev'), 0, places=0)
-        self.assertAlmostEqual(static_model('enable', 'rel_energy_prev'), 0, places=0)
-        self.assertAlmostEqual(static_model('ioInit', 'rel_energy_prev'), 0, places=0)
-        self.assertAlmostEqual(static_model('sendLine', 'rel_energy_prev'), 33447, places=0)
-        self.assertAlmostEqual(static_model('toggleVCOM', 'rel_energy_prev'), 30242, places=0)
-        self.assertAlmostEqual(static_model('clear', 'duration'), 30, places=0)
-        self.assertAlmostEqual(static_model('disable', 'duration'), 0, places=0)
-        self.assertAlmostEqual(static_model('enable', 'duration'), 0, places=0)
-        self.assertAlmostEqual(static_model('ioInit', 'duration'), 0, places=0)
-        self.assertAlmostEqual(static_model('sendLine', 'duration'), 180, places=0)
-        self.assertAlmostEqual(static_model('toggleVCOM', 'duration'), 30, places=0)
+        self.assertAlmostEqual(static_model("DISABLED", "power"), 22, places=0)
+        self.assertAlmostEqual(static_model("ENABLED", "power"), 24, places=0)
+        self.assertAlmostEqual(static_model("clear", "energy"), 14059, places=0)
+        self.assertAlmostEqual(static_model("disable", "energy"), 0, places=0)
+        self.assertAlmostEqual(static_model("enable", "energy"), 0, places=0)
+        self.assertAlmostEqual(static_model("ioInit", "energy"), 0, places=0)
+        self.assertAlmostEqual(static_model("sendLine", "energy"), 37874, places=0)
+        self.assertAlmostEqual(static_model("toggleVCOM", "energy"), 30991, places=0)
+        self.assertAlmostEqual(
+            static_model("clear", "rel_energy_prev"), 13329, places=0
+        )
+        self.assertAlmostEqual(static_model("disable", "rel_energy_prev"), 0, places=0)
+        self.assertAlmostEqual(static_model("enable", "rel_energy_prev"), 0, places=0)
+        self.assertAlmostEqual(static_model("ioInit", "rel_energy_prev"), 0, places=0)
+        self.assertAlmostEqual(
+            static_model("sendLine", "rel_energy_prev"), 33447, places=0
+        )
+        self.assertAlmostEqual(
+            static_model("toggleVCOM", "rel_energy_prev"), 30242, places=0
+        )
+        self.assertAlmostEqual(static_model("clear", "duration"), 30, places=0)
+        self.assertAlmostEqual(static_model("disable", "duration"), 0, places=0)
+        self.assertAlmostEqual(static_model("enable", "duration"), 0, places=0)
+        self.assertAlmostEqual(static_model("ioInit", "duration"), 0, places=0)
+        self.assertAlmostEqual(static_model("sendLine", "duration"), 180, places=0)
+        self.assertAlmostEqual(static_model("toggleVCOM", "duration"), 30, places=0)
 
     def test_model_multifile_mmstatic(self):
         testfiles = [
-            'test-data/20170116_143516_mmstatic.tar',
-            'test-data/20170116_142654_mmstatic.tar',
+            "test-data/20170116_143516_mmstatic.tar",
+            "test-data/20170116_142654_mmstatic.tar",
         ]
         raw_data = RawData(testfiles)
         preprocessed_data = raw_data.get_preprocessed_data()
         by_name, parameters, arg_count = pta_trace_to_aggregate(preprocessed_data)
         model = PTAModel(by_name, parameters, arg_count)
-        self.assertEqual(model.states(), 'B G OFF R'.split(' '))
-        self.assertEqual(model.transitions(), 'blue green off red'.split(' '))
+        self.assertEqual(model.states(), "B G OFF R".split(" "))
+        self.assertEqual(model.transitions(), "blue green off red".split(" "))
         static_model = model.get_static()
-        self.assertAlmostEqual(static_model('B', 'power'), 29443, places=0)
-        self.assertAlmostEqual(static_model('G', 'power'), 29432, places=0)
-        self.assertAlmostEqual(static_model('OFF', 'power'), 7057, places=0)
-        self.assertAlmostEqual(static_model('R', 'power'), 49068, places=0)
-        self.assertAlmostEqual(static_model('blue', 'energy'), 374440955, places=0)
-        self.assertAlmostEqual(static_model('green', 'energy'), 372026027, places=0)
-        self.assertAlmostEqual(static_model('off', 'energy'), 372999554, places=0)
-        self.assertAlmostEqual(static_model('red', 'energy'), 378936634, places=0)
-        self.assertAlmostEqual(static_model('blue', 'rel_energy_prev'), 105535587, places=0)
-        self.assertAlmostEqual(static_model('green', 'rel_energy_prev'), 102999371, places=0)
-        self.assertAlmostEqual(static_model('off', 'rel_energy_prev'), 103613698, places=0)
-        self.assertAlmostEqual(static_model('red', 'rel_energy_prev'), 110474331, places=0)
-        self.assertAlmostEqual(static_model('blue', 'duration'), 9140, places=0)
-        self.assertAlmostEqual(static_model('green', 'duration'), 9140, places=0)
-        self.assertAlmostEqual(static_model('off', 'duration'), 9140, places=0)
-        self.assertAlmostEqual(static_model('red', 'duration'), 9140, places=0)
-
-    @pytest.mark.skipif('TEST_SLOW' not in os.environ, reason="slow test, set TEST_SLOW=1 to run")
+        self.assertAlmostEqual(static_model("B", "power"), 29443, places=0)
+        self.assertAlmostEqual(static_model("G", "power"), 29432, places=0)
+        self.assertAlmostEqual(static_model("OFF", "power"), 7057, places=0)
+        self.assertAlmostEqual(static_model("R", "power"), 49068, places=0)
+        self.assertAlmostEqual(static_model("blue", "energy"), 374440955, places=0)
+        self.assertAlmostEqual(static_model("green", "energy"), 372026027, places=0)
+        self.assertAlmostEqual(static_model("off", "energy"), 372999554, places=0)
+        self.assertAlmostEqual(static_model("red", "energy"), 378936634, places=0)
+        self.assertAlmostEqual(
+            static_model("blue", "rel_energy_prev"), 105535587, places=0
+        )
+        self.assertAlmostEqual(
+            static_model("green", "rel_energy_prev"), 102999371, places=0
+        )
+        self.assertAlmostEqual(
+            static_model("off", "rel_energy_prev"), 103613698, places=0
+        )
+        self.assertAlmostEqual(
+            static_model("red", "rel_energy_prev"), 110474331, places=0
+        )
+        self.assertAlmostEqual(static_model("blue", "duration"), 9140, places=0)
+        self.assertAlmostEqual(static_model("green", "duration"), 9140, places=0)
+        self.assertAlmostEqual(static_model("off", "duration"), 9140, places=0)
+        self.assertAlmostEqual(static_model("red", "duration"), 9140, places=0)
+
+    @pytest.mark.skipif(
+        "TEST_SLOW" not in os.environ, reason="slow test, set TEST_SLOW=1 to run"
+    )
     def test_model_multifile_cc1200(self):
         testfiles = [
-            'test-data/20170125_125433_cc1200.tar',
-            'test-data/20170125_142420_cc1200.tar',
-            'test-data/20170125_144957_cc1200.tar',
-            'test-data/20170125_151149_cc1200.tar',
-            'test-data/20170125_151824_cc1200.tar',
-            'test-data/20170125_154019_cc1200.tar',
+            "test-data/20170125_125433_cc1200.tar",
+            "test-data/20170125_142420_cc1200.tar",
+            "test-data/20170125_144957_cc1200.tar",
+            "test-data/20170125_151149_cc1200.tar",
+            "test-data/20170125_151824_cc1200.tar",
+            "test-data/20170125_154019_cc1200.tar",
         ]
         raw_data = RawData(testfiles)
         preprocessed_data = raw_data.get_preprocessed_data()
         by_name, parameters, arg_count = pta_trace_to_aggregate(preprocessed_data)
         model = PTAModel(by_name, parameters, arg_count)
-        self.assertEqual(model.states(), 'IDLE RX SLEEP SLEEP_EWOR SYNTH_ON TX XOFF'.split(' '))
-        self.assertEqual(model.transitions(), 'crystal_off eWOR idle init prepare_xmit receive send setSymbolRate setTxPower sleep txDone'.split(' '))
+        self.assertEqual(
+            model.states(), "IDLE RX SLEEP SLEEP_EWOR SYNTH_ON TX XOFF".split(" ")
+        )
+        self.assertEqual(
+            model.transitions(),
+            "crystal_off eWOR idle init prepare_xmit receive send setSymbolRate setTxPower sleep txDone".split(
+                " "
+            ),
+        )
         static_model = model.get_static()
-        self.assertAlmostEqual(static_model('IDLE', 'power'), 9500, places=0)
-        self.assertAlmostEqual(static_model('RX', 'power'), 85177, places=0)
-        self.assertAlmostEqual(static_model('SLEEP', 'power'), 143, places=0)
-        self.assertAlmostEqual(static_model('SLEEP_EWOR', 'power'), 81801, places=0)
-        self.assertAlmostEqual(static_model('SYNTH_ON', 'power'), 60036, places=0)
-        self.assertAlmostEqual(static_model('TX', 'power'), 92461, places=0)
-        self.assertAlmostEqual(static_model('XOFF', 'power'), 780, places=0)
-        self.assertAlmostEqual(static_model('crystal_off', 'energy'), 114658, places=0)
-        self.assertAlmostEqual(static_model('eWOR', 'energy'), 317556, places=0)
-        self.assertAlmostEqual(static_model('idle', 'energy'), 717713, places=0)
-        self.assertAlmostEqual(static_model('init', 'energy'), 23028941, places=0)
-        self.assertAlmostEqual(static_model('prepare_xmit', 'energy'), 378552, places=0)
-        self.assertAlmostEqual(static_model('receive', 'energy'), 380335, places=0)
-        self.assertAlmostEqual(static_model('send', 'energy'), 4282597, places=0)
-        self.assertAlmostEqual(static_model('setSymbolRate', 'energy'), 962060, places=0)
-        self.assertAlmostEqual(static_model('setTxPower', 'energy'), 288701, places=0)
-        self.assertAlmostEqual(static_model('sleep', 'energy'), 104445, places=0)
-        self.assertEqual(static_model('txDone', 'energy'), 0)
+        self.assertAlmostEqual(static_model("IDLE", "power"), 9500, places=0)
+        self.assertAlmostEqual(static_model("RX", "power"), 85177, places=0)
+        self.assertAlmostEqual(static_model("SLEEP", "power"), 143, places=0)
+        self.assertAlmostEqual(static_model("SLEEP_EWOR", "power"), 81801, places=0)
+        self.assertAlmostEqual(static_model("SYNTH_ON", "power"), 60036, places=0)
+        self.assertAlmostEqual(static_model("TX", "power"), 92461, places=0)
+        self.assertAlmostEqual(static_model("XOFF", "power"), 780, places=0)
+        self.assertAlmostEqual(static_model("crystal_off", "energy"), 114658, places=0)
+        self.assertAlmostEqual(static_model("eWOR", "energy"), 317556, places=0)
+        self.assertAlmostEqual(static_model("idle", "energy"), 717713, places=0)
+        self.assertAlmostEqual(static_model("init", "energy"), 23028941, places=0)
+        self.assertAlmostEqual(static_model("prepare_xmit", "energy"), 378552, places=0)
+        self.assertAlmostEqual(static_model("receive", "energy"), 380335, places=0)
+        self.assertAlmostEqual(static_model("send", "energy"), 4282597, places=0)
+        self.assertAlmostEqual(
+            static_model("setSymbolRate", "energy"), 962060, places=0
+        )
+        self.assertAlmostEqual(static_model("setTxPower", "energy"), 288701, places=0)
+        self.assertAlmostEqual(static_model("sleep", "energy"), 104445, places=0)
+        self.assertEqual(static_model("txDone", "energy"), 0)
 
         param_model, param_info = model.get_fitted()
-        self.assertEqual(param_info('IDLE', 'power'), None)
-        self.assertEqual(param_info('RX', 'power')['function']._model_str,
-                         '0 + regression_arg(0) + regression_arg(1) * np.log(parameter(symbolrate) + 1)')
-        self.assertEqual(param_info('SLEEP', 'power'), None)
-        self.assertEqual(param_info('SLEEP_EWOR', 'power'), None)
-        self.assertEqual(param_info('SYNTH_ON', 'power'), None)
-        self.assertEqual(param_info('XOFF', 'power'), None)
+        self.assertEqual(param_info("IDLE", "power"), None)
+        self.assertEqual(
+            param_info("RX", "power")["function"]._model_str,
+            "0 + regression_arg(0) + regression_arg(1) * np.log(parameter(symbolrate) + 1)",
+        )
+        self.assertEqual(param_info("SLEEP", "power"), None)
+        self.assertEqual(param_info("SLEEP_EWOR", "power"), None)
+        self.assertEqual(param_info("SYNTH_ON", "power"), None)
+        self.assertEqual(param_info("XOFF", "power"), None)
 
-        self.assertAlmostEqual(param_info('RX', 'power')['function']._regression_args[0], 84415, places=0)
-        self.assertAlmostEqual(param_info('RX', 'power')['function']._regression_args[1], 206, places=0)
+        self.assertAlmostEqual(
+            param_info("RX", "power")["function"]._regression_args[0], 84415, places=0
+        )
+        self.assertAlmostEqual(
+            param_info("RX", "power")["function"]._regression_args[1], 206, places=0
+        )
 
 
-if __name__ == '__main__':
+if __name__ == "__main__":
     unittest.main()
diff --git a/test/test_timingharness.py b/test/test_timingharness.py
index 9c49b46..29e21f8 100755
--- a/test/test_timingharness.py
+++ b/test/test_timingharness.py
@@ -7,89 +7,164 @@ import unittest
 
 class TestModels(unittest.TestCase):
     def test_model_singlefile_rf24(self):
-        raw_data = TimingData(['test-data/20190815_111745_nRF24_no-rx.json'])
+        raw_data = TimingData(["test-data/20190815_111745_nRF24_no-rx.json"])
         preprocessed_data = raw_data.get_preprocessed_data()
         by_name, parameters, arg_count = pta_trace_to_aggregate(preprocessed_data)
         model = AnalyticModel(by_name, parameters, arg_count)
-        self.assertEqual(model.names, 'setPALevel setRetries setup write'.split(' '))
+        self.assertEqual(model.names, "setPALevel setRetries setup write".split(" "))
         static_model = model.get_static()
-        self.assertAlmostEqual(static_model('setPALevel', 'duration'), 146, places=0)
-        self.assertAlmostEqual(static_model('setRetries', 'duration'), 73, places=0)
-        self.assertAlmostEqual(static_model('setup', 'duration'), 6533, places=0)
-        self.assertAlmostEqual(static_model('write', 'duration'), 12634, places=0)
-
-        for transition in 'setPALevel setRetries setup write'.split(' '):
-            self.assertAlmostEqual(model.stats.param_dependence_ratio(transition, 'duration', 'channel'), 0, places=2)
+        self.assertAlmostEqual(static_model("setPALevel", "duration"), 146, places=0)
+        self.assertAlmostEqual(static_model("setRetries", "duration"), 73, places=0)
+        self.assertAlmostEqual(static_model("setup", "duration"), 6533, places=0)
+        self.assertAlmostEqual(static_model("write", "duration"), 12634, places=0)
+
+        for transition in "setPALevel setRetries setup write".split(" "):
+            self.assertAlmostEqual(
+                model.stats.param_dependence_ratio(transition, "duration", "channel"),
+                0,
+                places=2,
+            )
 
         param_model, param_info = model.get_fitted()
-        self.assertEqual(param_info('setPALevel', 'duration'), None)
-        self.assertEqual(param_info('setRetries', 'duration'), None)
-        self.assertEqual(param_info('setup', 'duration'), None)
-        self.assertEqual(param_info('write', 'duration')['function']._model_str, '0 + regression_arg(0) + regression_arg(1) * parameter(max_retry_count) + regression_arg(2) * parameter(retry_delay) + regression_arg(3) * parameter(max_retry_count) * parameter(retry_delay)')
-
-        self.assertAlmostEqual(param_info('write', 'duration')['function']._regression_args[0], 1163, places=0)
-        self.assertAlmostEqual(param_info('write', 'duration')['function']._regression_args[1], 464, places=0)
-        self.assertAlmostEqual(param_info('write', 'duration')['function']._regression_args[2], 1, places=0)
-        self.assertAlmostEqual(param_info('write', 'duration')['function']._regression_args[3], 1, places=0)
+        self.assertEqual(param_info("setPALevel", "duration"), None)
+        self.assertEqual(param_info("setRetries", "duration"), None)
+        self.assertEqual(param_info("setup", "duration"), None)
+        self.assertEqual(
+            param_info("write", "duration")["function"]._model_str,
+            "0 + regression_arg(0) + regression_arg(1) * parameter(max_retry_count) + regression_arg(2) * parameter(retry_delay) + regression_arg(3) * parameter(max_retry_count) * parameter(retry_delay)",
+        )
+
+        self.assertAlmostEqual(
+            param_info("write", "duration")["function"]._regression_args[0],
+            1163,
+            places=0,
+        )
+        self.assertAlmostEqual(
+            param_info("write", "duration")["function"]._regression_args[1],
+            464,
+            places=0,
+        )
+        self.assertAlmostEqual(
+            param_info("write", "duration")["function"]._regression_args[2], 1, places=0
+        )
+        self.assertAlmostEqual(
+            param_info("write", "duration")["function"]._regression_args[3], 1, places=0
+        )
 
     def test_dependent_parameter_pruning(self):
-        raw_data = TimingData(['test-data/20190815_103347_nRF24_no-rx.json'])
+        raw_data = TimingData(["test-data/20190815_103347_nRF24_no-rx.json"])
         preprocessed_data = raw_data.get_preprocessed_data()
         by_name, parameters, arg_count = pta_trace_to_aggregate(preprocessed_data)
         prune_dependent_parameters(by_name, parameters)
         model = AnalyticModel(by_name, parameters, arg_count)
-        self.assertEqual(model.names, 'getObserveTx setPALevel setRetries setup write'.split(' '))
+        self.assertEqual(
+            model.names, "getObserveTx setPALevel setRetries setup write".split(" ")
+        )
         static_model = model.get_static()
-        self.assertAlmostEqual(static_model('getObserveTx', 'duration'), 75, places=0)
-        self.assertAlmostEqual(static_model('setPALevel', 'duration'), 146, places=0)
-        self.assertAlmostEqual(static_model('setRetries', 'duration'), 73, places=0)
-        self.assertAlmostEqual(static_model('setup', 'duration'), 6533, places=0)
-        self.assertAlmostEqual(static_model('write', 'duration'), 12634, places=0)
-
-        for transition in 'getObserveTx setPALevel setRetries setup write'.split(' '):
-            self.assertAlmostEqual(model.stats.param_dependence_ratio(transition, 'duration', 'channel'), 0, places=2)
+        self.assertAlmostEqual(static_model("getObserveTx", "duration"), 75, places=0)
+        self.assertAlmostEqual(static_model("setPALevel", "duration"), 146, places=0)
+        self.assertAlmostEqual(static_model("setRetries", "duration"), 73, places=0)
+        self.assertAlmostEqual(static_model("setup", "duration"), 6533, places=0)
+        self.assertAlmostEqual(static_model("write", "duration"), 12634, places=0)
+
+        for transition in "getObserveTx setPALevel setRetries setup write".split(" "):
+            self.assertAlmostEqual(
+                model.stats.param_dependence_ratio(transition, "duration", "channel"),
+                0,
+                places=2,
+            )
 
         param_model, param_info = model.get_fitted()
-        self.assertEqual(param_info('getObserveTx', 'duration'), None)
-        self.assertEqual(param_info('setPALevel', 'duration'), None)
-        self.assertEqual(param_info('setRetries', 'duration'), None)
-        self.assertEqual(param_info('setup', 'duration'), None)
-        self.assertEqual(param_info('write', 'duration')['function']._model_str, '0 + regression_arg(0) + regression_arg(1) * parameter(max_retry_count) + regression_arg(2) * parameter(retry_delay) + regression_arg(3) * parameter(max_retry_count) * parameter(retry_delay)')
-
-        self.assertAlmostEqual(param_info('write', 'duration')['function']._regression_args[0], 1163, places=0)
-        self.assertAlmostEqual(param_info('write', 'duration')['function']._regression_args[1], 464, places=0)
-        self.assertAlmostEqual(param_info('write', 'duration')['function']._regression_args[2], 1, places=0)
-        self.assertAlmostEqual(param_info('write', 'duration')['function']._regression_args[3], 1, places=0)
+        self.assertEqual(param_info("getObserveTx", "duration"), None)
+        self.assertEqual(param_info("setPALevel", "duration"), None)
+        self.assertEqual(param_info("setRetries", "duration"), None)
+        self.assertEqual(param_info("setup", "duration"), None)
+        self.assertEqual(
+            param_info("write", "duration")["function"]._model_str,
+            "0 + regression_arg(0) + regression_arg(1) * parameter(max_retry_count) + regression_arg(2) * parameter(retry_delay) + regression_arg(3) * parameter(max_retry_count) * parameter(retry_delay)",
+        )
+
+        self.assertAlmostEqual(
+            param_info("write", "duration")["function"]._regression_args[0],
+            1163,
+            places=0,
+        )
+        self.assertAlmostEqual(
+            param_info("write", "duration")["function"]._regression_args[1],
+            464,
+            places=0,
+        )
+        self.assertAlmostEqual(
+            param_info("write", "duration")["function"]._regression_args[2], 1, places=0
+        )
+        self.assertAlmostEqual(
+            param_info("write", "duration")["function"]._regression_args[3], 1, places=0
+        )
 
     def test_function_override(self):
-        raw_data = TimingData(['test-data/20190815_122531_nRF24_no-rx.json'])
+        raw_data = TimingData(["test-data/20190815_122531_nRF24_no-rx.json"])
         preprocessed_data = raw_data.get_preprocessed_data()
         by_name, parameters, arg_count = pta_trace_to_aggregate(preprocessed_data)
-        model = AnalyticModel(by_name, parameters, arg_count, function_override={('write', 'duration'): '(parameter(auto_ack!) * (regression_arg(0) + regression_arg(1) * parameter(max_retry_count) + regression_arg(2) * parameter(retry_delay) + regression_arg(3) * parameter(max_retry_count) * parameter(retry_delay))) + ((1 - parameter(auto_ack!)) * regression_arg(4))'})
-        self.assertEqual(model.names, 'setAutoAck setPALevel setRetries setup write'.split(' '))
+        model = AnalyticModel(
+            by_name,
+            parameters,
+            arg_count,
+            function_override={
+                (
+                    "write",
+                    "duration",
+                ): "(parameter(auto_ack!) * (regression_arg(0) + regression_arg(1) * parameter(max_retry_count) + regression_arg(2) * parameter(retry_delay) + regression_arg(3) * parameter(max_retry_count) * parameter(retry_delay))) + ((1 - parameter(auto_ack!)) * regression_arg(4))"
+            },
+        )
+        self.assertEqual(
+            model.names, "setAutoAck setPALevel setRetries setup write".split(" ")
+        )
         static_model = model.get_static()
-        self.assertAlmostEqual(static_model('setAutoAck', 'duration'), 72, places=0)
-        self.assertAlmostEqual(static_model('setPALevel', 'duration'), 146, places=0)
-        self.assertAlmostEqual(static_model('setRetries', 'duration'), 73, places=0)
-        self.assertAlmostEqual(static_model('setup', 'duration'), 6533, places=0)
-        self.assertAlmostEqual(static_model('write', 'duration'), 1181, places=0)
-
-        for transition in 'setAutoAck setPALevel setRetries setup write'.split(' '):
-            self.assertAlmostEqual(model.stats.param_dependence_ratio(transition, 'duration', 'channel'), 0, places=2)
+        self.assertAlmostEqual(static_model("setAutoAck", "duration"), 72, places=0)
+        self.assertAlmostEqual(static_model("setPALevel", "duration"), 146, places=0)
+        self.assertAlmostEqual(static_model("setRetries", "duration"), 73, places=0)
+        self.assertAlmostEqual(static_model("setup", "duration"), 6533, places=0)
+        self.assertAlmostEqual(static_model("write", "duration"), 1181, places=0)
+
+        for transition in "setAutoAck setPALevel setRetries setup write".split(" "):
+            self.assertAlmostEqual(
+                model.stats.param_dependence_ratio(transition, "duration", "channel"),
+                0,
+                places=2,
+            )
 
         param_model, param_info = model.get_fitted()
-        self.assertEqual(param_info('setAutoAck', 'duration'), None)
-        self.assertEqual(param_info('setPALevel', 'duration'), None)
-        self.assertEqual(param_info('setRetries', 'duration'), None)
-        self.assertEqual(param_info('setup', 'duration'), None)
-        self.assertEqual(param_info('write', 'duration')['function']._model_str, '(parameter(auto_ack!) * (regression_arg(0) + regression_arg(1) * parameter(max_retry_count) + regression_arg(2) * parameter(retry_delay) + regression_arg(3) * parameter(max_retry_count) * parameter(retry_delay))) + ((1 - parameter(auto_ack!)) * regression_arg(4))')
-
-        self.assertAlmostEqual(param_info('write', 'duration')['function']._regression_args[0], 1162, places=0)
-        self.assertAlmostEqual(param_info('write', 'duration')['function']._regression_args[1], 464, places=0)
-        self.assertAlmostEqual(param_info('write', 'duration')['function']._regression_args[2], 1, places=0)
-        self.assertAlmostEqual(param_info('write', 'duration')['function']._regression_args[3], 1, places=0)
-        self.assertAlmostEqual(param_info('write', 'duration')['function']._regression_args[4], 1086, places=0)
-
-
-if __name__ == '__main__':
+        self.assertEqual(param_info("setAutoAck", "duration"), None)
+        self.assertEqual(param_info("setPALevel", "duration"), None)
+        self.assertEqual(param_info("setRetries", "duration"), None)
+        self.assertEqual(param_info("setup", "duration"), None)
+        self.assertEqual(
+            param_info("write", "duration")["function"]._model_str,
+            "(parameter(auto_ack!) * (regression_arg(0) + regression_arg(1) * parameter(max_retry_count) + regression_arg(2) * parameter(retry_delay) + regression_arg(3) * parameter(max_retry_count) * parameter(retry_delay))) + ((1 - parameter(auto_ack!)) * regression_arg(4))",
+        )
+
+        self.assertAlmostEqual(
+            param_info("write", "duration")["function"]._regression_args[0],
+            1162,
+            places=0,
+        )
+        self.assertAlmostEqual(
+            param_info("write", "duration")["function"]._regression_args[1],
+            464,
+            places=0,
+        )
+        self.assertAlmostEqual(
+            param_info("write", "duration")["function"]._regression_args[2], 1, places=0
+        )
+        self.assertAlmostEqual(
+            param_info("write", "duration")["function"]._regression_args[3], 1, places=0
+        )
+        self.assertAlmostEqual(
+            param_info("write", "duration")["function"]._regression_args[4],
+            1086,
+            places=0,
+        )
+
+
+if __name__ == "__main__":
     unittest.main()
-- 
cgit v1.2.3


From adaa03cf0247b065e6b3863cf16ad88ee24f5169 Mon Sep 17 00:00:00 2001
From: Daniel Friesel <daniel.friesel@uos.de>
Date: Fri, 3 Jul 2020 12:26:50 +0200
Subject: AnalyticFunction: Remove _ prefix from public attributes

---
 bin/analyze-archive.py      |  8 ++++----
 bin/analyze-timing.py       |  4 ++--
 bin/eval-outlier-removal.py | 16 ++++++++--------
 lib/automata.py             |  6 +++---
 lib/functions.py            | 20 ++++++++++----------
 test/test_parameters.py     |  2 +-
 test/test_ptamodel.py       | 18 +++++++++---------
 test/test_timingharness.py  | 32 ++++++++++++++++----------------
 8 files changed, 53 insertions(+), 53 deletions(-)

(limited to 'test/test_ptamodel.py')

diff --git a/bin/analyze-archive.py b/bin/analyze-archive.py
index bf3ab64..e23fb9e 100755
--- a/bin/analyze-archive.py
+++ b/bin/analyze-archive.py
@@ -645,13 +645,13 @@ if __name__ == "__main__":
                 if param_info(state, attribute):
                     print(
                         "{:10s}: {}".format(
-                            state, param_info(state, attribute)["function"]._model_str
+                            state, param_info(state, attribute)["function"].model_function
                         )
                     )
                     print(
                         "{:10s}  {}".format(
                             "",
-                            param_info(state, attribute)["function"]._regression_args,
+                            param_info(state, attribute)["function"].model_args,
                         )
                     )
         for trans in model.transitions():
@@ -661,14 +661,14 @@ if __name__ == "__main__":
                         "{:10s}: {:10s}: {}".format(
                             trans,
                             attribute,
-                            param_info(trans, attribute)["function"]._model_str,
+                            param_info(trans, attribute)["function"].model_function,
                         )
                     )
                     print(
                         "{:10s}  {:10s}  {}".format(
                             "",
                             "",
-                            param_info(trans, attribute)["function"]._regression_args,
+                            param_info(trans, attribute)["function"].model_args,
                         )
                     )
 
diff --git a/bin/analyze-timing.py b/bin/analyze-timing.py
index 4039f45..924388d 100755
--- a/bin/analyze-timing.py
+++ b/bin/analyze-timing.py
@@ -423,14 +423,14 @@ if __name__ == "__main__":
                         "{:10s}: {:10s}: {}".format(
                             trans,
                             attribute,
-                            param_info(trans, attribute)["function"]._model_str,
+                            param_info(trans, attribute)["function"].model_function,
                         )
                     )
                     print(
                         "{:10s}  {:10s}  {}".format(
                             "",
                             "",
-                            param_info(trans, attribute)["function"]._regression_args,
+                            param_info(trans, attribute)["function"].model_args,
                         )
                     )
 
diff --git a/bin/eval-outlier-removal.py b/bin/eval-outlier-removal.py
index 14f0e60..b091ea4 100755
--- a/bin/eval-outlier-removal.py
+++ b/bin/eval-outlier-removal.py
@@ -141,12 +141,12 @@ if __name__ == "__main__":
             if param_i1(state, attribute):
                 print(
                     "{:10s}: {}".format(
-                        state, param_i1(state, attribute)["function"]._model_str
+                        state, param_i1(state, attribute)["function"].model_function
                     )
                 )
                 print(
                     "{:10s}  {}".format(
-                        "", param_i1(state, attribute)["function"]._regression_args
+                        "", param_i1(state, attribute)["function"].model_args
                     )
                 )
     for trans in m1.transitions():
@@ -162,12 +162,12 @@ if __name__ == "__main__":
                     "{:10s}: {:10s}: {}".format(
                         trans,
                         attribute,
-                        param_i1(trans, attribute)["function"]._model_str,
+                        param_i1(trans, attribute)["function"].model_function,
                     )
                 )
                 print(
                     "{:10s}  {:10s}  {}".format(
-                        "", "", param_i1(trans, attribute)["function"]._regression_args
+                        "", "", param_i1(trans, attribute)["function"].model_args
                     )
                 )
     param_m2, param_i2 = m2.get_fitted()
@@ -176,12 +176,12 @@ if __name__ == "__main__":
             if param_i2(state, attribute):
                 print(
                     "{:10s}: {}".format(
-                        state, param_i2(state, attribute)["function"]._model_str
+                        state, param_i2(state, attribute)["function"].model_function
                     )
                 )
                 print(
                     "{:10s}  {}".format(
-                        "", param_i2(state, attribute)["function"]._regression_args
+                        "", param_i2(state, attribute)["function"].model_args
                     )
                 )
     for trans in m2.transitions():
@@ -197,12 +197,12 @@ if __name__ == "__main__":
                     "{:10s}: {:10s}: {}".format(
                         trans,
                         attribute,
-                        param_i2(trans, attribute)["function"]._model_str,
+                        param_i2(trans, attribute)["function"].model_function,
                     )
                 )
                 print(
                     "{:10s}  {:10s}  {}".format(
-                        "", "", param_i2(trans, attribute)["function"]._regression_args
+                        "", "", param_i2(trans, attribute)["function"].model_args
                     )
                 )
 
diff --git a/lib/automata.py b/lib/automata.py
index 69b3969..ebe1871 100755
--- a/lib/automata.py
+++ b/lib/automata.py
@@ -103,7 +103,7 @@ class PTAAttribute:
     def __repr__(self):
         if self.function is not None:
             return "PTAATtribute<{:.0f}, {}>".format(
-                self.value, self.function._model_str
+                self.value, self.function.model_function
             )
         return "PTAATtribute<{:.0f}, None>".format(self.value)
 
@@ -137,8 +137,8 @@ class PTAAttribute:
         }
         if self.function:
             ret["function"] = {
-                "raw": self.function._model_str,
-                "regression_args": list(self.function._regression_args),
+                "raw": self.function.model_function,
+                "regression_args": list(self.function.model_args),
             }
             ret["function_error"] = self.function_error
         return ret
diff --git a/lib/functions.py b/lib/functions.py
index 0b849bd..99ba17d 100644
--- a/lib/functions.py
+++ b/lib/functions.py
@@ -141,7 +141,7 @@ class AnalyticFunction:
         """
         self._parameter_names = parameters
         self._num_args = num_args
-        self._model_str = function_str
+        self.model_function = function_str
         rawfunction = function_str
         self._dependson = [False] * (len(parameters) + num_args)
         self.fit_success = False
@@ -174,12 +174,12 @@ class AnalyticFunction:
             self._function = function_str
 
         if regression_args:
-            self._regression_args = regression_args.copy()
+            self.model_args = regression_args.copy()
             self._fit_success = True
         elif type(function_str) == str:
-            self._regression_args = list(np.ones((num_vars)))
+            self.model_args = list(np.ones((num_vars)))
         else:
-            self._regression_args = []
+            self.model_args = []
 
     def get_fit_data(self, by_param, state_or_tran, model_attribute):
         """
@@ -260,22 +260,22 @@ class AnalyticFunction:
             error_function = lambda P, X, y: self._function(P, X) - y
             try:
                 res = optimize.least_squares(
-                    error_function, self._regression_args, args=(X, Y), xtol=2e-15
+                    error_function, self.model_args, args=(X, Y), xtol=2e-15
                 )
             except ValueError as err:
                 logger.warning(
                     "Fit failed for {}/{}: {} (function: {})".format(
-                        state_or_tran, model_attribute, err, self._model_str
+                        state_or_tran, model_attribute, err, self.model_function
                     ),
                 )
                 return
             if res.status > 0:
-                self._regression_args = res.x
+                self.model_args = res.x
                 self.fit_success = True
             else:
                 logger.warning(
                     "Fit failed for {}/{}: {} (function: {})".format(
-                        state_or_tran, model_attribute, res.message, self._model_str
+                        state_or_tran, model_attribute, res.message, self.model_function
                     ),
                 )
         else:
@@ -308,9 +308,9 @@ class AnalyticFunction:
             corresponds to lexically first parameter, etc.
         :param arg_list: argument values (list of float), if arguments are used.
         """
-        if len(self._regression_args) == 0:
+        if len(self.model_args) == 0:
             return self._function(param_list, arg_list)
-        return self._function(self._regression_args, param_list)
+        return self._function(self.model_args, param_list)
 
 
 class analytic:
diff --git a/test/test_parameters.py b/test/test_parameters.py
index 5d7ec84..baf1c99 100755
--- a/test/test_parameters.py
+++ b/test/test_parameters.py
@@ -63,7 +63,7 @@ class TestModels(unittest.TestCase):
         combined_fit = analytic.function_powerset(fit_result, parameter_names, 0)
 
         self.assertEqual(
-            combined_fit._model_str,
+            combined_fit.model_function,
             "0 + regression_arg(0) + regression_arg(1) * parameter(p_linear)",
         )
         self.assertEqual(
diff --git a/test/test_ptamodel.py b/test/test_ptamodel.py
index 3237450..9abe3c0 100755
--- a/test/test_ptamodel.py
+++ b/test/test_ptamodel.py
@@ -134,26 +134,26 @@ class TestModels(unittest.TestCase):
         param_model, param_info = model.get_fitted()
         self.assertEqual(param_info("POWERDOWN", "power"), None)
         self.assertEqual(
-            param_info("RX", "power")["function"]._model_str,
+            param_info("RX", "power")["function"].model_function,
             "0 + regression_arg(0) + regression_arg(1) * np.sqrt(parameter(datarate))",
         )
         self.assertAlmostEqual(
-            param_info("RX", "power")["function"]._regression_args[0], 48530.7, places=0
+            param_info("RX", "power")["function"].model_args[0], 48530.7, places=0
         )
         self.assertAlmostEqual(
-            param_info("RX", "power")["function"]._regression_args[1], 117, places=0
+            param_info("RX", "power")["function"].model_args[1], 117, places=0
         )
         self.assertEqual(param_info("STANDBY1", "power"), None)
         self.assertEqual(
-            param_info("TX", "power")["function"]._model_str,
+            param_info("TX", "power")["function"].model_function,
             "0 + regression_arg(0) + regression_arg(1) * 1/(parameter(datarate)) + regression_arg(2) * parameter(txpower) + regression_arg(3) * 1/(parameter(datarate)) * parameter(txpower)",
         )
         self.assertEqual(
-            param_info("epilogue", "timeout")["function"]._model_str,
+            param_info("epilogue", "timeout")["function"].model_function,
             "0 + regression_arg(0) + regression_arg(1) * 1/(parameter(datarate))",
         )
         self.assertEqual(
-            param_info("stopListening", "duration")["function"]._model_str,
+            param_info("stopListening", "duration")["function"].model_function,
             "0 + regression_arg(0) + regression_arg(1) * 1/(parameter(datarate))",
         )
 
@@ -371,7 +371,7 @@ class TestModels(unittest.TestCase):
         param_model, param_info = model.get_fitted()
         self.assertEqual(param_info("IDLE", "power"), None)
         self.assertEqual(
-            param_info("RX", "power")["function"]._model_str,
+            param_info("RX", "power")["function"].model_function,
             "0 + regression_arg(0) + regression_arg(1) * np.log(parameter(symbolrate) + 1)",
         )
         self.assertEqual(param_info("SLEEP", "power"), None)
@@ -380,10 +380,10 @@ class TestModels(unittest.TestCase):
         self.assertEqual(param_info("XOFF", "power"), None)
 
         self.assertAlmostEqual(
-            param_info("RX", "power")["function"]._regression_args[0], 84415, places=0
+            param_info("RX", "power")["function"].model_args[0], 84415, places=0
         )
         self.assertAlmostEqual(
-            param_info("RX", "power")["function"]._regression_args[1], 206, places=0
+            param_info("RX", "power")["function"].model_args[1], 206, places=0
         )
 
 
diff --git a/test/test_timingharness.py b/test/test_timingharness.py
index 29e21f8..13289ea 100755
--- a/test/test_timingharness.py
+++ b/test/test_timingharness.py
@@ -30,25 +30,25 @@ class TestModels(unittest.TestCase):
         self.assertEqual(param_info("setRetries", "duration"), None)
         self.assertEqual(param_info("setup", "duration"), None)
         self.assertEqual(
-            param_info("write", "duration")["function"]._model_str,
+            param_info("write", "duration")["function"].model_function,
             "0 + regression_arg(0) + regression_arg(1) * parameter(max_retry_count) + regression_arg(2) * parameter(retry_delay) + regression_arg(3) * parameter(max_retry_count) * parameter(retry_delay)",
         )
 
         self.assertAlmostEqual(
-            param_info("write", "duration")["function"]._regression_args[0],
+            param_info("write", "duration")["function"].model_args[0],
             1163,
             places=0,
         )
         self.assertAlmostEqual(
-            param_info("write", "duration")["function"]._regression_args[1],
+            param_info("write", "duration")["function"].model_args[1],
             464,
             places=0,
         )
         self.assertAlmostEqual(
-            param_info("write", "duration")["function"]._regression_args[2], 1, places=0
+            param_info("write", "duration")["function"].model_args[2], 1, places=0
         )
         self.assertAlmostEqual(
-            param_info("write", "duration")["function"]._regression_args[3], 1, places=0
+            param_info("write", "duration")["function"].model_args[3], 1, places=0
         )
 
     def test_dependent_parameter_pruning(self):
@@ -80,25 +80,25 @@ class TestModels(unittest.TestCase):
         self.assertEqual(param_info("setRetries", "duration"), None)
         self.assertEqual(param_info("setup", "duration"), None)
         self.assertEqual(
-            param_info("write", "duration")["function"]._model_str,
+            param_info("write", "duration")["function"].model_function,
             "0 + regression_arg(0) + regression_arg(1) * parameter(max_retry_count) + regression_arg(2) * parameter(retry_delay) + regression_arg(3) * parameter(max_retry_count) * parameter(retry_delay)",
         )
 
         self.assertAlmostEqual(
-            param_info("write", "duration")["function"]._regression_args[0],
+            param_info("write", "duration")["function"].model_args[0],
             1163,
             places=0,
         )
         self.assertAlmostEqual(
-            param_info("write", "duration")["function"]._regression_args[1],
+            param_info("write", "duration")["function"].model_args[1],
             464,
             places=0,
         )
         self.assertAlmostEqual(
-            param_info("write", "duration")["function"]._regression_args[2], 1, places=0
+            param_info("write", "duration")["function"].model_args[2], 1, places=0
         )
         self.assertAlmostEqual(
-            param_info("write", "duration")["function"]._regression_args[3], 1, places=0
+            param_info("write", "duration")["function"].model_args[3], 1, places=0
         )
 
     def test_function_override(self):
@@ -139,28 +139,28 @@ class TestModels(unittest.TestCase):
         self.assertEqual(param_info("setRetries", "duration"), None)
         self.assertEqual(param_info("setup", "duration"), None)
         self.assertEqual(
-            param_info("write", "duration")["function"]._model_str,
+            param_info("write", "duration")["function"].model_function,
             "(parameter(auto_ack!) * (regression_arg(0) + regression_arg(1) * parameter(max_retry_count) + regression_arg(2) * parameter(retry_delay) + regression_arg(3) * parameter(max_retry_count) * parameter(retry_delay))) + ((1 - parameter(auto_ack!)) * regression_arg(4))",
         )
 
         self.assertAlmostEqual(
-            param_info("write", "duration")["function"]._regression_args[0],
+            param_info("write", "duration")["function"].model_args[0],
             1162,
             places=0,
         )
         self.assertAlmostEqual(
-            param_info("write", "duration")["function"]._regression_args[1],
+            param_info("write", "duration")["function"].model_args[1],
             464,
             places=0,
         )
         self.assertAlmostEqual(
-            param_info("write", "duration")["function"]._regression_args[2], 1, places=0
+            param_info("write", "duration")["function"].model_args[2], 1, places=0
         )
         self.assertAlmostEqual(
-            param_info("write", "duration")["function"]._regression_args[3], 1, places=0
+            param_info("write", "duration")["function"].model_args[3], 1, places=0
         )
         self.assertAlmostEqual(
-            param_info("write", "duration")["function"]._regression_args[4],
+            param_info("write", "duration")["function"].model_args[4],
             1086,
             places=0,
         )
-- 
cgit v1.2.3


From d7ca9acbb668d4c73f07eddf0278c08bbdae7be7 Mon Sep 17 00:00:00 2001
From: Daniel Friesel <daniel.friesel@uos.de>
Date: Mon, 6 Jul 2020 11:47:05 +0200
Subject: Move ParamFit, PTAModel, AnalyticModel to model.py module

---
 bin/analyze-archive.py            |    3 +-
 bin/analyze-timing.py             |    3 +-
 bin/eval-online-model-accuracy.py |    2 +-
 bin/eval-outlier-removal.py       |    3 +-
 bin/eval-rel-energy.py            |    3 +-
 bin/gptest.py                     |    3 +-
 bin/mimosa-etv                    |  163 +++--
 bin/test_corrcoef.py              |    3 +-
 lib/dfatool.py                    | 1171 ------------------------------------
 lib/model.py                      | 1186 +++++++++++++++++++++++++++++++++++++
 test/test_parameters.py           |    6 +-
 test/test_ptamodel.py             |    3 +-
 test/test_timingharness.py        |    3 +-
 13 files changed, 1310 insertions(+), 1242 deletions(-)
 create mode 100644 lib/model.py

(limited to 'test/test_ptamodel.py')

diff --git a/bin/analyze-archive.py b/bin/analyze-archive.py
index bf9e511..e9d70f6 100755
--- a/bin/analyze-archive.py
+++ b/bin/analyze-archive.py
@@ -113,8 +113,9 @@ import random
 import re
 import sys
 from dfatool import plotter
-from dfatool.dfatool import PTAModel, RawData, pta_trace_to_aggregate
+from dfatool.dfatool import RawData, pta_trace_to_aggregate
 from dfatool.dfatool import gplearn_to_function
+from dfatool.model import PTAModel
 from dfatool.validation import CrossValidator
 from dfatool.utils import filter_aggregate_by_param
 from dfatool.automata import PTA
diff --git a/bin/analyze-timing.py b/bin/analyze-timing.py
index 8c7ee5b..9271787 100755
--- a/bin/analyze-timing.py
+++ b/bin/analyze-timing.py
@@ -78,8 +78,9 @@ import json
 import re
 import sys
 from dfatool import plotter
-from dfatool.dfatool import AnalyticModel, TimingData, pta_trace_to_aggregate
+from dfatool.dfatool import TimingData, pta_trace_to_aggregate
 from dfatool.dfatool import gplearn_to_function
+from dfatool.model import AnalyticModel
 from dfatool.validation import CrossValidator
 from dfatool.utils import filter_aggregate_by_param
 from dfatool.parameters import prune_dependent_parameters
diff --git a/bin/eval-online-model-accuracy.py b/bin/eval-online-model-accuracy.py
index 202ac28..97fd8e2 100755
--- a/bin/eval-online-model-accuracy.py
+++ b/bin/eval-online-model-accuracy.py
@@ -28,7 +28,7 @@ import itertools
 import yaml
 from dfatool.automata import PTA
 from dfatool.codegen import get_simulated_accountingmethod
-from dfatool.dfatool import regression_measures
+from dfatool.model import regression_measures
 import numpy as np
 
 opt = dict()
diff --git a/bin/eval-outlier-removal.py b/bin/eval-outlier-removal.py
index b091ea4..b81c33a 100755
--- a/bin/eval-outlier-removal.py
+++ b/bin/eval-outlier-removal.py
@@ -3,7 +3,8 @@
 import getopt
 import re
 import sys
-from dfatool.dfatool import PTAModel, RawData, pta_trace_to_aggregate
+from dfatool.dfatool import RawData, pta_trace_to_aggregate
+from dfatool.model import PTAModel
 
 opt = dict()
 
diff --git a/bin/eval-rel-energy.py b/bin/eval-rel-energy.py
index 8a2be13..2af2cff 100755
--- a/bin/eval-rel-energy.py
+++ b/bin/eval-rel-energy.py
@@ -3,7 +3,8 @@
 import getopt
 import re
 import sys
-from dfatool.dfatool import PTAModel, RawData, pta_trace_to_aggregate
+from dfatool.dfatool import RawData, pta_trace_to_aggregate
+from dfatool.model import PTAModel
 
 opt = dict()
 
diff --git a/bin/gptest.py b/bin/gptest.py
index 82b4575..bcfb7aa 100755
--- a/bin/gptest.py
+++ b/bin/gptest.py
@@ -3,11 +3,10 @@
 import sys
 import numpy as np
 from dfatool.dfatool import (
-    PTAModel,
     RawData,
-    regression_measures,
     pta_trace_to_aggregate,
 )
+from dfatool.model import PTAModel, regression_measures
 from gplearn.genetic import SymbolicRegressor
 from multiprocessing import Pool
 
diff --git a/bin/mimosa-etv b/bin/mimosa-etv
index e23b46c..431e275 100755
--- a/bin/mimosa-etv
+++ b/bin/mimosa-etv
@@ -8,13 +8,16 @@ import numpy as np
 import os
 import re
 import sys
-from dfatool.dfatool import aggregate_measures, MIMOSA
+from dfatool.dfatool import MIMOSA
+from dfatool.model import aggregate_measures
 from dfatool.utils import running_mean
 
 opt = dict()
 
+
 def show_help():
-    print('''mimosa-etv - MIMOSA Analyzer and Visualizer
+    print(
+        """mimosa-etv - MIMOSA Analyzer and Visualizer
 
 USAGE
 
@@ -41,7 +44,9 @@ OPTIONS
     Show power/time plot
   --stat
     Show mean voltage, current, and power as well as total energy consumption.
-    ''')
+    """
+    )
+
 
 def peak_search(data, lower, upper, direction_function):
     while upper - lower > 1e-6:
@@ -58,6 +63,7 @@ def peak_search(data, lower, upper, direction_function):
             upper = bs_test
     return None
 
+
 def peak_search2(data, lower, upper, check_function):
     for power in np.arange(lower, upper, 1e-6):
         peakcount = itertools.groupby(data, lambda x: x >= power)
@@ -67,38 +73,39 @@ def peak_search2(data, lower, upper, check_function):
             return power
     return None
 
-if __name__ == '__main__':
+
+if __name__ == "__main__":
     try:
-        optspec = ('help skip= threshold= threshold-peakcount= plot stat')
-        raw_opts, args = getopt.getopt(sys.argv[1:], "", optspec.split(' '))
+        optspec = "help skip= threshold= threshold-peakcount= plot stat"
+        raw_opts, args = getopt.getopt(sys.argv[1:], "", optspec.split(" "))
 
         for option, parameter in raw_opts:
-            optname = re.sub(r'^--', '', option)
+            optname = re.sub(r"^--", "", option)
             opt[optname] = parameter
 
-        if 'help' in opt:
+        if "help" in opt:
             show_help()
             sys.exit(0)
 
-        if 'skip' in opt:
-            opt['skip'] = int(opt['skip'])
+        if "skip" in opt:
+            opt["skip"] = int(opt["skip"])
         else:
-            opt['skip'] = 0
+            opt["skip"] = 0
 
-        if 'threshold' in opt and opt['threshold'] != 'mean':
-            opt['threshold'] = float(opt['threshold'])
+        if "threshold" in opt and opt["threshold"] != "mean":
+            opt["threshold"] = float(opt["threshold"])
 
-        if 'threshold-peakcount' in opt:
-            opt['threshold-peakcount'] = int(opt['threshold-peakcount'])
+        if "threshold-peakcount" in opt:
+            opt["threshold-peakcount"] = int(opt["threshold-peakcount"])
 
     except getopt.GetoptError as err:
         print(err)
         sys.exit(2)
     except IndexError:
-        print('Usage: mimosa-etv <duration>')
+        print("Usage: mimosa-etv <duration>")
         sys.exit(2)
     except ValueError:
-        print('Error: duration or skip is not a number')
+        print("Error: duration or skip is not a number")
         sys.exit(2)
 
     voltage, shunt, inputfile = args
@@ -110,7 +117,7 @@ if __name__ == '__main__':
     currents = mim.charge_to_current_nocal(charges) * 1e-6
     powers = currents * voltage
 
-    if 'threshold-peakcount' in opt:
+    if "threshold-peakcount" in opt:
         bs_mean = np.mean(powers)
 
         # Finding the correct threshold is tricky. If #peaks < peakcont, our
@@ -126,42 +133,59 @@ if __name__ == '__main__':
         # #peaks != peakcount and threshold >= mean, we go down.
         # If that doesn't work, we fall back to a linear search in 1 µW steps
         def direction_function(peakcount, power):
-            if peakcount == opt['threshold-peakcount']:
+            if peakcount == opt["threshold-peakcount"]:
                 return 0
             if power < bs_mean:
                 return 1
             return -1
+
         threshold = peak_search(power, np.min(power), np.max(power), direction_function)
         if threshold == None:
-            threshold = peak_search2(power, np.min(power), np.max(power), direction_function)
+            threshold = peak_search2(
+                power, np.min(power), np.max(power), direction_function
+            )
 
         if threshold != None:
-            print('Threshold set to {:.0f} µW         : {:.9f}'.format(threshold * 1e6, threshold))
-            opt['threshold'] = threshold
+            print(
+                "Threshold set to {:.0f} µW         : {:.9f}".format(
+                    threshold * 1e6, threshold
+                )
+            )
+            opt["threshold"] = threshold
         else:
-            print('Found no working threshold')
+            print("Found no working threshold")
 
-    if 'threshold' in opt:
-        if opt['threshold'] == 'mean':
-            opt['threshold'] = np.mean(powers)
-            print('Threshold set to {:.0f} µW         : {:.9f}'.format(opt['threshold'] * 1e6, opt['threshold']))
+    if "threshold" in opt:
+        if opt["threshold"] == "mean":
+            opt["threshold"] = np.mean(powers)
+            print(
+                "Threshold set to {:.0f} µW         : {:.9f}".format(
+                    opt["threshold"] * 1e6, opt["threshold"]
+                )
+            )
 
         baseline_mean = 0
-        if np.any(powers < opt['threshold']):
-            baseline_mean = np.mean(powers[powers < opt['threshold']])
-            print('Baseline mean: {:.0f} µW           : {:.9f}'.format(
-                baseline_mean * 1e6, baseline_mean))
-        if np.any(powers >= opt['threshold']):
-            print('Peak mean: {:.0f} µW               : {:.9f}'.format(
-                np.mean(powers[powers >= opt['threshold']]) * 1e6,
-                np.mean(powers[powers >= opt['threshold']])))
+        if np.any(powers < opt["threshold"]):
+            baseline_mean = np.mean(powers[powers < opt["threshold"]])
+            print(
+                "Baseline mean: {:.0f} µW           : {:.9f}".format(
+                    baseline_mean * 1e6, baseline_mean
+                )
+            )
+        if np.any(powers >= opt["threshold"]):
+            print(
+                "Peak mean: {:.0f} µW               : {:.9f}".format(
+                    np.mean(powers[powers >= opt["threshold"]]) * 1e6,
+                    np.mean(powers[powers >= opt["threshold"]]),
+                )
+            )
 
         peaks = []
         peak_start = -1
         for i, dp in enumerate(powers):
-            if dp >= opt['threshold'] and peak_start == -1:
+            if dp >= opt["threshold"] and peak_start == -1:
                 peak_start = i
-            elif dp < opt['threshold'] and peak_start != -1:
+            elif dp < opt["threshold"] and peak_start != -1:
                 peaks.append((peak_start, i))
                 peak_start = -1
 
@@ -170,32 +194,55 @@ if __name__ == '__main__':
         for peak in peaks:
             duration = (peak[1] - peak[0]) * 1e-5
             total_energy += np.mean(powers[peak[0] : peak[1]]) * duration
-            delta_energy += (np.mean(powers[peak[0] : peak[1]]) - baseline_mean) * duration
+            delta_energy += (
+                np.mean(powers[peak[0] : peak[1]]) - baseline_mean
+            ) * duration
             delta_powers = powers[peak[0] : peak[1]] - baseline_mean
-            print('{:.2f}ms peak ({:f} -> {:f})'.format(duration * 1000,
-                peak[0], peak[1]))
-            print('    {:f} µJ / mean {:f} µW'.format(
-                np.mean(powers[peak[0] : peak[1]]) * duration * 1e6,
-                np.mean(powers[peak[0] : peak[1]]) * 1e6 ))
+            print(
+                "{:.2f}ms peak ({:f} -> {:f})".format(duration * 1000, peak[0], peak[1])
+            )
+            print(
+                "    {:f} µJ / mean {:f} µW".format(
+                    np.mean(powers[peak[0] : peak[1]]) * duration * 1e6,
+                    np.mean(powers[peak[0] : peak[1]]) * 1e6,
+                )
+            )
             measures = aggregate_measures(np.mean(delta_powers), delta_powers)
-            print('    {:f} µW delta mean = {:0.1f}% / {:f} µW error'.format(np.mean(delta_powers) * 1e6, measures['smape'], measures['rmsd'] * 1e6 ))
-        print('Peak energy mean: {:.0f} µJ         : {:.9f}'.format(
-            total_energy * 1e6 / len(peaks), total_energy / len(peaks)))
-        print('Average per-peak energy (delta over baseline): {:.0f} µJ         : {:.9f}'.format(
-            delta_energy * 1e6 / len(peaks), delta_energy / len(peaks)))
-
-
-    if 'stat' in opt:
+            print(
+                "    {:f} µW delta mean = {:0.1f}% / {:f} µW error".format(
+                    np.mean(delta_powers) * 1e6,
+                    measures["smape"],
+                    measures["rmsd"] * 1e6,
+                )
+            )
+        print(
+            "Peak energy mean: {:.0f} µJ         : {:.9f}".format(
+                total_energy * 1e6 / len(peaks), total_energy / len(peaks)
+            )
+        )
+        print(
+            "Average per-peak energy (delta over baseline): {:.0f} µJ         : {:.9f}".format(
+                delta_energy * 1e6 / len(peaks), delta_energy / len(peaks)
+            )
+        )
+
+    if "stat" in opt:
         mean_current = np.mean(currents)
         mean_power = np.mean(powers)
-        print('Mean current: {:.0f} µA       : {:.9f}'.format(mean_current * 1e6, mean_current))
-        print('Mean power: {:.0f} µW       : {:.9f}'.format(mean_power * 1e6, mean_power))
-
-    if 'plot' in opt:
+        print(
+            "Mean current: {:.0f} µA       : {:.9f}".format(
+                mean_current * 1e6, mean_current
+            )
+        )
+        print(
+            "Mean power: {:.0f} µW       : {:.9f}".format(mean_power * 1e6, mean_power)
+        )
+
+    if "plot" in opt:
         timestamps = np.arange(len(powers)) * 1e-5
-        pwrhandle, = plt.plot(timestamps, powers, 'b-', label='U*I', markersize=1)
+        (pwrhandle,) = plt.plot(timestamps, powers, "b-", label="U*I", markersize=1)
         plt.legend(handles=[pwrhandle])
-        plt.xlabel('Time [s]')
-        plt.ylabel('Power [W]')
+        plt.xlabel("Time [s]")
+        plt.ylabel("Power [W]")
         plt.grid(True)
         plt.show()
diff --git a/bin/test_corrcoef.py b/bin/test_corrcoef.py
index 0b1ca54..75b5d0d 100755
--- a/bin/test_corrcoef.py
+++ b/bin/test_corrcoef.py
@@ -4,8 +4,9 @@ import getopt
 import re
 import sys
 from dfatool import plotter
-from dfatool.dfatool import PTAModel, RawData, pta_trace_to_aggregate
+from dfatool.dfatool import RawData, pta_trace_to_aggregate
 from dfatool.dfatool import gplearn_to_function
+from dfatool.model import PTAModel
 
 opt = dict()
 
diff --git a/lib/dfatool.py b/lib/dfatool.py
index 392f5a6..20e198d 100644
--- a/lib/dfatool.py
+++ b/lib/dfatool.py
@@ -92,77 +92,6 @@ def mean_or_none(arr):
     return -1
 
 
-def aggregate_measures(aggregate: float, actual: list) -> dict:
-    """
-    Calculate error measures for model value on data list.
-
-    arguments:
-    aggregate -- model value (float or int)
-    actual -- real-world / reference values (list of float or int)
-
-    return value:
-    See regression_measures
-    """
-    aggregate_array = np.array([aggregate] * len(actual))
-    return regression_measures(aggregate_array, np.array(actual))
-
-
-def regression_measures(predicted: np.ndarray, actual: np.ndarray):
-    """
-    Calculate error measures by comparing model values to reference values.
-
-    arguments:
-    predicted -- model values (np.ndarray)
-    actual -- real-world / reference values (np.ndarray)
-
-    Returns a dict containing the following measures:
-    mae -- Mean Absolute Error
-    mape -- Mean Absolute Percentage Error,
-            if all items in actual are non-zero (NaN otherwise)
-    smape -- Symmetric Mean Absolute Percentage Error,
-             if no 0,0-pairs are present in actual and predicted (NaN otherwise)
-    msd -- Mean Square Deviation
-    rmsd -- Root Mean Square Deviation
-    ssr -- Sum of Squared Residuals
-    rsq -- R^2 measure, see sklearn.metrics.r2_score
-    count -- Number of values
-    """
-    if type(predicted) != np.ndarray:
-        raise ValueError("first arg must be ndarray, is {}".format(type(predicted)))
-    if type(actual) != np.ndarray:
-        raise ValueError("second arg must be ndarray, is {}".format(type(actual)))
-    deviations = predicted - actual
-    # mean = np.mean(actual)
-    if len(deviations) == 0:
-        return {}
-    measures = {
-        "mae": np.mean(np.abs(deviations), dtype=np.float64),
-        "msd": np.mean(deviations ** 2, dtype=np.float64),
-        "rmsd": np.sqrt(np.mean(deviations ** 2), dtype=np.float64),
-        "ssr": np.sum(deviations ** 2, dtype=np.float64),
-        "rsq": r2_score(actual, predicted),
-        "count": len(actual),
-    }
-
-    # rsq_quotient = np.sum((actual - mean)**2, dtype=np.float64) * np.sum((predicted - mean)**2, dtype=np.float64)
-
-    if np.all(actual != 0):
-        measures["mape"] = np.mean(np.abs(deviations / actual)) * 100  # bad measure
-    else:
-        measures["mape"] = np.nan
-    if np.all(np.abs(predicted) + np.abs(actual) != 0):
-        measures["smape"] = (
-            np.mean(np.abs(deviations) / ((np.abs(predicted) + np.abs(actual)) / 2))
-            * 100
-        )
-    else:
-        measures["smape"] = np.nan
-    # if np.all(rsq_quotient != 0):
-    #    measures['rsq'] = (np.sum((actual - mean) * (predicted - mean), dtype=np.float64)**2) / rsq_quotient
-
-    return measures
-
-
 class KeysightCSV:
     """Simple loader for Keysight CSV data, as exported by the windows software."""
 
@@ -1191,581 +1120,6 @@ class RawData:
         }
 
 
-class ParallelParamFit:
-    """
-    Fit a set of functions on parameterized measurements.
-
-    One parameter is variale, all others are fixed. Reports the best-fitting
-    function type for each parameter.
-    """
-
-    def __init__(self, by_param):
-        """Create a new ParallelParamFit object."""
-        self.fit_queue = []
-        self.by_param = by_param
-
-    def enqueue(
-        self,
-        state_or_tran,
-        attribute,
-        param_index,
-        param_name,
-        safe_functions_enabled=False,
-        param_filter=None,
-    ):
-        """
-        Add state_or_tran/attribute/param_name to fit queue.
-
-        This causes fit() to compute the best-fitting function for this model part.
-        """
-        self.fit_queue.append(
-            {
-                "key": [state_or_tran, attribute, param_name, param_filter],
-                "args": [
-                    self.by_param,
-                    state_or_tran,
-                    attribute,
-                    param_index,
-                    safe_functions_enabled,
-                    param_filter,
-                ],
-            }
-        )
-
-    def fit(self):
-        """
-        Fit functions on previously enqueue data.
-
-        Fitting is one in parallel with one process per core.
-
-        Results can be accessed using the public ParallelParamFit.results object.
-        """
-        with Pool() as pool:
-            self.results = pool.map(_try_fits_parallel, self.fit_queue)
-
-    def get_result(self, name, attribute, param_filter: dict = None):
-        """
-        Parse and sanitize fit results for state/transition/... 'name' and model attribute 'attribute'.
-
-        Filters out results where the best function is worse (or not much better than) static mean/median estimates.
-
-        :param name: state/transition/... name, e.g. 'TX'
-        :param attribute: model attribute, e.g. 'duration'
-        :param param_filter:
-        :returns: dict with fit result (see `_try_fits`) for each successfully fitted parameter. E.g. {'param 1': {'best' : 'function name', ...} }
-        """
-        fit_result = dict()
-        for result in self.results:
-            if (
-                result["key"][0] == name
-                and result["key"][1] == attribute
-                and result["key"][3] == param_filter
-                and result["result"]["best"] is not None
-            ):  # dürfte an ['best'] != None liegen-> Fit für gefilterten Kram schlägt fehl?
-                this_result = result["result"]
-                if this_result["best_rmsd"] >= min(
-                    this_result["mean_rmsd"], this_result["median_rmsd"]
-                ):
-                    logger.debug(
-                        "Not modeling {} {} as function of {}: best ({:.0f}) is worse than ref ({:.0f}, {:.0f})".format(
-                            name,
-                            attribute,
-                            result["key"][2],
-                            this_result["best_rmsd"],
-                            this_result["mean_rmsd"],
-                            this_result["median_rmsd"],
-                        )
-                    )
-                # See notes on depends_on_param
-                elif this_result["best_rmsd"] >= 0.8 * min(
-                    this_result["mean_rmsd"], this_result["median_rmsd"]
-                ):
-                    logger.debug(
-                        "Not modeling {} {} as function of {}: best ({:.0f}) is not much better than ref ({:.0f}, {:.0f})".format(
-                            name,
-                            attribute,
-                            result["key"][2],
-                            this_result["best_rmsd"],
-                            this_result["mean_rmsd"],
-                            this_result["median_rmsd"],
-                        )
-                    )
-                else:
-                    fit_result[result["key"][2]] = this_result
-        return fit_result
-
-
-def _try_fits_parallel(arg):
-    """
-    Call _try_fits(*arg['args']) and return arg['key'] and the _try_fits result.
-
-    Must be a global function as it is called from a multiprocessing Pool.
-    """
-    return {"key": arg["key"], "result": _try_fits(*arg["args"])}
-
-
-def _try_fits(
-    by_param,
-    state_or_tran,
-    model_attribute,
-    param_index,
-    safe_functions_enabled=False,
-    param_filter: dict = None,
-):
-    """
-    Determine goodness-of-fit for prediction of `by_param[(state_or_tran, *)][model_attribute]` dependence on `param_index` using various functions.
-
-    This is done by varying `param_index` while keeping all other parameters constant and doing one least squares optimization for each function and for each combination of the remaining parameters.
-    The value of the parameter corresponding to `param_index` (e.g. txpower or packet length) is the sole input to the model function.
-    Only numeric parameter values (as determined by `utils.is_numeric`) are used for fitting, non-numeric values such as None or enum strings are ignored.
-    Fitting is only performed if at least three distinct parameter values exist in `by_param[(state_or_tran, *)]`.
-
-    :returns:  a dictionary with the following elements:
-        best -- name of the best-fitting function (see `analytic.functions`). `None` in case of insufficient data.
-        best_rmsd -- mean Root Mean Square Deviation of best-fitting function over all combinations of the remaining parameters
-        mean_rmsd -- mean Root Mean Square Deviation of a reference model using the mean of its respective input data as model value
-        median_rmsd -- mean Root Mean Square Deviation of a reference model using the median of its respective input data as model value
-        results -- mean goodness-of-fit measures for the individual functions. See `analytic.functions` for keys and `aggregate_measures` for values
-
-    :param by_param: measurements partitioned by state/transition/... name and parameter values.
-    Example: `{('foo', (0, 2)): {'bar': [2]}, ('foo', (0, 4)): {'bar': [4]}, ('foo', (0, 6)): {'bar': [6]}}`
-
-    :param state_or_tran: state/transition/... name for which goodness-of-fit will be calculated (first element of by_param key tuple).
-    Example: `'foo'`
-
-    :param model_attribute: attribute for which goodness-of-fit will be calculated.
-    Example: `'bar'`
-
-    :param param_index: index of the parameter used as model input
-    :param safe_functions_enabled: Include "safe" variants of functions with limited argument range.
-    :param param_filter: Only use measurements whose parameters match param_filter for fitting.
-    """
-
-    functions = analytic.functions(safe_functions_enabled=safe_functions_enabled)
-
-    for param_key in filter(lambda x: x[0] == state_or_tran, by_param.keys()):
-        # We might remove elements from 'functions' while iterating over
-        # its keys. A generator will not allow this, so we need to
-        # convert to a list.
-        function_names = list(functions.keys())
-        for function_name in function_names:
-            function_object = functions[function_name]
-            if is_numeric(param_key[1][param_index]) and not function_object.is_valid(
-                param_key[1][param_index]
-            ):
-                functions.pop(function_name, None)
-
-    raw_results = dict()
-    raw_results_by_param = dict()
-    ref_results = {"mean": list(), "median": list()}
-    results = dict()
-    results_by_param = dict()
-
-    seen_parameter_combinations = set()
-
-    # for each parameter combination:
-    for param_key in filter(
-        lambda x: x[0] == state_or_tran
-        and remove_index_from_tuple(x[1], param_index)
-        not in seen_parameter_combinations
-        and len(by_param[x]["param"])
-        and match_parameter_values(by_param[x]["param"][0], param_filter),
-        by_param.keys(),
-    ):
-        X = []
-        Y = []
-        num_valid = 0
-        num_total = 0
-
-        # Ensure that each parameter combination is only optimized once. Otherwise, with parameters (1, 2, 5), (1, 3, 5), (1, 4, 5) and param_index == 1,
-        # the parameter combination (1, *, 5) would be optimized three times, both wasting time and biasing results towards more frequently occuring combinations of non-param_index parameters
-        seen_parameter_combinations.add(
-            remove_index_from_tuple(param_key[1], param_index)
-        )
-
-        # for each value of the parameter denoted by param_index (all other parameters remain the same):
-        for k, v in filter(
-            lambda kv: param_slice_eq(kv[0], param_key, param_index), by_param.items()
-        ):
-            num_total += 1
-            if is_numeric(k[1][param_index]):
-                num_valid += 1
-                X.extend([float(k[1][param_index])] * len(v[model_attribute]))
-                Y.extend(v[model_attribute])
-
-        if num_valid > 2:
-            X = np.array(X)
-            Y = np.array(Y)
-            other_parameters = remove_index_from_tuple(k[1], param_index)
-            raw_results_by_param[other_parameters] = dict()
-            results_by_param[other_parameters] = dict()
-            for function_name, param_function in functions.items():
-                if function_name not in raw_results:
-                    raw_results[function_name] = dict()
-                error_function = param_function.error_function
-                res = optimize.least_squares(
-                    error_function, [0, 1], args=(X, Y), xtol=2e-15
-                )
-                measures = regression_measures(param_function.eval(res.x, X), Y)
-                raw_results_by_param[other_parameters][function_name] = measures
-                for measure, error_rate in measures.items():
-                    if measure not in raw_results[function_name]:
-                        raw_results[function_name][measure] = list()
-                    raw_results[function_name][measure].append(error_rate)
-                # print(function_name, res, measures)
-            mean_measures = aggregate_measures(np.mean(Y), Y)
-            ref_results["mean"].append(mean_measures["rmsd"])
-            raw_results_by_param[other_parameters]["mean"] = mean_measures
-            median_measures = aggregate_measures(np.median(Y), Y)
-            ref_results["median"].append(median_measures["rmsd"])
-            raw_results_by_param[other_parameters]["median"] = median_measures
-
-    if not len(ref_results["mean"]):
-        # Insufficient data for fitting
-        # print('[W] Insufficient data for fitting {}/{}/{}'.format(state_or_tran, model_attribute, param_index))
-        return {"best": None, "best_rmsd": np.inf, "results": results}
-
-    for (
-        other_parameter_combination,
-        other_parameter_results,
-    ) in raw_results_by_param.items():
-        best_fit_val = np.inf
-        best_fit_name = None
-        results = dict()
-        for function_name, result in other_parameter_results.items():
-            if len(result) > 0:
-                results[function_name] = result
-                rmsd = result["rmsd"]
-                if rmsd < best_fit_val:
-                    best_fit_val = rmsd
-                    best_fit_name = function_name
-        results_by_param[other_parameter_combination] = {
-            "best": best_fit_name,
-            "best_rmsd": best_fit_val,
-            "mean_rmsd": results["mean"]["rmsd"],
-            "median_rmsd": results["median"]["rmsd"],
-            "results": results,
-        }
-
-    best_fit_val = np.inf
-    best_fit_name = None
-    results = dict()
-    for function_name, result in raw_results.items():
-        if len(result) > 0:
-            results[function_name] = {}
-            for measure in result.keys():
-                results[function_name][measure] = np.mean(result[measure])
-            rmsd = results[function_name]["rmsd"]
-            if rmsd < best_fit_val:
-                best_fit_val = rmsd
-                best_fit_name = function_name
-
-    return {
-        "best": best_fit_name,
-        "best_rmsd": best_fit_val,
-        "mean_rmsd": np.mean(ref_results["mean"]),
-        "median_rmsd": np.mean(ref_results["median"]),
-        "results": results,
-        "results_by_other_param": results_by_param,
-    }
-
-
-def _num_args_from_by_name(by_name):
-    num_args = dict()
-    for key, value in by_name.items():
-        if "args" in value:
-            num_args[key] = len(value["args"][0])
-    return num_args
-
-
-class AnalyticModel:
-    u"""
-    Parameter-aware analytic energy/data size/... model.
-
-    Supports both static and parameter-based model attributes, and automatic detection of parameter-dependence.
-
-    These provide measurements aggregated by (function/state/...) name
-    and (for by_param) parameter values. Layout:
-    dictionary with one key per name ('send', 'TX', ...) or
-    one key per name and parameter combination
-    (('send', (1, 2)), ('send', (2, 3)), ('TX', (1, 2)), ('TX', (2, 3)), ...).
-
-    Parameter values must be ordered corresponding to the lexically sorted parameter names.
-
-    Each element is in turn a dict with the following elements:
-    - param: list of parameter values in each measurement (-> list of lists)
-    - attributes: list of keys that should be analyzed,
-        e.g. ['power', 'duration']
-    - for each attribute mentioned in 'attributes': A list with measurements.
-      All list except for 'attributes' must have the same length.
-
-    For example:
-    parameters = ['foo_count', 'irrelevant']
-    by_name = {
-        'foo' : [1, 1, 2],
-        'bar' : [5, 6, 7],
-        'attributes' : ['foo', 'bar'],
-        'param' : [[1, 0], [1, 0], [2, 0]]
-    }
-
-    methods:
-    get_static -- return static (parameter-unaware) model.
-    get_param_lut -- return parameter-aware look-up-table model. Cannot model parameter combinations not present in by_param.
-    get_fitted -- return parameter-aware model using fitted functions for behaviour prediction.
-
-    variables:
-    names -- function/state/... names (i.e., the keys of by_name)
-    parameters -- parameter names
-    stats -- ParamStats object providing parameter-dependency statistics for each name and attribute
-    assess -- calculate model quality
-    """
-
-    def __init__(
-        self,
-        by_name,
-        parameters,
-        arg_count=None,
-        function_override=dict(),
-        use_corrcoef=False,
-    ):
-        """
-        Create a new AnalyticModel and compute parameter statistics.
-
-        :param by_name: measurements aggregated by (function/state/...) name.
-            Layout: dictionary with one key per name ('send', 'TX', ...) or
-            one key per name and parameter combination
-            (('send', (1, 2)), ('send', (2, 3)), ('TX', (1, 2)), ('TX', (2, 3)), ...).
-
-            Parameter values must be ordered corresponding to the lexically sorted parameter names.
-
-            Each element is in turn a dict with the following elements:
-            - param: list of parameter values in each measurement (-> list of lists)
-            - attributes: list of keys that should be analyzed,
-                e.g. ['power', 'duration']
-            - for each attribute mentioned in 'attributes': A list with measurements.
-            All list except for 'attributes' must have the same length.
-
-            For example:
-            parameters = ['foo_count', 'irrelevant']
-            by_name = {
-                'foo' : [1, 1, 2],
-                'duration' : [5, 6, 7],
-                'attributes' : ['foo', 'duration'],
-                'param' : [[1, 0], [1, 0], [2, 0]]
-                # foo_count-^  ^-irrelevant
-            }
-        :param parameters: List of parameter names
-        :param function_override: dict of overrides for automatic parameter function generation.
-            If (state or transition name, model attribute) is present in function_override,
-            the corresponding text string is the function used for analytic (parameter-aware/fitted)
-            modeling of this attribute. It is passed to AnalyticFunction, see
-            there for the required format. Note that this happens regardless of
-            parameter dependency detection: The provided analytic function will be assigned
-            even if it seems like the model attribute is static / parameter-independent.
-        :param use_corrcoef: use correlation coefficient instead of stddev comparison to detect whether a model attribute depends on a parameter
-        """
-        self.cache = dict()
-        self.by_name = by_name
-        self.by_param = by_name_to_by_param(by_name)
-        self.names = sorted(by_name.keys())
-        self.parameters = sorted(parameters)
-        self.function_override = function_override.copy()
-        self._use_corrcoef = use_corrcoef
-        self._num_args = arg_count
-        if self._num_args is None:
-            self._num_args = _num_args_from_by_name(by_name)
-
-        self.stats = ParamStats(
-            self.by_name,
-            self.by_param,
-            self.parameters,
-            self._num_args,
-            use_corrcoef=use_corrcoef,
-        )
-
-    def _get_model_from_dict(self, model_dict, model_function):
-        model = {}
-        for name, elem in model_dict.items():
-            model[name] = {}
-            for key in elem["attributes"]:
-                try:
-                    model[name][key] = model_function(elem[key])
-                except RuntimeWarning:
-                    logger.warning("Got no data for {} {}".format(name, key))
-                except FloatingPointError as fpe:
-                    logger.warning("Got no data for {} {}: {}".format(name, key, fpe))
-        return model
-
-    def param_index(self, param_name):
-        if param_name in self.parameters:
-            return self.parameters.index(param_name)
-        return len(self.parameters) + int(param_name)
-
-    def param_name(self, param_index):
-        if param_index < len(self.parameters):
-            return self.parameters[param_index]
-        return str(param_index)
-
-    def get_static(self, use_mean=False):
-        """
-        Get static model function: name, attribute -> model value.
-
-        Uses the median of by_name for modeling.
-        """
-        getter_function = np.median
-
-        if use_mean:
-            getter_function = np.mean
-
-        static_model = self._get_model_from_dict(self.by_name, getter_function)
-
-        def static_model_getter(name, key, **kwargs):
-            return static_model[name][key]
-
-        return static_model_getter
-
-    def get_param_lut(self, fallback=False):
-        """
-        Get parameter-look-up-table model function: name, attribute, parameter values -> model value.
-
-        The function can only give model values for parameter combinations
-        present in by_param. By default, it raises KeyError for other values.
-
-        arguments:
-        fallback -- Fall back to the (non-parameter-aware) static model when encountering unknown parameter values
-        """
-        static_model = self._get_model_from_dict(self.by_name, np.median)
-        lut_model = self._get_model_from_dict(self.by_param, np.median)
-
-        def lut_median_getter(name, key, param, arg=[], **kwargs):
-            param.extend(map(soft_cast_int, arg))
-            try:
-                return lut_model[(name, tuple(param))][key]
-            except KeyError:
-                if fallback:
-                    return static_model[name][key]
-                raise
-
-        return lut_median_getter
-
-    def get_fitted(self, safe_functions_enabled=False):
-        """
-        Get paramete-aware model function and model information function.
-
-        Returns two functions:
-        model_function(name, attribute, param=parameter values) -> model value.
-        model_info(name, attribute) -> {'fit_result' : ..., 'function' : ... } or None
-        """
-        if "fitted_model_getter" in self.cache and "fitted_info_getter" in self.cache:
-            return self.cache["fitted_model_getter"], self.cache["fitted_info_getter"]
-
-        static_model = self._get_model_from_dict(self.by_name, np.median)
-        param_model = dict([[name, {}] for name in self.by_name.keys()])
-        paramfit = ParallelParamFit(self.by_param)
-
-        for name in self.by_name.keys():
-            for attribute in self.by_name[name]["attributes"]:
-                for param_index, param in enumerate(self.parameters):
-                    if self.stats.depends_on_param(name, attribute, param):
-                        paramfit.enqueue(name, attribute, param_index, param, False)
-                if arg_support_enabled and name in self._num_args:
-                    for arg_index in range(self._num_args[name]):
-                        if self.stats.depends_on_arg(name, attribute, arg_index):
-                            paramfit.enqueue(
-                                name,
-                                attribute,
-                                len(self.parameters) + arg_index,
-                                arg_index,
-                                False,
-                            )
-
-        paramfit.fit()
-
-        for name in self.by_name.keys():
-            num_args = 0
-            if name in self._num_args:
-                num_args = self._num_args[name]
-            for attribute in self.by_name[name]["attributes"]:
-                fit_result = paramfit.get_result(name, attribute)
-
-                if (name, attribute) in self.function_override:
-                    function_str = self.function_override[(name, attribute)]
-                    x = AnalyticFunction(function_str, self.parameters, num_args)
-                    x.fit(self.by_param, name, attribute)
-                    if x.fit_success:
-                        param_model[name][attribute] = {
-                            "fit_result": fit_result,
-                            "function": x,
-                        }
-                elif len(fit_result.keys()):
-                    x = analytic.function_powerset(
-                        fit_result, self.parameters, num_args
-                    )
-                    x.fit(self.by_param, name, attribute)
-
-                    if x.fit_success:
-                        param_model[name][attribute] = {
-                            "fit_result": fit_result,
-                            "function": x,
-                        }
-
-        def model_getter(name, key, **kwargs):
-            if "arg" in kwargs and "param" in kwargs:
-                kwargs["param"].extend(map(soft_cast_int, kwargs["arg"]))
-            if key in param_model[name]:
-                param_list = kwargs["param"]
-                param_function = param_model[name][key]["function"]
-                if param_function.is_predictable(param_list):
-                    return param_function.eval(param_list)
-            return static_model[name][key]
-
-        def info_getter(name, key):
-            if key in param_model[name]:
-                return param_model[name][key]
-            return None
-
-        self.cache["fitted_model_getter"] = model_getter
-        self.cache["fitted_info_getter"] = info_getter
-
-        return model_getter, info_getter
-
-    def assess(self, model_function):
-        """
-        Calculate MAE, SMAPE, etc. of model_function for each by_name entry.
-
-        state/transition/... name and parameter values are fed into model_function.
-        The by_name entries of this AnalyticModel are used as ground truth and
-        compared with the values predicted by model_function.
-
-        For proper model assessments, the data used to generate model_function
-        and the data fed into this AnalyticModel instance must be mutually
-        exclusive (e.g. by performing cross validation). Otherwise,
-        overfitting cannot be detected.
-        """
-        detailed_results = {}
-        for name, elem in sorted(self.by_name.items()):
-            detailed_results[name] = {}
-            for attribute in elem["attributes"]:
-                predicted_data = np.array(
-                    list(
-                        map(
-                            lambda i: model_function(
-                                name, attribute, param=elem["param"][i]
-                            ),
-                            range(len(elem[attribute])),
-                        )
-                    )
-                )
-                measures = regression_measures(predicted_data, elem[attribute])
-                detailed_results[name][attribute] = measures
-
-        return {"by_name": detailed_results}
-
-    def to_json(self):
-        # TODO
-        pass
-
-
 def _add_trace_data_to_aggregate(aggregate, key, element):
     # Only cares about element['isa'], element['offline_aggregates'], and
     # element['plan']['level']
@@ -1867,531 +1221,6 @@ def pta_trace_to_aggregate(traces, ignore_trace_indexes=[]):
     return by_name, parameter_names, arg_count
 
 
-class PTAModel:
-    u"""
-    Parameter-aware PTA-based energy model.
-
-    Supports both static and parameter-based model attributes, and automatic detection of parameter-dependence.
-
-    The model heavily relies on two internal data structures:
-    PTAModel.by_name and PTAModel.by_param.
-
-    These provide measurements aggregated by state/transition name
-    and (for by_param) parameter values. Layout:
-    dictionary with one key per state/transition ('send', 'TX', ...) or
-    one key per state/transition and parameter combination
-    (('send', (1, 2)), ('send', (2, 3)), ('TX', (1, 2)), ('TX', (2, 3)), ...).
-    For by_param, parameter values are ordered corresponding to the lexically sorted parameter names.
-
-    Each element is in turn a dict with the following elements:
-    - isa: 'state' or 'transition'
-    - power: list of mean power measurements in µW
-    - duration: list of durations in µs
-    - power_std: list of stddev of power per state/transition
-    - energy: consumed energy (power*duration) in pJ
-    - paramkeys: list of parameter names in each measurement (-> list of lists)
-    - param: list of parameter values in each measurement (-> list of lists)
-    - attributes: list of keys that should be analyzed,
-        e.g. ['power', 'duration']
-    additionally, only if isa == 'transition':
-    - timeout: list of duration of previous state in µs
-    - rel_energy_prev: transition energy relative to previous state mean power in pJ
-    - rel_energy_next: transition energy relative to next state mean power in pJ
-    """
-
-    def __init__(
-        self,
-        by_name,
-        parameters,
-        arg_count,
-        traces=[],
-        ignore_trace_indexes=[],
-        discard_outliers=None,
-        function_override={},
-        use_corrcoef=False,
-        pta=None,
-    ):
-        """
-        Prepare a new PTA energy model.
-
-        Actual model generation is done on-demand by calling the respective functions.
-
-        arguments:
-        by_name -- state/transition measurements aggregated by name, as returned by pta_trace_to_aggregate.
-        parameters -- list of parameter names, as returned by pta_trace_to_aggregate
-        arg_count -- function arguments, as returned by pta_trace_to_aggregate
-        traces -- list of preprocessed DFA traces, as returned by RawData.get_preprocessed_data()
-        ignore_trace_indexes -- list of trace indexes. The corresponding traces will be ignored.
-        discard_outliers -- currently not supported: threshold for outlier detection and removel (float).
-            Outlier detection is performed individually for each state/transition in each trace,
-            so it only works if the benchmark ran several times.
-            Given "data" (a set of measurements of the same thing, e.g. TX duration in the third benchmark trace),
-            "m" (the median of all attribute measurements with the same parameters, which may include data from other traces),
-            a data point X is considered an outlier if
-            | 0.6745 * (X - m) / median(|data - m|) | > discard_outliers .
-        function_override -- dict of overrides for automatic parameter function generation.
-            If (state or transition name, model attribute) is present in function_override,
-            the corresponding text string is the function used for analytic (parameter-aware/fitted)
-            modeling of this attribute. It is passed to AnalyticFunction, see
-            there for the required format. Note that this happens regardless of
-            parameter dependency detection: The provided analytic function will be assigned
-            even if it seems like the model attribute is static / parameter-independent.
-        use_corrcoef -- use correlation coefficient instead of stddev comparison
-            to detect whether a model attribute depends on a parameter
-        pta -- hardware model as `PTA` object
-        """
-        self.by_name = by_name
-        self.by_param = by_name_to_by_param(by_name)
-        self._parameter_names = sorted(parameters)
-        self._num_args = arg_count
-        self._use_corrcoef = use_corrcoef
-        self.traces = traces
-        self.stats = ParamStats(
-            self.by_name,
-            self.by_param,
-            self._parameter_names,
-            self._num_args,
-            self._use_corrcoef,
-        )
-        self.cache = {}
-        np.seterr("raise")
-        self._outlier_threshold = discard_outliers
-        self.function_override = function_override.copy()
-        self.pta = pta
-        self.ignore_trace_indexes = ignore_trace_indexes
-        self._aggregate_to_ndarray(self.by_name)
-
-    def _aggregate_to_ndarray(self, aggregate):
-        for elem in aggregate.values():
-            for key in elem["attributes"]:
-                elem[key] = np.array(elem[key])
-
-    # This heuristic is very similar to the "function is not much better than
-    # median" checks in get_fitted. So far, doing it here as well is mostly
-    # a performance and not an algorithm quality decision.
-    # --df, 2018-04-18
-    def depends_on_param(self, state_or_trans, key, param):
-        return self.stats.depends_on_param(state_or_trans, key, param)
-
-    # See notes on depends_on_param
-    def depends_on_arg(self, state_or_trans, key, param):
-        return self.stats.depends_on_arg(state_or_trans, key, param)
-
-    def _get_model_from_dict(self, model_dict, model_function):
-        model = {}
-        for name, elem in model_dict.items():
-            model[name] = {}
-            for key in elem["attributes"]:
-                try:
-                    model[name][key] = model_function(elem[key])
-                except RuntimeWarning:
-                    logger.warning("Got no data for {} {}".format(name, key))
-                except FloatingPointError as fpe:
-                    logger.warning("Got no data for {} {}: {}".format(name, key, fpe))
-        return model
-
-    def get_static(self, use_mean=False):
-        """
-        Get static model function: name, attribute -> model value.
-
-        Uses the median of by_name for modeling, unless `use_mean` is set.
-        """
-        getter_function = np.median
-
-        if use_mean:
-            getter_function = np.mean
-
-        static_model = self._get_model_from_dict(self.by_name, getter_function)
-
-        def static_model_getter(name, key, **kwargs):
-            return static_model[name][key]
-
-        return static_model_getter
-
-    def get_param_lut(self, fallback=False):
-        """
-        Get parameter-look-up-table model function: name, attribute, parameter values -> model value.
-
-        The function can only give model values for parameter combinations
-        present in by_param. By default, it raises KeyError for other values.
-
-        arguments:
-        fallback -- Fall back to the (non-parameter-aware) static model when encountering unknown parameter values
-        """
-        static_model = self._get_model_from_dict(self.by_name, np.median)
-        lut_model = self._get_model_from_dict(self.by_param, np.median)
-
-        def lut_median_getter(name, key, param, arg=[], **kwargs):
-            param.extend(map(soft_cast_int, arg))
-            try:
-                return lut_model[(name, tuple(param))][key]
-            except KeyError:
-                if fallback:
-                    return static_model[name][key]
-                raise
-
-        return lut_median_getter
-
-    def param_index(self, param_name):
-        if param_name in self._parameter_names:
-            return self._parameter_names.index(param_name)
-        return len(self._parameter_names) + int(param_name)
-
-    def param_name(self, param_index):
-        if param_index < len(self._parameter_names):
-            return self._parameter_names[param_index]
-        return str(param_index)
-
-    def get_fitted(self, safe_functions_enabled=False):
-        """
-        Get parameter-aware model function and model information function.
-
-        Returns two functions:
-        model_function(name, attribute, param=parameter values) -> model value.
-        model_info(name, attribute) -> {'fit_result' : ..., 'function' : ... } or None
-        """
-        if "fitted_model_getter" in self.cache and "fitted_info_getter" in self.cache:
-            return self.cache["fitted_model_getter"], self.cache["fitted_info_getter"]
-
-        static_model = self._get_model_from_dict(self.by_name, np.median)
-        param_model = dict(
-            [[state_or_tran, {}] for state_or_tran in self.by_name.keys()]
-        )
-        paramfit = ParallelParamFit(self.by_param)
-        for state_or_tran in self.by_name.keys():
-            for model_attribute in self.by_name[state_or_tran]["attributes"]:
-                fit_results = {}
-                for parameter_index, parameter_name in enumerate(self._parameter_names):
-                    if self.depends_on_param(
-                        state_or_tran, model_attribute, parameter_name
-                    ):
-                        paramfit.enqueue(
-                            state_or_tran,
-                            model_attribute,
-                            parameter_index,
-                            parameter_name,
-                            safe_functions_enabled,
-                        )
-                        for (
-                            codependent_param_dict
-                        ) in self.stats.codependent_parameter_value_dicts(
-                            state_or_tran, model_attribute, parameter_name
-                        ):
-                            paramfit.enqueue(
-                                state_or_tran,
-                                model_attribute,
-                                parameter_index,
-                                parameter_name,
-                                safe_functions_enabled,
-                                codependent_param_dict,
-                            )
-                if (
-                    arg_support_enabled
-                    and self.by_name[state_or_tran]["isa"] == "transition"
-                ):
-                    for arg_index in range(self._num_args[state_or_tran]):
-                        if self.depends_on_arg(
-                            state_or_tran, model_attribute, arg_index
-                        ):
-                            paramfit.enqueue(
-                                state_or_tran,
-                                model_attribute,
-                                len(self._parameter_names) + arg_index,
-                                arg_index,
-                                safe_functions_enabled,
-                            )
-        paramfit.fit()
-
-        for state_or_tran in self.by_name.keys():
-            num_args = 0
-            if (
-                arg_support_enabled
-                and self.by_name[state_or_tran]["isa"] == "transition"
-            ):
-                num_args = self._num_args[state_or_tran]
-            for model_attribute in self.by_name[state_or_tran]["attributes"]:
-                fit_results = paramfit.get_result(state_or_tran, model_attribute)
-
-                for parameter_name in self._parameter_names:
-                    if self.depends_on_param(
-                        state_or_tran, model_attribute, parameter_name
-                    ):
-                        for (
-                            codependent_param_dict
-                        ) in self.stats.codependent_parameter_value_dicts(
-                            state_or_tran, model_attribute, parameter_name
-                        ):
-                            pass
-                            # FIXME paramfit.get_result hat ja gar keinen Parameter als Argument...
-
-                if (state_or_tran, model_attribute) in self.function_override:
-                    function_str = self.function_override[
-                        (state_or_tran, model_attribute)
-                    ]
-                    x = AnalyticFunction(function_str, self._parameter_names, num_args)
-                    x.fit(self.by_param, state_or_tran, model_attribute)
-                    if x.fit_success:
-                        param_model[state_or_tran][model_attribute] = {
-                            "fit_result": fit_results,
-                            "function": x,
-                        }
-                elif len(fit_results.keys()):
-                    x = analytic.function_powerset(
-                        fit_results, self._parameter_names, num_args
-                    )
-                    x.fit(self.by_param, state_or_tran, model_attribute)
-                    if x.fit_success:
-                        param_model[state_or_tran][model_attribute] = {
-                            "fit_result": fit_results,
-                            "function": x,
-                        }
-
-        def model_getter(name, key, **kwargs):
-            if "arg" in kwargs and "param" in kwargs:
-                kwargs["param"].extend(map(soft_cast_int, kwargs["arg"]))
-            if key in param_model[name]:
-                param_list = kwargs["param"]
-                param_function = param_model[name][key]["function"]
-                if param_function.is_predictable(param_list):
-                    return param_function.eval(param_list)
-            return static_model[name][key]
-
-        def info_getter(name, key):
-            if key in param_model[name]:
-                return param_model[name][key]
-            return None
-
-        self.cache["fitted_model_getter"] = model_getter
-        self.cache["fitted_info_getter"] = info_getter
-
-        return model_getter, info_getter
-
-    def to_json(self):
-        static_model = self.get_static()
-        static_quality = self.assess(static_model)
-        param_model, param_info = self.get_fitted()
-        analytic_quality = self.assess(param_model)
-        self.pta.update(
-            static_model,
-            param_info,
-            static_error=static_quality["by_name"],
-            analytic_error=analytic_quality["by_name"],
-        )
-        return self.pta.to_json()
-
-    def states(self):
-        """Return sorted list of state names."""
-        return sorted(
-            list(
-                filter(lambda k: self.by_name[k]["isa"] == "state", self.by_name.keys())
-            )
-        )
-
-    def transitions(self):
-        """Return sorted list of transition names."""
-        return sorted(
-            list(
-                filter(
-                    lambda k: self.by_name[k]["isa"] == "transition",
-                    self.by_name.keys(),
-                )
-            )
-        )
-
-    def states_and_transitions(self):
-        """Return list of states and transition names."""
-        ret = self.states()
-        ret.extend(self.transitions())
-        return ret
-
-    def parameters(self):
-        return self._parameter_names
-
-    def attributes(self, state_or_trans):
-        return self.by_name[state_or_trans]["attributes"]
-
-    def assess(self, model_function):
-        """
-        Calculate MAE, SMAPE, etc. of model_function for each by_name entry.
-
-        state/transition/... name and parameter values are fed into model_function.
-        The by_name entries of this PTAModel are used as ground truth and
-        compared with the values predicted by model_function.
-
-        For proper model assessments, the data used to generate model_function
-        and the data fed into this AnalyticModel instance must be mutually
-        exclusive (e.g. by performing cross validation). Otherwise,
-        overfitting cannot be detected.
-        """
-        detailed_results = {}
-        for name, elem in sorted(self.by_name.items()):
-            detailed_results[name] = {}
-            for key in elem["attributes"]:
-                predicted_data = np.array(
-                    list(
-                        map(
-                            lambda i: model_function(name, key, param=elem["param"][i]),
-                            range(len(elem[key])),
-                        )
-                    )
-                )
-                measures = regression_measures(predicted_data, elem[key])
-                detailed_results[name][key] = measures
-
-        return {"by_name": detailed_results}
-
-    def assess_states(
-        self, model_function, model_attribute="power", distribution: dict = None
-    ):
-        """
-        Calculate overall model error assuming equal distribution of states
-        """
-        # TODO calculate mean power draw for distribution and use it to
-        # calculate relative error from MAE combination
-        model_quality = self.assess(model_function)
-        num_states = len(self.states())
-        if distribution is None:
-            distribution = dict(map(lambda x: [x, 1 / num_states], self.states()))
-
-        if not np.isclose(sum(distribution.values()), 1):
-            raise ValueError(
-                "distribution must be a probability distribution with sum 1"
-            )
-
-        # total_value = None
-        # try:
-        #     total_value = sum(map(lambda x: model_function(x, model_attribute) * distribution[x], self.states()))
-        # except KeyError:
-        #     pass
-
-        total_error = np.sqrt(
-            sum(
-                map(
-                    lambda x: np.square(
-                        model_quality["by_name"][x][model_attribute]["mae"]
-                        * distribution[x]
-                    ),
-                    self.states(),
-                )
-            )
-        )
-        return total_error
-
-    def assess_on_traces(self, model_function):
-        """
-        Calculate MAE, SMAPE, etc. of model_function for each trace known to this PTAModel instance.
-
-        :returns: dict of `duration_by_trace`, `energy_by_trace`, `timeout_by_trace`, `rel_energy_by_trace` and `state_energy_by_trace`.
-            Each entry holds regression measures for the corresponding measure. Note that the determined model quality heavily depends on the
-            traces: small-ish absolute errors in states which frequently occur may have more effect than large absolute errors in rarely occuring states
-        """
-        model_energy_list = []
-        real_energy_list = []
-        model_rel_energy_list = []
-        model_state_energy_list = []
-        model_duration_list = []
-        real_duration_list = []
-        model_timeout_list = []
-        real_timeout_list = []
-
-        for trace in self.traces:
-            if trace["id"] not in self.ignore_trace_indexes:
-                for rep_id in range(len(trace["trace"][0]["offline"])):
-                    model_energy = 0.0
-                    real_energy = 0.0
-                    model_rel_energy = 0.0
-                    model_state_energy = 0.0
-                    model_duration = 0.0
-                    real_duration = 0.0
-                    model_timeout = 0.0
-                    real_timeout = 0.0
-                    for i, trace_part in enumerate(trace["trace"]):
-                        name = trace_part["name"]
-                        prev_name = trace["trace"][i - 1]["name"]
-                        isa = trace_part["isa"]
-                        if name != "UNINITIALIZED":
-                            try:
-                                param = trace_part["offline_aggregates"]["param"][
-                                    rep_id
-                                ]
-                                prev_param = trace["trace"][i - 1][
-                                    "offline_aggregates"
-                                ]["param"][rep_id]
-                                power = trace_part["offline"][rep_id]["uW_mean"]
-                                duration = trace_part["offline"][rep_id]["us"]
-                                prev_duration = trace["trace"][i - 1]["offline"][
-                                    rep_id
-                                ]["us"]
-                                real_energy += power * duration
-                                if isa == "state":
-                                    model_energy += (
-                                        model_function(name, "power", param=param)
-                                        * duration
-                                    )
-                                else:
-                                    model_energy += model_function(
-                                        name, "energy", param=param
-                                    )
-                                    # If i == 1, the previous state was UNINITIALIZED, for which we do not have model data
-                                    if i == 1:
-                                        model_rel_energy += model_function(
-                                            name, "energy", param=param
-                                        )
-                                    else:
-                                        model_rel_energy += model_function(
-                                            prev_name, "power", param=prev_param
-                                        ) * (prev_duration + duration)
-                                        model_state_energy += model_function(
-                                            prev_name, "power", param=prev_param
-                                        ) * (prev_duration + duration)
-                                    model_rel_energy += model_function(
-                                        name, "rel_energy_prev", param=param
-                                    )
-                                    real_duration += duration
-                                    model_duration += model_function(
-                                        name, "duration", param=param
-                                    )
-                                    if (
-                                        "plan" in trace_part
-                                        and trace_part["plan"]["level"] == "epilogue"
-                                    ):
-                                        real_timeout += trace_part["offline"][rep_id][
-                                            "timeout"
-                                        ]
-                                        model_timeout += model_function(
-                                            name, "timeout", param=param
-                                        )
-                            except KeyError:
-                                # if states/transitions have been removed via --filter-param, this is harmless
-                                pass
-                    real_energy_list.append(real_energy)
-                    model_energy_list.append(model_energy)
-                    model_rel_energy_list.append(model_rel_energy)
-                    model_state_energy_list.append(model_state_energy)
-                    real_duration_list.append(real_duration)
-                    model_duration_list.append(model_duration)
-                    real_timeout_list.append(real_timeout)
-                    model_timeout_list.append(model_timeout)
-
-        return {
-            "duration_by_trace": regression_measures(
-                np.array(model_duration_list), np.array(real_duration_list)
-            ),
-            "energy_by_trace": regression_measures(
-                np.array(model_energy_list), np.array(real_energy_list)
-            ),
-            "timeout_by_trace": regression_measures(
-                np.array(model_timeout_list), np.array(real_timeout_list)
-            ),
-            "rel_energy_by_trace": regression_measures(
-                np.array(model_rel_energy_list), np.array(real_energy_list)
-            ),
-            "state_energy_by_trace": regression_measures(
-                np.array(model_state_energy_list), np.array(real_energy_list)
-            ),
-        }
-
-
 class EnergyTraceLog:
     """
     EnergyTrace log loader for DFA traces.
diff --git a/lib/model.py b/lib/model.py
new file mode 100644
index 0000000..d83c12c
--- /dev/null
+++ b/lib/model.py
@@ -0,0 +1,1186 @@
+#!/usr/bin/env python3
+
+import logging
+import numpy as np
+from scipy import optimize
+from sklearn.metrics import r2_score
+from multiprocessing import Pool
+from .functions import analytic
+from .functions import AnalyticFunction
+from .parameters import ParamStats
+from .utils import is_numeric, soft_cast_int, param_slice_eq, remove_index_from_tuple
+from .utils import by_name_to_by_param, match_parameter_values
+
+logger = logging.getLogger(__name__)
+arg_support_enabled = True
+
+
+def aggregate_measures(aggregate: float, actual: list) -> dict:
+    """
+    Calculate error measures for model value on data list.
+
+    arguments:
+    aggregate -- model value (float or int)
+    actual -- real-world / reference values (list of float or int)
+
+    return value:
+    See regression_measures
+    """
+    aggregate_array = np.array([aggregate] * len(actual))
+    return regression_measures(aggregate_array, np.array(actual))
+
+
+def regression_measures(predicted: np.ndarray, actual: np.ndarray):
+    """
+    Calculate error measures by comparing model values to reference values.
+
+    arguments:
+    predicted -- model values (np.ndarray)
+    actual -- real-world / reference values (np.ndarray)
+
+    Returns a dict containing the following measures:
+    mae -- Mean Absolute Error
+    mape -- Mean Absolute Percentage Error,
+            if all items in actual are non-zero (NaN otherwise)
+    smape -- Symmetric Mean Absolute Percentage Error,
+             if no 0,0-pairs are present in actual and predicted (NaN otherwise)
+    msd -- Mean Square Deviation
+    rmsd -- Root Mean Square Deviation
+    ssr -- Sum of Squared Residuals
+    rsq -- R^2 measure, see sklearn.metrics.r2_score
+    count -- Number of values
+    """
+    if type(predicted) != np.ndarray:
+        raise ValueError("first arg must be ndarray, is {}".format(type(predicted)))
+    if type(actual) != np.ndarray:
+        raise ValueError("second arg must be ndarray, is {}".format(type(actual)))
+    deviations = predicted - actual
+    # mean = np.mean(actual)
+    if len(deviations) == 0:
+        return {}
+    measures = {
+        "mae": np.mean(np.abs(deviations), dtype=np.float64),
+        "msd": np.mean(deviations ** 2, dtype=np.float64),
+        "rmsd": np.sqrt(np.mean(deviations ** 2), dtype=np.float64),
+        "ssr": np.sum(deviations ** 2, dtype=np.float64),
+        "rsq": r2_score(actual, predicted),
+        "count": len(actual),
+    }
+
+    # rsq_quotient = np.sum((actual - mean)**2, dtype=np.float64) * np.sum((predicted - mean)**2, dtype=np.float64)
+
+    if np.all(actual != 0):
+        measures["mape"] = np.mean(np.abs(deviations / actual)) * 100  # bad measure
+    else:
+        measures["mape"] = np.nan
+    if np.all(np.abs(predicted) + np.abs(actual) != 0):
+        measures["smape"] = (
+            np.mean(np.abs(deviations) / ((np.abs(predicted) + np.abs(actual)) / 2))
+            * 100
+        )
+    else:
+        measures["smape"] = np.nan
+    # if np.all(rsq_quotient != 0):
+    #    measures['rsq'] = (np.sum((actual - mean) * (predicted - mean), dtype=np.float64)**2) / rsq_quotient
+
+    return measures
+
+
+class ParallelParamFit:
+    """
+    Fit a set of functions on parameterized measurements.
+
+    One parameter is variale, all others are fixed. Reports the best-fitting
+    function type for each parameter.
+    """
+
+    def __init__(self, by_param):
+        """Create a new ParallelParamFit object."""
+        self.fit_queue = []
+        self.by_param = by_param
+
+    def enqueue(
+        self,
+        state_or_tran,
+        attribute,
+        param_index,
+        param_name,
+        safe_functions_enabled=False,
+        param_filter=None,
+    ):
+        """
+        Add state_or_tran/attribute/param_name to fit queue.
+
+        This causes fit() to compute the best-fitting function for this model part.
+        """
+        self.fit_queue.append(
+            {
+                "key": [state_or_tran, attribute, param_name, param_filter],
+                "args": [
+                    self.by_param,
+                    state_or_tran,
+                    attribute,
+                    param_index,
+                    safe_functions_enabled,
+                    param_filter,
+                ],
+            }
+        )
+
+    def fit(self):
+        """
+        Fit functions on previously enqueue data.
+
+        Fitting is one in parallel with one process per core.
+
+        Results can be accessed using the public ParallelParamFit.results object.
+        """
+        with Pool() as pool:
+            self.results = pool.map(_try_fits_parallel, self.fit_queue)
+
+    def get_result(self, name, attribute, param_filter: dict = None):
+        """
+        Parse and sanitize fit results for state/transition/... 'name' and model attribute 'attribute'.
+
+        Filters out results where the best function is worse (or not much better than) static mean/median estimates.
+
+        :param name: state/transition/... name, e.g. 'TX'
+        :param attribute: model attribute, e.g. 'duration'
+        :param param_filter:
+        :returns: dict with fit result (see `_try_fits`) for each successfully fitted parameter. E.g. {'param 1': {'best' : 'function name', ...} }
+        """
+        fit_result = dict()
+        for result in self.results:
+            if (
+                result["key"][0] == name
+                and result["key"][1] == attribute
+                and result["key"][3] == param_filter
+                and result["result"]["best"] is not None
+            ):  # dürfte an ['best'] != None liegen-> Fit für gefilterten Kram schlägt fehl?
+                this_result = result["result"]
+                if this_result["best_rmsd"] >= min(
+                    this_result["mean_rmsd"], this_result["median_rmsd"]
+                ):
+                    logger.debug(
+                        "Not modeling {} {} as function of {}: best ({:.0f}) is worse than ref ({:.0f}, {:.0f})".format(
+                            name,
+                            attribute,
+                            result["key"][2],
+                            this_result["best_rmsd"],
+                            this_result["mean_rmsd"],
+                            this_result["median_rmsd"],
+                        )
+                    )
+                # See notes on depends_on_param
+                elif this_result["best_rmsd"] >= 0.8 * min(
+                    this_result["mean_rmsd"], this_result["median_rmsd"]
+                ):
+                    logger.debug(
+                        "Not modeling {} {} as function of {}: best ({:.0f}) is not much better than ref ({:.0f}, {:.0f})".format(
+                            name,
+                            attribute,
+                            result["key"][2],
+                            this_result["best_rmsd"],
+                            this_result["mean_rmsd"],
+                            this_result["median_rmsd"],
+                        )
+                    )
+                else:
+                    fit_result[result["key"][2]] = this_result
+        return fit_result
+
+
+def _try_fits_parallel(arg):
+    """
+    Call _try_fits(*arg['args']) and return arg['key'] and the _try_fits result.
+
+    Must be a global function as it is called from a multiprocessing Pool.
+    """
+    return {"key": arg["key"], "result": _try_fits(*arg["args"])}
+
+
+def _try_fits(
+    by_param,
+    state_or_tran,
+    model_attribute,
+    param_index,
+    safe_functions_enabled=False,
+    param_filter: dict = None,
+):
+    """
+    Determine goodness-of-fit for prediction of `by_param[(state_or_tran, *)][model_attribute]` dependence on `param_index` using various functions.
+
+    This is done by varying `param_index` while keeping all other parameters constant and doing one least squares optimization for each function and for each combination of the remaining parameters.
+    The value of the parameter corresponding to `param_index` (e.g. txpower or packet length) is the sole input to the model function.
+    Only numeric parameter values (as determined by `utils.is_numeric`) are used for fitting, non-numeric values such as None or enum strings are ignored.
+    Fitting is only performed if at least three distinct parameter values exist in `by_param[(state_or_tran, *)]`.
+
+    :returns:  a dictionary with the following elements:
+        best -- name of the best-fitting function (see `analytic.functions`). `None` in case of insufficient data.
+        best_rmsd -- mean Root Mean Square Deviation of best-fitting function over all combinations of the remaining parameters
+        mean_rmsd -- mean Root Mean Square Deviation of a reference model using the mean of its respective input data as model value
+        median_rmsd -- mean Root Mean Square Deviation of a reference model using the median of its respective input data as model value
+        results -- mean goodness-of-fit measures for the individual functions. See `analytic.functions` for keys and `aggregate_measures` for values
+
+    :param by_param: measurements partitioned by state/transition/... name and parameter values.
+    Example: `{('foo', (0, 2)): {'bar': [2]}, ('foo', (0, 4)): {'bar': [4]}, ('foo', (0, 6)): {'bar': [6]}}`
+
+    :param state_or_tran: state/transition/... name for which goodness-of-fit will be calculated (first element of by_param key tuple).
+    Example: `'foo'`
+
+    :param model_attribute: attribute for which goodness-of-fit will be calculated.
+    Example: `'bar'`
+
+    :param param_index: index of the parameter used as model input
+    :param safe_functions_enabled: Include "safe" variants of functions with limited argument range.
+    :param param_filter: Only use measurements whose parameters match param_filter for fitting.
+    """
+
+    functions = analytic.functions(safe_functions_enabled=safe_functions_enabled)
+
+    for param_key in filter(lambda x: x[0] == state_or_tran, by_param.keys()):
+        # We might remove elements from 'functions' while iterating over
+        # its keys. A generator will not allow this, so we need to
+        # convert to a list.
+        function_names = list(functions.keys())
+        for function_name in function_names:
+            function_object = functions[function_name]
+            if is_numeric(param_key[1][param_index]) and not function_object.is_valid(
+                param_key[1][param_index]
+            ):
+                functions.pop(function_name, None)
+
+    raw_results = dict()
+    raw_results_by_param = dict()
+    ref_results = {"mean": list(), "median": list()}
+    results = dict()
+    results_by_param = dict()
+
+    seen_parameter_combinations = set()
+
+    # for each parameter combination:
+    for param_key in filter(
+        lambda x: x[0] == state_or_tran
+        and remove_index_from_tuple(x[1], param_index)
+        not in seen_parameter_combinations
+        and len(by_param[x]["param"])
+        and match_parameter_values(by_param[x]["param"][0], param_filter),
+        by_param.keys(),
+    ):
+        X = []
+        Y = []
+        num_valid = 0
+        num_total = 0
+
+        # Ensure that each parameter combination is only optimized once. Otherwise, with parameters (1, 2, 5), (1, 3, 5), (1, 4, 5) and param_index == 1,
+        # the parameter combination (1, *, 5) would be optimized three times, both wasting time and biasing results towards more frequently occuring combinations of non-param_index parameters
+        seen_parameter_combinations.add(
+            remove_index_from_tuple(param_key[1], param_index)
+        )
+
+        # for each value of the parameter denoted by param_index (all other parameters remain the same):
+        for k, v in filter(
+            lambda kv: param_slice_eq(kv[0], param_key, param_index), by_param.items()
+        ):
+            num_total += 1
+            if is_numeric(k[1][param_index]):
+                num_valid += 1
+                X.extend([float(k[1][param_index])] * len(v[model_attribute]))
+                Y.extend(v[model_attribute])
+
+        if num_valid > 2:
+            X = np.array(X)
+            Y = np.array(Y)
+            other_parameters = remove_index_from_tuple(k[1], param_index)
+            raw_results_by_param[other_parameters] = dict()
+            results_by_param[other_parameters] = dict()
+            for function_name, param_function in functions.items():
+                if function_name not in raw_results:
+                    raw_results[function_name] = dict()
+                error_function = param_function.error_function
+                res = optimize.least_squares(
+                    error_function, [0, 1], args=(X, Y), xtol=2e-15
+                )
+                measures = regression_measures(param_function.eval(res.x, X), Y)
+                raw_results_by_param[other_parameters][function_name] = measures
+                for measure, error_rate in measures.items():
+                    if measure not in raw_results[function_name]:
+                        raw_results[function_name][measure] = list()
+                    raw_results[function_name][measure].append(error_rate)
+                # print(function_name, res, measures)
+            mean_measures = aggregate_measures(np.mean(Y), Y)
+            ref_results["mean"].append(mean_measures["rmsd"])
+            raw_results_by_param[other_parameters]["mean"] = mean_measures
+            median_measures = aggregate_measures(np.median(Y), Y)
+            ref_results["median"].append(median_measures["rmsd"])
+            raw_results_by_param[other_parameters]["median"] = median_measures
+
+    if not len(ref_results["mean"]):
+        # Insufficient data for fitting
+        # print('[W] Insufficient data for fitting {}/{}/{}'.format(state_or_tran, model_attribute, param_index))
+        return {"best": None, "best_rmsd": np.inf, "results": results}
+
+    for (
+        other_parameter_combination,
+        other_parameter_results,
+    ) in raw_results_by_param.items():
+        best_fit_val = np.inf
+        best_fit_name = None
+        results = dict()
+        for function_name, result in other_parameter_results.items():
+            if len(result) > 0:
+                results[function_name] = result
+                rmsd = result["rmsd"]
+                if rmsd < best_fit_val:
+                    best_fit_val = rmsd
+                    best_fit_name = function_name
+        results_by_param[other_parameter_combination] = {
+            "best": best_fit_name,
+            "best_rmsd": best_fit_val,
+            "mean_rmsd": results["mean"]["rmsd"],
+            "median_rmsd": results["median"]["rmsd"],
+            "results": results,
+        }
+
+    best_fit_val = np.inf
+    best_fit_name = None
+    results = dict()
+    for function_name, result in raw_results.items():
+        if len(result) > 0:
+            results[function_name] = {}
+            for measure in result.keys():
+                results[function_name][measure] = np.mean(result[measure])
+            rmsd = results[function_name]["rmsd"]
+            if rmsd < best_fit_val:
+                best_fit_val = rmsd
+                best_fit_name = function_name
+
+    return {
+        "best": best_fit_name,
+        "best_rmsd": best_fit_val,
+        "mean_rmsd": np.mean(ref_results["mean"]),
+        "median_rmsd": np.mean(ref_results["median"]),
+        "results": results,
+        "results_by_other_param": results_by_param,
+    }
+
+
+def _num_args_from_by_name(by_name):
+    num_args = dict()
+    for key, value in by_name.items():
+        if "args" in value:
+            num_args[key] = len(value["args"][0])
+    return num_args
+
+
+class AnalyticModel:
+    u"""
+    Parameter-aware analytic energy/data size/... model.
+
+    Supports both static and parameter-based model attributes, and automatic detection of parameter-dependence.
+
+    These provide measurements aggregated by (function/state/...) name
+    and (for by_param) parameter values. Layout:
+    dictionary with one key per name ('send', 'TX', ...) or
+    one key per name and parameter combination
+    (('send', (1, 2)), ('send', (2, 3)), ('TX', (1, 2)), ('TX', (2, 3)), ...).
+
+    Parameter values must be ordered corresponding to the lexically sorted parameter names.
+
+    Each element is in turn a dict with the following elements:
+    - param: list of parameter values in each measurement (-> list of lists)
+    - attributes: list of keys that should be analyzed,
+        e.g. ['power', 'duration']
+    - for each attribute mentioned in 'attributes': A list with measurements.
+      All list except for 'attributes' must have the same length.
+
+    For example:
+    parameters = ['foo_count', 'irrelevant']
+    by_name = {
+        'foo' : [1, 1, 2],
+        'bar' : [5, 6, 7],
+        'attributes' : ['foo', 'bar'],
+        'param' : [[1, 0], [1, 0], [2, 0]]
+    }
+
+    methods:
+    get_static -- return static (parameter-unaware) model.
+    get_param_lut -- return parameter-aware look-up-table model. Cannot model parameter combinations not present in by_param.
+    get_fitted -- return parameter-aware model using fitted functions for behaviour prediction.
+
+    variables:
+    names -- function/state/... names (i.e., the keys of by_name)
+    parameters -- parameter names
+    stats -- ParamStats object providing parameter-dependency statistics for each name and attribute
+    assess -- calculate model quality
+    """
+
+    def __init__(
+        self,
+        by_name,
+        parameters,
+        arg_count=None,
+        function_override=dict(),
+        use_corrcoef=False,
+    ):
+        """
+        Create a new AnalyticModel and compute parameter statistics.
+
+        :param by_name: measurements aggregated by (function/state/...) name.
+            Layout: dictionary with one key per name ('send', 'TX', ...) or
+            one key per name and parameter combination
+            (('send', (1, 2)), ('send', (2, 3)), ('TX', (1, 2)), ('TX', (2, 3)), ...).
+
+            Parameter values must be ordered corresponding to the lexically sorted parameter names.
+
+            Each element is in turn a dict with the following elements:
+            - param: list of parameter values in each measurement (-> list of lists)
+            - attributes: list of keys that should be analyzed,
+                e.g. ['power', 'duration']
+            - for each attribute mentioned in 'attributes': A list with measurements.
+            All list except for 'attributes' must have the same length.
+
+            For example:
+            parameters = ['foo_count', 'irrelevant']
+            by_name = {
+                'foo' : [1, 1, 2],
+                'duration' : [5, 6, 7],
+                'attributes' : ['foo', 'duration'],
+                'param' : [[1, 0], [1, 0], [2, 0]]
+                # foo_count-^  ^-irrelevant
+            }
+        :param parameters: List of parameter names
+        :param function_override: dict of overrides for automatic parameter function generation.
+            If (state or transition name, model attribute) is present in function_override,
+            the corresponding text string is the function used for analytic (parameter-aware/fitted)
+            modeling of this attribute. It is passed to AnalyticFunction, see
+            there for the required format. Note that this happens regardless of
+            parameter dependency detection: The provided analytic function will be assigned
+            even if it seems like the model attribute is static / parameter-independent.
+        :param use_corrcoef: use correlation coefficient instead of stddev comparison to detect whether a model attribute depends on a parameter
+        """
+        self.cache = dict()
+        self.by_name = by_name
+        self.by_param = by_name_to_by_param(by_name)
+        self.names = sorted(by_name.keys())
+        self.parameters = sorted(parameters)
+        self.function_override = function_override.copy()
+        self._use_corrcoef = use_corrcoef
+        self._num_args = arg_count
+        if self._num_args is None:
+            self._num_args = _num_args_from_by_name(by_name)
+
+        self.stats = ParamStats(
+            self.by_name,
+            self.by_param,
+            self.parameters,
+            self._num_args,
+            use_corrcoef=use_corrcoef,
+        )
+
+    def _get_model_from_dict(self, model_dict, model_function):
+        model = {}
+        for name, elem in model_dict.items():
+            model[name] = {}
+            for key in elem["attributes"]:
+                try:
+                    model[name][key] = model_function(elem[key])
+                except RuntimeWarning:
+                    logger.warning("Got no data for {} {}".format(name, key))
+                except FloatingPointError as fpe:
+                    logger.warning("Got no data for {} {}: {}".format(name, key, fpe))
+        return model
+
+    def param_index(self, param_name):
+        if param_name in self.parameters:
+            return self.parameters.index(param_name)
+        return len(self.parameters) + int(param_name)
+
+    def param_name(self, param_index):
+        if param_index < len(self.parameters):
+            return self.parameters[param_index]
+        return str(param_index)
+
+    def get_static(self, use_mean=False):
+        """
+        Get static model function: name, attribute -> model value.
+
+        Uses the median of by_name for modeling.
+        """
+        getter_function = np.median
+
+        if use_mean:
+            getter_function = np.mean
+
+        static_model = self._get_model_from_dict(self.by_name, getter_function)
+
+        def static_model_getter(name, key, **kwargs):
+            return static_model[name][key]
+
+        return static_model_getter
+
+    def get_param_lut(self, fallback=False):
+        """
+        Get parameter-look-up-table model function: name, attribute, parameter values -> model value.
+
+        The function can only give model values for parameter combinations
+        present in by_param. By default, it raises KeyError for other values.
+
+        arguments:
+        fallback -- Fall back to the (non-parameter-aware) static model when encountering unknown parameter values
+        """
+        static_model = self._get_model_from_dict(self.by_name, np.median)
+        lut_model = self._get_model_from_dict(self.by_param, np.median)
+
+        def lut_median_getter(name, key, param, arg=[], **kwargs):
+            param.extend(map(soft_cast_int, arg))
+            try:
+                return lut_model[(name, tuple(param))][key]
+            except KeyError:
+                if fallback:
+                    return static_model[name][key]
+                raise
+
+        return lut_median_getter
+
+    def get_fitted(self, safe_functions_enabled=False):
+        """
+        Get paramete-aware model function and model information function.
+
+        Returns two functions:
+        model_function(name, attribute, param=parameter values) -> model value.
+        model_info(name, attribute) -> {'fit_result' : ..., 'function' : ... } or None
+        """
+        if "fitted_model_getter" in self.cache and "fitted_info_getter" in self.cache:
+            return self.cache["fitted_model_getter"], self.cache["fitted_info_getter"]
+
+        static_model = self._get_model_from_dict(self.by_name, np.median)
+        param_model = dict([[name, {}] for name in self.by_name.keys()])
+        paramfit = ParallelParamFit(self.by_param)
+
+        for name in self.by_name.keys():
+            for attribute in self.by_name[name]["attributes"]:
+                for param_index, param in enumerate(self.parameters):
+                    if self.stats.depends_on_param(name, attribute, param):
+                        paramfit.enqueue(name, attribute, param_index, param, False)
+                if arg_support_enabled and name in self._num_args:
+                    for arg_index in range(self._num_args[name]):
+                        if self.stats.depends_on_arg(name, attribute, arg_index):
+                            paramfit.enqueue(
+                                name,
+                                attribute,
+                                len(self.parameters) + arg_index,
+                                arg_index,
+                                False,
+                            )
+
+        paramfit.fit()
+
+        for name in self.by_name.keys():
+            num_args = 0
+            if name in self._num_args:
+                num_args = self._num_args[name]
+            for attribute in self.by_name[name]["attributes"]:
+                fit_result = paramfit.get_result(name, attribute)
+
+                if (name, attribute) in self.function_override:
+                    function_str = self.function_override[(name, attribute)]
+                    x = AnalyticFunction(function_str, self.parameters, num_args)
+                    x.fit(self.by_param, name, attribute)
+                    if x.fit_success:
+                        param_model[name][attribute] = {
+                            "fit_result": fit_result,
+                            "function": x,
+                        }
+                elif len(fit_result.keys()):
+                    x = analytic.function_powerset(
+                        fit_result, self.parameters, num_args
+                    )
+                    x.fit(self.by_param, name, attribute)
+
+                    if x.fit_success:
+                        param_model[name][attribute] = {
+                            "fit_result": fit_result,
+                            "function": x,
+                        }
+
+        def model_getter(name, key, **kwargs):
+            if "arg" in kwargs and "param" in kwargs:
+                kwargs["param"].extend(map(soft_cast_int, kwargs["arg"]))
+            if key in param_model[name]:
+                param_list = kwargs["param"]
+                param_function = param_model[name][key]["function"]
+                if param_function.is_predictable(param_list):
+                    return param_function.eval(param_list)
+            return static_model[name][key]
+
+        def info_getter(name, key):
+            if key in param_model[name]:
+                return param_model[name][key]
+            return None
+
+        self.cache["fitted_model_getter"] = model_getter
+        self.cache["fitted_info_getter"] = info_getter
+
+        return model_getter, info_getter
+
+    def assess(self, model_function):
+        """
+        Calculate MAE, SMAPE, etc. of model_function for each by_name entry.
+
+        state/transition/... name and parameter values are fed into model_function.
+        The by_name entries of this AnalyticModel are used as ground truth and
+        compared with the values predicted by model_function.
+
+        For proper model assessments, the data used to generate model_function
+        and the data fed into this AnalyticModel instance must be mutually
+        exclusive (e.g. by performing cross validation). Otherwise,
+        overfitting cannot be detected.
+        """
+        detailed_results = {}
+        for name, elem in sorted(self.by_name.items()):
+            detailed_results[name] = {}
+            for attribute in elem["attributes"]:
+                predicted_data = np.array(
+                    list(
+                        map(
+                            lambda i: model_function(
+                                name, attribute, param=elem["param"][i]
+                            ),
+                            range(len(elem[attribute])),
+                        )
+                    )
+                )
+                measures = regression_measures(predicted_data, elem[attribute])
+                detailed_results[name][attribute] = measures
+
+        return {"by_name": detailed_results}
+
+    def to_json(self):
+        # TODO
+        pass
+
+
+class PTAModel:
+    u"""
+    Parameter-aware PTA-based energy model.
+
+    Supports both static and parameter-based model attributes, and automatic detection of parameter-dependence.
+
+    The model heavily relies on two internal data structures:
+    PTAModel.by_name and PTAModel.by_param.
+
+    These provide measurements aggregated by state/transition name
+    and (for by_param) parameter values. Layout:
+    dictionary with one key per state/transition ('send', 'TX', ...) or
+    one key per state/transition and parameter combination
+    (('send', (1, 2)), ('send', (2, 3)), ('TX', (1, 2)), ('TX', (2, 3)), ...).
+    For by_param, parameter values are ordered corresponding to the lexically sorted parameter names.
+
+    Each element is in turn a dict with the following elements:
+    - isa: 'state' or 'transition'
+    - power: list of mean power measurements in µW
+    - duration: list of durations in µs
+    - power_std: list of stddev of power per state/transition
+    - energy: consumed energy (power*duration) in pJ
+    - paramkeys: list of parameter names in each measurement (-> list of lists)
+    - param: list of parameter values in each measurement (-> list of lists)
+    - attributes: list of keys that should be analyzed,
+        e.g. ['power', 'duration']
+    additionally, only if isa == 'transition':
+    - timeout: list of duration of previous state in µs
+    - rel_energy_prev: transition energy relative to previous state mean power in pJ
+    - rel_energy_next: transition energy relative to next state mean power in pJ
+    """
+
+    def __init__(
+        self,
+        by_name,
+        parameters,
+        arg_count,
+        traces=[],
+        ignore_trace_indexes=[],
+        discard_outliers=None,
+        function_override={},
+        use_corrcoef=False,
+        pta=None,
+    ):
+        """
+        Prepare a new PTA energy model.
+
+        Actual model generation is done on-demand by calling the respective functions.
+
+        arguments:
+        by_name -- state/transition measurements aggregated by name, as returned by pta_trace_to_aggregate.
+        parameters -- list of parameter names, as returned by pta_trace_to_aggregate
+        arg_count -- function arguments, as returned by pta_trace_to_aggregate
+        traces -- list of preprocessed DFA traces, as returned by RawData.get_preprocessed_data()
+        ignore_trace_indexes -- list of trace indexes. The corresponding traces will be ignored.
+        discard_outliers -- currently not supported: threshold for outlier detection and removel (float).
+            Outlier detection is performed individually for each state/transition in each trace,
+            so it only works if the benchmark ran several times.
+            Given "data" (a set of measurements of the same thing, e.g. TX duration in the third benchmark trace),
+            "m" (the median of all attribute measurements with the same parameters, which may include data from other traces),
+            a data point X is considered an outlier if
+            | 0.6745 * (X - m) / median(|data - m|) | > discard_outliers .
+        function_override -- dict of overrides for automatic parameter function generation.
+            If (state or transition name, model attribute) is present in function_override,
+            the corresponding text string is the function used for analytic (parameter-aware/fitted)
+            modeling of this attribute. It is passed to AnalyticFunction, see
+            there for the required format. Note that this happens regardless of
+            parameter dependency detection: The provided analytic function will be assigned
+            even if it seems like the model attribute is static / parameter-independent.
+        use_corrcoef -- use correlation coefficient instead of stddev comparison
+            to detect whether a model attribute depends on a parameter
+        pta -- hardware model as `PTA` object
+        """
+        self.by_name = by_name
+        self.by_param = by_name_to_by_param(by_name)
+        self._parameter_names = sorted(parameters)
+        self._num_args = arg_count
+        self._use_corrcoef = use_corrcoef
+        self.traces = traces
+        self.stats = ParamStats(
+            self.by_name,
+            self.by_param,
+            self._parameter_names,
+            self._num_args,
+            self._use_corrcoef,
+        )
+        self.cache = {}
+        np.seterr("raise")
+        self._outlier_threshold = discard_outliers
+        self.function_override = function_override.copy()
+        self.pta = pta
+        self.ignore_trace_indexes = ignore_trace_indexes
+        self._aggregate_to_ndarray(self.by_name)
+
+    def _aggregate_to_ndarray(self, aggregate):
+        for elem in aggregate.values():
+            for key in elem["attributes"]:
+                elem[key] = np.array(elem[key])
+
+    # This heuristic is very similar to the "function is not much better than
+    # median" checks in get_fitted. So far, doing it here as well is mostly
+    # a performance and not an algorithm quality decision.
+    # --df, 2018-04-18
+    def depends_on_param(self, state_or_trans, key, param):
+        return self.stats.depends_on_param(state_or_trans, key, param)
+
+    # See notes on depends_on_param
+    def depends_on_arg(self, state_or_trans, key, param):
+        return self.stats.depends_on_arg(state_or_trans, key, param)
+
+    def _get_model_from_dict(self, model_dict, model_function):
+        model = {}
+        for name, elem in model_dict.items():
+            model[name] = {}
+            for key in elem["attributes"]:
+                try:
+                    model[name][key] = model_function(elem[key])
+                except RuntimeWarning:
+                    logger.warning("Got no data for {} {}".format(name, key))
+                except FloatingPointError as fpe:
+                    logger.warning("Got no data for {} {}: {}".format(name, key, fpe))
+        return model
+
+    def get_static(self, use_mean=False):
+        """
+        Get static model function: name, attribute -> model value.
+
+        Uses the median of by_name for modeling, unless `use_mean` is set.
+        """
+        getter_function = np.median
+
+        if use_mean:
+            getter_function = np.mean
+
+        static_model = self._get_model_from_dict(self.by_name, getter_function)
+
+        def static_model_getter(name, key, **kwargs):
+            return static_model[name][key]
+
+        return static_model_getter
+
+    def get_param_lut(self, fallback=False):
+        """
+        Get parameter-look-up-table model function: name, attribute, parameter values -> model value.
+
+        The function can only give model values for parameter combinations
+        present in by_param. By default, it raises KeyError for other values.
+
+        arguments:
+        fallback -- Fall back to the (non-parameter-aware) static model when encountering unknown parameter values
+        """
+        static_model = self._get_model_from_dict(self.by_name, np.median)
+        lut_model = self._get_model_from_dict(self.by_param, np.median)
+
+        def lut_median_getter(name, key, param, arg=[], **kwargs):
+            param.extend(map(soft_cast_int, arg))
+            try:
+                return lut_model[(name, tuple(param))][key]
+            except KeyError:
+                if fallback:
+                    return static_model[name][key]
+                raise
+
+        return lut_median_getter
+
+    def param_index(self, param_name):
+        if param_name in self._parameter_names:
+            return self._parameter_names.index(param_name)
+        return len(self._parameter_names) + int(param_name)
+
+    def param_name(self, param_index):
+        if param_index < len(self._parameter_names):
+            return self._parameter_names[param_index]
+        return str(param_index)
+
+    def get_fitted(self, safe_functions_enabled=False):
+        """
+        Get parameter-aware model function and model information function.
+
+        Returns two functions:
+        model_function(name, attribute, param=parameter values) -> model value.
+        model_info(name, attribute) -> {'fit_result' : ..., 'function' : ... } or None
+        """
+        if "fitted_model_getter" in self.cache and "fitted_info_getter" in self.cache:
+            return self.cache["fitted_model_getter"], self.cache["fitted_info_getter"]
+
+        static_model = self._get_model_from_dict(self.by_name, np.median)
+        param_model = dict(
+            [[state_or_tran, {}] for state_or_tran in self.by_name.keys()]
+        )
+        paramfit = ParallelParamFit(self.by_param)
+        for state_or_tran in self.by_name.keys():
+            for model_attribute in self.by_name[state_or_tran]["attributes"]:
+                fit_results = {}
+                for parameter_index, parameter_name in enumerate(self._parameter_names):
+                    if self.depends_on_param(
+                        state_or_tran, model_attribute, parameter_name
+                    ):
+                        paramfit.enqueue(
+                            state_or_tran,
+                            model_attribute,
+                            parameter_index,
+                            parameter_name,
+                            safe_functions_enabled,
+                        )
+                        for (
+                            codependent_param_dict
+                        ) in self.stats.codependent_parameter_value_dicts(
+                            state_or_tran, model_attribute, parameter_name
+                        ):
+                            paramfit.enqueue(
+                                state_or_tran,
+                                model_attribute,
+                                parameter_index,
+                                parameter_name,
+                                safe_functions_enabled,
+                                codependent_param_dict,
+                            )
+                if (
+                    arg_support_enabled
+                    and self.by_name[state_or_tran]["isa"] == "transition"
+                ):
+                    for arg_index in range(self._num_args[state_or_tran]):
+                        if self.depends_on_arg(
+                            state_or_tran, model_attribute, arg_index
+                        ):
+                            paramfit.enqueue(
+                                state_or_tran,
+                                model_attribute,
+                                len(self._parameter_names) + arg_index,
+                                arg_index,
+                                safe_functions_enabled,
+                            )
+        paramfit.fit()
+
+        for state_or_tran in self.by_name.keys():
+            num_args = 0
+            if (
+                arg_support_enabled
+                and self.by_name[state_or_tran]["isa"] == "transition"
+            ):
+                num_args = self._num_args[state_or_tran]
+            for model_attribute in self.by_name[state_or_tran]["attributes"]:
+                fit_results = paramfit.get_result(state_or_tran, model_attribute)
+
+                for parameter_name in self._parameter_names:
+                    if self.depends_on_param(
+                        state_or_tran, model_attribute, parameter_name
+                    ):
+                        for (
+                            codependent_param_dict
+                        ) in self.stats.codependent_parameter_value_dicts(
+                            state_or_tran, model_attribute, parameter_name
+                        ):
+                            pass
+                            # FIXME paramfit.get_result hat ja gar keinen Parameter als Argument...
+
+                if (state_or_tran, model_attribute) in self.function_override:
+                    function_str = self.function_override[
+                        (state_or_tran, model_attribute)
+                    ]
+                    x = AnalyticFunction(function_str, self._parameter_names, num_args)
+                    x.fit(self.by_param, state_or_tran, model_attribute)
+                    if x.fit_success:
+                        param_model[state_or_tran][model_attribute] = {
+                            "fit_result": fit_results,
+                            "function": x,
+                        }
+                elif len(fit_results.keys()):
+                    x = analytic.function_powerset(
+                        fit_results, self._parameter_names, num_args
+                    )
+                    x.fit(self.by_param, state_or_tran, model_attribute)
+                    if x.fit_success:
+                        param_model[state_or_tran][model_attribute] = {
+                            "fit_result": fit_results,
+                            "function": x,
+                        }
+
+        def model_getter(name, key, **kwargs):
+            if "arg" in kwargs and "param" in kwargs:
+                kwargs["param"].extend(map(soft_cast_int, kwargs["arg"]))
+            if key in param_model[name]:
+                param_list = kwargs["param"]
+                param_function = param_model[name][key]["function"]
+                if param_function.is_predictable(param_list):
+                    return param_function.eval(param_list)
+            return static_model[name][key]
+
+        def info_getter(name, key):
+            if key in param_model[name]:
+                return param_model[name][key]
+            return None
+
+        self.cache["fitted_model_getter"] = model_getter
+        self.cache["fitted_info_getter"] = info_getter
+
+        return model_getter, info_getter
+
+    def to_json(self):
+        static_model = self.get_static()
+        static_quality = self.assess(static_model)
+        param_model, param_info = self.get_fitted()
+        analytic_quality = self.assess(param_model)
+        self.pta.update(
+            static_model,
+            param_info,
+            static_error=static_quality["by_name"],
+            analytic_error=analytic_quality["by_name"],
+        )
+        return self.pta.to_json()
+
+    def states(self):
+        """Return sorted list of state names."""
+        return sorted(
+            list(
+                filter(lambda k: self.by_name[k]["isa"] == "state", self.by_name.keys())
+            )
+        )
+
+    def transitions(self):
+        """Return sorted list of transition names."""
+        return sorted(
+            list(
+                filter(
+                    lambda k: self.by_name[k]["isa"] == "transition",
+                    self.by_name.keys(),
+                )
+            )
+        )
+
+    def states_and_transitions(self):
+        """Return list of states and transition names."""
+        ret = self.states()
+        ret.extend(self.transitions())
+        return ret
+
+    def parameters(self):
+        return self._parameter_names
+
+    def attributes(self, state_or_trans):
+        return self.by_name[state_or_trans]["attributes"]
+
+    def assess(self, model_function):
+        """
+        Calculate MAE, SMAPE, etc. of model_function for each by_name entry.
+
+        state/transition/... name and parameter values are fed into model_function.
+        The by_name entries of this PTAModel are used as ground truth and
+        compared with the values predicted by model_function.
+
+        For proper model assessments, the data used to generate model_function
+        and the data fed into this AnalyticModel instance must be mutually
+        exclusive (e.g. by performing cross validation). Otherwise,
+        overfitting cannot be detected.
+        """
+        detailed_results = {}
+        for name, elem in sorted(self.by_name.items()):
+            detailed_results[name] = {}
+            for key in elem["attributes"]:
+                predicted_data = np.array(
+                    list(
+                        map(
+                            lambda i: model_function(name, key, param=elem["param"][i]),
+                            range(len(elem[key])),
+                        )
+                    )
+                )
+                measures = regression_measures(predicted_data, elem[key])
+                detailed_results[name][key] = measures
+
+        return {"by_name": detailed_results}
+
+    def assess_states(
+        self, model_function, model_attribute="power", distribution: dict = None
+    ):
+        """
+        Calculate overall model error assuming equal distribution of states
+        """
+        # TODO calculate mean power draw for distribution and use it to
+        # calculate relative error from MAE combination
+        model_quality = self.assess(model_function)
+        num_states = len(self.states())
+        if distribution is None:
+            distribution = dict(map(lambda x: [x, 1 / num_states], self.states()))
+
+        if not np.isclose(sum(distribution.values()), 1):
+            raise ValueError(
+                "distribution must be a probability distribution with sum 1"
+            )
+
+        # total_value = None
+        # try:
+        #     total_value = sum(map(lambda x: model_function(x, model_attribute) * distribution[x], self.states()))
+        # except KeyError:
+        #     pass
+
+        total_error = np.sqrt(
+            sum(
+                map(
+                    lambda x: np.square(
+                        model_quality["by_name"][x][model_attribute]["mae"]
+                        * distribution[x]
+                    ),
+                    self.states(),
+                )
+            )
+        )
+        return total_error
+
+    def assess_on_traces(self, model_function):
+        """
+        Calculate MAE, SMAPE, etc. of model_function for each trace known to this PTAModel instance.
+
+        :returns: dict of `duration_by_trace`, `energy_by_trace`, `timeout_by_trace`, `rel_energy_by_trace` and `state_energy_by_trace`.
+            Each entry holds regression measures for the corresponding measure. Note that the determined model quality heavily depends on the
+            traces: small-ish absolute errors in states which frequently occur may have more effect than large absolute errors in rarely occuring states
+        """
+        model_energy_list = []
+        real_energy_list = []
+        model_rel_energy_list = []
+        model_state_energy_list = []
+        model_duration_list = []
+        real_duration_list = []
+        model_timeout_list = []
+        real_timeout_list = []
+
+        for trace in self.traces:
+            if trace["id"] not in self.ignore_trace_indexes:
+                for rep_id in range(len(trace["trace"][0]["offline"])):
+                    model_energy = 0.0
+                    real_energy = 0.0
+                    model_rel_energy = 0.0
+                    model_state_energy = 0.0
+                    model_duration = 0.0
+                    real_duration = 0.0
+                    model_timeout = 0.0
+                    real_timeout = 0.0
+                    for i, trace_part in enumerate(trace["trace"]):
+                        name = trace_part["name"]
+                        prev_name = trace["trace"][i - 1]["name"]
+                        isa = trace_part["isa"]
+                        if name != "UNINITIALIZED":
+                            try:
+                                param = trace_part["offline_aggregates"]["param"][
+                                    rep_id
+                                ]
+                                prev_param = trace["trace"][i - 1][
+                                    "offline_aggregates"
+                                ]["param"][rep_id]
+                                power = trace_part["offline"][rep_id]["uW_mean"]
+                                duration = trace_part["offline"][rep_id]["us"]
+                                prev_duration = trace["trace"][i - 1]["offline"][
+                                    rep_id
+                                ]["us"]
+                                real_energy += power * duration
+                                if isa == "state":
+                                    model_energy += (
+                                        model_function(name, "power", param=param)
+                                        * duration
+                                    )
+                                else:
+                                    model_energy += model_function(
+                                        name, "energy", param=param
+                                    )
+                                    # If i == 1, the previous state was UNINITIALIZED, for which we do not have model data
+                                    if i == 1:
+                                        model_rel_energy += model_function(
+                                            name, "energy", param=param
+                                        )
+                                    else:
+                                        model_rel_energy += model_function(
+                                            prev_name, "power", param=prev_param
+                                        ) * (prev_duration + duration)
+                                        model_state_energy += model_function(
+                                            prev_name, "power", param=prev_param
+                                        ) * (prev_duration + duration)
+                                    model_rel_energy += model_function(
+                                        name, "rel_energy_prev", param=param
+                                    )
+                                    real_duration += duration
+                                    model_duration += model_function(
+                                        name, "duration", param=param
+                                    )
+                                    if (
+                                        "plan" in trace_part
+                                        and trace_part["plan"]["level"] == "epilogue"
+                                    ):
+                                        real_timeout += trace_part["offline"][rep_id][
+                                            "timeout"
+                                        ]
+                                        model_timeout += model_function(
+                                            name, "timeout", param=param
+                                        )
+                            except KeyError:
+                                # if states/transitions have been removed via --filter-param, this is harmless
+                                pass
+                    real_energy_list.append(real_energy)
+                    model_energy_list.append(model_energy)
+                    model_rel_energy_list.append(model_rel_energy)
+                    model_state_energy_list.append(model_state_energy)
+                    real_duration_list.append(real_duration)
+                    model_duration_list.append(model_duration)
+                    real_timeout_list.append(real_timeout)
+                    model_timeout_list.append(model_timeout)
+
+        return {
+            "duration_by_trace": regression_measures(
+                np.array(model_duration_list), np.array(real_duration_list)
+            ),
+            "energy_by_trace": regression_measures(
+                np.array(model_energy_list), np.array(real_energy_list)
+            ),
+            "timeout_by_trace": regression_measures(
+                np.array(model_timeout_list), np.array(real_timeout_list)
+            ),
+            "rel_energy_by_trace": regression_measures(
+                np.array(model_rel_energy_list), np.array(real_energy_list)
+            ),
+            "state_energy_by_trace": regression_measures(
+                np.array(model_state_energy_list), np.array(real_energy_list)
+            ),
+        }
diff --git a/test/test_parameters.py b/test/test_parameters.py
index 22efccf..e36b1a1 100755
--- a/test/test_parameters.py
+++ b/test/test_parameters.py
@@ -1,9 +1,9 @@
 #!/usr/bin/env python3
 
-from dfatool import dfatool as dt
 from dfatool import parameters
 from dfatool.utils import by_name_to_by_param
 from dfatool.functions import analytic
+from dfatool.model import ParallelParamFit
 import unittest
 
 import numpy as np
@@ -52,7 +52,7 @@ class TestModels(unittest.TestCase):
 
         # Fit individual functions for each parameter (only "p_linear" in this case)
 
-        paramfit = dt.ParallelParamFit(by_param)
+        paramfit = ParallelParamFit(by_param)
         paramfit.enqueue("TX", "power", 1, "p_linear")
         paramfit.fit()
 
@@ -133,7 +133,7 @@ class TestModels(unittest.TestCase):
         self.assertEqual(stats.depends_on_param("someKey", "ll", "log_inv"), True)
         self.assertEqual(stats.depends_on_param("someKey", "ll", "square_none"), False)
 
-        paramfit = dt.ParallelParamFit(by_param)
+        paramfit = ParallelParamFit(by_param)
         paramfit.enqueue("someKey", "lls", 0, "lin_lin")
         paramfit.enqueue("someKey", "lls", 1, "log_inv")
         paramfit.enqueue("someKey", "lls", 2, "square_none")
diff --git a/test/test_ptamodel.py b/test/test_ptamodel.py
index 9abe3c0..e153280 100755
--- a/test/test_ptamodel.py
+++ b/test/test_ptamodel.py
@@ -1,6 +1,7 @@
 #!/usr/bin/env python3
 
-from dfatool.dfatool import PTAModel, RawData, pta_trace_to_aggregate
+from dfatool.dfatool import RawData, pta_trace_to_aggregate
+from dfatool.model import PTAModel
 import os
 import unittest
 import pytest
diff --git a/test/test_timingharness.py b/test/test_timingharness.py
index 61cdf4b..cc4b766 100755
--- a/test/test_timingharness.py
+++ b/test/test_timingharness.py
@@ -1,6 +1,7 @@
 #!/usr/bin/env python3
 
-from dfatool.dfatool import AnalyticModel, TimingData, pta_trace_to_aggregate
+from dfatool.dfatool import TimingData, pta_trace_to_aggregate
+from dfatool.model import AnalyticModel
 from dfatool.parameters import prune_dependent_parameters
 import unittest
 
-- 
cgit v1.2.3


From 92030c19d7cde49999648509309c3ac6e8b4ba21 Mon Sep 17 00:00:00 2001
From: Daniel Friesel <daniel.friesel@uos.de>
Date: Mon, 6 Jul 2020 15:32:12 +0200
Subject: Rename dfatool.dfatool to dfatool.loader

---
 bin/analyze-archive.py          |    2 +-
 bin/analyze-timing.py           |    2 +-
 bin/cal-hist                    |    2 +-
 bin/eval-accounting-overhead.py |    2 +-
 bin/eval-outlier-removal.py     |    2 +-
 bin/eval-rel-energy.py          |    2 +-
 bin/gptest.py                   |    2 +-
 bin/gradient                    |    2 +-
 bin/mim-vs-keysight.py          |    2 +-
 bin/mimosa-etv                  |    2 +-
 bin/mimplot                     |    2 +-
 bin/test_corrcoef.py            |    2 +-
 lib/dfatool.py                  | 2008 ---------------------------------------
 lib/loader.py                   | 2008 +++++++++++++++++++++++++++++++++++++++
 test/test_ptamodel.py           |    2 +-
 test/test_timingharness.py      |    2 +-
 16 files changed, 2022 insertions(+), 2022 deletions(-)
 delete mode 100644 lib/dfatool.py
 create mode 100644 lib/loader.py

(limited to 'test/test_ptamodel.py')

diff --git a/bin/analyze-archive.py b/bin/analyze-archive.py
index 7cac27a..175570b 100755
--- a/bin/analyze-archive.py
+++ b/bin/analyze-archive.py
@@ -113,7 +113,7 @@ import random
 import re
 import sys
 from dfatool import plotter
-from dfatool.dfatool import RawData, pta_trace_to_aggregate
+from dfatool.loader import RawData, pta_trace_to_aggregate
 from dfatool.functions import gplearn_to_function
 from dfatool.model import PTAModel
 from dfatool.validation import CrossValidator
diff --git a/bin/analyze-timing.py b/bin/analyze-timing.py
index 3503279..ed9c571 100755
--- a/bin/analyze-timing.py
+++ b/bin/analyze-timing.py
@@ -79,7 +79,7 @@ import logging
 import re
 import sys
 from dfatool import plotter
-from dfatool.dfatool import TimingData, pta_trace_to_aggregate
+from dfatool.loader import TimingData, pta_trace_to_aggregate
 from dfatool.functions import gplearn_to_function
 from dfatool.model import AnalyticModel
 from dfatool.validation import CrossValidator
diff --git a/bin/cal-hist b/bin/cal-hist
index ba2ff47..07ab597 100755
--- a/bin/cal-hist
+++ b/bin/cal-hist
@@ -7,7 +7,7 @@ import struct
 import sys
 import tarfile
 import matplotlib.pyplot as plt
-from dfatool.dfatool import MIMOSA
+from dfatool.loader import MIMOSA
 from dfatool.utils import running_mean
 
 voltage = float(sys.argv[1])
diff --git a/bin/eval-accounting-overhead.py b/bin/eval-accounting-overhead.py
index 7ea0807..1c03bf8 100755
--- a/bin/eval-accounting-overhead.py
+++ b/bin/eval-accounting-overhead.py
@@ -13,7 +13,7 @@ providing overhead per transition and getEnergy overhead
 
 """
 
-from dfatool.dfatool import AnalyticModel, TimingData, pta_trace_to_aggregate
+from dfatool.loader import AnalyticModel, TimingData, pta_trace_to_aggregate
 import json
 import sys
 
diff --git a/bin/eval-outlier-removal.py b/bin/eval-outlier-removal.py
index b81c33a..c03266d 100755
--- a/bin/eval-outlier-removal.py
+++ b/bin/eval-outlier-removal.py
@@ -3,7 +3,7 @@
 import getopt
 import re
 import sys
-from dfatool.dfatool import RawData, pta_trace_to_aggregate
+from dfatool.loader import RawData, pta_trace_to_aggregate
 from dfatool.model import PTAModel
 
 opt = dict()
diff --git a/bin/eval-rel-energy.py b/bin/eval-rel-energy.py
index 2af2cff..66c3ae2 100755
--- a/bin/eval-rel-energy.py
+++ b/bin/eval-rel-energy.py
@@ -3,7 +3,7 @@
 import getopt
 import re
 import sys
-from dfatool.dfatool import RawData, pta_trace_to_aggregate
+from dfatool.loader import RawData, pta_trace_to_aggregate
 from dfatool.model import PTAModel
 
 opt = dict()
diff --git a/bin/gptest.py b/bin/gptest.py
index bcfb7aa..b5012e5 100755
--- a/bin/gptest.py
+++ b/bin/gptest.py
@@ -2,7 +2,7 @@
 
 import sys
 import numpy as np
-from dfatool.dfatool import (
+from dfatool.loader import (
     RawData,
     pta_trace_to_aggregate,
 )
diff --git a/bin/gradient b/bin/gradient
index 8280794..0409c38 100755
--- a/bin/gradient
+++ b/bin/gradient
@@ -7,7 +7,7 @@ import struct
 import sys
 import tarfile
 import matplotlib.pyplot as plt
-from dfatool.dfatool import MIMOSA
+from dfatool.loader import MIMOSA
 from dfatool.utils import running_mean
 
 voltage = float(sys.argv[1])
diff --git a/bin/mim-vs-keysight.py b/bin/mim-vs-keysight.py
index c214f2f..c9a7249 100755
--- a/bin/mim-vs-keysight.py
+++ b/bin/mim-vs-keysight.py
@@ -3,7 +3,7 @@
 import numpy as np
 import sys
 import matplotlib.pyplot as plt
-from dfatool.dfatool import MIMOSA, KeysightCSV
+from dfatool.loader import MIMOSA, KeysightCSV
 from dfatool.utils import running_mean
 
 voltage = float(sys.argv[1])
diff --git a/bin/mimosa-etv b/bin/mimosa-etv
index 431e275..9b6e897 100755
--- a/bin/mimosa-etv
+++ b/bin/mimosa-etv
@@ -8,7 +8,7 @@ import numpy as np
 import os
 import re
 import sys
-from dfatool.dfatool import MIMOSA
+from dfatool.loader import MIMOSA
 from dfatool.model import aggregate_measures
 from dfatool.utils import running_mean
 
diff --git a/bin/mimplot b/bin/mimplot
index 2a888ee..0d4ba0e 100755
--- a/bin/mimplot
+++ b/bin/mimplot
@@ -9,7 +9,7 @@ import struct
 import sys
 import tarfile
 import matplotlib.pyplot as plt
-from dfatool.dfatool import MIMOSA
+from dfatool.loader import MIMOSA
 from dfatool.utils import running_mean
 
 opt = dict()
diff --git a/bin/test_corrcoef.py b/bin/test_corrcoef.py
index fef0b24..b8c8eae 100755
--- a/bin/test_corrcoef.py
+++ b/bin/test_corrcoef.py
@@ -4,7 +4,7 @@ import getopt
 import re
 import sys
 from dfatool import plotter
-from dfatool.dfatool import RawData, pta_trace_to_aggregate
+from dfatool.loader import RawData, pta_trace_to_aggregate
 from dfatool.functions import gplearn_to_function
 from dfatool.model import PTAModel
 
diff --git a/lib/dfatool.py b/lib/dfatool.py
deleted file mode 100644
index e8b5090..0000000
--- a/lib/dfatool.py
+++ /dev/null
@@ -1,2008 +0,0 @@
-#!/usr/bin/env python3
-
-import csv
-import io
-import json
-import logging
-import numpy as np
-import os
-import re
-import struct
-import tarfile
-import hashlib
-from multiprocessing import Pool
-from .utils import running_mean, soft_cast_int
-
-logger = logging.getLogger(__name__)
-
-try:
-    from .pubcode import Code128
-    import zbar
-
-    zbar_available = True
-except ImportError:
-    zbar_available = False
-
-
-arg_support_enabled = True
-
-
-class KeysightCSV:
-    """Simple loader for Keysight CSV data, as exported by the windows software."""
-
-    def __init__(self):
-        """Create a new KeysightCSV object."""
-        pass
-
-    def load_data(self, filename: str):
-        """
-        Load log data from filename, return timestamps and currents.
-
-        Returns two one-dimensional NumPy arrays: timestamps and corresponding currents.
-        """
-        with open(filename) as f:
-            for i, _ in enumerate(f):
-                pass
-            timestamps = np.ndarray((i - 3), dtype=float)
-            currents = np.ndarray((i - 3), dtype=float)
-        # basically seek back to start
-        with open(filename) as f:
-            for _ in range(4):
-                next(f)
-            reader = csv.reader(f, delimiter=",")
-            for i, row in enumerate(reader):
-                timestamps[i] = float(row[0])
-                currents[i] = float(row[2]) * -1
-        return timestamps, currents
-
-
-def _preprocess_mimosa(measurement):
-    setup = measurement["setup"]
-    mim = MIMOSA(
-        float(setup["mimosa_voltage"]),
-        int(setup["mimosa_shunt"]),
-        with_traces=measurement["with_traces"],
-    )
-    try:
-        charges, triggers = mim.load_data(measurement["content"])
-        trigidx = mim.trigger_edges(triggers)
-    except EOFError as e:
-        mim.errors.append("MIMOSA logfile error: {}".format(e))
-        trigidx = list()
-
-    if len(trigidx) == 0:
-        mim.errors.append("MIMOSA log has no triggers")
-        return {
-            "fileno": measurement["fileno"],
-            "info": measurement["info"],
-            "has_datasource_error": len(mim.errors) > 0,
-            "datasource_errors": mim.errors,
-            "expected_trace": measurement["expected_trace"],
-            "repeat_id": measurement["repeat_id"],
-        }
-
-    cal_edges = mim.calibration_edges(
-        running_mean(mim.currents_nocal(charges[0 : trigidx[0]]), 10)
-    )
-    calfunc, caldata = mim.calibration_function(charges, cal_edges)
-    vcalfunc = np.vectorize(calfunc, otypes=[np.float64])
-
-    processed_data = {
-        "fileno": measurement["fileno"],
-        "info": measurement["info"],
-        "triggers": len(trigidx),
-        "first_trig": trigidx[0] * 10,
-        "calibration": caldata,
-        "energy_trace": mim.analyze_states(charges, trigidx, vcalfunc),
-        "has_datasource_error": len(mim.errors) > 0,
-        "datasource_errors": mim.errors,
-    }
-
-    for key in ["expected_trace", "repeat_id"]:
-        if key in measurement:
-            processed_data[key] = measurement[key]
-
-    return processed_data
-
-
-def _preprocess_etlog(measurement):
-    setup = measurement["setup"]
-    etlog = EnergyTraceLog(
-        float(setup["voltage"]),
-        int(setup["state_duration"]),
-        measurement["transition_names"],
-        with_traces=measurement["with_traces"],
-    )
-    try:
-        etlog.load_data(measurement["content"])
-        states_and_transitions = etlog.analyze_states(
-            measurement["expected_trace"], measurement["repeat_id"]
-        )
-    except EOFError as e:
-        etlog.errors.append("EnergyTrace logfile error: {}".format(e))
-
-    processed_data = {
-        "fileno": measurement["fileno"],
-        "repeat_id": measurement["repeat_id"],
-        "info": measurement["info"],
-        "expected_trace": measurement["expected_trace"],
-        "energy_trace": states_and_transitions,
-        "has_datasource_error": len(etlog.errors) > 0,
-        "datasource_errors": etlog.errors,
-    }
-
-    return processed_data
-
-
-class TimingData:
-    """
-    Loader for timing model traces measured with on-board timers using `harness.OnboardTimerHarness`.
-
-    Excpets a specific trace format and UART log output (as produced by
-    generate-dfa-benchmark.py). Prunes states from output. (TODO)
-    """
-
-    def __init__(self, filenames):
-        """
-        Create a new TimingData object.
-
-        Each filenames element corresponds to a measurement run.
-        """
-        self.filenames = filenames.copy()
-        self.traces_by_fileno = []
-        self.setup_by_fileno = []
-        self.preprocessed = False
-        self._parameter_names = None
-        self.version = 0
-
-    def _concatenate_analyzed_traces(self):
-        self.traces = []
-        for trace_group in self.traces_by_fileno:
-            for trace in trace_group:
-                # TimingHarness logs states, but does not aggregate any data for them at the moment -> throw all states away
-                transitions = list(
-                    filter(lambda x: x["isa"] == "transition", trace["trace"])
-                )
-                self.traces.append({"id": trace["id"], "trace": transitions})
-        for i, trace in enumerate(self.traces):
-            trace["orig_id"] = trace["id"]
-            trace["id"] = i
-            for log_entry in trace["trace"]:
-                paramkeys = sorted(log_entry["parameter"].keys())
-                if "param" not in log_entry["offline_aggregates"]:
-                    log_entry["offline_aggregates"]["param"] = list()
-                if "duration" in log_entry["offline_aggregates"]:
-                    for i in range(len(log_entry["offline_aggregates"]["duration"])):
-                        paramvalues = list()
-                        for paramkey in paramkeys:
-                            if type(log_entry["parameter"][paramkey]) is list:
-                                paramvalues.append(
-                                    soft_cast_int(log_entry["parameter"][paramkey][i])
-                                )
-                            else:
-                                paramvalues.append(
-                                    soft_cast_int(log_entry["parameter"][paramkey])
-                                )
-                        if arg_support_enabled and "args" in log_entry:
-                            paramvalues.extend(map(soft_cast_int, log_entry["args"]))
-                        log_entry["offline_aggregates"]["param"].append(paramvalues)
-
-    def _preprocess_0(self):
-        for filename in self.filenames:
-            with open(filename, "r") as f:
-                log_data = json.load(f)
-                self.traces_by_fileno.extend(log_data["traces"])
-        self._concatenate_analyzed_traces()
-
-    def get_preprocessed_data(self):
-        """
-        Return a list of DFA traces annotated with timing and parameter data.
-
-        Suitable for the PTAModel constructor.
-        See PTAModel(...) docstring for format details.
-        """
-        if self.preprocessed:
-            return self.traces
-        if self.version == 0:
-            self._preprocess_0()
-        self.preprocessed = True
-        return self.traces
-
-
-def sanity_check_aggregate(aggregate):
-    for key in aggregate:
-        if "param" not in aggregate[key]:
-            raise RuntimeError("aggregate[{}][param] does not exist".format(key))
-        if "attributes" not in aggregate[key]:
-            raise RuntimeError("aggregate[{}][attributes] does not exist".format(key))
-        for attribute in aggregate[key]["attributes"]:
-            if attribute not in aggregate[key]:
-                raise RuntimeError(
-                    "aggregate[{}][{}] does not exist, even though it is contained in aggregate[{}][attributes]".format(
-                        key, attribute, key
-                    )
-                )
-            param_len = len(aggregate[key]["param"])
-            attr_len = len(aggregate[key][attribute])
-            if param_len != attr_len:
-                raise RuntimeError(
-                    "parameter mismatch: len(aggregate[{}][param]) == {} != len(aggregate[{}][{}]) == {}".format(
-                        key, param_len, key, attribute, attr_len
-                    )
-                )
-
-
-class RawData:
-    """
-    Loader for hardware model traces measured with MIMOSA.
-
-    Expects a specific trace format and UART log output (as produced by the
-    dfatool benchmark generator). Loads data, prunes bogus measurements, and
-    provides preprocessed data suitable for PTAModel. Results are cached on the
-    file system, making subsequent loads near-instant.
-    """
-
-    def __init__(self, filenames, with_traces=False):
-        """
-        Create a new RawData object.
-
-        Each filename element corresponds to a measurement run.
-        It must be a tar archive with the following contents:
-
-        Version 0:
-
-        * `setup.json`: measurement setup. Must contain the keys `state_duration` (how long each state is active, in ms),
-          `mimosa_voltage` (voltage applied to dut, in V), and `mimosa_shunt` (shunt value, in Ohm)
-        * `src/apps/DriverEval/DriverLog.json`: PTA traces and parameters for this benchmark.
-          Layout: List of traces, each trace has an 'id' (numeric, starting with 1) and 'trace' (list of states and transitions) element.
-          Each trace has an even number of elements, starting with the first state (usually `UNINITIALIZED`) and ending with a transition.
-          Each state/transition must have the members `.parameter` (parameter values, empty string or None if unknown), `.isa` ("state" or "transition") and `.name`.
-          Each transition must additionally contain `.plan.level` ("user" or "epilogue").
-          Example: `[ {"id": 1, "trace": [ {"parameter": {...}, "isa": "state", "name": "UNINITIALIZED"}, ...] }, ... ]
-        * At least one `*.mim` file. Each file corresponds to a single execution of the entire benchmark (i.e., all runs described in DriverLog.json) and starts with a MIMOSA Autocal calibration sequence.
-          MIMOSA files are parsed by the `MIMOSA` class.
-
-        Version 1:
-
-        * `ptalog.json`: measurement setup and traces. Contents:
-          `.opt.sleep`: state duration
-          `.opt.pta`: PTA
-          `.opt.traces`: list of sub-benchmark traces (the benchmark may have been split due to code size limitations). Each item is a list of traces as returned by `harness.traces`:
-            `.opt.traces[]`: List of traces. Each trace has an 'id' (numeric, starting with 1) and 'trace' (list of states and transitions) element.
-              Each state/transition must have the members '`parameter` (dict with normalized parameter values), `.isa` ("state" or "transition") and `.name`
-              Each transition must additionally contain `.args`
-          `.opt.files`: list of coresponding MIMOSA measurements.
-            `.opt.files[]` = ['abc123.mim', ...]
-          `.opt.configs`: ....
-        * MIMOSA log files (`*.mim`) as specified in `.opt.files`
-
-        Version 2:
-
-        * `ptalog.json`: measurement setup and traces. Contents:
-          `.opt.sleep`: state duration
-          `.opt.pta`: PTA
-          `.opt.traces`: list of sub-benchmark traces (the benchmark may have been split due to code size limitations). Each item is a list of traces as returned by `harness.traces`:
-            `.opt.traces[]`: List of traces. Each trace has an 'id' (numeric, starting with 1) and 'trace' (list of states and transitions) element.
-              Each state/transition must have the members '`parameter` (dict with normalized parameter values), `.isa` ("state" or "transition") and `.name`
-              Each transition must additionally contain `.args` and `.duration`
-              * `.duration`: list of durations, one per repetition
-          `.opt.files`: list of coresponding EnergyTrace measurements.
-            `.opt.files[]` = ['abc123.etlog', ...]
-          `.opt.configs`: ....
-        * EnergyTrace log files (`*.etlog`) as specified in `.opt.files`
-
-        If a cached result for a file is available, it is loaded and the file
-        is not preprocessed, unless `with_traces` is set.
-
-        tbd
-        """
-        self.with_traces = with_traces
-        self.filenames = filenames.copy()
-        self.traces_by_fileno = []
-        self.setup_by_fileno = []
-        self.version = 0
-        self.preprocessed = False
-        self._parameter_names = None
-        self.ignore_clipping = False
-        self.pta = None
-
-        with tarfile.open(filenames[0]) as tf:
-            for member in tf.getmembers():
-                if member.name == "ptalog.json" and self.version == 0:
-                    self.version = 1
-                    # might also be version 2
-                    # depends on whether *.etlog exists or not
-                elif ".etlog" in member.name:
-                    self.version = 2
-                    break
-
-        self.set_cache_file()
-        if not with_traces:
-            self.load_cache()
-
-    def set_cache_file(self):
-        cache_key = hashlib.sha256("!".join(self.filenames).encode()).hexdigest()
-        self.cache_dir = os.path.dirname(self.filenames[0]) + "/cache"
-        self.cache_file = "{}/{}.json".format(self.cache_dir, cache_key)
-
-    def load_cache(self):
-        if os.path.exists(self.cache_file):
-            with open(self.cache_file, "r") as f:
-                cache_data = json.load(f)
-                self.filenames = cache_data["filenames"]
-                self.traces = cache_data["traces"]
-                self.preprocessing_stats = cache_data["preprocessing_stats"]
-                if "pta" in cache_data:
-                    self.pta = cache_data["pta"]
-                self.setup_by_fileno = cache_data["setup_by_fileno"]
-                self.preprocessed = True
-
-    def save_cache(self):
-        if self.with_traces:
-            return
-        try:
-            os.mkdir(self.cache_dir)
-        except FileExistsError:
-            pass
-        with open(self.cache_file, "w") as f:
-            cache_data = {
-                "filenames": self.filenames,
-                "traces": self.traces,
-                "preprocessing_stats": self.preprocessing_stats,
-                "pta": self.pta,
-                "setup_by_fileno": self.setup_by_fileno,
-            }
-            json.dump(cache_data, f)
-
-    def _state_is_too_short(self, online, offline, state_duration, next_transition):
-        # We cannot control when an interrupt causes a state to be left
-        if next_transition["plan"]["level"] == "epilogue":
-            return False
-
-        # Note: state_duration is stored as ms, not us
-        return offline["us"] < state_duration * 500
-
-    def _state_is_too_long(self, online, offline, state_duration, prev_transition):
-        # If the previous state was left by an interrupt, we may have some
-        # waiting time left over. So it's okay if the current state is longer
-        # than expected.
-        if prev_transition["plan"]["level"] == "epilogue":
-            return False
-        # state_duration is stored as ms, not us
-        return offline["us"] > state_duration * 1500
-
-    def _measurement_is_valid_2(self, processed_data):
-        """
-        Check if a dfatool v2 measurement is valid.
-
-        processed_data layout:
-        'fileno' : measurement['fileno'],
-        'info' : measurement['info'],
-        'energy_trace' : etlog.analyze_states()
-            A sequence of unnamed, unparameterized states and transitions with
-            power and timing data
-        'expected_trace' : trace from PTA DFS (with parameter data)
-        etlog.analyze_states returns a list of (alternating) states and transitions.
-        Each element is a dict containing:
-            - isa: 'state' oder 'transition'
-            - W_mean: Mittelwert der (kalibrierten) Leistungsaufnahme
-            - W_std: Standardabweichung der (kalibrierten) Leistungsaufnahme
-            - s: duration
-
-            if isa == 'transition':
-            - W_mean_delta_prev: Differenz zwischen W_mean und W_mean des vorherigen Zustands
-            - W_mean_delta_next: Differenz zwischen W_mean und W_mean des Folgezustands
-        """
-
-        # Check for low-level parser errors
-        if processed_data["has_datasource_error"]:
-            processed_data["error"] = "; ".join(processed_data["datasource_errors"])
-            return False
-
-        # Note that the low-level parser (EnergyTraceLog) already checks
-        # whether the transition count is correct
-
-        return True
-
-    def _measurement_is_valid_01(self, processed_data):
-        """
-        Check if a dfatool v0 or v1 measurement is valid.
-
-        processed_data layout:
-        'fileno' : measurement['fileno'],
-        'info' : measurement['info'],
-        'triggers' : len(trigidx),
-        'first_trig' : trigidx[0] * 10,
-        'calibration' : caldata,
-        'energy_trace' : mim.analyze_states(charges, trigidx, vcalfunc)
-            A sequence of unnamed, unparameterized states and transitions with
-            power and timing data
-        'expected_trace' : trace from PTA DFS (with parameter data)
-        mim.analyze_states returns a list of (alternating) states and transitions.
-        Each element is a dict containing:
-            - isa: 'state' oder 'transition'
-            - clip_rate: range(0..1) Anteil an Clipping im Energieverbrauch
-            - raw_mean: Mittelwert der Rohwerte
-            - raw_std: Standardabweichung der Rohwerte
-            - uW_mean: Mittelwert der (kalibrierten) Leistungsaufnahme
-            - uW_std: Standardabweichung der (kalibrierten) Leistungsaufnahme
-            - us: Dauer
-
-            Nur falls isa == 'transition':
-            - timeout: Dauer des vorherigen Zustands
-            - uW_mean_delta_prev: Differenz zwischen uW_mean und uW_mean des vorherigen Zustands
-            - uW_mean_delta_next: Differenz zwischen uW_mean und uW_mean des Folgezustands
-        """
-        setup = self.setup_by_fileno[processed_data["fileno"]]
-        if "expected_trace" in processed_data:
-            traces = processed_data["expected_trace"]
-        else:
-            traces = self.traces_by_fileno[processed_data["fileno"]]
-        state_duration = setup["state_duration"]
-
-        # Check MIMOSA error
-        if processed_data["has_datasource_error"]:
-            processed_data["error"] = "; ".join(processed_data["datasource_errors"])
-            return False
-
-        # Check trigger count
-        sched_trigger_count = 0
-        for run in traces:
-            sched_trigger_count += len(run["trace"])
-        if sched_trigger_count != processed_data["triggers"]:
-            processed_data[
-                "error"
-            ] = "got {got:d} trigger edges, expected {exp:d}".format(
-                got=processed_data["triggers"], exp=sched_trigger_count
-            )
-            return False
-        # Check state durations. Very short or long states can indicate a
-        # missed trigger signal which wasn't detected due to duplicate
-        # triggers elsewhere
-        online_datapoints = []
-        for run_idx, run in enumerate(traces):
-            for trace_part_idx in range(len(run["trace"])):
-                online_datapoints.append((run_idx, trace_part_idx))
-        for offline_idx, online_ref in enumerate(online_datapoints):
-            online_run_idx, online_trace_part_idx = online_ref
-            offline_trace_part = processed_data["energy_trace"][offline_idx]
-            online_trace_part = traces[online_run_idx]["trace"][online_trace_part_idx]
-
-            if self._parameter_names is None:
-                self._parameter_names = sorted(online_trace_part["parameter"].keys())
-
-            if sorted(online_trace_part["parameter"].keys()) != self._parameter_names:
-                processed_data[
-                    "error"
-                ] = "Offline #{off_idx:d} (online {on_name:s} @ {on_idx:d}/{on_sub:d}) has inconsistent parameter set: should be {param_want:s}, is {param_is:s}".format(
-                    off_idx=offline_idx,
-                    on_idx=online_run_idx,
-                    on_sub=online_trace_part_idx,
-                    on_name=online_trace_part["name"],
-                    param_want=self._parameter_names,
-                    param_is=sorted(online_trace_part["parameter"].keys()),
-                )
-
-            if online_trace_part["isa"] != offline_trace_part["isa"]:
-                processed_data[
-                    "error"
-                ] = "Offline #{off_idx:d} (online {on_name:s} @ {on_idx:d}/{on_sub:d}) claims to be {off_isa:s}, but should be {on_isa:s}".format(
-                    off_idx=offline_idx,
-                    on_idx=online_run_idx,
-                    on_sub=online_trace_part_idx,
-                    on_name=online_trace_part["name"],
-                    off_isa=offline_trace_part["isa"],
-                    on_isa=online_trace_part["isa"],
-                )
-                return False
-
-            # Clipping in UNINITIALIZED (offline_idx == 0) can happen during
-            # calibration and is handled by MIMOSA
-            if (
-                offline_idx != 0
-                and offline_trace_part["clip_rate"] != 0
-                and not self.ignore_clipping
-            ):
-                processed_data[
-                    "error"
-                ] = "Offline #{off_idx:d} (online {on_name:s} @ {on_idx:d}/{on_sub:d}) was clipping {clip:f}% of the time".format(
-                    off_idx=offline_idx,
-                    on_idx=online_run_idx,
-                    on_sub=online_trace_part_idx,
-                    on_name=online_trace_part["name"],
-                    clip=offline_trace_part["clip_rate"] * 100,
-                )
-                return False
-
-            if (
-                online_trace_part["isa"] == "state"
-                and online_trace_part["name"] != "UNINITIALIZED"
-                and len(traces[online_run_idx]["trace"]) > online_trace_part_idx + 1
-            ):
-                online_prev_transition = traces[online_run_idx]["trace"][
-                    online_trace_part_idx - 1
-                ]
-                online_next_transition = traces[online_run_idx]["trace"][
-                    online_trace_part_idx + 1
-                ]
-                try:
-                    if self._state_is_too_short(
-                        online_trace_part,
-                        offline_trace_part,
-                        state_duration,
-                        online_next_transition,
-                    ):
-                        processed_data[
-                            "error"
-                        ] = "Offline #{off_idx:d} (online {on_name:s} @ {on_idx:d}/{on_sub:d}) is too short (duration = {dur:d} us)".format(
-                            off_idx=offline_idx,
-                            on_idx=online_run_idx,
-                            on_sub=online_trace_part_idx,
-                            on_name=online_trace_part["name"],
-                            dur=offline_trace_part["us"],
-                        )
-                        return False
-                    if self._state_is_too_long(
-                        online_trace_part,
-                        offline_trace_part,
-                        state_duration,
-                        online_prev_transition,
-                    ):
-                        processed_data[
-                            "error"
-                        ] = "Offline #{off_idx:d} (online {on_name:s} @ {on_idx:d}/{on_sub:d}) is too long (duration = {dur:d} us)".format(
-                            off_idx=offline_idx,
-                            on_idx=online_run_idx,
-                            on_sub=online_trace_part_idx,
-                            on_name=online_trace_part["name"],
-                            dur=offline_trace_part["us"],
-                        )
-                        return False
-                except KeyError:
-                    pass
-                    # TODO es gibt next_transitions ohne 'plan'
-        return True
-
-    def _merge_online_and_offline(self, measurement):
-        # Edits self.traces_by_fileno[measurement['fileno']][*]['trace'][*]['offline']
-        # and self.traces_by_fileno[measurement['fileno']][*]['trace'][*]['offline_aggregates'] in place
-        # (appends data from measurement['energy_trace'])
-        # If measurement['expected_trace'] exists, it is edited in place instead
-        online_datapoints = []
-        if "expected_trace" in measurement:
-            traces = measurement["expected_trace"]
-            traces = self.traces_by_fileno[measurement["fileno"]]
-        else:
-            traces = self.traces_by_fileno[measurement["fileno"]]
-        for run_idx, run in enumerate(traces):
-            for trace_part_idx in range(len(run["trace"])):
-                online_datapoints.append((run_idx, trace_part_idx))
-        for offline_idx, online_ref in enumerate(online_datapoints):
-            online_run_idx, online_trace_part_idx = online_ref
-            offline_trace_part = measurement["energy_trace"][offline_idx]
-            online_trace_part = traces[online_run_idx]["trace"][online_trace_part_idx]
-
-            if "offline" not in online_trace_part:
-                online_trace_part["offline"] = [offline_trace_part]
-            else:
-                online_trace_part["offline"].append(offline_trace_part)
-
-            paramkeys = sorted(online_trace_part["parameter"].keys())
-
-            paramvalues = list()
-
-            for paramkey in paramkeys:
-                if type(online_trace_part["parameter"][paramkey]) is list:
-                    paramvalues.append(
-                        soft_cast_int(
-                            online_trace_part["parameter"][paramkey][
-                                measurement["repeat_id"]
-                            ]
-                        )
-                    )
-                else:
-                    paramvalues.append(
-                        soft_cast_int(online_trace_part["parameter"][paramkey])
-                    )
-
-            # NB: Unscheduled transitions do not have an 'args' field set.
-            # However, they should only be caused by interrupts, and
-            # interrupts don't have args anyways.
-            if arg_support_enabled and "args" in online_trace_part:
-                paramvalues.extend(map(soft_cast_int, online_trace_part["args"]))
-
-            if "offline_aggregates" not in online_trace_part:
-                online_trace_part["offline_attributes"] = [
-                    "power",
-                    "duration",
-                    "energy",
-                ]
-                online_trace_part["offline_aggregates"] = {
-                    "power": [],
-                    "duration": [],
-                    "power_std": [],
-                    "energy": [],
-                    "paramkeys": [],
-                    "param": [],
-                }
-                if online_trace_part["isa"] == "transition":
-                    online_trace_part["offline_attributes"].extend(
-                        ["rel_energy_prev", "rel_energy_next", "timeout"]
-                    )
-                    online_trace_part["offline_aggregates"]["rel_energy_prev"] = []
-                    online_trace_part["offline_aggregates"]["rel_energy_next"] = []
-                    online_trace_part["offline_aggregates"]["timeout"] = []
-
-            # Note: All state/transitions are 20us "too long" due to injected
-            # active wait states. These are needed to work around MIMOSA's
-            # relatively low sample rate of 100 kHz (10us) and removed here.
-            online_trace_part["offline_aggregates"]["power"].append(
-                offline_trace_part["uW_mean"]
-            )
-            online_trace_part["offline_aggregates"]["duration"].append(
-                offline_trace_part["us"] - 20
-            )
-            online_trace_part["offline_aggregates"]["power_std"].append(
-                offline_trace_part["uW_std"]
-            )
-            online_trace_part["offline_aggregates"]["energy"].append(
-                offline_trace_part["uW_mean"] * (offline_trace_part["us"] - 20)
-            )
-            online_trace_part["offline_aggregates"]["paramkeys"].append(paramkeys)
-            online_trace_part["offline_aggregates"]["param"].append(paramvalues)
-            if online_trace_part["isa"] == "transition":
-                online_trace_part["offline_aggregates"]["rel_energy_prev"].append(
-                    offline_trace_part["uW_mean_delta_prev"]
-                    * (offline_trace_part["us"] - 20)
-                )
-                online_trace_part["offline_aggregates"]["rel_energy_next"].append(
-                    offline_trace_part["uW_mean_delta_next"]
-                    * (offline_trace_part["us"] - 20)
-                )
-                online_trace_part["offline_aggregates"]["timeout"].append(
-                    offline_trace_part["timeout"]
-                )
-
-    def _merge_online_and_etlog(self, measurement):
-        # Edits self.traces_by_fileno[measurement['fileno']][*]['trace'][*]['offline']
-        # and self.traces_by_fileno[measurement['fileno']][*]['trace'][*]['offline_aggregates'] in place
-        # (appends data from measurement['energy_trace'])
-        online_datapoints = []
-        traces = self.traces_by_fileno[measurement["fileno"]]
-        for run_idx, run in enumerate(traces):
-            for trace_part_idx in range(len(run["trace"])):
-                online_datapoints.append((run_idx, trace_part_idx))
-        for offline_idx, online_ref in enumerate(online_datapoints):
-            online_run_idx, online_trace_part_idx = online_ref
-            offline_trace_part = measurement["energy_trace"][offline_idx]
-            online_trace_part = traces[online_run_idx]["trace"][online_trace_part_idx]
-
-            if "offline" not in online_trace_part:
-                online_trace_part["offline"] = [offline_trace_part]
-            else:
-                online_trace_part["offline"].append(offline_trace_part)
-
-            paramkeys = sorted(online_trace_part["parameter"].keys())
-
-            paramvalues = list()
-
-            for paramkey in paramkeys:
-                if type(online_trace_part["parameter"][paramkey]) is list:
-                    paramvalues.append(
-                        soft_cast_int(
-                            online_trace_part["parameter"][paramkey][
-                                measurement["repeat_id"]
-                            ]
-                        )
-                    )
-                else:
-                    paramvalues.append(
-                        soft_cast_int(online_trace_part["parameter"][paramkey])
-                    )
-
-            # NB: Unscheduled transitions do not have an 'args' field set.
-            # However, they should only be caused by interrupts, and
-            # interrupts don't have args anyways.
-            if arg_support_enabled and "args" in online_trace_part:
-                paramvalues.extend(map(soft_cast_int, online_trace_part["args"]))
-
-            if "offline_aggregates" not in online_trace_part:
-                online_trace_part["offline_aggregates"] = {
-                    "offline_attributes": ["power", "duration", "energy"],
-                    "duration": list(),
-                    "power": list(),
-                    "power_std": list(),
-                    "energy": list(),
-                    "paramkeys": list(),
-                    "param": list(),
-                }
-
-            offline_aggregates = online_trace_part["offline_aggregates"]
-
-            # if online_trace_part['isa'] == 'transitions':
-            #    online_trace_part['offline_attributes'].extend(['rel_energy_prev', 'rel_energy_next'])
-            #    offline_aggregates['rel_energy_prev'] = list()
-            #    offline_aggregates['rel_energy_next'] = list()
-
-            offline_aggregates["duration"].append(offline_trace_part["s"] * 1e6)
-            offline_aggregates["power"].append(offline_trace_part["W_mean"] * 1e6)
-            offline_aggregates["power_std"].append(offline_trace_part["W_std"] * 1e6)
-            offline_aggregates["energy"].append(
-                offline_trace_part["W_mean"] * offline_trace_part["s"] * 1e12
-            )
-            offline_aggregates["paramkeys"].append(paramkeys)
-            offline_aggregates["param"].append(paramvalues)
-
-            # if online_trace_part['isa'] == 'transition':
-            #    offline_aggregates['rel_energy_prev'].append(offline_trace_part['W_mean_delta_prev'] * offline_trace_part['s'] * 1e12)
-            #    offline_aggregates['rel_energy_next'].append(offline_trace_part['W_mean_delta_next'] * offline_trace_part['s'] * 1e12)
-
-    def _concatenate_traces(self, list_of_traces):
-        """
-        Concatenate `list_of_traces` (list of lists) into a single trace while adjusting trace IDs.
-
-        :param list_of_traces: List of list of traces.
-        :returns: List of traces with ['id'] in ascending order and ['orig_id'] as previous ['id']
-        """
-
-        trace_output = list()
-        for trace in list_of_traces:
-            trace_output.extend(trace.copy())
-        for i, trace in enumerate(trace_output):
-            trace["orig_id"] = trace["id"]
-            trace["id"] = i
-        return trace_output
-
-    def get_preprocessed_data(self):
-        """
-        Return a list of DFA traces annotated with energy, timing, and parameter data.
-        The list is cached on disk, unless the constructor was called with `with_traces` set.
-
-        Each DFA trace contains the following elements:
-         * `id`: Numeric ID, starting with 1
-         * `total_energy`: Total amount of energy (as measured by MIMOSA) in the entire trace
-         * `orig_id`: Original trace ID. May differ when concatenating multiple (different) benchmarks into one analysis, i.e., when calling RawData() with more than one file argument.
-         * `trace`: List of the individual states and transitions in this trace. Always contains an even number of elements, staring with the first state (typically "UNINITIALIZED") and ending with a transition.
-
-        Each trace element (that is, an entry of the `trace` list mentioned above) contains the following elements:
-         * `isa`: "state" or "transition"
-         * `name`: name
-         * `offline`: List of offline measumerents for this state/transition. Each entry contains a result for this state/transition during one benchmark execution.
-           Entry contents:
-            - `clip_rate`: rate of clipped energy measurements, 0 .. 1
-            - `raw_mean`: mean raw MIMOSA value
-            - `raw_std`: standard deviation of raw MIMOSA value
-            - `uW_mean`: mean power draw, uW
-            - `uw_std`: standard deviation of power draw, uW
-            - `us`: state/transition duration, us
-            - `uW_mean_delta_prev`: (only for transitions) difference between uW_mean of this transition and uW_mean of previous state
-            - `uW_mean_elta_next`: (only for transitions) difference between uW_mean of this transition and uW_mean of next state
-            - `timeout`: (only for transitions) duration of previous state, us
-         * `offline_aggregates`: Aggregate of `offline` entries. dict of lists, each list entry has the same length
-            - `duration`: state/transition durations ("us"), us
-            - `energy`: state/transition energy ("us * uW_mean"), us
-            - `power`: mean power draw ("uW_mean"), uW
-            - `power_std`: standard deviations of power draw ("uW_std"), uW^2
-            - `paramkeys`: List of lists, each sub-list contains the parameter names corresponding to the `param` entries
-            - `param`: List of lists, each sub-list contains the parameter values for this measurement. Typically, all sub-lists are the same.
-            - `rel_energy_prev`: (only for transitions) transition energy relative to previous state mean power, pJ
-            - `rel_energy_next`: (only for transitions) transition energy relative to next state mean power, pJ
-            - `timeout`: (only for transitions) duration of previous state, us
-         * `offline_attributes`: List containing the keys of `offline_aggregates` which are meant to be part of themodel.
-           This list ultimately decides which hardware/software attributes the model describes.
-           If isa == state, it contains power, duration, energy
-           If isa == transition, it contains power, duration, energy, rel_energy_prev, rel_energy_next, timeout
-         * `online`: List of online estimations for this state/transition. Each entry contains a result for this state/transition during one benchmark execution.
-          Entry contents for isa == state:
-            - `time`: state/transition
-          Entry contents for isa == transition:
-            - `timeout`: Duration of previous state, measured using on-board timers
-         * `parameter`: dictionary describing parameter values for this state/transition. Parameter values refer to the begin of the state/transition and do not account for changes made by the transition.
-         * `plan`: Dictionary describing expected behaviour according to schedule / offline model.
-           Contents for isa == state: `energy`, `power`, `time`
-           Contents for isa == transition: `energy`, `timeout`, `level`.
-           If level is "user", the transition is part of the regular driver API. If level is "epilogue", it is an interrupt service routine and not called explicitly.
-        Each transition also contains:
-         * `args`: List of arguments the corresponding function call was called with. args entries are strings which are not necessarily numeric
-         * `code`: List of function name (first entry) and arguments (remaining entries) of the corresponding function call
-        """
-        if self.preprocessed:
-            return self.traces
-        if self.version == 0:
-            self._preprocess_012(0)
-        elif self.version == 1:
-            self._preprocess_012(1)
-        elif self.version == 2:
-            self._preprocess_012(2)
-        self.preprocessed = True
-        self.save_cache()
-        return self.traces
-
-    def _preprocess_012(self, version):
-        """Load raw MIMOSA data and turn it into measurements which are ready to be analyzed."""
-        offline_data = []
-        for i, filename in enumerate(self.filenames):
-
-            if version == 0:
-
-                with tarfile.open(filename) as tf:
-                    self.setup_by_fileno.append(json.load(tf.extractfile("setup.json")))
-                    self.traces_by_fileno.append(
-                        json.load(tf.extractfile("src/apps/DriverEval/DriverLog.json"))
-                    )
-                    for member in tf.getmembers():
-                        _, extension = os.path.splitext(member.name)
-                        if extension == ".mim":
-                            offline_data.append(
-                                {
-                                    "content": tf.extractfile(member).read(),
-                                    "fileno": i,
-                                    "info": member,
-                                    "setup": self.setup_by_fileno[i],
-                                    "with_traces": self.with_traces,
-                                }
-                            )
-
-            elif version == 1:
-
-                new_filenames = list()
-                with tarfile.open(filename) as tf:
-                    ptalog = json.load(tf.extractfile(tf.getmember("ptalog.json")))
-                    self.pta = ptalog["pta"]
-
-                    # Benchmark code may be too large to be executed in a single
-                    # run, so benchmarks (a benchmark is basically a list of DFA runs)
-                    # may be split up. To accomodate this, ptalog['traces'] is
-                    # a list of lists: ptalog['traces'][0] corresponds to the
-                    # first benchmark part, ptalog['traces'][1] to the
-                    # second, and so on. ptalog['traces'][0][0] is the first
-                    # trace (a sequence of states and transitions) in the
-                    # first benchmark part, ptalog['traces'][0][1] the second, etc.
-                    #
-                    # As traces are typically repeated to minimize the effect
-                    # of random noise, observations for each benchmark part
-                    # are also lists. In this case, this applies in two
-                    # cases: traces[i][j]['parameter'][some_param] is either
-                    # a value (if the parameter is controlld by software)
-                    # or a list (if the parameter is known a posteriori, e.g.
-                    # "how many retransmissions did this packet take?").
-                    #
-                    # The second case is the MIMOSA energy measurements, which
-                    # are listed in ptalog['files']. ptalog['files'][0]
-                    # contains a list of files for the first benchmark part,
-                    # ptalog['files'][0][0] is its first iteration/repetition,
-                    # ptalog['files'][0][1] the second, etc.
-
-                    for j, traces in enumerate(ptalog["traces"]):
-                        new_filenames.append("{}#{}".format(filename, j))
-                        self.traces_by_fileno.append(traces)
-                        self.setup_by_fileno.append(
-                            {
-                                "mimosa_voltage": ptalog["configs"][j]["voltage"],
-                                "mimosa_shunt": ptalog["configs"][j]["shunt"],
-                                "state_duration": ptalog["opt"]["sleep"],
-                            }
-                        )
-                        for repeat_id, mim_file in enumerate(ptalog["files"][j]):
-                            member = tf.getmember(mim_file)
-                            offline_data.append(
-                                {
-                                    "content": tf.extractfile(member).read(),
-                                    "fileno": j,
-                                    "info": member,
-                                    "setup": self.setup_by_fileno[j],
-                                    "repeat_id": repeat_id,
-                                    "expected_trace": ptalog["traces"][j],
-                                    "with_traces": self.with_traces,
-                                }
-                            )
-                self.filenames = new_filenames
-
-            elif version == 2:
-
-                new_filenames = list()
-                with tarfile.open(filename) as tf:
-                    ptalog = json.load(tf.extractfile(tf.getmember("ptalog.json")))
-                    self.pta = ptalog["pta"]
-
-                    # Benchmark code may be too large to be executed in a single
-                    # run, so benchmarks (a benchmark is basically a list of DFA runs)
-                    # may be split up. To accomodate this, ptalog['traces'] is
-                    # a list of lists: ptalog['traces'][0] corresponds to the
-                    # first benchmark part, ptalog['traces'][1] to the
-                    # second, and so on. ptalog['traces'][0][0] is the first
-                    # trace (a sequence of states and transitions) in the
-                    # first benchmark part, ptalog['traces'][0][1] the second, etc.
-                    #
-                    # As traces are typically repeated to minimize the effect
-                    # of random noise, observations for each benchmark part
-                    # are also lists. In this case, this applies in two
-                    # cases: traces[i][j]['parameter'][some_param] is either
-                    # a value (if the parameter is controlld by software)
-                    # or a list (if the parameter is known a posteriori, e.g.
-                    # "how many retransmissions did this packet take?").
-                    #
-                    # The second case is the MIMOSA energy measurements, which
-                    # are listed in ptalog['files']. ptalog['files'][0]
-                    # contains a list of files for the first benchmark part,
-                    # ptalog['files'][0][0] is its first iteration/repetition,
-                    # ptalog['files'][0][1] the second, etc.
-
-                    # generate-dfa-benchmark uses TimingHarness to obtain timing data.
-                    # Data is placed in 'offline_aggregates', which is also
-                    # where we are going to store power/energy data.
-                    # In case of invalid measurements, this can lead to a
-                    # mismatch between duration and power/energy data, e.g.
-                    # where duration = [A, B, C], power = [a, b], B belonging
-                    # to an invalid measurement and thus power[b] corresponding
-                    # to duration[C]. At the moment, this is harmless, but in the
-                    # future it might not be.
-                    if "offline_aggregates" in ptalog["traces"][0][0]["trace"][0]:
-                        for trace_group in ptalog["traces"]:
-                            for trace in trace_group:
-                                for state_or_transition in trace["trace"]:
-                                    offline_aggregates = state_or_transition.pop(
-                                        "offline_aggregates", None
-                                    )
-                                    if offline_aggregates:
-                                        state_or_transition[
-                                            "online_aggregates"
-                                        ] = offline_aggregates
-
-                    for j, traces in enumerate(ptalog["traces"]):
-                        new_filenames.append("{}#{}".format(filename, j))
-                        self.traces_by_fileno.append(traces)
-                        self.setup_by_fileno.append(
-                            {
-                                "voltage": ptalog["configs"][j]["voltage"],
-                                "state_duration": ptalog["opt"]["sleep"],
-                            }
-                        )
-                        for repeat_id, etlog_file in enumerate(ptalog["files"][j]):
-                            member = tf.getmember(etlog_file)
-                            offline_data.append(
-                                {
-                                    "content": tf.extractfile(member).read(),
-                                    "fileno": j,
-                                    "info": member,
-                                    "setup": self.setup_by_fileno[j],
-                                    "repeat_id": repeat_id,
-                                    "expected_trace": ptalog["traces"][j],
-                                    "with_traces": self.with_traces,
-                                    "transition_names": list(
-                                        map(
-                                            lambda x: x["name"],
-                                            ptalog["pta"]["transitions"],
-                                        )
-                                    ),
-                                }
-                            )
-                self.filenames = new_filenames
-                # TODO remove 'offline_aggregates' from pre-parse data and place
-                # it under 'online_aggregates' or similar instead. This way, if
-                # a .etlog file fails to parse, its corresponding duration data
-                # will not linger in 'offline_aggregates' and confuse the hell
-                # out of other code paths
-
-        with Pool() as pool:
-            if self.version <= 1:
-                measurements = pool.map(_preprocess_mimosa, offline_data)
-            elif self.version == 2:
-                measurements = pool.map(_preprocess_etlog, offline_data)
-
-        num_valid = 0
-        for measurement in measurements:
-
-            if "energy_trace" not in measurement:
-                logger.warning(
-                    "Skipping {ar:s}/{m:s}: {e:s}".format(
-                        ar=self.filenames[measurement["fileno"]],
-                        m=measurement["info"].name,
-                        e="; ".join(measurement["datasource_errors"]),
-                    )
-                )
-                continue
-
-            if version == 0:
-                # Strip the last state (it is not part of the scheduled measurement)
-                measurement["energy_trace"].pop()
-            elif version == 1:
-                # The first online measurement is the UNINITIALIZED state. In v1,
-                # it is not part of the expected PTA trace -> remove it.
-                measurement["energy_trace"].pop(0)
-
-            if version == 0 or version == 1:
-                if self._measurement_is_valid_01(measurement):
-                    self._merge_online_and_offline(measurement)
-                    num_valid += 1
-                else:
-                    logger.warning(
-                        "Skipping {ar:s}/{m:s}: {e:s}".format(
-                            ar=self.filenames[measurement["fileno"]],
-                            m=measurement["info"].name,
-                            e=measurement["error"],
-                        )
-                    )
-            elif version == 2:
-                if self._measurement_is_valid_2(measurement):
-                    self._merge_online_and_etlog(measurement)
-                    num_valid += 1
-                else:
-                    logger.warning(
-                        "Skipping {ar:s}/{m:s}: {e:s}".format(
-                            ar=self.filenames[measurement["fileno"]],
-                            m=measurement["info"].name,
-                            e=measurement["error"],
-                        )
-                    )
-        logger.info(
-            "{num_valid:d}/{num_total:d} measurements are valid".format(
-                num_valid=num_valid, num_total=len(measurements)
-            )
-        )
-        if version == 0:
-            self.traces = self._concatenate_traces(self.traces_by_fileno)
-        elif version == 1:
-            self.traces = self._concatenate_traces(
-                map(lambda x: x["expected_trace"], measurements)
-            )
-            self.traces = self._concatenate_traces(self.traces_by_fileno)
-        elif version == 2:
-            self.traces = self._concatenate_traces(self.traces_by_fileno)
-        self.preprocessing_stats = {
-            "num_runs": len(measurements),
-            "num_valid": num_valid,
-        }
-
-
-def _add_trace_data_to_aggregate(aggregate, key, element):
-    # Only cares about element['isa'], element['offline_aggregates'], and
-    # element['plan']['level']
-    if key not in aggregate:
-        aggregate[key] = {"isa": element["isa"]}
-        for datakey in element["offline_aggregates"].keys():
-            aggregate[key][datakey] = []
-        if element["isa"] == "state":
-            aggregate[key]["attributes"] = ["power"]
-        else:
-            # TODO do not hardcode values
-            aggregate[key]["attributes"] = [
-                "duration",
-                "energy",
-                "rel_energy_prev",
-                "rel_energy_next",
-            ]
-            # Uncomment this line if you also want to analyze mean transition power
-            # aggrgate[key]['attributes'].append('power')
-            if "plan" in element and element["plan"]["level"] == "epilogue":
-                aggregate[key]["attributes"].insert(0, "timeout")
-        attributes = aggregate[key]["attributes"].copy()
-        for attribute in attributes:
-            if attribute not in element["offline_aggregates"]:
-                aggregate[key]["attributes"].remove(attribute)
-    for datakey, dataval in element["offline_aggregates"].items():
-        aggregate[key][datakey].extend(dataval)
-
-
-def pta_trace_to_aggregate(traces, ignore_trace_indexes=[]):
-    u"""
-    Convert preprocessed DFA traces from peripherals/drivers to by_name aggregate for PTAModel.
-
-    arguments:
-    traces -- [ ... Liste von einzelnen Läufen (d.h. eine Zustands- und Transitionsfolge UNINITIALIZED -> foo -> FOO -> bar -> BAR -> ...)
-        Jeder Lauf:
-        - id: int Nummer des Laufs, beginnend bei 1
-        - trace: [ ... Liste von Zuständen und Transitionen
-            Jeweils:
-            - name: str Name
-            - isa: str state // transition
-            - parameter: { ... globaler Parameter: aktueller wert. null falls noch nicht eingestellt }
-            - args: [ Funktionsargumente, falls isa == 'transition' ]
-            - offline_aggregates:
-                - power: [float(uW)] Mittlere Leistung während Zustand/Transitions
-                - power_std: [float(uW^2)] Standardabweichung der Leistung
-                - duration: [int(us)] Dauer
-                - energy: [float(pJ)] Energieaufnahme des Zustands / der Transition
-                - clip_rate: [float(0..1)] Clipping
-                - paramkeys: [[str]] Name der berücksichtigten Parameter
-                - param: [int // str] Parameterwerte. Quasi-Duplikat von 'parameter' oben
-                Falls isa == 'transition':
-                - timeout: [int(us)] Dauer des vorherigen Zustands
-                - rel_energy_prev: [int(pJ)]
-                - rel_energy_next: [int(pJ)]
-        ]
-    ]
-    ignore_trace_indexes -- list of trace indexes. The corresponding taces will be ignored.
-
-    returns a tuple of three elements:
-    by_name -- measurements aggregated by state/transition name, annotated with parameter values
-    parameter_names -- list of parameter names
-    arg_count -- dict mapping transition names to the number of arguments of their corresponding driver function
-
-    by_name layout:
-    Dictionary with one key per state/transition ('send', 'TX', ...).
-    Each element is in turn a dict with the following elements:
-    - isa: 'state' or 'transition'
-    - power: list of mean power measurements in µW
-    - duration: list of durations in µs
-    - power_std: list of stddev of power per state/transition
-    - energy: consumed energy (power*duration) in pJ
-    - paramkeys: list of parameter names in each measurement (-> list of lists)
-    - param: list of parameter values in each measurement (-> list of lists)
-    - attributes: list of keys that should be analyzed,
-        e.g. ['power', 'duration']
-    additionally, only if isa == 'transition':
-    - timeout: list of duration of previous state in µs
-    - rel_energy_prev: transition energy relative to previous state mean power in pJ
-    - rel_energy_next: transition energy relative to next state mean power in pJ
-    """
-    arg_count = dict()
-    by_name = dict()
-    parameter_names = sorted(traces[0]["trace"][0]["parameter"].keys())
-    for run in traces:
-        if run["id"] not in ignore_trace_indexes:
-            for elem in run["trace"]:
-                if (
-                    elem["isa"] == "transition"
-                    and not elem["name"] in arg_count
-                    and "args" in elem
-                ):
-                    arg_count[elem["name"]] = len(elem["args"])
-                if elem["name"] != "UNINITIALIZED":
-                    _add_trace_data_to_aggregate(by_name, elem["name"], elem)
-    for elem in by_name.values():
-        for key in elem["attributes"]:
-            elem[key] = np.array(elem[key])
-    return by_name, parameter_names, arg_count
-
-
-class EnergyTraceLog:
-    """
-    EnergyTrace log loader for DFA traces.
-
-    Expects an EnergyTrace log file generated via msp430-etv / energytrace-util
-    and a dfatool-generated benchmark. An EnergyTrace log consits of a series
-    of measurements. Each measurement has a timestamp, mean current, voltage,
-    and cumulative energy since start of measurement. Each transition is
-    preceded by a Code128 barcode embedded into the energy consumption by
-    toggling a LED.
-
-    Note that the baseline power draw of board and peripherals is not subtracted
-    at the moment.
-    """
-
-    def __init__(
-        self,
-        voltage: float,
-        state_duration: int,
-        transition_names: list,
-        with_traces=False,
-    ):
-        """
-        Create a new EnergyTraceLog object.
-
-        :param voltage: supply voltage [V], usually 3.3 V
-        :param state_duration: state duration [ms]
-        :param transition_names: list of transition names in PTA transition order.
-            Needed to map barcode synchronization numbers to transitions.
-        """
-        self.voltage = voltage
-        self.state_duration = state_duration * 1e-3
-        self.transition_names = transition_names
-        self.with_traces = with_traces
-        self.errors = list()
-
-        # TODO auto-detect
-        self.led_power = 10e-3
-
-        # multipass/include/object/ptalog.h#startTransition
-        self.module_duration = 5e-3
-
-        # multipass/include/object/ptalog.h#startTransition
-        self.quiet_zone_duration = 60e-3
-
-        # TODO auto-detect?
-        # Note that we consider barcode duration after start, so only the
-        # quiet zone -after- the code is relevant
-        self.min_barcode_duration = 57 * self.module_duration + self.quiet_zone_duration
-        self.max_barcode_duration = 68 * self.module_duration + self.quiet_zone_duration
-
-    def load_data(self, log_data):
-        """
-        Load log data (raw energytrace .txt file, one line per event).
-
-        :param log_data: raw energytrace log file in 4-column .txt format
-        """
-
-        if not zbar_available:
-            logger.error("zbar module is not available")
-            self.errors.append(
-                'zbar module is not available. Try "apt install python3-zbar"'
-            )
-            return list()
-
-        lines = log_data.decode("ascii").split("\n")
-        data_count = sum(map(lambda x: len(x) > 0 and x[0] != "#", lines))
-        data_lines = filter(lambda x: len(x) > 0 and x[0] != "#", lines)
-
-        data = np.empty((data_count, 4))
-
-        for i, line in enumerate(data_lines):
-            fields = line.split(" ")
-            if len(fields) == 4:
-                timestamp, current, voltage, total_energy = map(int, fields)
-            elif len(fields) == 5:
-                # cpustate = fields[0]
-                timestamp, current, voltage, total_energy = map(int, fields[1:])
-            else:
-                raise RuntimeError('cannot parse line "{}"'.format(line))
-            data[i] = [timestamp, current, voltage, total_energy]
-
-        self.interval_start_timestamp = data[:-1, 0] * 1e-6
-        self.interval_duration = (data[1:, 0] - data[:-1, 0]) * 1e-6
-        self.interval_power = ((data[1:, 3] - data[:-1, 3]) * 1e-9) / (
-            (data[1:, 0] - data[:-1, 0]) * 1e-6
-        )
-
-        m_duration_us = data[-1, 0] - data[0, 0]
-
-        self.sample_rate = data_count / (m_duration_us * 1e-6)
-
-        logger.debug(
-            "got {} samples with {} seconds of log data ({} Hz)".format(
-                data_count, m_duration_us * 1e-6, self.sample_rate
-            )
-        )
-
-        return (
-            self.interval_start_timestamp,
-            self.interval_duration,
-            self.interval_power,
-        )
-
-    def ts_to_index(self, timestamp):
-        """
-        Convert timestamp in seconds to interval_start_timestamp / interval_duration / interval_power index.
-
-        Returns the index of the interval which timestamp is part of.
-        """
-        return self._ts_to_index(timestamp, 0, len(self.interval_start_timestamp))
-
-    def _ts_to_index(self, timestamp, left_index, right_index):
-        if left_index == right_index:
-            return left_index
-        if left_index + 1 == right_index:
-            return left_index
-
-        mid_index = left_index + (right_index - left_index) // 2
-
-        # I'm feeling lucky
-        if (
-            timestamp > self.interval_start_timestamp[mid_index]
-            and timestamp
-            <= self.interval_start_timestamp[mid_index]
-            + self.interval_duration[mid_index]
-        ):
-            return mid_index
-
-        if timestamp <= self.interval_start_timestamp[mid_index]:
-            return self._ts_to_index(timestamp, left_index, mid_index)
-
-        return self._ts_to_index(timestamp, mid_index, right_index)
-
-    def analyze_states(self, traces, offline_index: int):
-        u"""
-        Split log data into states and transitions and return duration, energy, and mean power for each element.
-
-        :param traces: expected traces, needed to synchronize with the measurement.
-            traces is a list of runs, traces[*]['trace'] is a single run
-            (i.e. a list of states and transitions, starting with a transition
-            and ending with a state).
-        :param offline_index: This function uses traces[*]['trace'][*]['online_aggregates']['duration'][offline_index] to find sync codes
-
-        :param charges: raw charges (each element describes the charge in pJ transferred during 10 µs)
-        :param trigidx: "charges" indexes corresponding to a trigger edge, see `trigger_edges`
-        :param ua_func: charge(pJ) -> current(µA) function as returned by `calibration_function`
-
-        :returns: maybe returns list of states and transitions, both starting andending with a state.
-            Each element is a dict containing:
-            * `isa`: 'state' or 'transition'
-            * `clip_rate`: range(0..1) Anteil an Clipping im Energieverbrauch
-            * `raw_mean`: Mittelwert der Rohwerte
-            * `raw_std`: Standardabweichung der Rohwerte
-            * `uW_mean`: Mittelwert der (kalibrierten) Leistungsaufnahme
-            * `uW_std`: Standardabweichung der (kalibrierten) Leistungsaufnahme
-            * `us`: Dauer
-            if isa == 'transition, it also contains:
-            * `timeout`: Dauer des vorherigen Zustands
-            * `uW_mean_delta_prev`: Differenz zwischen uW_mean und uW_mean des vorherigen Zustands
-            * `uW_mean_delta_next`: Differenz zwischen uW_mean und uW_mean des Folgezustands
-        """
-
-        first_sync = self.find_first_sync()
-
-        energy_trace = list()
-
-        expected_transitions = list()
-        for trace_number, trace in enumerate(traces):
-            for state_or_transition_number, state_or_transition in enumerate(
-                trace["trace"]
-            ):
-                if state_or_transition["isa"] == "transition":
-                    try:
-                        expected_transitions.append(
-                            (
-                                state_or_transition["name"],
-                                state_or_transition["online_aggregates"]["duration"][
-                                    offline_index
-                                ]
-                                * 1e-6,
-                            )
-                        )
-                    except IndexError:
-                        self.errors.append(
-                            'Entry #{} ("{}") in trace #{} has no duration entry for offline_index/repeat_id {}'.format(
-                                state_or_transition_number,
-                                state_or_transition["name"],
-                                trace_number,
-                                offline_index,
-                            )
-                        )
-                        return energy_trace
-
-        next_barcode = first_sync
-
-        for name, duration in expected_transitions:
-            bc, start, stop, end = self.find_barcode(next_barcode)
-            if bc is None:
-                logger.error('did not find transition "{}"'.format(name))
-                break
-            next_barcode = end + self.state_duration + duration
-            logger.debug(
-                '{} barcode "{}" area: {:0.2f} .. {:0.2f} / {:0.2f} seconds'.format(
-                    offline_index, bc, start, stop, end
-                )
-            )
-            if bc != name:
-                logger.error('mismatch: expected "{}", got "{}"'.format(name, bc))
-            logger.debug(
-                "{} estimated transition area: {:0.3f} .. {:0.3f} seconds".format(
-                    offline_index, end, end + duration
-                )
-            )
-
-            transition_start_index = self.ts_to_index(end)
-            transition_done_index = self.ts_to_index(end + duration) + 1
-            state_start_index = transition_done_index
-            state_done_index = (
-                self.ts_to_index(end + duration + self.state_duration) + 1
-            )
-
-            logger.debug(
-                "{} estimated transitionindex: {:0.3f} .. {:0.3f} seconds".format(
-                    offline_index,
-                    transition_start_index / self.sample_rate,
-                    transition_done_index / self.sample_rate,
-                )
-            )
-
-            transition_power_W = self.interval_power[
-                transition_start_index:transition_done_index
-            ]
-
-            transition = {
-                "isa": "transition",
-                "W_mean": np.mean(transition_power_W),
-                "W_std": np.std(transition_power_W),
-                "s": duration,
-                "s_coarse": self.interval_start_timestamp[transition_done_index]
-                - self.interval_start_timestamp[transition_start_index],
-            }
-
-            if self.with_traces:
-                transition["uW"] = transition_power_W * 1e6
-
-            energy_trace.append(transition)
-
-            if len(energy_trace) > 1:
-                energy_trace[-1]["W_mean_delta_prev"] = (
-                    energy_trace[-1]["W_mean"] - energy_trace[-2]["W_mean"]
-                )
-
-            state_power_W = self.interval_power[state_start_index:state_done_index]
-            state = {
-                "isa": "state",
-                "W_mean": np.mean(state_power_W),
-                "W_std": np.std(state_power_W),
-                "s": self.state_duration,
-                "s_coarse": self.interval_start_timestamp[state_done_index]
-                - self.interval_start_timestamp[state_start_index],
-            }
-
-            if self.with_traces:
-                state["uW"] = state_power_W * 1e6
-
-            energy_trace.append(state)
-
-            energy_trace[-2]["W_mean_delta_next"] = (
-                energy_trace[-2]["W_mean"] - energy_trace[-1]["W_mean"]
-            )
-
-        expected_transition_count = len(expected_transitions)
-        recovered_transition_ount = len(energy_trace) // 2
-
-        if expected_transition_count != recovered_transition_ount:
-            self.errors.append(
-                "Expected {:d} transitions, got {:d}".format(
-                    expected_transition_count, recovered_transition_ount
-                )
-            )
-
-        return energy_trace
-
-    def find_first_sync(self):
-        # LED Power is approx. self.led_power W, use self.led_power/2 W above surrounding median as threshold
-        sync_threshold_power = (
-            np.median(self.interval_power[: int(3 * self.sample_rate)])
-            + self.led_power / 3
-        )
-        for i, ts in enumerate(self.interval_start_timestamp):
-            if ts > 2 and self.interval_power[i] > sync_threshold_power:
-                return self.interval_start_timestamp[i - 300]
-        return None
-
-    def find_barcode(self, start_ts):
-        """
-        Return absolute position and content of the next barcode following `start_ts`.
-
-        :param interval_ts: list of start timestamps (one per measurement interval) [s]
-        :param interval_power: mean power per measurement interval [W]
-        :param start_ts: timestamp at which to start looking for a barcode [s]
-        """
-
-        for i, ts in enumerate(self.interval_start_timestamp):
-            if ts >= start_ts:
-                start_position = i
-                break
-
-        # Lookaround: 100 ms in both directions
-        lookaround = int(0.1 * self.sample_rate)
-
-        # LED Power is approx. self.led_power W, use self.led_power/2 W above surrounding median as threshold
-        sync_threshold_power = (
-            np.median(
-                self.interval_power[
-                    start_position - lookaround : start_position + lookaround
-                ]
-            )
-            + self.led_power / 3
-        )
-
-        logger.debug(
-            "looking for barcode starting at {:0.2f} s, threshold is {:0.1f} mW".format(
-                start_ts, sync_threshold_power * 1e3
-            )
-        )
-
-        sync_area_start = None
-        sync_start_ts = None
-        sync_area_end = None
-        sync_end_ts = None
-        for i, ts in enumerate(self.interval_start_timestamp):
-            if (
-                sync_area_start is None
-                and ts >= start_ts
-                and self.interval_power[i] > sync_threshold_power
-            ):
-                sync_area_start = i - 300
-                sync_start_ts = ts
-            if (
-                sync_area_start is not None
-                and sync_area_end is None
-                and ts > sync_start_ts + self.min_barcode_duration
-                and (
-                    ts > sync_start_ts + self.max_barcode_duration
-                    or abs(sync_threshold_power - self.interval_power[i])
-                    > self.led_power
-                )
-            ):
-                sync_area_end = i
-                sync_end_ts = ts
-                break
-
-        barcode_data = self.interval_power[sync_area_start:sync_area_end]
-
-        logger.debug(
-            "barcode search area: {:0.2f} .. {:0.2f} seconds ({} samples)".format(
-                sync_start_ts, sync_end_ts, len(barcode_data)
-            )
-        )
-
-        bc, start, stop, padding_bits = self.find_barcode_in_power_data(barcode_data)
-
-        if bc is None:
-            return None, None, None, None
-
-        start_ts = self.interval_start_timestamp[sync_area_start + start]
-        stop_ts = self.interval_start_timestamp[sync_area_start + stop]
-
-        end_ts = (
-            stop_ts + self.module_duration * padding_bits + self.quiet_zone_duration
-        )
-
-        # barcode content, barcode start timestamp, barcode stop timestamp, barcode end (stop + padding) timestamp
-        return bc, start_ts, stop_ts, end_ts
-
-    def find_barcode_in_power_data(self, barcode_data):
-
-        min_power = np.min(barcode_data)
-        max_power = np.max(barcode_data)
-
-        # zbar seems to be confused by measurement (and thus image) noise
-        # inside of barcodes. As our barcodes are only 1px high, this is
-        # likely not trivial to fix.
-        # -> Create a black and white (not grayscale) image to avoid this.
-        # Unfortunately, this decreases resilience against background noise
-        # (e.g. a not-exactly-idle peripheral device or CPU interrupts).
-        image_data = np.around(
-            1 - ((barcode_data - min_power) / (max_power - min_power))
-        )
-        image_data *= 255
-
-        # zbar only returns the complete barcode position if it is at least
-        # two pixels high. For a 1px barcode, it only returns its right border.
-
-        width = len(image_data)
-        height = 2
-
-        image_data = bytes(map(int, image_data)) * height
-
-        # img = Image.frombytes('L', (width, height), image_data).resize((width, 100))
-        # img.save('/tmp/test-{}.png'.format(os.getpid()))
-
-        zbimg = zbar.Image(width, height, "Y800", image_data)
-        scanner = zbar.ImageScanner()
-        scanner.parse_config("enable")
-
-        if scanner.scan(zbimg):
-            (sym,) = zbimg.symbols
-            content = sym.data
-            try:
-                sym_start = sym.location[1][0]
-            except IndexError:
-                sym_start = 0
-            sym_end = sym.location[0][0]
-
-            match = re.fullmatch(r"T(\d+)", content)
-            if match:
-                content = self.transition_names[int(match.group(1))]
-
-            # PTALog barcode generation operates on bytes, so there may be
-            # additional non-barcode padding (encoded as LED off / image white).
-            # Calculate the amount of extra bits to determine the offset until
-            # the transition starts.
-            padding_bits = len(Code128(sym.data, charset="B").modules) % 8
-
-            # sym_start leaves out the first two bars, but we don't do anything about that here
-            # sym_end leaves out the last three bars, each of which is one padding bit long.
-            # as a workaround, we unconditionally increment padding_bits by three.
-            padding_bits += 3
-
-            return content, sym_start, sym_end, padding_bits
-        else:
-            logger.warning("unable to find barcode")
-            return None, None, None, None
-
-
-class MIMOSA:
-    """
-    MIMOSA log loader for DFA traces with auto-calibration.
-
-    Expects a MIMOSA log file generated via dfatool and a dfatool-generated
-    benchmark. A MIMOSA log consists of a series of measurements. Each measurement
-    gives the total charge (in pJ) and binary buzzer/trigger value during a 10µs interval.
-
-    There must be a calibration run consisting of at least two seconds with disconnected DUT,
-    two seconds with 1 kOhm (984 Ohm), and two seconds with 100 kOhm (99013 Ohm) resistor at
-    the start. The first ten seconds of data are reserved for calbiration and must not contain
-    measurements, as trigger/buzzer signals are ignored in this time range.
-
-    Resulting data is a list of state/transition/state/transition/... measurements.
-    """
-
-    def __init__(self, voltage: float, shunt: int, with_traces=False):
-        """
-        Initialize MIMOSA loader for a specific voltage and shunt setting.
-
-        :param voltage: MIMOSA DUT supply voltage (V)
-        :para mshunt: MIMOSA Shunt (Ohms)
-        """
-        self.voltage = voltage
-        self.shunt = shunt
-        self.with_traces = with_traces
-        self.r1 = 984  # "1k"
-        self.r2 = 99013  # "100k"
-        self.errors = list()
-
-    def charge_to_current_nocal(self, charge):
-        u"""
-        Convert charge per 10µs (in pJ) to mean currents (in µA) without accounting for calibration.
-
-        :param charge: numpy array of charges (pJ per 10µs) as returned by `load_data` or `load_file`
-
-        :returns: numpy array of mean currents (µA per 10µs)
-        """
-        ua_max = 1.836 / self.shunt * 1000000
-        ua_step = ua_max / 65535
-        return charge * ua_step
-
-    def _load_tf(self, tf):
-        u"""
-        Load MIMOSA log data from an open `tarfile` instance.
-
-        :param tf: `tarfile` instance
-
-        :returns: (numpy array of charges (pJ per 10µs), numpy array of triggers (0/1 int, per 10µs))
-        """
-        num_bytes = tf.getmember("/tmp/mimosa//mimosa_scale_1.tmp").size
-        charges = np.ndarray(shape=(int(num_bytes / 4)), dtype=np.int32)
-        triggers = np.ndarray(shape=(int(num_bytes / 4)), dtype=np.int8)
-        with tf.extractfile("/tmp/mimosa//mimosa_scale_1.tmp") as f:
-            content = f.read()
-            iterator = struct.iter_unpack("<I", content)
-            i = 0
-            for word in iterator:
-                charges[i] = word[0] >> 4
-                triggers[i] = (word[0] & 0x08) >> 3
-                i += 1
-        return charges, triggers
-
-    def load_data(self, raw_data):
-        u"""
-        Load MIMOSA log data from a MIMOSA log file passed as raw byte string
-
-        :param raw_data: MIMOSA log file, passed as raw byte string
-
-        :returns: (numpy array of charges (pJ per 10µs), numpy array of triggers (0/1 int, per 10µs))
-        """
-        with io.BytesIO(raw_data) as data_object:
-            with tarfile.open(fileobj=data_object) as tf:
-                return self._load_tf(tf)
-
-    def load_file(self, filename):
-        u"""
-        Load MIMOSA log data from a MIMOSA log file
-
-        :param filename: MIMOSA log file
-
-        :returns: (numpy array of charges (pJ per 10µs), numpy array of triggers (0/1 int, per 10µs))
-        """
-        with tarfile.open(filename) as tf:
-            return self._load_tf(tf)
-
-    def currents_nocal(self, charges):
-        u"""
-        Convert charges (pJ per 10µs) to mean currents without accounting for calibration.
-
-        :param charges: numpy array of charges (pJ per 10µs)
-
-        :returns: numpy array of currents (mean µA per 10µs)"""
-        ua_max = 1.836 / self.shunt * 1000000
-        ua_step = ua_max / 65535
-        return charges.astype(np.double) * ua_step
-
-    def trigger_edges(self, triggers):
-        """
-        Return indexes of trigger edges (both 0->1 and 1->0) in log data.
-
-        Ignores the first 10 seconds, which are used for calibration and may
-        contain bogus triggers due to DUT resets.
-
-        :param triggers: trigger array (int, 0/1) as returned by load_data
-
-        :returns: list of int (trigger indices, e.g. [2000000, ...] means the first trigger appears in charges/currents interval 2000000 -> 20s after start of measurements. Keep in mind that each interval is 10µs long, not 1µs, so index values are not µs timestamps)
-        """
-        trigidx = []
-
-        if len(triggers) < 1000000:
-            self.errors.append("MIMOSA log is too short")
-            return trigidx
-
-        prevtrig = triggers[999999]
-
-        # if the first trigger is high (i.e., trigger/buzzer pin is active before the benchmark starts),
-        # something went wrong and are unable to determine when the first
-        # transition starts.
-        if prevtrig != 0:
-            self.errors.append(
-                "Unable to find start of first transition (log starts with trigger == {} != 0)".format(
-                    prevtrig
-                )
-            )
-
-        # if the last trigger is high (i.e., trigger/buzzer pin is active when the benchmark ends),
-        # it terminated in the middle of a transition -- meaning that it was not
-        # measured in its entirety.
-        if triggers[-1] != 0:
-            self.errors.append("Log ends during a transition".format(prevtrig))
-
-        # the device is reset for MIMOSA calibration in the first 10s and may
-        # send bogus interrupts -> bogus triggers
-        for i in range(1000000, triggers.shape[0]):
-            trig = triggers[i]
-            if trig != prevtrig:
-                # Due to MIMOSA's integrate-read-reset cycle, the charge/current
-                # interval belonging to this trigger comes two intervals (20µs) later
-                trigidx.append(i + 2)
-            prevtrig = trig
-        return trigidx
-
-    def calibration_edges(self, currents):
-        u"""
-        Return start/stop indexes of calibration measurements.
-
-        :param currents: uncalibrated currents as reported by MIMOSA. For best results,
-            it may help to use a running mean, like so:
-            `currents = running_mean(currents_nocal(..., 10))`
-
-        :returns: indices of calibration events in MIMOSA data:
-            (disconnect start, disconnect stop, R1 (1k) start, R1 (1k) stop, R2 (100k) start, R2 (100k) stop)
-            indices refer to charges/currents arrays, so 0 refers to the first 10µs interval, 1 to the second, and so on.
-        """
-        r1idx = 0
-        r2idx = 0
-        ua_r1 = self.voltage / self.r1 * 1000000
-        # first second may be bogus
-        for i in range(100000, len(currents)):
-            if r1idx == 0 and currents[i] > ua_r1 * 0.6:
-                r1idx = i
-            elif (
-                r1idx != 0
-                and r2idx == 0
-                and i > (r1idx + 180000)
-                and currents[i] < ua_r1 * 0.4
-            ):
-                r2idx = i
-        # 2s disconnected, 2s r1, 2s r2  with r1 < r2  ->  ua_r1 > ua_r2
-        # allow 5ms buffer in both directions to account for bouncing relais contacts
-        return (
-            r1idx - 180500,
-            r1idx - 500,
-            r1idx + 500,
-            r2idx - 500,
-            r2idx + 500,
-            r2idx + 180500,
-        )
-
-    def calibration_function(self, charges, cal_edges):
-        u"""
-        Calculate calibration function from previously determined calibration edges.
-
-        :param charges: raw charges from MIMOSA
-        :param cal_edges: calibration edges as returned by calibration_edges
-
-        :returns: (calibration_function, calibration_data):
-            calibration_function -- charge in pJ (float) -> current in uA (float).
-                Converts the amount of charge in a 10 µs interval to the
-                mean current during the same interval.
-            calibration_data -- dict containing the following keys:
-                edges -- calibration points in the log file, in µs
-                offset -- ...
-                offset2 --  ...
-                slope_low -- ...
-                slope_high -- ...
-                add_low -- ...
-                add_high -- ..
-                r0_err_uW -- mean error of uncalibrated data at "∞ Ohm" in µW
-                r0_std_uW -- standard deviation of uncalibrated data at "∞ Ohm" in µW
-                r1_err_uW -- mean error of uncalibrated data at 1 kOhm
-                r1_std_uW -- stddev at 1 kOhm
-                r2_err_uW -- mean error at 100 kOhm
-                r2_std_uW -- stddev at 100 kOhm
-        """
-        dis_start, dis_end, r1_start, r1_end, r2_start, r2_end = cal_edges
-        if dis_start < 0:
-            dis_start = 0
-        chg_r0 = charges[dis_start:dis_end]
-        chg_r1 = charges[r1_start:r1_end]
-        chg_r2 = charges[r2_start:r2_end]
-        cal_0_mean = np.mean(chg_r0)
-        cal_r1_mean = np.mean(chg_r1)
-        cal_r2_mean = np.mean(chg_r2)
-
-        ua_r1 = self.voltage / self.r1 * 1000000
-        ua_r2 = self.voltage / self.r2 * 1000000
-
-        if cal_r2_mean > cal_0_mean:
-            b_lower = (ua_r2 - 0) / (cal_r2_mean - cal_0_mean)
-        else:
-            logger.warning("0 uA == %.f uA during calibration" % (ua_r2))
-            b_lower = 0
-
-        b_upper = (ua_r1 - ua_r2) / (cal_r1_mean - cal_r2_mean)
-
-        a_lower = -b_lower * cal_0_mean
-        a_upper = -b_upper * cal_r2_mean
-
-        if self.shunt == 680:
-            # R1 current is higher than shunt range -> only use R2 for calibration
-            def calfunc(charge):
-                if charge < cal_0_mean:
-                    return 0
-                else:
-                    return charge * b_lower + a_lower
-
-        else:
-
-            def calfunc(charge):
-                if charge < cal_0_mean:
-                    return 0
-                if charge <= cal_r2_mean:
-                    return charge * b_lower + a_lower
-                else:
-                    return charge * b_upper + a_upper + ua_r2
-
-        caldata = {
-            "edges": [x * 10 for x in cal_edges],
-            "offset": cal_0_mean,
-            "offset2": cal_r2_mean,
-            "slope_low": b_lower,
-            "slope_high": b_upper,
-            "add_low": a_lower,
-            "add_high": a_upper,
-            "r0_err_uW": np.mean(self.currents_nocal(chg_r0)) * self.voltage,
-            "r0_std_uW": np.std(self.currents_nocal(chg_r0)) * self.voltage,
-            "r1_err_uW": (np.mean(self.currents_nocal(chg_r1)) - ua_r1) * self.voltage,
-            "r1_std_uW": np.std(self.currents_nocal(chg_r1)) * self.voltage,
-            "r2_err_uW": (np.mean(self.currents_nocal(chg_r2)) - ua_r2) * self.voltage,
-            "r2_std_uW": np.std(self.currents_nocal(chg_r2)) * self.voltage,
-        }
-
-        # print("if charge < %f : return 0" % cal_0_mean)
-        # print("if charge <= %f : return charge * %f + %f" % (cal_r2_mean, b_lower, a_lower))
-        # print("else : return charge * %f + %f + %f" % (b_upper, a_upper, ua_r2))
-
-        return calfunc, caldata
-
-    """
-    def calcgrad(self, currents, threshold):
-        grad = np.gradient(running_mean(currents * self.voltage, 10))
-        # len(grad) == len(currents) - 9
-        subst = []
-        lastgrad = 0
-        for i in range(len(grad)):
-            # minimum substate duration: 10ms
-            if np.abs(grad[i]) > threshold and i - lastgrad > 50:
-                # account for skew introduced by running_mean and current
-                # ramp slope (parasitic capacitors etc.)
-                subst.append(i+10)
-                lastgrad = i
-        if lastgrad != i:
-            subst.append(i+10)
-        return subst
-
-    # TODO konfigurierbare min/max threshold und len(gradidx) > X, binaere
-    # Sache nach noetiger threshold. postprocessing mit
-    # "zwei benachbarte substates haben sehr aehnliche werte / niedrige stddev" -> mergen
-    # ... min/max muessen nicht vorgegeben werden, sind ja bekannt (0 / np.max(grad))
-    # TODO bei substates / index foo den offset durch running_mean beachten
-    # TODO ggf. clustering der 'abs(grad) > threshold' und bestimmung interessanter
-    # uebergaenge dadurch?
-    def gradfoo(self, currents):
-        gradients = np.abs(np.gradient(running_mean(currents * self.voltage, 10)))
-        gradmin = np.min(gradients)
-        gradmax = np.max(gradients)
-        threshold = np.mean([gradmin, gradmax])
-        gradidx = self.calcgrad(currents, threshold)
-        num_substates = 2
-        while len(gradidx) != num_substates:
-            if gradmax - gradmin < 0.1:
-                # We did our best
-                return threshold, gradidx
-            if len(gradidx) > num_substates:
-                gradmin = threshold
-            else:
-                gradmax = threshold
-            threshold = np.mean([gradmin, gradmax])
-            gradidx = self.calcgrad(currents, threshold)
-        return threshold, gradidx
-    """
-
-    def analyze_states(self, charges, trigidx, ua_func):
-        u"""
-        Split log data into states and transitions and return duration, energy, and mean power for each element.
-
-        :param charges: raw charges (each element describes the charge in pJ transferred during 10 µs)
-        :param trigidx: "charges" indexes corresponding to a trigger edge, see `trigger_edges`
-        :param ua_func: charge(pJ) -> current(µA) function as returned by `calibration_function`
-
-        :returns: list of states and transitions, both starting andending with a state.
-            Each element is a dict containing:
-            * `isa`: 'state' or 'transition'
-            * `clip_rate`: range(0..1) Anteil an Clipping im Energieverbrauch
-            * `raw_mean`: Mittelwert der Rohwerte
-            * `raw_std`: Standardabweichung der Rohwerte
-            * `uW_mean`: Mittelwert der (kalibrierten) Leistungsaufnahme
-            * `uW_std`: Standardabweichung der (kalibrierten) Leistungsaufnahme
-            * `us`: Dauer
-            if isa == 'transition, it also contains:
-            * `timeout`: Dauer des vorherigen Zustands
-            * `uW_mean_delta_prev`: Differenz zwischen uW_mean und uW_mean des vorherigen Zustands
-            * `uW_mean_delta_next`: Differenz zwischen uW_mean und uW_mean des Folgezustands
-        """
-        previdx = 0
-        is_state = True
-        iterdata = []
-
-        # The last state (between the last transition and end of file) may also
-        # be important. Pretend it ends when the log ends.
-        trigger_indices = trigidx.copy()
-        trigger_indices.append(len(charges))
-
-        for idx in trigger_indices:
-            range_raw = charges[previdx:idx]
-            range_ua = ua_func(range_raw)
-            substates = {}
-
-            if previdx != 0 and idx - previdx > 200:
-                thr, subst = 0, []  # self.gradfoo(range_ua)
-                if len(subst):
-                    statelist = []
-                    prevsubidx = 0
-                    for subidx in subst:
-                        statelist.append(
-                            {
-                                "duration": (subidx - prevsubidx) * 10,
-                                "uW_mean": np.mean(
-                                    range_ua[prevsubidx:subidx] * self.voltage
-                                ),
-                                "uW_std": np.std(
-                                    range_ua[prevsubidx:subidx] * self.voltage
-                                ),
-                            }
-                        )
-                        prevsubidx = subidx
-                    substates = {"threshold": thr, "states": statelist}
-
-            isa = "state"
-            if not is_state:
-                isa = "transition"
-
-            data = {
-                "isa": isa,
-                "clip_rate": np.mean(range_raw == 65535),
-                "raw_mean": np.mean(range_raw),
-                "raw_std": np.std(range_raw),
-                "uW_mean": np.mean(range_ua * self.voltage),
-                "uW_std": np.std(range_ua * self.voltage),
-                "us": (idx - previdx) * 10,
-            }
-
-            if self.with_traces:
-                data["uW"] = range_ua * self.voltage
-
-            if "states" in substates:
-                data["substates"] = substates
-                ssum = np.sum(list(map(lambda x: x["duration"], substates["states"])))
-                if ssum != data["us"]:
-                    logger.warning("duration %d vs %d" % (data["us"], ssum))
-
-            if isa == "transition":
-                # subtract average power of previous state
-                # (that is, the state from which this transition originates)
-                data["uW_mean_delta_prev"] = data["uW_mean"] - iterdata[-1]["uW_mean"]
-                # placeholder to avoid extra cases in the analysis
-                data["uW_mean_delta_next"] = data["uW_mean"]
-                data["timeout"] = iterdata[-1]["us"]
-            elif len(iterdata) > 0:
-                # subtract average power of next state
-                # (the state into which this transition leads)
-                iterdata[-1]["uW_mean_delta_next"] = (
-                    iterdata[-1]["uW_mean"] - data["uW_mean"]
-                )
-
-            iterdata.append(data)
-
-            previdx = idx
-            is_state = not is_state
-        return iterdata
diff --git a/lib/loader.py b/lib/loader.py
new file mode 100644
index 0000000..e8b5090
--- /dev/null
+++ b/lib/loader.py
@@ -0,0 +1,2008 @@
+#!/usr/bin/env python3
+
+import csv
+import io
+import json
+import logging
+import numpy as np
+import os
+import re
+import struct
+import tarfile
+import hashlib
+from multiprocessing import Pool
+from .utils import running_mean, soft_cast_int
+
+logger = logging.getLogger(__name__)
+
+try:
+    from .pubcode import Code128
+    import zbar
+
+    zbar_available = True
+except ImportError:
+    zbar_available = False
+
+
+arg_support_enabled = True
+
+
+class KeysightCSV:
+    """Simple loader for Keysight CSV data, as exported by the windows software."""
+
+    def __init__(self):
+        """Create a new KeysightCSV object."""
+        pass
+
+    def load_data(self, filename: str):
+        """
+        Load log data from filename, return timestamps and currents.
+
+        Returns two one-dimensional NumPy arrays: timestamps and corresponding currents.
+        """
+        with open(filename) as f:
+            for i, _ in enumerate(f):
+                pass
+            timestamps = np.ndarray((i - 3), dtype=float)
+            currents = np.ndarray((i - 3), dtype=float)
+        # basically seek back to start
+        with open(filename) as f:
+            for _ in range(4):
+                next(f)
+            reader = csv.reader(f, delimiter=",")
+            for i, row in enumerate(reader):
+                timestamps[i] = float(row[0])
+                currents[i] = float(row[2]) * -1
+        return timestamps, currents
+
+
+def _preprocess_mimosa(measurement):
+    setup = measurement["setup"]
+    mim = MIMOSA(
+        float(setup["mimosa_voltage"]),
+        int(setup["mimosa_shunt"]),
+        with_traces=measurement["with_traces"],
+    )
+    try:
+        charges, triggers = mim.load_data(measurement["content"])
+        trigidx = mim.trigger_edges(triggers)
+    except EOFError as e:
+        mim.errors.append("MIMOSA logfile error: {}".format(e))
+        trigidx = list()
+
+    if len(trigidx) == 0:
+        mim.errors.append("MIMOSA log has no triggers")
+        return {
+            "fileno": measurement["fileno"],
+            "info": measurement["info"],
+            "has_datasource_error": len(mim.errors) > 0,
+            "datasource_errors": mim.errors,
+            "expected_trace": measurement["expected_trace"],
+            "repeat_id": measurement["repeat_id"],
+        }
+
+    cal_edges = mim.calibration_edges(
+        running_mean(mim.currents_nocal(charges[0 : trigidx[0]]), 10)
+    )
+    calfunc, caldata = mim.calibration_function(charges, cal_edges)
+    vcalfunc = np.vectorize(calfunc, otypes=[np.float64])
+
+    processed_data = {
+        "fileno": measurement["fileno"],
+        "info": measurement["info"],
+        "triggers": len(trigidx),
+        "first_trig": trigidx[0] * 10,
+        "calibration": caldata,
+        "energy_trace": mim.analyze_states(charges, trigidx, vcalfunc),
+        "has_datasource_error": len(mim.errors) > 0,
+        "datasource_errors": mim.errors,
+    }
+
+    for key in ["expected_trace", "repeat_id"]:
+        if key in measurement:
+            processed_data[key] = measurement[key]
+
+    return processed_data
+
+
+def _preprocess_etlog(measurement):
+    setup = measurement["setup"]
+    etlog = EnergyTraceLog(
+        float(setup["voltage"]),
+        int(setup["state_duration"]),
+        measurement["transition_names"],
+        with_traces=measurement["with_traces"],
+    )
+    try:
+        etlog.load_data(measurement["content"])
+        states_and_transitions = etlog.analyze_states(
+            measurement["expected_trace"], measurement["repeat_id"]
+        )
+    except EOFError as e:
+        etlog.errors.append("EnergyTrace logfile error: {}".format(e))
+
+    processed_data = {
+        "fileno": measurement["fileno"],
+        "repeat_id": measurement["repeat_id"],
+        "info": measurement["info"],
+        "expected_trace": measurement["expected_trace"],
+        "energy_trace": states_and_transitions,
+        "has_datasource_error": len(etlog.errors) > 0,
+        "datasource_errors": etlog.errors,
+    }
+
+    return processed_data
+
+
+class TimingData:
+    """
+    Loader for timing model traces measured with on-board timers using `harness.OnboardTimerHarness`.
+
+    Excpets a specific trace format and UART log output (as produced by
+    generate-dfa-benchmark.py). Prunes states from output. (TODO)
+    """
+
+    def __init__(self, filenames):
+        """
+        Create a new TimingData object.
+
+        Each filenames element corresponds to a measurement run.
+        """
+        self.filenames = filenames.copy()
+        self.traces_by_fileno = []
+        self.setup_by_fileno = []
+        self.preprocessed = False
+        self._parameter_names = None
+        self.version = 0
+
+    def _concatenate_analyzed_traces(self):
+        self.traces = []
+        for trace_group in self.traces_by_fileno:
+            for trace in trace_group:
+                # TimingHarness logs states, but does not aggregate any data for them at the moment -> throw all states away
+                transitions = list(
+                    filter(lambda x: x["isa"] == "transition", trace["trace"])
+                )
+                self.traces.append({"id": trace["id"], "trace": transitions})
+        for i, trace in enumerate(self.traces):
+            trace["orig_id"] = trace["id"]
+            trace["id"] = i
+            for log_entry in trace["trace"]:
+                paramkeys = sorted(log_entry["parameter"].keys())
+                if "param" not in log_entry["offline_aggregates"]:
+                    log_entry["offline_aggregates"]["param"] = list()
+                if "duration" in log_entry["offline_aggregates"]:
+                    for i in range(len(log_entry["offline_aggregates"]["duration"])):
+                        paramvalues = list()
+                        for paramkey in paramkeys:
+                            if type(log_entry["parameter"][paramkey]) is list:
+                                paramvalues.append(
+                                    soft_cast_int(log_entry["parameter"][paramkey][i])
+                                )
+                            else:
+                                paramvalues.append(
+                                    soft_cast_int(log_entry["parameter"][paramkey])
+                                )
+                        if arg_support_enabled and "args" in log_entry:
+                            paramvalues.extend(map(soft_cast_int, log_entry["args"]))
+                        log_entry["offline_aggregates"]["param"].append(paramvalues)
+
+    def _preprocess_0(self):
+        for filename in self.filenames:
+            with open(filename, "r") as f:
+                log_data = json.load(f)
+                self.traces_by_fileno.extend(log_data["traces"])
+        self._concatenate_analyzed_traces()
+
+    def get_preprocessed_data(self):
+        """
+        Return a list of DFA traces annotated with timing and parameter data.
+
+        Suitable for the PTAModel constructor.
+        See PTAModel(...) docstring for format details.
+        """
+        if self.preprocessed:
+            return self.traces
+        if self.version == 0:
+            self._preprocess_0()
+        self.preprocessed = True
+        return self.traces
+
+
+def sanity_check_aggregate(aggregate):
+    for key in aggregate:
+        if "param" not in aggregate[key]:
+            raise RuntimeError("aggregate[{}][param] does not exist".format(key))
+        if "attributes" not in aggregate[key]:
+            raise RuntimeError("aggregate[{}][attributes] does not exist".format(key))
+        for attribute in aggregate[key]["attributes"]:
+            if attribute not in aggregate[key]:
+                raise RuntimeError(
+                    "aggregate[{}][{}] does not exist, even though it is contained in aggregate[{}][attributes]".format(
+                        key, attribute, key
+                    )
+                )
+            param_len = len(aggregate[key]["param"])
+            attr_len = len(aggregate[key][attribute])
+            if param_len != attr_len:
+                raise RuntimeError(
+                    "parameter mismatch: len(aggregate[{}][param]) == {} != len(aggregate[{}][{}]) == {}".format(
+                        key, param_len, key, attribute, attr_len
+                    )
+                )
+
+
+class RawData:
+    """
+    Loader for hardware model traces measured with MIMOSA.
+
+    Expects a specific trace format and UART log output (as produced by the
+    dfatool benchmark generator). Loads data, prunes bogus measurements, and
+    provides preprocessed data suitable for PTAModel. Results are cached on the
+    file system, making subsequent loads near-instant.
+    """
+
+    def __init__(self, filenames, with_traces=False):
+        """
+        Create a new RawData object.
+
+        Each filename element corresponds to a measurement run.
+        It must be a tar archive with the following contents:
+
+        Version 0:
+
+        * `setup.json`: measurement setup. Must contain the keys `state_duration` (how long each state is active, in ms),
+          `mimosa_voltage` (voltage applied to dut, in V), and `mimosa_shunt` (shunt value, in Ohm)
+        * `src/apps/DriverEval/DriverLog.json`: PTA traces and parameters for this benchmark.
+          Layout: List of traces, each trace has an 'id' (numeric, starting with 1) and 'trace' (list of states and transitions) element.
+          Each trace has an even number of elements, starting with the first state (usually `UNINITIALIZED`) and ending with a transition.
+          Each state/transition must have the members `.parameter` (parameter values, empty string or None if unknown), `.isa` ("state" or "transition") and `.name`.
+          Each transition must additionally contain `.plan.level` ("user" or "epilogue").
+          Example: `[ {"id": 1, "trace": [ {"parameter": {...}, "isa": "state", "name": "UNINITIALIZED"}, ...] }, ... ]
+        * At least one `*.mim` file. Each file corresponds to a single execution of the entire benchmark (i.e., all runs described in DriverLog.json) and starts with a MIMOSA Autocal calibration sequence.
+          MIMOSA files are parsed by the `MIMOSA` class.
+
+        Version 1:
+
+        * `ptalog.json`: measurement setup and traces. Contents:
+          `.opt.sleep`: state duration
+          `.opt.pta`: PTA
+          `.opt.traces`: list of sub-benchmark traces (the benchmark may have been split due to code size limitations). Each item is a list of traces as returned by `harness.traces`:
+            `.opt.traces[]`: List of traces. Each trace has an 'id' (numeric, starting with 1) and 'trace' (list of states and transitions) element.
+              Each state/transition must have the members '`parameter` (dict with normalized parameter values), `.isa` ("state" or "transition") and `.name`
+              Each transition must additionally contain `.args`
+          `.opt.files`: list of coresponding MIMOSA measurements.
+            `.opt.files[]` = ['abc123.mim', ...]
+          `.opt.configs`: ....
+        * MIMOSA log files (`*.mim`) as specified in `.opt.files`
+
+        Version 2:
+
+        * `ptalog.json`: measurement setup and traces. Contents:
+          `.opt.sleep`: state duration
+          `.opt.pta`: PTA
+          `.opt.traces`: list of sub-benchmark traces (the benchmark may have been split due to code size limitations). Each item is a list of traces as returned by `harness.traces`:
+            `.opt.traces[]`: List of traces. Each trace has an 'id' (numeric, starting with 1) and 'trace' (list of states and transitions) element.
+              Each state/transition must have the members '`parameter` (dict with normalized parameter values), `.isa` ("state" or "transition") and `.name`
+              Each transition must additionally contain `.args` and `.duration`
+              * `.duration`: list of durations, one per repetition
+          `.opt.files`: list of coresponding EnergyTrace measurements.
+            `.opt.files[]` = ['abc123.etlog', ...]
+          `.opt.configs`: ....
+        * EnergyTrace log files (`*.etlog`) as specified in `.opt.files`
+
+        If a cached result for a file is available, it is loaded and the file
+        is not preprocessed, unless `with_traces` is set.
+
+        tbd
+        """
+        self.with_traces = with_traces
+        self.filenames = filenames.copy()
+        self.traces_by_fileno = []
+        self.setup_by_fileno = []
+        self.version = 0
+        self.preprocessed = False
+        self._parameter_names = None
+        self.ignore_clipping = False
+        self.pta = None
+
+        with tarfile.open(filenames[0]) as tf:
+            for member in tf.getmembers():
+                if member.name == "ptalog.json" and self.version == 0:
+                    self.version = 1
+                    # might also be version 2
+                    # depends on whether *.etlog exists or not
+                elif ".etlog" in member.name:
+                    self.version = 2
+                    break
+
+        self.set_cache_file()
+        if not with_traces:
+            self.load_cache()
+
+    def set_cache_file(self):
+        cache_key = hashlib.sha256("!".join(self.filenames).encode()).hexdigest()
+        self.cache_dir = os.path.dirname(self.filenames[0]) + "/cache"
+        self.cache_file = "{}/{}.json".format(self.cache_dir, cache_key)
+
+    def load_cache(self):
+        if os.path.exists(self.cache_file):
+            with open(self.cache_file, "r") as f:
+                cache_data = json.load(f)
+                self.filenames = cache_data["filenames"]
+                self.traces = cache_data["traces"]
+                self.preprocessing_stats = cache_data["preprocessing_stats"]
+                if "pta" in cache_data:
+                    self.pta = cache_data["pta"]
+                self.setup_by_fileno = cache_data["setup_by_fileno"]
+                self.preprocessed = True
+
+    def save_cache(self):
+        if self.with_traces:
+            return
+        try:
+            os.mkdir(self.cache_dir)
+        except FileExistsError:
+            pass
+        with open(self.cache_file, "w") as f:
+            cache_data = {
+                "filenames": self.filenames,
+                "traces": self.traces,
+                "preprocessing_stats": self.preprocessing_stats,
+                "pta": self.pta,
+                "setup_by_fileno": self.setup_by_fileno,
+            }
+            json.dump(cache_data, f)
+
+    def _state_is_too_short(self, online, offline, state_duration, next_transition):
+        # We cannot control when an interrupt causes a state to be left
+        if next_transition["plan"]["level"] == "epilogue":
+            return False
+
+        # Note: state_duration is stored as ms, not us
+        return offline["us"] < state_duration * 500
+
+    def _state_is_too_long(self, online, offline, state_duration, prev_transition):
+        # If the previous state was left by an interrupt, we may have some
+        # waiting time left over. So it's okay if the current state is longer
+        # than expected.
+        if prev_transition["plan"]["level"] == "epilogue":
+            return False
+        # state_duration is stored as ms, not us
+        return offline["us"] > state_duration * 1500
+
+    def _measurement_is_valid_2(self, processed_data):
+        """
+        Check if a dfatool v2 measurement is valid.
+
+        processed_data layout:
+        'fileno' : measurement['fileno'],
+        'info' : measurement['info'],
+        'energy_trace' : etlog.analyze_states()
+            A sequence of unnamed, unparameterized states and transitions with
+            power and timing data
+        'expected_trace' : trace from PTA DFS (with parameter data)
+        etlog.analyze_states returns a list of (alternating) states and transitions.
+        Each element is a dict containing:
+            - isa: 'state' oder 'transition'
+            - W_mean: Mittelwert der (kalibrierten) Leistungsaufnahme
+            - W_std: Standardabweichung der (kalibrierten) Leistungsaufnahme
+            - s: duration
+
+            if isa == 'transition':
+            - W_mean_delta_prev: Differenz zwischen W_mean und W_mean des vorherigen Zustands
+            - W_mean_delta_next: Differenz zwischen W_mean und W_mean des Folgezustands
+        """
+
+        # Check for low-level parser errors
+        if processed_data["has_datasource_error"]:
+            processed_data["error"] = "; ".join(processed_data["datasource_errors"])
+            return False
+
+        # Note that the low-level parser (EnergyTraceLog) already checks
+        # whether the transition count is correct
+
+        return True
+
+    def _measurement_is_valid_01(self, processed_data):
+        """
+        Check if a dfatool v0 or v1 measurement is valid.
+
+        processed_data layout:
+        'fileno' : measurement['fileno'],
+        'info' : measurement['info'],
+        'triggers' : len(trigidx),
+        'first_trig' : trigidx[0] * 10,
+        'calibration' : caldata,
+        'energy_trace' : mim.analyze_states(charges, trigidx, vcalfunc)
+            A sequence of unnamed, unparameterized states and transitions with
+            power and timing data
+        'expected_trace' : trace from PTA DFS (with parameter data)
+        mim.analyze_states returns a list of (alternating) states and transitions.
+        Each element is a dict containing:
+            - isa: 'state' oder 'transition'
+            - clip_rate: range(0..1) Anteil an Clipping im Energieverbrauch
+            - raw_mean: Mittelwert der Rohwerte
+            - raw_std: Standardabweichung der Rohwerte
+            - uW_mean: Mittelwert der (kalibrierten) Leistungsaufnahme
+            - uW_std: Standardabweichung der (kalibrierten) Leistungsaufnahme
+            - us: Dauer
+
+            Nur falls isa == 'transition':
+            - timeout: Dauer des vorherigen Zustands
+            - uW_mean_delta_prev: Differenz zwischen uW_mean und uW_mean des vorherigen Zustands
+            - uW_mean_delta_next: Differenz zwischen uW_mean und uW_mean des Folgezustands
+        """
+        setup = self.setup_by_fileno[processed_data["fileno"]]
+        if "expected_trace" in processed_data:
+            traces = processed_data["expected_trace"]
+        else:
+            traces = self.traces_by_fileno[processed_data["fileno"]]
+        state_duration = setup["state_duration"]
+
+        # Check MIMOSA error
+        if processed_data["has_datasource_error"]:
+            processed_data["error"] = "; ".join(processed_data["datasource_errors"])
+            return False
+
+        # Check trigger count
+        sched_trigger_count = 0
+        for run in traces:
+            sched_trigger_count += len(run["trace"])
+        if sched_trigger_count != processed_data["triggers"]:
+            processed_data[
+                "error"
+            ] = "got {got:d} trigger edges, expected {exp:d}".format(
+                got=processed_data["triggers"], exp=sched_trigger_count
+            )
+            return False
+        # Check state durations. Very short or long states can indicate a
+        # missed trigger signal which wasn't detected due to duplicate
+        # triggers elsewhere
+        online_datapoints = []
+        for run_idx, run in enumerate(traces):
+            for trace_part_idx in range(len(run["trace"])):
+                online_datapoints.append((run_idx, trace_part_idx))
+        for offline_idx, online_ref in enumerate(online_datapoints):
+            online_run_idx, online_trace_part_idx = online_ref
+            offline_trace_part = processed_data["energy_trace"][offline_idx]
+            online_trace_part = traces[online_run_idx]["trace"][online_trace_part_idx]
+
+            if self._parameter_names is None:
+                self._parameter_names = sorted(online_trace_part["parameter"].keys())
+
+            if sorted(online_trace_part["parameter"].keys()) != self._parameter_names:
+                processed_data[
+                    "error"
+                ] = "Offline #{off_idx:d} (online {on_name:s} @ {on_idx:d}/{on_sub:d}) has inconsistent parameter set: should be {param_want:s}, is {param_is:s}".format(
+                    off_idx=offline_idx,
+                    on_idx=online_run_idx,
+                    on_sub=online_trace_part_idx,
+                    on_name=online_trace_part["name"],
+                    param_want=self._parameter_names,
+                    param_is=sorted(online_trace_part["parameter"].keys()),
+                )
+
+            if online_trace_part["isa"] != offline_trace_part["isa"]:
+                processed_data[
+                    "error"
+                ] = "Offline #{off_idx:d} (online {on_name:s} @ {on_idx:d}/{on_sub:d}) claims to be {off_isa:s}, but should be {on_isa:s}".format(
+                    off_idx=offline_idx,
+                    on_idx=online_run_idx,
+                    on_sub=online_trace_part_idx,
+                    on_name=online_trace_part["name"],
+                    off_isa=offline_trace_part["isa"],
+                    on_isa=online_trace_part["isa"],
+                )
+                return False
+
+            # Clipping in UNINITIALIZED (offline_idx == 0) can happen during
+            # calibration and is handled by MIMOSA
+            if (
+                offline_idx != 0
+                and offline_trace_part["clip_rate"] != 0
+                and not self.ignore_clipping
+            ):
+                processed_data[
+                    "error"
+                ] = "Offline #{off_idx:d} (online {on_name:s} @ {on_idx:d}/{on_sub:d}) was clipping {clip:f}% of the time".format(
+                    off_idx=offline_idx,
+                    on_idx=online_run_idx,
+                    on_sub=online_trace_part_idx,
+                    on_name=online_trace_part["name"],
+                    clip=offline_trace_part["clip_rate"] * 100,
+                )
+                return False
+
+            if (
+                online_trace_part["isa"] == "state"
+                and online_trace_part["name"] != "UNINITIALIZED"
+                and len(traces[online_run_idx]["trace"]) > online_trace_part_idx + 1
+            ):
+                online_prev_transition = traces[online_run_idx]["trace"][
+                    online_trace_part_idx - 1
+                ]
+                online_next_transition = traces[online_run_idx]["trace"][
+                    online_trace_part_idx + 1
+                ]
+                try:
+                    if self._state_is_too_short(
+                        online_trace_part,
+                        offline_trace_part,
+                        state_duration,
+                        online_next_transition,
+                    ):
+                        processed_data[
+                            "error"
+                        ] = "Offline #{off_idx:d} (online {on_name:s} @ {on_idx:d}/{on_sub:d}) is too short (duration = {dur:d} us)".format(
+                            off_idx=offline_idx,
+                            on_idx=online_run_idx,
+                            on_sub=online_trace_part_idx,
+                            on_name=online_trace_part["name"],
+                            dur=offline_trace_part["us"],
+                        )
+                        return False
+                    if self._state_is_too_long(
+                        online_trace_part,
+                        offline_trace_part,
+                        state_duration,
+                        online_prev_transition,
+                    ):
+                        processed_data[
+                            "error"
+                        ] = "Offline #{off_idx:d} (online {on_name:s} @ {on_idx:d}/{on_sub:d}) is too long (duration = {dur:d} us)".format(
+                            off_idx=offline_idx,
+                            on_idx=online_run_idx,
+                            on_sub=online_trace_part_idx,
+                            on_name=online_trace_part["name"],
+                            dur=offline_trace_part["us"],
+                        )
+                        return False
+                except KeyError:
+                    pass
+                    # TODO es gibt next_transitions ohne 'plan'
+        return True
+
+    def _merge_online_and_offline(self, measurement):
+        # Edits self.traces_by_fileno[measurement['fileno']][*]['trace'][*]['offline']
+        # and self.traces_by_fileno[measurement['fileno']][*]['trace'][*]['offline_aggregates'] in place
+        # (appends data from measurement['energy_trace'])
+        # If measurement['expected_trace'] exists, it is edited in place instead
+        online_datapoints = []
+        if "expected_trace" in measurement:
+            traces = measurement["expected_trace"]
+            traces = self.traces_by_fileno[measurement["fileno"]]
+        else:
+            traces = self.traces_by_fileno[measurement["fileno"]]
+        for run_idx, run in enumerate(traces):
+            for trace_part_idx in range(len(run["trace"])):
+                online_datapoints.append((run_idx, trace_part_idx))
+        for offline_idx, online_ref in enumerate(online_datapoints):
+            online_run_idx, online_trace_part_idx = online_ref
+            offline_trace_part = measurement["energy_trace"][offline_idx]
+            online_trace_part = traces[online_run_idx]["trace"][online_trace_part_idx]
+
+            if "offline" not in online_trace_part:
+                online_trace_part["offline"] = [offline_trace_part]
+            else:
+                online_trace_part["offline"].append(offline_trace_part)
+
+            paramkeys = sorted(online_trace_part["parameter"].keys())
+
+            paramvalues = list()
+
+            for paramkey in paramkeys:
+                if type(online_trace_part["parameter"][paramkey]) is list:
+                    paramvalues.append(
+                        soft_cast_int(
+                            online_trace_part["parameter"][paramkey][
+                                measurement["repeat_id"]
+                            ]
+                        )
+                    )
+                else:
+                    paramvalues.append(
+                        soft_cast_int(online_trace_part["parameter"][paramkey])
+                    )
+
+            # NB: Unscheduled transitions do not have an 'args' field set.
+            # However, they should only be caused by interrupts, and
+            # interrupts don't have args anyways.
+            if arg_support_enabled and "args" in online_trace_part:
+                paramvalues.extend(map(soft_cast_int, online_trace_part["args"]))
+
+            if "offline_aggregates" not in online_trace_part:
+                online_trace_part["offline_attributes"] = [
+                    "power",
+                    "duration",
+                    "energy",
+                ]
+                online_trace_part["offline_aggregates"] = {
+                    "power": [],
+                    "duration": [],
+                    "power_std": [],
+                    "energy": [],
+                    "paramkeys": [],
+                    "param": [],
+                }
+                if online_trace_part["isa"] == "transition":
+                    online_trace_part["offline_attributes"].extend(
+                        ["rel_energy_prev", "rel_energy_next", "timeout"]
+                    )
+                    online_trace_part["offline_aggregates"]["rel_energy_prev"] = []
+                    online_trace_part["offline_aggregates"]["rel_energy_next"] = []
+                    online_trace_part["offline_aggregates"]["timeout"] = []
+
+            # Note: All state/transitions are 20us "too long" due to injected
+            # active wait states. These are needed to work around MIMOSA's
+            # relatively low sample rate of 100 kHz (10us) and removed here.
+            online_trace_part["offline_aggregates"]["power"].append(
+                offline_trace_part["uW_mean"]
+            )
+            online_trace_part["offline_aggregates"]["duration"].append(
+                offline_trace_part["us"] - 20
+            )
+            online_trace_part["offline_aggregates"]["power_std"].append(
+                offline_trace_part["uW_std"]
+            )
+            online_trace_part["offline_aggregates"]["energy"].append(
+                offline_trace_part["uW_mean"] * (offline_trace_part["us"] - 20)
+            )
+            online_trace_part["offline_aggregates"]["paramkeys"].append(paramkeys)
+            online_trace_part["offline_aggregates"]["param"].append(paramvalues)
+            if online_trace_part["isa"] == "transition":
+                online_trace_part["offline_aggregates"]["rel_energy_prev"].append(
+                    offline_trace_part["uW_mean_delta_prev"]
+                    * (offline_trace_part["us"] - 20)
+                )
+                online_trace_part["offline_aggregates"]["rel_energy_next"].append(
+                    offline_trace_part["uW_mean_delta_next"]
+                    * (offline_trace_part["us"] - 20)
+                )
+                online_trace_part["offline_aggregates"]["timeout"].append(
+                    offline_trace_part["timeout"]
+                )
+
+    def _merge_online_and_etlog(self, measurement):
+        # Edits self.traces_by_fileno[measurement['fileno']][*]['trace'][*]['offline']
+        # and self.traces_by_fileno[measurement['fileno']][*]['trace'][*]['offline_aggregates'] in place
+        # (appends data from measurement['energy_trace'])
+        online_datapoints = []
+        traces = self.traces_by_fileno[measurement["fileno"]]
+        for run_idx, run in enumerate(traces):
+            for trace_part_idx in range(len(run["trace"])):
+                online_datapoints.append((run_idx, trace_part_idx))
+        for offline_idx, online_ref in enumerate(online_datapoints):
+            online_run_idx, online_trace_part_idx = online_ref
+            offline_trace_part = measurement["energy_trace"][offline_idx]
+            online_trace_part = traces[online_run_idx]["trace"][online_trace_part_idx]
+
+            if "offline" not in online_trace_part:
+                online_trace_part["offline"] = [offline_trace_part]
+            else:
+                online_trace_part["offline"].append(offline_trace_part)
+
+            paramkeys = sorted(online_trace_part["parameter"].keys())
+
+            paramvalues = list()
+
+            for paramkey in paramkeys:
+                if type(online_trace_part["parameter"][paramkey]) is list:
+                    paramvalues.append(
+                        soft_cast_int(
+                            online_trace_part["parameter"][paramkey][
+                                measurement["repeat_id"]
+                            ]
+                        )
+                    )
+                else:
+                    paramvalues.append(
+                        soft_cast_int(online_trace_part["parameter"][paramkey])
+                    )
+
+            # NB: Unscheduled transitions do not have an 'args' field set.
+            # However, they should only be caused by interrupts, and
+            # interrupts don't have args anyways.
+            if arg_support_enabled and "args" in online_trace_part:
+                paramvalues.extend(map(soft_cast_int, online_trace_part["args"]))
+
+            if "offline_aggregates" not in online_trace_part:
+                online_trace_part["offline_aggregates"] = {
+                    "offline_attributes": ["power", "duration", "energy"],
+                    "duration": list(),
+                    "power": list(),
+                    "power_std": list(),
+                    "energy": list(),
+                    "paramkeys": list(),
+                    "param": list(),
+                }
+
+            offline_aggregates = online_trace_part["offline_aggregates"]
+
+            # if online_trace_part['isa'] == 'transitions':
+            #    online_trace_part['offline_attributes'].extend(['rel_energy_prev', 'rel_energy_next'])
+            #    offline_aggregates['rel_energy_prev'] = list()
+            #    offline_aggregates['rel_energy_next'] = list()
+
+            offline_aggregates["duration"].append(offline_trace_part["s"] * 1e6)
+            offline_aggregates["power"].append(offline_trace_part["W_mean"] * 1e6)
+            offline_aggregates["power_std"].append(offline_trace_part["W_std"] * 1e6)
+            offline_aggregates["energy"].append(
+                offline_trace_part["W_mean"] * offline_trace_part["s"] * 1e12
+            )
+            offline_aggregates["paramkeys"].append(paramkeys)
+            offline_aggregates["param"].append(paramvalues)
+
+            # if online_trace_part['isa'] == 'transition':
+            #    offline_aggregates['rel_energy_prev'].append(offline_trace_part['W_mean_delta_prev'] * offline_trace_part['s'] * 1e12)
+            #    offline_aggregates['rel_energy_next'].append(offline_trace_part['W_mean_delta_next'] * offline_trace_part['s'] * 1e12)
+
+    def _concatenate_traces(self, list_of_traces):
+        """
+        Concatenate `list_of_traces` (list of lists) into a single trace while adjusting trace IDs.
+
+        :param list_of_traces: List of list of traces.
+        :returns: List of traces with ['id'] in ascending order and ['orig_id'] as previous ['id']
+        """
+
+        trace_output = list()
+        for trace in list_of_traces:
+            trace_output.extend(trace.copy())
+        for i, trace in enumerate(trace_output):
+            trace["orig_id"] = trace["id"]
+            trace["id"] = i
+        return trace_output
+
+    def get_preprocessed_data(self):
+        """
+        Return a list of DFA traces annotated with energy, timing, and parameter data.
+        The list is cached on disk, unless the constructor was called with `with_traces` set.
+
+        Each DFA trace contains the following elements:
+         * `id`: Numeric ID, starting with 1
+         * `total_energy`: Total amount of energy (as measured by MIMOSA) in the entire trace
+         * `orig_id`: Original trace ID. May differ when concatenating multiple (different) benchmarks into one analysis, i.e., when calling RawData() with more than one file argument.
+         * `trace`: List of the individual states and transitions in this trace. Always contains an even number of elements, staring with the first state (typically "UNINITIALIZED") and ending with a transition.
+
+        Each trace element (that is, an entry of the `trace` list mentioned above) contains the following elements:
+         * `isa`: "state" or "transition"
+         * `name`: name
+         * `offline`: List of offline measumerents for this state/transition. Each entry contains a result for this state/transition during one benchmark execution.
+           Entry contents:
+            - `clip_rate`: rate of clipped energy measurements, 0 .. 1
+            - `raw_mean`: mean raw MIMOSA value
+            - `raw_std`: standard deviation of raw MIMOSA value
+            - `uW_mean`: mean power draw, uW
+            - `uw_std`: standard deviation of power draw, uW
+            - `us`: state/transition duration, us
+            - `uW_mean_delta_prev`: (only for transitions) difference between uW_mean of this transition and uW_mean of previous state
+            - `uW_mean_elta_next`: (only for transitions) difference between uW_mean of this transition and uW_mean of next state
+            - `timeout`: (only for transitions) duration of previous state, us
+         * `offline_aggregates`: Aggregate of `offline` entries. dict of lists, each list entry has the same length
+            - `duration`: state/transition durations ("us"), us
+            - `energy`: state/transition energy ("us * uW_mean"), us
+            - `power`: mean power draw ("uW_mean"), uW
+            - `power_std`: standard deviations of power draw ("uW_std"), uW^2
+            - `paramkeys`: List of lists, each sub-list contains the parameter names corresponding to the `param` entries
+            - `param`: List of lists, each sub-list contains the parameter values for this measurement. Typically, all sub-lists are the same.
+            - `rel_energy_prev`: (only for transitions) transition energy relative to previous state mean power, pJ
+            - `rel_energy_next`: (only for transitions) transition energy relative to next state mean power, pJ
+            - `timeout`: (only for transitions) duration of previous state, us
+         * `offline_attributes`: List containing the keys of `offline_aggregates` which are meant to be part of themodel.
+           This list ultimately decides which hardware/software attributes the model describes.
+           If isa == state, it contains power, duration, energy
+           If isa == transition, it contains power, duration, energy, rel_energy_prev, rel_energy_next, timeout
+         * `online`: List of online estimations for this state/transition. Each entry contains a result for this state/transition during one benchmark execution.
+          Entry contents for isa == state:
+            - `time`: state/transition
+          Entry contents for isa == transition:
+            - `timeout`: Duration of previous state, measured using on-board timers
+         * `parameter`: dictionary describing parameter values for this state/transition. Parameter values refer to the begin of the state/transition and do not account for changes made by the transition.
+         * `plan`: Dictionary describing expected behaviour according to schedule / offline model.
+           Contents for isa == state: `energy`, `power`, `time`
+           Contents for isa == transition: `energy`, `timeout`, `level`.
+           If level is "user", the transition is part of the regular driver API. If level is "epilogue", it is an interrupt service routine and not called explicitly.
+        Each transition also contains:
+         * `args`: List of arguments the corresponding function call was called with. args entries are strings which are not necessarily numeric
+         * `code`: List of function name (first entry) and arguments (remaining entries) of the corresponding function call
+        """
+        if self.preprocessed:
+            return self.traces
+        if self.version == 0:
+            self._preprocess_012(0)
+        elif self.version == 1:
+            self._preprocess_012(1)
+        elif self.version == 2:
+            self._preprocess_012(2)
+        self.preprocessed = True
+        self.save_cache()
+        return self.traces
+
+    def _preprocess_012(self, version):
+        """Load raw MIMOSA data and turn it into measurements which are ready to be analyzed."""
+        offline_data = []
+        for i, filename in enumerate(self.filenames):
+
+            if version == 0:
+
+                with tarfile.open(filename) as tf:
+                    self.setup_by_fileno.append(json.load(tf.extractfile("setup.json")))
+                    self.traces_by_fileno.append(
+                        json.load(tf.extractfile("src/apps/DriverEval/DriverLog.json"))
+                    )
+                    for member in tf.getmembers():
+                        _, extension = os.path.splitext(member.name)
+                        if extension == ".mim":
+                            offline_data.append(
+                                {
+                                    "content": tf.extractfile(member).read(),
+                                    "fileno": i,
+                                    "info": member,
+                                    "setup": self.setup_by_fileno[i],
+                                    "with_traces": self.with_traces,
+                                }
+                            )
+
+            elif version == 1:
+
+                new_filenames = list()
+                with tarfile.open(filename) as tf:
+                    ptalog = json.load(tf.extractfile(tf.getmember("ptalog.json")))
+                    self.pta = ptalog["pta"]
+
+                    # Benchmark code may be too large to be executed in a single
+                    # run, so benchmarks (a benchmark is basically a list of DFA runs)
+                    # may be split up. To accomodate this, ptalog['traces'] is
+                    # a list of lists: ptalog['traces'][0] corresponds to the
+                    # first benchmark part, ptalog['traces'][1] to the
+                    # second, and so on. ptalog['traces'][0][0] is the first
+                    # trace (a sequence of states and transitions) in the
+                    # first benchmark part, ptalog['traces'][0][1] the second, etc.
+                    #
+                    # As traces are typically repeated to minimize the effect
+                    # of random noise, observations for each benchmark part
+                    # are also lists. In this case, this applies in two
+                    # cases: traces[i][j]['parameter'][some_param] is either
+                    # a value (if the parameter is controlld by software)
+                    # or a list (if the parameter is known a posteriori, e.g.
+                    # "how many retransmissions did this packet take?").
+                    #
+                    # The second case is the MIMOSA energy measurements, which
+                    # are listed in ptalog['files']. ptalog['files'][0]
+                    # contains a list of files for the first benchmark part,
+                    # ptalog['files'][0][0] is its first iteration/repetition,
+                    # ptalog['files'][0][1] the second, etc.
+
+                    for j, traces in enumerate(ptalog["traces"]):
+                        new_filenames.append("{}#{}".format(filename, j))
+                        self.traces_by_fileno.append(traces)
+                        self.setup_by_fileno.append(
+                            {
+                                "mimosa_voltage": ptalog["configs"][j]["voltage"],
+                                "mimosa_shunt": ptalog["configs"][j]["shunt"],
+                                "state_duration": ptalog["opt"]["sleep"],
+                            }
+                        )
+                        for repeat_id, mim_file in enumerate(ptalog["files"][j]):
+                            member = tf.getmember(mim_file)
+                            offline_data.append(
+                                {
+                                    "content": tf.extractfile(member).read(),
+                                    "fileno": j,
+                                    "info": member,
+                                    "setup": self.setup_by_fileno[j],
+                                    "repeat_id": repeat_id,
+                                    "expected_trace": ptalog["traces"][j],
+                                    "with_traces": self.with_traces,
+                                }
+                            )
+                self.filenames = new_filenames
+
+            elif version == 2:
+
+                new_filenames = list()
+                with tarfile.open(filename) as tf:
+                    ptalog = json.load(tf.extractfile(tf.getmember("ptalog.json")))
+                    self.pta = ptalog["pta"]
+
+                    # Benchmark code may be too large to be executed in a single
+                    # run, so benchmarks (a benchmark is basically a list of DFA runs)
+                    # may be split up. To accomodate this, ptalog['traces'] is
+                    # a list of lists: ptalog['traces'][0] corresponds to the
+                    # first benchmark part, ptalog['traces'][1] to the
+                    # second, and so on. ptalog['traces'][0][0] is the first
+                    # trace (a sequence of states and transitions) in the
+                    # first benchmark part, ptalog['traces'][0][1] the second, etc.
+                    #
+                    # As traces are typically repeated to minimize the effect
+                    # of random noise, observations for each benchmark part
+                    # are also lists. In this case, this applies in two
+                    # cases: traces[i][j]['parameter'][some_param] is either
+                    # a value (if the parameter is controlld by software)
+                    # or a list (if the parameter is known a posteriori, e.g.
+                    # "how many retransmissions did this packet take?").
+                    #
+                    # The second case is the MIMOSA energy measurements, which
+                    # are listed in ptalog['files']. ptalog['files'][0]
+                    # contains a list of files for the first benchmark part,
+                    # ptalog['files'][0][0] is its first iteration/repetition,
+                    # ptalog['files'][0][1] the second, etc.
+
+                    # generate-dfa-benchmark uses TimingHarness to obtain timing data.
+                    # Data is placed in 'offline_aggregates', which is also
+                    # where we are going to store power/energy data.
+                    # In case of invalid measurements, this can lead to a
+                    # mismatch between duration and power/energy data, e.g.
+                    # where duration = [A, B, C], power = [a, b], B belonging
+                    # to an invalid measurement and thus power[b] corresponding
+                    # to duration[C]. At the moment, this is harmless, but in the
+                    # future it might not be.
+                    if "offline_aggregates" in ptalog["traces"][0][0]["trace"][0]:
+                        for trace_group in ptalog["traces"]:
+                            for trace in trace_group:
+                                for state_or_transition in trace["trace"]:
+                                    offline_aggregates = state_or_transition.pop(
+                                        "offline_aggregates", None
+                                    )
+                                    if offline_aggregates:
+                                        state_or_transition[
+                                            "online_aggregates"
+                                        ] = offline_aggregates
+
+                    for j, traces in enumerate(ptalog["traces"]):
+                        new_filenames.append("{}#{}".format(filename, j))
+                        self.traces_by_fileno.append(traces)
+                        self.setup_by_fileno.append(
+                            {
+                                "voltage": ptalog["configs"][j]["voltage"],
+                                "state_duration": ptalog["opt"]["sleep"],
+                            }
+                        )
+                        for repeat_id, etlog_file in enumerate(ptalog["files"][j]):
+                            member = tf.getmember(etlog_file)
+                            offline_data.append(
+                                {
+                                    "content": tf.extractfile(member).read(),
+                                    "fileno": j,
+                                    "info": member,
+                                    "setup": self.setup_by_fileno[j],
+                                    "repeat_id": repeat_id,
+                                    "expected_trace": ptalog["traces"][j],
+                                    "with_traces": self.with_traces,
+                                    "transition_names": list(
+                                        map(
+                                            lambda x: x["name"],
+                                            ptalog["pta"]["transitions"],
+                                        )
+                                    ),
+                                }
+                            )
+                self.filenames = new_filenames
+                # TODO remove 'offline_aggregates' from pre-parse data and place
+                # it under 'online_aggregates' or similar instead. This way, if
+                # a .etlog file fails to parse, its corresponding duration data
+                # will not linger in 'offline_aggregates' and confuse the hell
+                # out of other code paths
+
+        with Pool() as pool:
+            if self.version <= 1:
+                measurements = pool.map(_preprocess_mimosa, offline_data)
+            elif self.version == 2:
+                measurements = pool.map(_preprocess_etlog, offline_data)
+
+        num_valid = 0
+        for measurement in measurements:
+
+            if "energy_trace" not in measurement:
+                logger.warning(
+                    "Skipping {ar:s}/{m:s}: {e:s}".format(
+                        ar=self.filenames[measurement["fileno"]],
+                        m=measurement["info"].name,
+                        e="; ".join(measurement["datasource_errors"]),
+                    )
+                )
+                continue
+
+            if version == 0:
+                # Strip the last state (it is not part of the scheduled measurement)
+                measurement["energy_trace"].pop()
+            elif version == 1:
+                # The first online measurement is the UNINITIALIZED state. In v1,
+                # it is not part of the expected PTA trace -> remove it.
+                measurement["energy_trace"].pop(0)
+
+            if version == 0 or version == 1:
+                if self._measurement_is_valid_01(measurement):
+                    self._merge_online_and_offline(measurement)
+                    num_valid += 1
+                else:
+                    logger.warning(
+                        "Skipping {ar:s}/{m:s}: {e:s}".format(
+                            ar=self.filenames[measurement["fileno"]],
+                            m=measurement["info"].name,
+                            e=measurement["error"],
+                        )
+                    )
+            elif version == 2:
+                if self._measurement_is_valid_2(measurement):
+                    self._merge_online_and_etlog(measurement)
+                    num_valid += 1
+                else:
+                    logger.warning(
+                        "Skipping {ar:s}/{m:s}: {e:s}".format(
+                            ar=self.filenames[measurement["fileno"]],
+                            m=measurement["info"].name,
+                            e=measurement["error"],
+                        )
+                    )
+        logger.info(
+            "{num_valid:d}/{num_total:d} measurements are valid".format(
+                num_valid=num_valid, num_total=len(measurements)
+            )
+        )
+        if version == 0:
+            self.traces = self._concatenate_traces(self.traces_by_fileno)
+        elif version == 1:
+            self.traces = self._concatenate_traces(
+                map(lambda x: x["expected_trace"], measurements)
+            )
+            self.traces = self._concatenate_traces(self.traces_by_fileno)
+        elif version == 2:
+            self.traces = self._concatenate_traces(self.traces_by_fileno)
+        self.preprocessing_stats = {
+            "num_runs": len(measurements),
+            "num_valid": num_valid,
+        }
+
+
+def _add_trace_data_to_aggregate(aggregate, key, element):
+    # Only cares about element['isa'], element['offline_aggregates'], and
+    # element['plan']['level']
+    if key not in aggregate:
+        aggregate[key] = {"isa": element["isa"]}
+        for datakey in element["offline_aggregates"].keys():
+            aggregate[key][datakey] = []
+        if element["isa"] == "state":
+            aggregate[key]["attributes"] = ["power"]
+        else:
+            # TODO do not hardcode values
+            aggregate[key]["attributes"] = [
+                "duration",
+                "energy",
+                "rel_energy_prev",
+                "rel_energy_next",
+            ]
+            # Uncomment this line if you also want to analyze mean transition power
+            # aggrgate[key]['attributes'].append('power')
+            if "plan" in element and element["plan"]["level"] == "epilogue":
+                aggregate[key]["attributes"].insert(0, "timeout")
+        attributes = aggregate[key]["attributes"].copy()
+        for attribute in attributes:
+            if attribute not in element["offline_aggregates"]:
+                aggregate[key]["attributes"].remove(attribute)
+    for datakey, dataval in element["offline_aggregates"].items():
+        aggregate[key][datakey].extend(dataval)
+
+
+def pta_trace_to_aggregate(traces, ignore_trace_indexes=[]):
+    u"""
+    Convert preprocessed DFA traces from peripherals/drivers to by_name aggregate for PTAModel.
+
+    arguments:
+    traces -- [ ... Liste von einzelnen Läufen (d.h. eine Zustands- und Transitionsfolge UNINITIALIZED -> foo -> FOO -> bar -> BAR -> ...)
+        Jeder Lauf:
+        - id: int Nummer des Laufs, beginnend bei 1
+        - trace: [ ... Liste von Zuständen und Transitionen
+            Jeweils:
+            - name: str Name
+            - isa: str state // transition
+            - parameter: { ... globaler Parameter: aktueller wert. null falls noch nicht eingestellt }
+            - args: [ Funktionsargumente, falls isa == 'transition' ]
+            - offline_aggregates:
+                - power: [float(uW)] Mittlere Leistung während Zustand/Transitions
+                - power_std: [float(uW^2)] Standardabweichung der Leistung
+                - duration: [int(us)] Dauer
+                - energy: [float(pJ)] Energieaufnahme des Zustands / der Transition
+                - clip_rate: [float(0..1)] Clipping
+                - paramkeys: [[str]] Name der berücksichtigten Parameter
+                - param: [int // str] Parameterwerte. Quasi-Duplikat von 'parameter' oben
+                Falls isa == 'transition':
+                - timeout: [int(us)] Dauer des vorherigen Zustands
+                - rel_energy_prev: [int(pJ)]
+                - rel_energy_next: [int(pJ)]
+        ]
+    ]
+    ignore_trace_indexes -- list of trace indexes. The corresponding taces will be ignored.
+
+    returns a tuple of three elements:
+    by_name -- measurements aggregated by state/transition name, annotated with parameter values
+    parameter_names -- list of parameter names
+    arg_count -- dict mapping transition names to the number of arguments of their corresponding driver function
+
+    by_name layout:
+    Dictionary with one key per state/transition ('send', 'TX', ...).
+    Each element is in turn a dict with the following elements:
+    - isa: 'state' or 'transition'
+    - power: list of mean power measurements in µW
+    - duration: list of durations in µs
+    - power_std: list of stddev of power per state/transition
+    - energy: consumed energy (power*duration) in pJ
+    - paramkeys: list of parameter names in each measurement (-> list of lists)
+    - param: list of parameter values in each measurement (-> list of lists)
+    - attributes: list of keys that should be analyzed,
+        e.g. ['power', 'duration']
+    additionally, only if isa == 'transition':
+    - timeout: list of duration of previous state in µs
+    - rel_energy_prev: transition energy relative to previous state mean power in pJ
+    - rel_energy_next: transition energy relative to next state mean power in pJ
+    """
+    arg_count = dict()
+    by_name = dict()
+    parameter_names = sorted(traces[0]["trace"][0]["parameter"].keys())
+    for run in traces:
+        if run["id"] not in ignore_trace_indexes:
+            for elem in run["trace"]:
+                if (
+                    elem["isa"] == "transition"
+                    and not elem["name"] in arg_count
+                    and "args" in elem
+                ):
+                    arg_count[elem["name"]] = len(elem["args"])
+                if elem["name"] != "UNINITIALIZED":
+                    _add_trace_data_to_aggregate(by_name, elem["name"], elem)
+    for elem in by_name.values():
+        for key in elem["attributes"]:
+            elem[key] = np.array(elem[key])
+    return by_name, parameter_names, arg_count
+
+
+class EnergyTraceLog:
+    """
+    EnergyTrace log loader for DFA traces.
+
+    Expects an EnergyTrace log file generated via msp430-etv / energytrace-util
+    and a dfatool-generated benchmark. An EnergyTrace log consits of a series
+    of measurements. Each measurement has a timestamp, mean current, voltage,
+    and cumulative energy since start of measurement. Each transition is
+    preceded by a Code128 barcode embedded into the energy consumption by
+    toggling a LED.
+
+    Note that the baseline power draw of board and peripherals is not subtracted
+    at the moment.
+    """
+
+    def __init__(
+        self,
+        voltage: float,
+        state_duration: int,
+        transition_names: list,
+        with_traces=False,
+    ):
+        """
+        Create a new EnergyTraceLog object.
+
+        :param voltage: supply voltage [V], usually 3.3 V
+        :param state_duration: state duration [ms]
+        :param transition_names: list of transition names in PTA transition order.
+            Needed to map barcode synchronization numbers to transitions.
+        """
+        self.voltage = voltage
+        self.state_duration = state_duration * 1e-3
+        self.transition_names = transition_names
+        self.with_traces = with_traces
+        self.errors = list()
+
+        # TODO auto-detect
+        self.led_power = 10e-3
+
+        # multipass/include/object/ptalog.h#startTransition
+        self.module_duration = 5e-3
+
+        # multipass/include/object/ptalog.h#startTransition
+        self.quiet_zone_duration = 60e-3
+
+        # TODO auto-detect?
+        # Note that we consider barcode duration after start, so only the
+        # quiet zone -after- the code is relevant
+        self.min_barcode_duration = 57 * self.module_duration + self.quiet_zone_duration
+        self.max_barcode_duration = 68 * self.module_duration + self.quiet_zone_duration
+
+    def load_data(self, log_data):
+        """
+        Load log data (raw energytrace .txt file, one line per event).
+
+        :param log_data: raw energytrace log file in 4-column .txt format
+        """
+
+        if not zbar_available:
+            logger.error("zbar module is not available")
+            self.errors.append(
+                'zbar module is not available. Try "apt install python3-zbar"'
+            )
+            return list()
+
+        lines = log_data.decode("ascii").split("\n")
+        data_count = sum(map(lambda x: len(x) > 0 and x[0] != "#", lines))
+        data_lines = filter(lambda x: len(x) > 0 and x[0] != "#", lines)
+
+        data = np.empty((data_count, 4))
+
+        for i, line in enumerate(data_lines):
+            fields = line.split(" ")
+            if len(fields) == 4:
+                timestamp, current, voltage, total_energy = map(int, fields)
+            elif len(fields) == 5:
+                # cpustate = fields[0]
+                timestamp, current, voltage, total_energy = map(int, fields[1:])
+            else:
+                raise RuntimeError('cannot parse line "{}"'.format(line))
+            data[i] = [timestamp, current, voltage, total_energy]
+
+        self.interval_start_timestamp = data[:-1, 0] * 1e-6
+        self.interval_duration = (data[1:, 0] - data[:-1, 0]) * 1e-6
+        self.interval_power = ((data[1:, 3] - data[:-1, 3]) * 1e-9) / (
+            (data[1:, 0] - data[:-1, 0]) * 1e-6
+        )
+
+        m_duration_us = data[-1, 0] - data[0, 0]
+
+        self.sample_rate = data_count / (m_duration_us * 1e-6)
+
+        logger.debug(
+            "got {} samples with {} seconds of log data ({} Hz)".format(
+                data_count, m_duration_us * 1e-6, self.sample_rate
+            )
+        )
+
+        return (
+            self.interval_start_timestamp,
+            self.interval_duration,
+            self.interval_power,
+        )
+
+    def ts_to_index(self, timestamp):
+        """
+        Convert timestamp in seconds to interval_start_timestamp / interval_duration / interval_power index.
+
+        Returns the index of the interval which timestamp is part of.
+        """
+        return self._ts_to_index(timestamp, 0, len(self.interval_start_timestamp))
+
+    def _ts_to_index(self, timestamp, left_index, right_index):
+        if left_index == right_index:
+            return left_index
+        if left_index + 1 == right_index:
+            return left_index
+
+        mid_index = left_index + (right_index - left_index) // 2
+
+        # I'm feeling lucky
+        if (
+            timestamp > self.interval_start_timestamp[mid_index]
+            and timestamp
+            <= self.interval_start_timestamp[mid_index]
+            + self.interval_duration[mid_index]
+        ):
+            return mid_index
+
+        if timestamp <= self.interval_start_timestamp[mid_index]:
+            return self._ts_to_index(timestamp, left_index, mid_index)
+
+        return self._ts_to_index(timestamp, mid_index, right_index)
+
+    def analyze_states(self, traces, offline_index: int):
+        u"""
+        Split log data into states and transitions and return duration, energy, and mean power for each element.
+
+        :param traces: expected traces, needed to synchronize with the measurement.
+            traces is a list of runs, traces[*]['trace'] is a single run
+            (i.e. a list of states and transitions, starting with a transition
+            and ending with a state).
+        :param offline_index: This function uses traces[*]['trace'][*]['online_aggregates']['duration'][offline_index] to find sync codes
+
+        :param charges: raw charges (each element describes the charge in pJ transferred during 10 µs)
+        :param trigidx: "charges" indexes corresponding to a trigger edge, see `trigger_edges`
+        :param ua_func: charge(pJ) -> current(µA) function as returned by `calibration_function`
+
+        :returns: maybe returns list of states and transitions, both starting andending with a state.
+            Each element is a dict containing:
+            * `isa`: 'state' or 'transition'
+            * `clip_rate`: range(0..1) Anteil an Clipping im Energieverbrauch
+            * `raw_mean`: Mittelwert der Rohwerte
+            * `raw_std`: Standardabweichung der Rohwerte
+            * `uW_mean`: Mittelwert der (kalibrierten) Leistungsaufnahme
+            * `uW_std`: Standardabweichung der (kalibrierten) Leistungsaufnahme
+            * `us`: Dauer
+            if isa == 'transition, it also contains:
+            * `timeout`: Dauer des vorherigen Zustands
+            * `uW_mean_delta_prev`: Differenz zwischen uW_mean und uW_mean des vorherigen Zustands
+            * `uW_mean_delta_next`: Differenz zwischen uW_mean und uW_mean des Folgezustands
+        """
+
+        first_sync = self.find_first_sync()
+
+        energy_trace = list()
+
+        expected_transitions = list()
+        for trace_number, trace in enumerate(traces):
+            for state_or_transition_number, state_or_transition in enumerate(
+                trace["trace"]
+            ):
+                if state_or_transition["isa"] == "transition":
+                    try:
+                        expected_transitions.append(
+                            (
+                                state_or_transition["name"],
+                                state_or_transition["online_aggregates"]["duration"][
+                                    offline_index
+                                ]
+                                * 1e-6,
+                            )
+                        )
+                    except IndexError:
+                        self.errors.append(
+                            'Entry #{} ("{}") in trace #{} has no duration entry for offline_index/repeat_id {}'.format(
+                                state_or_transition_number,
+                                state_or_transition["name"],
+                                trace_number,
+                                offline_index,
+                            )
+                        )
+                        return energy_trace
+
+        next_barcode = first_sync
+
+        for name, duration in expected_transitions:
+            bc, start, stop, end = self.find_barcode(next_barcode)
+            if bc is None:
+                logger.error('did not find transition "{}"'.format(name))
+                break
+            next_barcode = end + self.state_duration + duration
+            logger.debug(
+                '{} barcode "{}" area: {:0.2f} .. {:0.2f} / {:0.2f} seconds'.format(
+                    offline_index, bc, start, stop, end
+                )
+            )
+            if bc != name:
+                logger.error('mismatch: expected "{}", got "{}"'.format(name, bc))
+            logger.debug(
+                "{} estimated transition area: {:0.3f} .. {:0.3f} seconds".format(
+                    offline_index, end, end + duration
+                )
+            )
+
+            transition_start_index = self.ts_to_index(end)
+            transition_done_index = self.ts_to_index(end + duration) + 1
+            state_start_index = transition_done_index
+            state_done_index = (
+                self.ts_to_index(end + duration + self.state_duration) + 1
+            )
+
+            logger.debug(
+                "{} estimated transitionindex: {:0.3f} .. {:0.3f} seconds".format(
+                    offline_index,
+                    transition_start_index / self.sample_rate,
+                    transition_done_index / self.sample_rate,
+                )
+            )
+
+            transition_power_W = self.interval_power[
+                transition_start_index:transition_done_index
+            ]
+
+            transition = {
+                "isa": "transition",
+                "W_mean": np.mean(transition_power_W),
+                "W_std": np.std(transition_power_W),
+                "s": duration,
+                "s_coarse": self.interval_start_timestamp[transition_done_index]
+                - self.interval_start_timestamp[transition_start_index],
+            }
+
+            if self.with_traces:
+                transition["uW"] = transition_power_W * 1e6
+
+            energy_trace.append(transition)
+
+            if len(energy_trace) > 1:
+                energy_trace[-1]["W_mean_delta_prev"] = (
+                    energy_trace[-1]["W_mean"] - energy_trace[-2]["W_mean"]
+                )
+
+            state_power_W = self.interval_power[state_start_index:state_done_index]
+            state = {
+                "isa": "state",
+                "W_mean": np.mean(state_power_W),
+                "W_std": np.std(state_power_W),
+                "s": self.state_duration,
+                "s_coarse": self.interval_start_timestamp[state_done_index]
+                - self.interval_start_timestamp[state_start_index],
+            }
+
+            if self.with_traces:
+                state["uW"] = state_power_W * 1e6
+
+            energy_trace.append(state)
+
+            energy_trace[-2]["W_mean_delta_next"] = (
+                energy_trace[-2]["W_mean"] - energy_trace[-1]["W_mean"]
+            )
+
+        expected_transition_count = len(expected_transitions)
+        recovered_transition_ount = len(energy_trace) // 2
+
+        if expected_transition_count != recovered_transition_ount:
+            self.errors.append(
+                "Expected {:d} transitions, got {:d}".format(
+                    expected_transition_count, recovered_transition_ount
+                )
+            )
+
+        return energy_trace
+
+    def find_first_sync(self):
+        # LED Power is approx. self.led_power W, use self.led_power/2 W above surrounding median as threshold
+        sync_threshold_power = (
+            np.median(self.interval_power[: int(3 * self.sample_rate)])
+            + self.led_power / 3
+        )
+        for i, ts in enumerate(self.interval_start_timestamp):
+            if ts > 2 and self.interval_power[i] > sync_threshold_power:
+                return self.interval_start_timestamp[i - 300]
+        return None
+
+    def find_barcode(self, start_ts):
+        """
+        Return absolute position and content of the next barcode following `start_ts`.
+
+        :param interval_ts: list of start timestamps (one per measurement interval) [s]
+        :param interval_power: mean power per measurement interval [W]
+        :param start_ts: timestamp at which to start looking for a barcode [s]
+        """
+
+        for i, ts in enumerate(self.interval_start_timestamp):
+            if ts >= start_ts:
+                start_position = i
+                break
+
+        # Lookaround: 100 ms in both directions
+        lookaround = int(0.1 * self.sample_rate)
+
+        # LED Power is approx. self.led_power W, use self.led_power/2 W above surrounding median as threshold
+        sync_threshold_power = (
+            np.median(
+                self.interval_power[
+                    start_position - lookaround : start_position + lookaround
+                ]
+            )
+            + self.led_power / 3
+        )
+
+        logger.debug(
+            "looking for barcode starting at {:0.2f} s, threshold is {:0.1f} mW".format(
+                start_ts, sync_threshold_power * 1e3
+            )
+        )
+
+        sync_area_start = None
+        sync_start_ts = None
+        sync_area_end = None
+        sync_end_ts = None
+        for i, ts in enumerate(self.interval_start_timestamp):
+            if (
+                sync_area_start is None
+                and ts >= start_ts
+                and self.interval_power[i] > sync_threshold_power
+            ):
+                sync_area_start = i - 300
+                sync_start_ts = ts
+            if (
+                sync_area_start is not None
+                and sync_area_end is None
+                and ts > sync_start_ts + self.min_barcode_duration
+                and (
+                    ts > sync_start_ts + self.max_barcode_duration
+                    or abs(sync_threshold_power - self.interval_power[i])
+                    > self.led_power
+                )
+            ):
+                sync_area_end = i
+                sync_end_ts = ts
+                break
+
+        barcode_data = self.interval_power[sync_area_start:sync_area_end]
+
+        logger.debug(
+            "barcode search area: {:0.2f} .. {:0.2f} seconds ({} samples)".format(
+                sync_start_ts, sync_end_ts, len(barcode_data)
+            )
+        )
+
+        bc, start, stop, padding_bits = self.find_barcode_in_power_data(barcode_data)
+
+        if bc is None:
+            return None, None, None, None
+
+        start_ts = self.interval_start_timestamp[sync_area_start + start]
+        stop_ts = self.interval_start_timestamp[sync_area_start + stop]
+
+        end_ts = (
+            stop_ts + self.module_duration * padding_bits + self.quiet_zone_duration
+        )
+
+        # barcode content, barcode start timestamp, barcode stop timestamp, barcode end (stop + padding) timestamp
+        return bc, start_ts, stop_ts, end_ts
+
+    def find_barcode_in_power_data(self, barcode_data):
+
+        min_power = np.min(barcode_data)
+        max_power = np.max(barcode_data)
+
+        # zbar seems to be confused by measurement (and thus image) noise
+        # inside of barcodes. As our barcodes are only 1px high, this is
+        # likely not trivial to fix.
+        # -> Create a black and white (not grayscale) image to avoid this.
+        # Unfortunately, this decreases resilience against background noise
+        # (e.g. a not-exactly-idle peripheral device or CPU interrupts).
+        image_data = np.around(
+            1 - ((barcode_data - min_power) / (max_power - min_power))
+        )
+        image_data *= 255
+
+        # zbar only returns the complete barcode position if it is at least
+        # two pixels high. For a 1px barcode, it only returns its right border.
+
+        width = len(image_data)
+        height = 2
+
+        image_data = bytes(map(int, image_data)) * height
+
+        # img = Image.frombytes('L', (width, height), image_data).resize((width, 100))
+        # img.save('/tmp/test-{}.png'.format(os.getpid()))
+
+        zbimg = zbar.Image(width, height, "Y800", image_data)
+        scanner = zbar.ImageScanner()
+        scanner.parse_config("enable")
+
+        if scanner.scan(zbimg):
+            (sym,) = zbimg.symbols
+            content = sym.data
+            try:
+                sym_start = sym.location[1][0]
+            except IndexError:
+                sym_start = 0
+            sym_end = sym.location[0][0]
+
+            match = re.fullmatch(r"T(\d+)", content)
+            if match:
+                content = self.transition_names[int(match.group(1))]
+
+            # PTALog barcode generation operates on bytes, so there may be
+            # additional non-barcode padding (encoded as LED off / image white).
+            # Calculate the amount of extra bits to determine the offset until
+            # the transition starts.
+            padding_bits = len(Code128(sym.data, charset="B").modules) % 8
+
+            # sym_start leaves out the first two bars, but we don't do anything about that here
+            # sym_end leaves out the last three bars, each of which is one padding bit long.
+            # as a workaround, we unconditionally increment padding_bits by three.
+            padding_bits += 3
+
+            return content, sym_start, sym_end, padding_bits
+        else:
+            logger.warning("unable to find barcode")
+            return None, None, None, None
+
+
+class MIMOSA:
+    """
+    MIMOSA log loader for DFA traces with auto-calibration.
+
+    Expects a MIMOSA log file generated via dfatool and a dfatool-generated
+    benchmark. A MIMOSA log consists of a series of measurements. Each measurement
+    gives the total charge (in pJ) and binary buzzer/trigger value during a 10µs interval.
+
+    There must be a calibration run consisting of at least two seconds with disconnected DUT,
+    two seconds with 1 kOhm (984 Ohm), and two seconds with 100 kOhm (99013 Ohm) resistor at
+    the start. The first ten seconds of data are reserved for calbiration and must not contain
+    measurements, as trigger/buzzer signals are ignored in this time range.
+
+    Resulting data is a list of state/transition/state/transition/... measurements.
+    """
+
+    def __init__(self, voltage: float, shunt: int, with_traces=False):
+        """
+        Initialize MIMOSA loader for a specific voltage and shunt setting.
+
+        :param voltage: MIMOSA DUT supply voltage (V)
+        :para mshunt: MIMOSA Shunt (Ohms)
+        """
+        self.voltage = voltage
+        self.shunt = shunt
+        self.with_traces = with_traces
+        self.r1 = 984  # "1k"
+        self.r2 = 99013  # "100k"
+        self.errors = list()
+
+    def charge_to_current_nocal(self, charge):
+        u"""
+        Convert charge per 10µs (in pJ) to mean currents (in µA) without accounting for calibration.
+
+        :param charge: numpy array of charges (pJ per 10µs) as returned by `load_data` or `load_file`
+
+        :returns: numpy array of mean currents (µA per 10µs)
+        """
+        ua_max = 1.836 / self.shunt * 1000000
+        ua_step = ua_max / 65535
+        return charge * ua_step
+
+    def _load_tf(self, tf):
+        u"""
+        Load MIMOSA log data from an open `tarfile` instance.
+
+        :param tf: `tarfile` instance
+
+        :returns: (numpy array of charges (pJ per 10µs), numpy array of triggers (0/1 int, per 10µs))
+        """
+        num_bytes = tf.getmember("/tmp/mimosa//mimosa_scale_1.tmp").size
+        charges = np.ndarray(shape=(int(num_bytes / 4)), dtype=np.int32)
+        triggers = np.ndarray(shape=(int(num_bytes / 4)), dtype=np.int8)
+        with tf.extractfile("/tmp/mimosa//mimosa_scale_1.tmp") as f:
+            content = f.read()
+            iterator = struct.iter_unpack("<I", content)
+            i = 0
+            for word in iterator:
+                charges[i] = word[0] >> 4
+                triggers[i] = (word[0] & 0x08) >> 3
+                i += 1
+        return charges, triggers
+
+    def load_data(self, raw_data):
+        u"""
+        Load MIMOSA log data from a MIMOSA log file passed as raw byte string
+
+        :param raw_data: MIMOSA log file, passed as raw byte string
+
+        :returns: (numpy array of charges (pJ per 10µs), numpy array of triggers (0/1 int, per 10µs))
+        """
+        with io.BytesIO(raw_data) as data_object:
+            with tarfile.open(fileobj=data_object) as tf:
+                return self._load_tf(tf)
+
+    def load_file(self, filename):
+        u"""
+        Load MIMOSA log data from a MIMOSA log file
+
+        :param filename: MIMOSA log file
+
+        :returns: (numpy array of charges (pJ per 10µs), numpy array of triggers (0/1 int, per 10µs))
+        """
+        with tarfile.open(filename) as tf:
+            return self._load_tf(tf)
+
+    def currents_nocal(self, charges):
+        u"""
+        Convert charges (pJ per 10µs) to mean currents without accounting for calibration.
+
+        :param charges: numpy array of charges (pJ per 10µs)
+
+        :returns: numpy array of currents (mean µA per 10µs)"""
+        ua_max = 1.836 / self.shunt * 1000000
+        ua_step = ua_max / 65535
+        return charges.astype(np.double) * ua_step
+
+    def trigger_edges(self, triggers):
+        """
+        Return indexes of trigger edges (both 0->1 and 1->0) in log data.
+
+        Ignores the first 10 seconds, which are used for calibration and may
+        contain bogus triggers due to DUT resets.
+
+        :param triggers: trigger array (int, 0/1) as returned by load_data
+
+        :returns: list of int (trigger indices, e.g. [2000000, ...] means the first trigger appears in charges/currents interval 2000000 -> 20s after start of measurements. Keep in mind that each interval is 10µs long, not 1µs, so index values are not µs timestamps)
+        """
+        trigidx = []
+
+        if len(triggers) < 1000000:
+            self.errors.append("MIMOSA log is too short")
+            return trigidx
+
+        prevtrig = triggers[999999]
+
+        # if the first trigger is high (i.e., trigger/buzzer pin is active before the benchmark starts),
+        # something went wrong and are unable to determine when the first
+        # transition starts.
+        if prevtrig != 0:
+            self.errors.append(
+                "Unable to find start of first transition (log starts with trigger == {} != 0)".format(
+                    prevtrig
+                )
+            )
+
+        # if the last trigger is high (i.e., trigger/buzzer pin is active when the benchmark ends),
+        # it terminated in the middle of a transition -- meaning that it was not
+        # measured in its entirety.
+        if triggers[-1] != 0:
+            self.errors.append("Log ends during a transition".format(prevtrig))
+
+        # the device is reset for MIMOSA calibration in the first 10s and may
+        # send bogus interrupts -> bogus triggers
+        for i in range(1000000, triggers.shape[0]):
+            trig = triggers[i]
+            if trig != prevtrig:
+                # Due to MIMOSA's integrate-read-reset cycle, the charge/current
+                # interval belonging to this trigger comes two intervals (20µs) later
+                trigidx.append(i + 2)
+            prevtrig = trig
+        return trigidx
+
+    def calibration_edges(self, currents):
+        u"""
+        Return start/stop indexes of calibration measurements.
+
+        :param currents: uncalibrated currents as reported by MIMOSA. For best results,
+            it may help to use a running mean, like so:
+            `currents = running_mean(currents_nocal(..., 10))`
+
+        :returns: indices of calibration events in MIMOSA data:
+            (disconnect start, disconnect stop, R1 (1k) start, R1 (1k) stop, R2 (100k) start, R2 (100k) stop)
+            indices refer to charges/currents arrays, so 0 refers to the first 10µs interval, 1 to the second, and so on.
+        """
+        r1idx = 0
+        r2idx = 0
+        ua_r1 = self.voltage / self.r1 * 1000000
+        # first second may be bogus
+        for i in range(100000, len(currents)):
+            if r1idx == 0 and currents[i] > ua_r1 * 0.6:
+                r1idx = i
+            elif (
+                r1idx != 0
+                and r2idx == 0
+                and i > (r1idx + 180000)
+                and currents[i] < ua_r1 * 0.4
+            ):
+                r2idx = i
+        # 2s disconnected, 2s r1, 2s r2  with r1 < r2  ->  ua_r1 > ua_r2
+        # allow 5ms buffer in both directions to account for bouncing relais contacts
+        return (
+            r1idx - 180500,
+            r1idx - 500,
+            r1idx + 500,
+            r2idx - 500,
+            r2idx + 500,
+            r2idx + 180500,
+        )
+
+    def calibration_function(self, charges, cal_edges):
+        u"""
+        Calculate calibration function from previously determined calibration edges.
+
+        :param charges: raw charges from MIMOSA
+        :param cal_edges: calibration edges as returned by calibration_edges
+
+        :returns: (calibration_function, calibration_data):
+            calibration_function -- charge in pJ (float) -> current in uA (float).
+                Converts the amount of charge in a 10 µs interval to the
+                mean current during the same interval.
+            calibration_data -- dict containing the following keys:
+                edges -- calibration points in the log file, in µs
+                offset -- ...
+                offset2 --  ...
+                slope_low -- ...
+                slope_high -- ...
+                add_low -- ...
+                add_high -- ..
+                r0_err_uW -- mean error of uncalibrated data at "∞ Ohm" in µW
+                r0_std_uW -- standard deviation of uncalibrated data at "∞ Ohm" in µW
+                r1_err_uW -- mean error of uncalibrated data at 1 kOhm
+                r1_std_uW -- stddev at 1 kOhm
+                r2_err_uW -- mean error at 100 kOhm
+                r2_std_uW -- stddev at 100 kOhm
+        """
+        dis_start, dis_end, r1_start, r1_end, r2_start, r2_end = cal_edges
+        if dis_start < 0:
+            dis_start = 0
+        chg_r0 = charges[dis_start:dis_end]
+        chg_r1 = charges[r1_start:r1_end]
+        chg_r2 = charges[r2_start:r2_end]
+        cal_0_mean = np.mean(chg_r0)
+        cal_r1_mean = np.mean(chg_r1)
+        cal_r2_mean = np.mean(chg_r2)
+
+        ua_r1 = self.voltage / self.r1 * 1000000
+        ua_r2 = self.voltage / self.r2 * 1000000
+
+        if cal_r2_mean > cal_0_mean:
+            b_lower = (ua_r2 - 0) / (cal_r2_mean - cal_0_mean)
+        else:
+            logger.warning("0 uA == %.f uA during calibration" % (ua_r2))
+            b_lower = 0
+
+        b_upper = (ua_r1 - ua_r2) / (cal_r1_mean - cal_r2_mean)
+
+        a_lower = -b_lower * cal_0_mean
+        a_upper = -b_upper * cal_r2_mean
+
+        if self.shunt == 680:
+            # R1 current is higher than shunt range -> only use R2 for calibration
+            def calfunc(charge):
+                if charge < cal_0_mean:
+                    return 0
+                else:
+                    return charge * b_lower + a_lower
+
+        else:
+
+            def calfunc(charge):
+                if charge < cal_0_mean:
+                    return 0
+                if charge <= cal_r2_mean:
+                    return charge * b_lower + a_lower
+                else:
+                    return charge * b_upper + a_upper + ua_r2
+
+        caldata = {
+            "edges": [x * 10 for x in cal_edges],
+            "offset": cal_0_mean,
+            "offset2": cal_r2_mean,
+            "slope_low": b_lower,
+            "slope_high": b_upper,
+            "add_low": a_lower,
+            "add_high": a_upper,
+            "r0_err_uW": np.mean(self.currents_nocal(chg_r0)) * self.voltage,
+            "r0_std_uW": np.std(self.currents_nocal(chg_r0)) * self.voltage,
+            "r1_err_uW": (np.mean(self.currents_nocal(chg_r1)) - ua_r1) * self.voltage,
+            "r1_std_uW": np.std(self.currents_nocal(chg_r1)) * self.voltage,
+            "r2_err_uW": (np.mean(self.currents_nocal(chg_r2)) - ua_r2) * self.voltage,
+            "r2_std_uW": np.std(self.currents_nocal(chg_r2)) * self.voltage,
+        }
+
+        # print("if charge < %f : return 0" % cal_0_mean)
+        # print("if charge <= %f : return charge * %f + %f" % (cal_r2_mean, b_lower, a_lower))
+        # print("else : return charge * %f + %f + %f" % (b_upper, a_upper, ua_r2))
+
+        return calfunc, caldata
+
+    """
+    def calcgrad(self, currents, threshold):
+        grad = np.gradient(running_mean(currents * self.voltage, 10))
+        # len(grad) == len(currents) - 9
+        subst = []
+        lastgrad = 0
+        for i in range(len(grad)):
+            # minimum substate duration: 10ms
+            if np.abs(grad[i]) > threshold and i - lastgrad > 50:
+                # account for skew introduced by running_mean and current
+                # ramp slope (parasitic capacitors etc.)
+                subst.append(i+10)
+                lastgrad = i
+        if lastgrad != i:
+            subst.append(i+10)
+        return subst
+
+    # TODO konfigurierbare min/max threshold und len(gradidx) > X, binaere
+    # Sache nach noetiger threshold. postprocessing mit
+    # "zwei benachbarte substates haben sehr aehnliche werte / niedrige stddev" -> mergen
+    # ... min/max muessen nicht vorgegeben werden, sind ja bekannt (0 / np.max(grad))
+    # TODO bei substates / index foo den offset durch running_mean beachten
+    # TODO ggf. clustering der 'abs(grad) > threshold' und bestimmung interessanter
+    # uebergaenge dadurch?
+    def gradfoo(self, currents):
+        gradients = np.abs(np.gradient(running_mean(currents * self.voltage, 10)))
+        gradmin = np.min(gradients)
+        gradmax = np.max(gradients)
+        threshold = np.mean([gradmin, gradmax])
+        gradidx = self.calcgrad(currents, threshold)
+        num_substates = 2
+        while len(gradidx) != num_substates:
+            if gradmax - gradmin < 0.1:
+                # We did our best
+                return threshold, gradidx
+            if len(gradidx) > num_substates:
+                gradmin = threshold
+            else:
+                gradmax = threshold
+            threshold = np.mean([gradmin, gradmax])
+            gradidx = self.calcgrad(currents, threshold)
+        return threshold, gradidx
+    """
+
+    def analyze_states(self, charges, trigidx, ua_func):
+        u"""
+        Split log data into states and transitions and return duration, energy, and mean power for each element.
+
+        :param charges: raw charges (each element describes the charge in pJ transferred during 10 µs)
+        :param trigidx: "charges" indexes corresponding to a trigger edge, see `trigger_edges`
+        :param ua_func: charge(pJ) -> current(µA) function as returned by `calibration_function`
+
+        :returns: list of states and transitions, both starting andending with a state.
+            Each element is a dict containing:
+            * `isa`: 'state' or 'transition'
+            * `clip_rate`: range(0..1) Anteil an Clipping im Energieverbrauch
+            * `raw_mean`: Mittelwert der Rohwerte
+            * `raw_std`: Standardabweichung der Rohwerte
+            * `uW_mean`: Mittelwert der (kalibrierten) Leistungsaufnahme
+            * `uW_std`: Standardabweichung der (kalibrierten) Leistungsaufnahme
+            * `us`: Dauer
+            if isa == 'transition, it also contains:
+            * `timeout`: Dauer des vorherigen Zustands
+            * `uW_mean_delta_prev`: Differenz zwischen uW_mean und uW_mean des vorherigen Zustands
+            * `uW_mean_delta_next`: Differenz zwischen uW_mean und uW_mean des Folgezustands
+        """
+        previdx = 0
+        is_state = True
+        iterdata = []
+
+        # The last state (between the last transition and end of file) may also
+        # be important. Pretend it ends when the log ends.
+        trigger_indices = trigidx.copy()
+        trigger_indices.append(len(charges))
+
+        for idx in trigger_indices:
+            range_raw = charges[previdx:idx]
+            range_ua = ua_func(range_raw)
+            substates = {}
+
+            if previdx != 0 and idx - previdx > 200:
+                thr, subst = 0, []  # self.gradfoo(range_ua)
+                if len(subst):
+                    statelist = []
+                    prevsubidx = 0
+                    for subidx in subst:
+                        statelist.append(
+                            {
+                                "duration": (subidx - prevsubidx) * 10,
+                                "uW_mean": np.mean(
+                                    range_ua[prevsubidx:subidx] * self.voltage
+                                ),
+                                "uW_std": np.std(
+                                    range_ua[prevsubidx:subidx] * self.voltage
+                                ),
+                            }
+                        )
+                        prevsubidx = subidx
+                    substates = {"threshold": thr, "states": statelist}
+
+            isa = "state"
+            if not is_state:
+                isa = "transition"
+
+            data = {
+                "isa": isa,
+                "clip_rate": np.mean(range_raw == 65535),
+                "raw_mean": np.mean(range_raw),
+                "raw_std": np.std(range_raw),
+                "uW_mean": np.mean(range_ua * self.voltage),
+                "uW_std": np.std(range_ua * self.voltage),
+                "us": (idx - previdx) * 10,
+            }
+
+            if self.with_traces:
+                data["uW"] = range_ua * self.voltage
+
+            if "states" in substates:
+                data["substates"] = substates
+                ssum = np.sum(list(map(lambda x: x["duration"], substates["states"])))
+                if ssum != data["us"]:
+                    logger.warning("duration %d vs %d" % (data["us"], ssum))
+
+            if isa == "transition":
+                # subtract average power of previous state
+                # (that is, the state from which this transition originates)
+                data["uW_mean_delta_prev"] = data["uW_mean"] - iterdata[-1]["uW_mean"]
+                # placeholder to avoid extra cases in the analysis
+                data["uW_mean_delta_next"] = data["uW_mean"]
+                data["timeout"] = iterdata[-1]["us"]
+            elif len(iterdata) > 0:
+                # subtract average power of next state
+                # (the state into which this transition leads)
+                iterdata[-1]["uW_mean_delta_next"] = (
+                    iterdata[-1]["uW_mean"] - data["uW_mean"]
+                )
+
+            iterdata.append(data)
+
+            previdx = idx
+            is_state = not is_state
+        return iterdata
diff --git a/test/test_ptamodel.py b/test/test_ptamodel.py
index e153280..94ee842 100755
--- a/test/test_ptamodel.py
+++ b/test/test_ptamodel.py
@@ -1,6 +1,6 @@
 #!/usr/bin/env python3
 
-from dfatool.dfatool import RawData, pta_trace_to_aggregate
+from dfatool.loader import RawData, pta_trace_to_aggregate
 from dfatool.model import PTAModel
 import os
 import unittest
diff --git a/test/test_timingharness.py b/test/test_timingharness.py
index cc4b766..917e4e2 100755
--- a/test/test_timingharness.py
+++ b/test/test_timingharness.py
@@ -1,6 +1,6 @@
 #!/usr/bin/env python3
 
-from dfatool.dfatool import TimingData, pta_trace_to_aggregate
+from dfatool.loader import TimingData, pta_trace_to_aggregate
 from dfatool.model import AnalyticModel
 from dfatool.parameters import prune_dependent_parameters
 import unittest
-- 
cgit v1.2.3


From 3061bf6dab2aed9746a43f3c838bea31c6c1a270 Mon Sep 17 00:00:00 2001
From: Daniel Friesel <daniel.friesel@uos.de>
Date: Wed, 15 Jul 2020 11:25:49 +0200
Subject: Add PTAModel validation and crossvalidation test

---
 test/test_ptamodel.py | 465 +++++++++++++++++++++++++++++++++++++++++++++++++-
 1 file changed, 458 insertions(+), 7 deletions(-)

(limited to 'test/test_ptamodel.py')

diff --git a/test/test_ptamodel.py b/test/test_ptamodel.py
index 94ee842..e8905b1 100755
--- a/test/test_ptamodel.py
+++ b/test/test_ptamodel.py
@@ -2,13 +2,464 @@
 
 from dfatool.loader import RawData, pta_trace_to_aggregate
 from dfatool.model import PTAModel
+from dfatool.utils import by_name_to_by_param
+from dfatool.validation import CrossValidator
 import os
 import unittest
 import pytest
 
+import numpy as np
 
-class TestModels(unittest.TestCase):
-    def test_model_singlefile_rf24(self):
+
+class TestSynthetic(unittest.TestCase):
+    def test_model_validation(self):
+        # rng = np.random.default_rng(seed=1312) # requiresy NumPy >= 1.17
+        np.random.seed(1312)
+        X = np.arange(500) % 50
+        parameter_names = ["p_mod5", "p_linear"]
+
+        s1_duration_base = 70
+        s1_duration_scale = 2
+        s1_power_base = 50
+        s1_power_scale = 7
+        s2_duration_base = 700
+        s2_duration_scale = 1
+        s2_power_base = 1500
+        s2_power_scale = 10
+
+        by_name = {
+            "raw_state_1": {
+                "isa": "state",
+                "param": [(x % 5, x) for x in X],
+                "duration": s1_duration_base
+                + np.random.normal(size=X.size, scale=s1_duration_scale),
+                "power": s1_power_base
+                + X
+                + np.random.normal(size=X.size, scale=s1_power_scale),
+                "attributes": ["duration", "power"],
+            },
+            "raw_state_2": {
+                "isa": "state",
+                "param": [(x % 5, x) for x in X],
+                "duration": s2_duration_base
+                - 2 * X
+                + np.random.normal(size=X.size, scale=s2_duration_scale),
+                "power": s2_power_base
+                + X
+                + np.random.normal(size=X.size, scale=s2_power_scale),
+                "attributes": ["duration", "power"],
+            },
+        }
+        by_param = by_name_to_by_param(by_name)
+        model = PTAModel(by_name, parameter_names, dict())
+        static_model = model.get_static()
+
+        # x ∈ [0, 50] -> mean(X) is 25
+        self.assertAlmostEqual(
+            static_model("raw_state_1", "duration"), s1_duration_base, places=0
+        )
+        self.assertAlmostEqual(
+            static_model("raw_state_1", "power"), s1_power_base + 25, delta=7
+        )
+        self.assertAlmostEqual(
+            static_model("raw_state_2", "duration"), s2_duration_base - 2 * 25, delta=2
+        )
+        self.assertAlmostEqual(
+            static_model("raw_state_2", "power"), s2_power_base + 25, delta=7
+        )
+
+        param_model, param_info = model.get_fitted()
+
+        self.assertAlmostEqual(
+            param_model("raw_state_1", "duration", param=[0, 10]),
+            s1_duration_base,
+            places=0,
+        )
+        self.assertAlmostEqual(
+            param_model("raw_state_1", "duration", param=[0, 50]),
+            s1_duration_base,
+            places=0,
+        )
+        self.assertAlmostEqual(
+            param_model("raw_state_1", "duration", param=[0, 70]),
+            s1_duration_base,
+            places=0,
+        )
+
+        self.assertAlmostEqual(
+            param_model("raw_state_1", "power", param=[0, 10]),
+            s1_power_base + 10,
+            places=0,
+        )
+        self.assertAlmostEqual(
+            param_model("raw_state_1", "power", param=[0, 50]),
+            s1_power_base + 50,
+            places=0,
+        )
+        self.assertAlmostEqual(
+            param_model("raw_state_1", "power", param=[0, 70]),
+            s1_power_base + 70,
+            places=0,
+        )
+
+        self.assertAlmostEqual(
+            param_model("raw_state_2", "duration", param=[0, 10]),
+            s2_duration_base - 2 * 10,
+            places=0,
+        )
+        self.assertAlmostEqual(
+            param_model("raw_state_2", "duration", param=[0, 50]),
+            s2_duration_base - 2 * 50,
+            places=0,
+        )
+        self.assertAlmostEqual(
+            param_model("raw_state_2", "duration", param=[0, 70]),
+            s2_duration_base - 2 * 70,
+            places=0,
+        )
+
+        self.assertAlmostEqual(
+            param_model("raw_state_2", "power", param=[0, 10]),
+            s2_power_base + 10,
+            delta=50,
+        )
+        self.assertAlmostEqual(
+            param_model("raw_state_2", "power", param=[0, 50]),
+            s2_power_base + 50,
+            delta=50,
+        )
+        self.assertAlmostEqual(
+            param_model("raw_state_2", "power", param=[0, 70]),
+            s2_power_base + 70,
+            delta=50,
+        )
+
+        static_quality = model.assess(static_model)
+        param_quality = model.assess(param_model)
+
+        # static quality reflects normal distribution scale for non-parameterized data
+
+        # the Root Mean Square Deviation must not be greater the scale (i.e., standard deviation) of the normal distribution
+        # Low Mean Absolute Error (< 2)
+        self.assertTrue(static_quality["by_name"]["raw_state_1"]["duration"]["mae"] < 2)
+        # Low Root Mean Square Deviation (< scale == 2)
+        self.assertTrue(
+            static_quality["by_name"]["raw_state_1"]["duration"]["rmsd"] < 2
+        )
+        # Relatively low error percentage (~~ MAE * 100% / s1_duration_base)
+        self.assertAlmostEqual(
+            static_quality["by_name"]["raw_state_1"]["duration"]["mape"],
+            static_quality["by_name"]["raw_state_1"]["duration"]["mae"]
+            * 100
+            / s1_duration_base,
+            places=1,
+        )
+        self.assertAlmostEqual(
+            static_quality["by_name"]["raw_state_1"]["duration"]["smape"],
+            static_quality["by_name"]["raw_state_1"]["duration"]["mae"]
+            * 100
+            / s1_duration_base,
+            places=1,
+        )
+
+        # static error is high for parameterized data
+
+        # MAE == mean(abs(actual value - model value))
+        # parameter range is [0, 50) -> mean 25, deviation range is [0, 25) -> mean deviation is 12.5 ± gauss scale
+        self.assertAlmostEqual(
+            static_quality["by_name"]["raw_state_1"]["power"]["mae"], 12.5, delta=1
+        )
+        self.assertAlmostEqual(
+            static_quality["by_name"]["raw_state_1"]["power"]["rmsd"], 16, delta=2
+        )
+        # high percentage error due to low s1_power_base
+        self.assertAlmostEqual(
+            static_quality["by_name"]["raw_state_1"]["power"]["mape"], 19, delta=2
+        )
+        self.assertAlmostEqual(
+            static_quality["by_name"]["raw_state_1"]["power"]["smape"], 19, delta=2
+        )
+
+        # parameter range is [0, 100) -> mean deviation is 25 ± gauss scale
+        self.assertAlmostEqual(
+            static_quality["by_name"]["raw_state_2"]["duration"]["mae"], 25, delta=2
+        )
+        self.assertAlmostEqual(
+            static_quality["by_name"]["raw_state_2"]["duration"]["rmsd"], 30, delta=2
+        )
+
+        # low percentage error due to high s2_duration_base (~~ 3.5 %)
+        self.assertAlmostEqual(
+            static_quality["by_name"]["raw_state_2"]["duration"]["mape"],
+            25 * 100 / s2_duration_base,
+            delta=1,
+        )
+        self.assertAlmostEqual(
+            static_quality["by_name"]["raw_state_2"]["duration"]["smape"],
+            25 * 100 / s2_duration_base,
+            delta=1,
+        )
+
+        self.assertAlmostEqual(
+            static_quality["by_name"]["raw_state_2"]["power"]["mae"], 12.5, delta=2
+        )
+        self.assertAlmostEqual(
+            static_quality["by_name"]["raw_state_2"]["power"]["rmsd"], 17, delta=2
+        )
+
+        # low percentage error due to high s2_power_base (~~ 1.7 %)
+        self.assertAlmostEqual(
+            static_quality["by_name"]["raw_state_2"]["power"]["mape"],
+            25 * 100 / s2_power_base,
+            delta=1,
+        )
+        self.assertAlmostEqual(
+            static_quality["by_name"]["raw_state_2"]["power"]["smape"],
+            25 * 100 / s2_power_base,
+            delta=1,
+        )
+
+        # raw_state_1/duration does not depend on parameters and delegates to the static model
+        self.assertAlmostEqual(
+            param_quality["by_name"]["raw_state_1"]["duration"]["mae"],
+            static_quality["by_name"]["raw_state_1"]["duration"]["mae"],
+        )
+        self.assertAlmostEqual(
+            param_quality["by_name"]["raw_state_1"]["duration"]["rmsd"],
+            static_quality["by_name"]["raw_state_1"]["duration"]["rmsd"],
+        )
+        self.assertAlmostEqual(
+            param_quality["by_name"]["raw_state_1"]["duration"]["mape"],
+            static_quality["by_name"]["raw_state_1"]["duration"]["mape"],
+        )
+        self.assertAlmostEqual(
+            param_quality["by_name"]["raw_state_1"]["duration"]["smape"],
+            static_quality["by_name"]["raw_state_1"]["duration"]["smape"],
+        )
+
+        # fitted param-model quality reflects normal distribution scale for all data
+        self.assertAlmostEqual(
+            param_quality["by_name"]["raw_state_2"]["power"]["mape"], 0.9, places=1
+        )
+        self.assertAlmostEqual(
+            param_quality["by_name"]["raw_state_2"]["power"]["smape"], 0.9, places=1
+        )
+
+        self.assertTrue(
+            param_quality["by_name"]["raw_state_1"]["power"]["mae"] < s1_power_scale
+        )
+        self.assertTrue(
+            param_quality["by_name"]["raw_state_1"]["power"]["rmsd"] < s1_power_scale
+        )
+        self.assertAlmostEqual(
+            param_quality["by_name"]["raw_state_1"]["power"]["mape"], 7.5, delta=1
+        )
+        self.assertAlmostEqual(
+            param_quality["by_name"]["raw_state_1"]["power"]["smape"], 7.5, delta=1
+        )
+
+        self.assertAlmostEqual(
+            param_quality["by_name"]["raw_state_2"]["duration"]["mae"],
+            s2_duration_scale,
+            delta=0.2,
+        )
+        self.assertAlmostEqual(
+            param_quality["by_name"]["raw_state_2"]["duration"]["rmsd"],
+            s2_duration_scale,
+            delta=0.2,
+        )
+        self.assertAlmostEqual(
+            param_quality["by_name"]["raw_state_2"]["duration"]["mape"],
+            0.12,
+            delta=0.01,
+        )
+        self.assertAlmostEqual(
+            param_quality["by_name"]["raw_state_2"]["duration"]["smape"],
+            0.12,
+            delta=0.01,
+        )
+
+        # ... unless the signal-to-noise ratio (parameter range = [0 .. 50] vs. scale = 10) is bad, leading to
+        # increased regression errors
+        self.assertTrue(param_quality["by_name"]["raw_state_2"]["power"]["mae"] < 15)
+        self.assertTrue(param_quality["by_name"]["raw_state_2"]["power"]["rmsd"] < 18)
+
+        # still: low percentage error due to high s2_power_base
+        self.assertAlmostEqual(
+            param_quality["by_name"]["raw_state_2"]["power"]["mape"], 0.9, places=1
+        )
+        self.assertAlmostEqual(
+            param_quality["by_name"]["raw_state_2"]["power"]["smape"], 0.9, places=1
+        )
+
+    def test_model_crossvalidation_10fold(self):
+        # rng = np.random.default_rng(seed=1312) # requiresy NumPy >= 1.17
+        np.random.seed(1312)
+        X = np.arange(500) % 50
+        parameter_names = ["p_mod5", "p_linear"]
+
+        s1_duration_base = 70
+        s1_duration_scale = 2
+        s1_power_base = 50
+        s1_power_scale = 7
+        s2_duration_base = 700
+        s2_duration_scale = 1
+        s2_power_base = 1500
+        s2_power_scale = 10
+
+        by_name = {
+            "raw_state_1": {
+                "isa": "state",
+                "param": [(x % 5, x) for x in X],
+                "duration": s1_duration_base
+                + np.random.normal(size=X.size, scale=s1_duration_scale),
+                "power": s1_power_base
+                + X
+                + np.random.normal(size=X.size, scale=s1_power_scale),
+                "attributes": ["duration", "power"],
+            },
+            "raw_state_2": {
+                "isa": "state",
+                "param": [(x % 5, x) for x in X],
+                "duration": s2_duration_base
+                - 2 * X
+                + np.random.normal(size=X.size, scale=s2_duration_scale),
+                "power": s2_power_base
+                + X
+                + np.random.normal(size=X.size, scale=s2_power_scale),
+                "attributes": ["duration", "power"],
+            },
+        }
+        by_param = by_name_to_by_param(by_name)
+        arg_count = dict()
+        model = PTAModel(by_name, parameter_names, arg_count)
+        validator = CrossValidator(PTAModel, by_name, parameter_names, arg_count)
+
+        static_quality = validator.kfold(lambda m: m.get_static(), 10)
+        param_quality = validator.kfold(lambda m: m.get_fitted()[0], 10)
+
+        print(static_quality)
+
+        # static quality reflects normal distribution scale for non-parameterized data
+
+        # the Root Mean Square Deviation must not be greater the scale (i.e., standard deviation) of the normal distribution
+        # Low Mean Absolute Error (< 2)
+        self.assertTrue(static_quality["by_name"]["raw_state_1"]["duration"]["mae"] < 2)
+        # Low Root Mean Square Deviation (< scale == 2)
+        self.assertTrue(
+            static_quality["by_name"]["raw_state_1"]["duration"]["rmsd"] < 2
+        )
+        # Relatively low error percentage (~~ MAE * 100% / s1_duration_base)
+        self.assertAlmostEqual(
+            static_quality["by_name"]["raw_state_1"]["duration"]["smape"],
+            static_quality["by_name"]["raw_state_1"]["duration"]["mae"]
+            * 100
+            / s1_duration_base,
+            places=1,
+        )
+
+        # static error is high for parameterized data
+
+        # MAE == mean(abs(actual value - model value))
+        # parameter range is [0, 50) -> mean 25, deviation range is [0, 25) -> mean deviation is 12.5 ± gauss scale
+        self.assertAlmostEqual(
+            static_quality["by_name"]["raw_state_1"]["power"]["mae"], 12.5, delta=1
+        )
+        self.assertAlmostEqual(
+            static_quality["by_name"]["raw_state_1"]["power"]["rmsd"], 16, delta=2
+        )
+        # high percentage error due to low s1_power_base
+        self.assertAlmostEqual(
+            static_quality["by_name"]["raw_state_1"]["power"]["smape"], 19, delta=2
+        )
+
+        # parameter range is [0, 100) -> mean deviation is 25 ± gauss scale
+        self.assertAlmostEqual(
+            static_quality["by_name"]["raw_state_2"]["duration"]["mae"], 25, delta=2
+        )
+        self.assertAlmostEqual(
+            static_quality["by_name"]["raw_state_2"]["duration"]["rmsd"], 30, delta=2
+        )
+
+        # low percentage error due to high s2_duration_base (~~ 3.5 %)
+        self.assertAlmostEqual(
+            static_quality["by_name"]["raw_state_2"]["duration"]["smape"],
+            25 * 100 / s2_duration_base,
+            delta=1,
+        )
+
+        self.assertAlmostEqual(
+            static_quality["by_name"]["raw_state_2"]["power"]["mae"], 12.5, delta=2
+        )
+        self.assertAlmostEqual(
+            static_quality["by_name"]["raw_state_2"]["power"]["rmsd"], 17, delta=2
+        )
+
+        # low percentage error due to high s2_power_base (~~ 1.7 %)
+        self.assertAlmostEqual(
+            static_quality["by_name"]["raw_state_2"]["power"]["smape"],
+            25 * 100 / s2_power_base,
+            delta=1,
+        )
+
+        # raw_state_1/duration does not depend on parameters and delegates to the static model
+        self.assertAlmostEqual(
+            param_quality["by_name"]["raw_state_1"]["duration"]["mae"],
+            static_quality["by_name"]["raw_state_1"]["duration"]["mae"],
+        )
+        self.assertAlmostEqual(
+            param_quality["by_name"]["raw_state_1"]["duration"]["rmsd"],
+            static_quality["by_name"]["raw_state_1"]["duration"]["rmsd"],
+        )
+        self.assertAlmostEqual(
+            param_quality["by_name"]["raw_state_1"]["duration"]["smape"],
+            static_quality["by_name"]["raw_state_1"]["duration"]["smape"],
+        )
+
+        # fitted param-model quality reflects normal distribution scale for all data
+        self.assertAlmostEqual(
+            param_quality["by_name"]["raw_state_2"]["power"]["smape"], 0.9, places=1
+        )
+
+        self.assertTrue(
+            param_quality["by_name"]["raw_state_1"]["power"]["mae"] < s1_power_scale
+        )
+        self.assertTrue(
+            param_quality["by_name"]["raw_state_1"]["power"]["rmsd"] < s1_power_scale
+        )
+        self.assertAlmostEqual(
+            param_quality["by_name"]["raw_state_1"]["power"]["smape"], 7.5, delta=1
+        )
+
+        self.assertAlmostEqual(
+            param_quality["by_name"]["raw_state_2"]["duration"]["mae"],
+            s2_duration_scale,
+            delta=0.2,
+        )
+        self.assertAlmostEqual(
+            param_quality["by_name"]["raw_state_2"]["duration"]["rmsd"],
+            s2_duration_scale,
+            delta=0.2,
+        )
+        self.assertAlmostEqual(
+            param_quality["by_name"]["raw_state_2"]["duration"]["smape"],
+            0.12,
+            delta=0.01,
+        )
+
+        # ... unless the signal-to-noise ratio (parameter range = [0 .. 50] vs. scale = 10) is bad, leading to
+        # increased regression errors
+        self.assertTrue(param_quality["by_name"]["raw_state_2"]["power"]["mae"] < 15)
+        self.assertTrue(param_quality["by_name"]["raw_state_2"]["power"]["rmsd"] < 18)
+
+        # still: low percentage error due to high s2_power_base
+        self.assertAlmostEqual(
+            param_quality["by_name"]["raw_state_2"]["power"]["smape"], 0.9, places=1
+        )
+
+
+class TestFromFile(unittest.TestCase):
+    def test_singlefile_rf24(self):
         raw_data = RawData(["test-data/20170220_164723_RF24_int_A.tar"])
         preprocessed_data = raw_data.get_preprocessed_data()
         by_name, parameters, arg_count = pta_trace_to_aggregate(preprocessed_data)
@@ -162,7 +613,7 @@ class TestModels(unittest.TestCase):
             param_model("RX", "power", param=[1, None, None]), 48647, places=-1
         )
 
-    def test_model_singlefile_mmparam(self):
+    def test_singlefile_mmparam(self):
         raw_data = RawData(["test-data/20161221_123347_mmparam.tar"])
         preprocessed_data = raw_data.get_preprocessed_data()
         by_name, parameters, arg_count = pta_trace_to_aggregate(preprocessed_data)
@@ -201,7 +652,7 @@ class TestModels(unittest.TestCase):
             param_lut_model("ON", "power", param=[None, None]), 17866, places=0
         )
 
-    def test_model_multifile_lm75x(self):
+    def test_multifile_lm75x(self):
         testfiles = [
             "test-data/20170116_124500_LM75x.tar",
             "test-data/20170116_131306_LM75x.tar",
@@ -243,7 +694,7 @@ class TestModels(unittest.TestCase):
         self.assertAlmostEqual(static_model("shutdown", "duration"), 6980, places=0)
         self.assertAlmostEqual(static_model("start", "duration"), 6980, places=0)
 
-    def test_model_multifile_sharp(self):
+    def test_multifile_sharp(self):
         testfiles = [
             "test-data/20170116_145420_sharpLS013B4DN.tar",
             "test-data/20170116_151348_sharpLS013B4DN.tar",
@@ -285,7 +736,7 @@ class TestModels(unittest.TestCase):
         self.assertAlmostEqual(static_model("sendLine", "duration"), 180, places=0)
         self.assertAlmostEqual(static_model("toggleVCOM", "duration"), 30, places=0)
 
-    def test_model_multifile_mmstatic(self):
+    def test_multifile_mmstatic(self):
         testfiles = [
             "test-data/20170116_143516_mmstatic.tar",
             "test-data/20170116_142654_mmstatic.tar",
@@ -325,7 +776,7 @@ class TestModels(unittest.TestCase):
     @pytest.mark.skipif(
         "TEST_SLOW" not in os.environ, reason="slow test, set TEST_SLOW=1 to run"
     )
-    def test_model_multifile_cc1200(self):
+    def test_multifile_cc1200(self):
         testfiles = [
             "test-data/20170125_125433_cc1200.tar",
             "test-data/20170125_142420_cc1200.tar",
-- 
cgit v1.2.3