summaryrefslogtreecommitdiff
diff options
context:
space:
mode:
authorDaniel Friesel <derf@finalrewind.org>2019-03-28 08:04:41 +0100
committerDaniel Friesel <derf@finalrewind.org>2019-03-28 08:04:41 +0100
commit6fd0d5f178903ba59e636ae9532d6e218a550ce8 (patch)
tree84d394d943bd7b003130f000bce03ccc7caafba8
parent2d0742f7a41a570b76a73d26b755ff8804f1373b (diff)
add shorten_call function from protocolmodeling/analyze-param.py
-rwxr-xr-xlib/protocol_benchmarks.py53
1 files changed, 53 insertions, 0 deletions
diff --git a/lib/protocol_benchmarks.py b/lib/protocol_benchmarks.py
index 35e90c6..593740d 100755
--- a/lib/protocol_benchmarks.py
+++ b/lib/protocol_benchmarks.py
@@ -5,6 +5,7 @@ import msgpack
import ubjson
import os
+import re
import time
from filelock import FileLock
@@ -1314,3 +1315,55 @@ def codegen_for_lib(library, library_options, data):
return XDR(data)
raise ValueError('Unsupported library: {}'.format(library))
+
+def shorten_call(snippet, lib = ''):
+ """
+ Remove literal arguments and variable names from ProtoBench function calls.
+
+ This provides some generalization when modeling individual function
+ calls, thus avoiding overfitting in AnalyticModel and the likes.
+ """
+ # The following adjustments are protobench-specific
+ # "xdrstream << (uint16_t)123" -> "xdrstream << (uint16_t"
+ if 'xdrstream << (' in snippet:
+ snippet = snippet.split(')')[0]
+ # "xdrstream << variable << ..." -> "xdrstream << variable"
+ elif 'xdrstream << variable' in snippet:
+ snippet = '<<'.join(snippet.split('<<')[0:2])
+ elif 'xdrstream.setNextArrayLen(' in snippet:
+ snippet = 'xdrstream.setNextArrayLen'
+ elif 'ubjw' in snippet:
+ snippet = re.sub('ubjw_write_key\(ctx, [^)]+\)', 'ubjw_write_key(ctx, ?)', snippet)
+ snippet = re.sub('ubjw_write_([^(]+)\(ctx, [^)]+\)', 'ubjw_write_\\1(ctx, ?)', snippet)
+ # mpack_write(&writer, (type)value) -> mpack_write(&writer, (type
+ elif 'mpack_write(' in snippet:
+ snippet = snippet.split(')')[0]
+ # mpack_write_cstr(&writer, "foo") -> mpack_write_cstr(&writer,
+ # same for mpack_write_cstr_or_nil
+ elif 'mpack_write_cstr' in snippet:
+ snippet = snippet.split('"')[0]
+ # mpack_start_map(&writer, x) -> mpack_start_map(&writer
+ # mpack_start_array(&writer, x) -> mpack_start_array(&writer
+ elif 'mpack_start_' in snippet:
+ snippet = snippet.split(',')[0]
+ elif 'bout <<' in snippet:
+ snippet = 'bout'
+ elif 'msg.' in snippet:
+ snippet = re.sub('msg.(?:[^[]+)(?:\[.*?\])? = .*', 'msg.? = ?', snippet)
+ elif lib == 'arduinojson:':
+ snippet = re.sub('ArduinoJson::JsonObject& [^ ]+ = [^.]+.createNestedObject\([^)]*\);', 'ArduinoJson::JsonObject& ? = ?.createNestedObject(?);', snippet)
+ snippet = re.sub('ArduinoJson::JsonArray& [^ ]+ = [^.]+.createNestedArray\([^)]*\);', 'ArduinoJson::JsonArray& ? = ?.createNestedArray(?);', snippet)
+ snippet = re.sub('root[^[]*\["[^"]*"\] = [^;]+', 'root?["?"] = ?', snippet)
+ snippet = re.sub('rootl.add\([^)]*\)', 'rootl.add(?)', snippet)
+
+ snippet = re.sub('^dec_[^ ]*', 'dec_?', snippet)
+ if lib == 'arduinojson:':
+ snippet = re.sub('root[^. ]+\.as', 'root[?].as', snippet)
+ elif 'nanopb:' in lib:
+ snippet = re.sub('= msg\.[^;]+;', '= msg.?;', snippet)
+ elif lib == 'mpack:':
+ snippet = re.sub('mpack_expect_([^_]+)_max\(&reader, [^)]+\)', 'mpack_expect_\\1_max(&reader, ?)', snippet)
+ elif lib == 'ubjson:':
+ snippet = re.sub('[^_ ]+_values[^.]+\.', '?_values[?].', snippet)
+
+ return snippet