sh_commands.py 44.5 KB
Newer Older
Y
yejianwu 已提交
1 2 3 4 5 6 7 8 9 10 11 12 13 14
# Copyright 2018 Xiaomi, Inc.  All rights reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.

Y
yejianwu 已提交
15 16
import falcon_cli
import filelock
Y
yejianwu 已提交
17
import glob
L
liuqi 已提交
18
import logging
Y
yejianwu 已提交
19
import os
20
import re
Y
yejianwu 已提交
21
import sh
Y
yejianwu 已提交
22
import subprocess
23
import sys
24
import time
W
wuchenghui 已提交
25
import urllib
26

L
liuqi 已提交
27
import common
L
Liangliang He 已提交
28

29 30 31 32 33 34 35
sys.path.insert(0, "mace/python/tools")
try:
    from encrypt_opencl_codegen import encrypt_opencl_codegen
    from opencl_codegen import opencl_codegen
    from binary_codegen import tuning_param_codegen
    from generate_data import generate_input_data
    from validate import validate
36
    from mace_engine_factory_codegen import gen_mace_engine_factory
Y
yejianwu 已提交
37 38
except Exception as e:
    print("Import error:\n%s" % e)
39 40
    exit(1)

41 42 43
################################
# common
################################
L
liuqi 已提交
44 45 46
logger = logging.getLogger('MACE')


47
def strip_invalid_utf8(str):
L
Liangliang He 已提交
48 49
    return sh.iconv(str, "-c", "-t", "UTF-8")

50 51

def make_output_processor(buff):
L
Liangliang He 已提交
52
    def process_output(line):
L
Liangliang He 已提交
53
        print(line.rstrip())
L
Liangliang He 已提交
54 55 56 57
        buff.append(line)

    return process_output

58

59 60 61 62 63 64 65 66 67 68 69 70 71 72 73 74
def device_lock_path(serialno):
    return "/tmp/device-lock-%s" % serialno


def device_lock(serialno, timeout=3600):
    return filelock.FileLock(device_lock_path(serialno), timeout=timeout)


def is_device_locked(serialno):
    try:
        with device_lock(serialno, timeout=0.000001):
            return False
    except filelock.Timeout:
        return True


Y
yejianwu 已提交
75 76 77
################################
# clear data
################################
78 79 80 81 82
def clear_phone_data_dir(serialno, phone_data_dir):
    sh.adb("-s",
           serialno,
           "shell",
           "rm -rf %s" % phone_data_dir)
83 84 85


def clear_model_codegen(model_codegen_dir="mace/codegen/models"):
Y
yejianwu 已提交
86 87 88 89
    if os.path.exists(model_codegen_dir):
        sh.rm("-rf", model_codegen_dir)


90 91 92 93
################################
# adb commands
################################
def adb_split_stdout(stdout_str):
L
Liangliang He 已提交
94 95 96 97
    stdout_str = strip_invalid_utf8(stdout_str)
    # Filter out last empty line
    return [l.strip() for l in stdout_str.split('\n') if len(l.strip()) > 0]

98

W
wuchenghui 已提交
99 100
def adb_devices():
    serialnos = []
101 102 103 104
    p = re.compile(r'(\w+)\s+device')
    for line in adb_split_stdout(sh.adb("devices")):
        m = p.match(line)
        if m:
W
wuchenghui 已提交
105 106 107 108 109 110 111 112 113 114 115 116 117 118 119 120 121 122 123 124 125 126 127 128
            serialnos.append(m.group(1))

    return serialnos


def get_soc_serialnos_map():
    serialnos = adb_devices()
    soc_serialnos_map = {}
    for serialno in serialnos:
        props = adb_getprop_by_serialno(serialno)
        soc_serialnos_map.setdefault(props["ro.board.platform"], [])\
            .append(serialno)

    return soc_serialnos_map


def get_target_socs_serialnos(target_socs=None):
    soc_serialnos_map = get_soc_serialnos_map()
    serialnos = []
    if target_socs is None:
        target_socs = soc_serialnos_map.keys()
    for target_soc in target_socs:
        serialnos.extend(soc_serialnos_map[target_soc])
    return serialnos
L
Liangliang He 已提交
129

130 131

def adb_getprop_by_serialno(serialno):
L
Liangliang He 已提交
132 133 134
    outputs = sh.adb("-s", serialno, "shell", "getprop")
    raw_props = adb_split_stdout(outputs)
    props = {}
135
    p = re.compile(r'\[(.+)\]: \[(.+)\]')
L
Liangliang He 已提交
136 137 138 139 140 141
    for raw_prop in raw_props:
        m = p.match(raw_prop)
        if m:
            props[m.group(1)] = m.group(2)
    return props

142

W
wuchenghui 已提交
143 144 145 146 147
def adb_get_device_name_by_serialno(serialno):
    props = adb_getprop_by_serialno(serialno)
    return props.get("ro.product.model", "")


148
def adb_supported_abis(serialno):
L
Liangliang He 已提交
149 150 151 152 153
    props = adb_getprop_by_serialno(serialno)
    abilist_str = props["ro.product.cpu.abilist"]
    abis = [abi.strip() for abi in abilist_str.split(',')]
    return abis

154

155
def adb_get_all_socs():
L
Liangliang He 已提交
156 157 158 159 160
    socs = []
    for d in adb_devices():
        props = adb_getprop_by_serialno(d)
        socs.append(props["ro.board.platform"])
    return set(socs)
161

L
Liangliang He 已提交
162

Y
yejianwu 已提交
163 164 165 166 167 168 169 170 171 172 173 174 175
def adb_push(src_path, dst_path, serialno):
    print("Push %s to %s" % (src_path, dst_path))
    sh.adb("-s", serialno, "push", src_path, dst_path)


def adb_pull(src_path, dst_path, serialno):
    print("Pull %s to %s" % (src_path, dst_path))
    try:
        sh.adb("-s", serialno, "pull", src_path, dst_path)
    except Exception as e:
        print("Error msg: %s" % e.stderr)


L
Liangliang He 已提交
176 177 178
def adb_run(serialno,
            host_bin_path,
            bin_name,
179 180 181
            args="",
            opencl_profiling=1,
            vlog_level=0,
182 183
            device_bin_path="/data/local/tmp/mace",
            out_of_range_check=1):
L
Liangliang He 已提交
184 185 186 187 188 189
    host_bin_full_path = "%s/%s" % (host_bin_path, bin_name)
    device_bin_full_path = "%s/%s" % (device_bin_path, bin_name)
    props = adb_getprop_by_serialno(serialno)
    print(
        "====================================================================="
    )
L
Liangliang He 已提交
190
    print("Trying to lock device %s" % serialno)
191 192 193 194
    with device_lock(serialno):
        print("Run on device: %s, %s, %s" %
              (serialno, props["ro.board.platform"],
               props["ro.product.model"]))
Y
yejianwu 已提交
195 196
        sh.adb("-s", serialno, "shell", "rm -rf %s" % device_bin_path)
        sh.adb("-s", serialno, "shell", "mkdir -p %s" % device_bin_path)
Y
yejianwu 已提交
197
        adb_push(host_bin_full_path, device_bin_full_path, serialno)
Y
yejianwu 已提交
198 199 200 201 202 203 204 205 206 207
        print("Run %s" % device_bin_full_path)
        stdout_buff = []
        process_output = make_output_processor(stdout_buff)
        p = sh.adb(
            "-s",
            serialno,
            "shell",
            "MACE_OUT_OF_RANGE_CHECK=%d MACE_OPENCL_PROFILING=%d "
            "MACE_CPP_MIN_VLOG_LEVEL=%d %s %s" %
            (out_of_range_check, opencl_profiling, vlog_level,
208
             device_bin_full_path, args),
Y
yejianwu 已提交
209 210 211 212 213
            _out=process_output,
            _bg=True,
            _err_to_out=True)
        p.wait()
        return "".join(stdout_buff)
214 215


216 217 218
def adb_run_valgrind(serialno,
                     host_bin_path,
                     bin_name,
219
                     valgrind_path="/data/local/tmp/valgrind",
220 221 222 223 224 225 226 227 228 229 230 231 232 233 234 235 236 237 238 239 240 241 242 243 244 245 246 247 248 249 250 251 252 253 254 255 256 257 258 259 260 261 262 263 264
                     valgrind_args="",
                     args="",
                     opencl_profiling=1,
                     vlog_level=0,
                     device_bin_path="/data/local/tmp/mace",
                     out_of_range_check=1):
    valgrind_lib = valgrind_path + "/lib/valgrind"
    valgrind_bin = valgrind_path + "/bin/valgrind"
    host_bin_full_path = "%s/%s" % (host_bin_path, bin_name)
    device_bin_full_path = "%s/%s" % (device_bin_path, bin_name)
    props = adb_getprop_by_serialno(serialno)
    print(
        "====================================================================="
    )
    print("Trying to lock device %s" % serialno)
    with device_lock(serialno):
        print("Run on device: %s, %s, %s" %
              (serialno, props["ro.board.platform"],
               props["ro.product.model"]))
        result = sh.adb("-s", serialno, "shell", "ls %s" % valgrind_path)
        if result.startswith("ls:"):
            print("Please install valgrind to %s manually." % valgrind_path)
            return result
        sh.adb("-s", serialno, "shell", "rm -rf %s" % device_bin_path)
        sh.adb("-s", serialno, "shell", "mkdir -p %s" % device_bin_path)
        adb_push(host_bin_full_path, device_bin_full_path, serialno)
        print("Run %s" % device_bin_full_path)
        stdout_buff = []
        process_output = make_output_processor(stdout_buff)
        p = sh.adb(
            "-s",
            serialno,
            "shell",
            "MACE_OUT_OF_RANGE_CHECK=%d MACE_OPENCL_PROFILING=%d "
            "MACE_CPP_MIN_VLOG_LEVEL=%d VALGRIND_LIB=%s %s %s %s %s " %
            (out_of_range_check, opencl_profiling, vlog_level,
             valgrind_lib, valgrind_bin, valgrind_args,
             device_bin_full_path, args),
            _out=process_output,
            _bg=True,
            _err_to_out=True)
        p.wait()
        return "".join(stdout_buff)


265 266 267
################################
# bazel commands
################################
Y
yejianwu 已提交
268 269 270 271 272
def bazel_build(target,
                strip="always",
                abi="armeabi-v7a",
                production_mode=False,
                hexagon_mode=False,
273
                disable_no_tuning_warning=False,
W
wuchenghui 已提交
274 275
                debug=False,
                enable_openmp=True):
Y
yejianwu 已提交
276 277 278 279
    print("* Build %s with ABI %s" % (target, abi))
    stdout_buff = []
    process_output = make_output_processor(stdout_buff)
    if abi == "host":
W
wuchenghui 已提交
280
        bazel_args = (
Y
yejianwu 已提交
281 282 283 284 285 286 287 288 289
            "build",
            "-c",
            "opt",
            "--strip",
            strip,
            "--verbose_failures",
            target,
            "--copt=-std=c++11",
            "--copt=-D_GLIBCXX_USE_C99_MATH_TR1",
W
wuchenghui 已提交
290 291
            "--copt=-Wextra",
            "--copt=-Wno-missing-field-initializers",
Y
yejianwu 已提交
292 293
            "--copt=-O3",
            "--define",
W
wuchenghui 已提交
294
            "openmp=%s" % str(enable_openmp).lower(),
Y
yejianwu 已提交
295 296
            "--define",
            "production=%s" % str(production_mode).lower(),
W
wuchenghui 已提交
297 298 299
        )
        p = sh.bazel(
            *bazel_args,
Y
yejianwu 已提交
300 301 302 303 304 305 306 307 308 309 310 311 312 313 314 315 316 317
            _out=process_output,
            _bg=True,
            _err_to_out=True)
        p.wait()
    else:
        bazel_args = (
            "build",
            "-c",
            "opt",
            "--strip",
            strip,
            "--verbose_failures",
            target,
            "--crosstool_top=//external:android/crosstool",
            "--host_crosstool_top=@bazel_tools//tools/cpp:toolchain",
            "--cpu=%s" % abi,
            "--copt=-std=c++11",
            "--copt=-D_GLIBCXX_USE_C99_MATH_TR1",
W
wuchenghui 已提交
318 319
            "--copt=-Wextra",
            "--copt=-Wno-missing-field-initializers",
Y
yejianwu 已提交
320 321 322 323 324
            "--copt=-DMACE_OBFUSCATE_LITERALS",
            "--copt=-O3",
            "--define",
            "neon=true",
            "--define",
W
wuchenghui 已提交
325
            "openmp=%s" % str(enable_openmp).lower(),
Y
yejianwu 已提交
326 327 328 329 330 331
            "--define",
            "production=%s" % str(production_mode).lower(),
            "--define",
            "hexagon=%s" % str(hexagon_mode).lower())
        if disable_no_tuning_warning:
            bazel_args += ("--copt=-DMACE_DISABLE_NO_TUNING_WARNING",)
332 333
        if debug:
            bazel_args += ("--copt=-g",)
Y
yejianwu 已提交
334 335 336 337 338 339 340 341 342 343 344
        p = sh.bazel(
            _out=process_output,
            _bg=True,
            _err_to_out=True,
            *bazel_args)
        p.wait()
    print("Building done!\n")
    return "".join(stdout_buff)


def bazel_build_common(target, build_args=""):
L
Liangliang He 已提交
345 346 347 348
    stdout_buff = []
    process_output = make_output_processor(stdout_buff)
    p = sh.bazel(
        "build",
Y
yejianwu 已提交
349
        target + build_args,
L
Liangliang He 已提交
350 351 352 353 354 355
        _out=process_output,
        _bg=True,
        _err_to_out=True)
    p.wait()
    return "".join(stdout_buff)

356 357

def bazel_target_to_bin(target):
L
Liangliang He 已提交
358 359 360 361 362 363 364 365
    # change //mace/a/b:c to bazel-bin/mace/a/b/c
    prefix, bin_name = target.split(':')
    prefix = prefix.replace('//', '/')
    if prefix.startswith('/'):
        prefix = prefix[1:]
    host_bin_path = "bazel-bin/%s" % prefix
    return host_bin_path, bin_name

366 367 368 369 370

################################
# mace commands
################################
def gen_encrypted_opencl_source(codegen_path="mace/codegen"):
L
Liangliang He 已提交
371
    sh.mkdir("-p", "%s/opencl" % codegen_path)
372 373
    encrypt_opencl_codegen("./mace/kernels/opencl/cl/",
                           "mace/codegen/opencl/opencl_encrypt_program.cc")
L
Liangliang He 已提交
374

375

Y
yejianwu 已提交
376 377
def gen_mace_engine_factory_source(model_tags,
                                   codegen_path="mace/codegen"):
378 379 380 381
    print("* Genearte mace engine creator source")
    codegen_tools_dir = "%s/engine" % codegen_path
    sh.rm("-rf", codegen_tools_dir)
    sh.mkdir("-p", codegen_tools_dir)
382
    gen_mace_engine_factory(
383 384 385 386 387 388 389 390 391
        model_tags,
        "mace/python/tools",
        codegen_tools_dir)
    print("Genearte mace engine creator source done!\n")


def pull_binaries(abi, serialno, model_output_dirs,
                  cl_built_kernel_file_name,
                  cl_platform_info_file_name):
392
    compiled_opencl_dir = "/data/local/tmp/mace_run/interior/"
393
    mace_run_param_file = "mace_run.config"
Y
yejianwu 已提交
394 395 396 397 398

    cl_bin_dirs = []
    for d in model_output_dirs:
        cl_bin_dirs.append(os.path.join(d, "opencl_bin"))
    cl_bin_dirs_str = ",".join(cl_bin_dirs)
399
    if cl_bin_dirs:
Y
yejianwu 已提交
400 401 402 403 404
        cl_bin_dir = cl_bin_dirs_str
        if os.path.exists(cl_bin_dir):
            sh.rm("-rf", cl_bin_dir)
        sh.mkdir("-p", cl_bin_dir)
        if abi != "host":
405 406 407 408
            adb_pull(compiled_opencl_dir + cl_built_kernel_file_name,
                     cl_bin_dir, serialno)
            adb_pull(compiled_opencl_dir + cl_platform_info_file_name,
                     cl_bin_dir, serialno)
409
            adb_pull("/data/local/tmp/mace_run/%s" % mace_run_param_file,
Y
yejianwu 已提交
410 411 412
                     cl_bin_dir, serialno)


W
wuchenghui 已提交
413
def gen_opencl_binary_code(model_output_dirs,
414 415
                           cl_built_kernel_file_name,
                           cl_platform_info_file_name,
Y
yejianwu 已提交
416
                           codegen_path="mace/codegen"):
417
    opencl_codegen_file = "%s/opencl/opencl_compiled_program.cc" % codegen_path
Y
yejianwu 已提交
418 419 420 421 422

    cl_bin_dirs = []
    for d in model_output_dirs:
        cl_bin_dirs.append(os.path.join(d, "opencl_bin"))
    cl_bin_dirs_str = ",".join(cl_bin_dirs)
423 424 425 426
    opencl_codegen(opencl_codegen_file,
                   cl_bin_dirs_str,
                   cl_built_kernel_file_name,
                   cl_platform_info_file_name)
Y
yejianwu 已提交
427 428


W
wuchenghui 已提交
429
def gen_tuning_param_code(model_output_dirs,
Y
yejianwu 已提交
430
                          codegen_path="mace/codegen"):
431
    mace_run_param_file = "mace_run.config"
Y
yejianwu 已提交
432 433 434 435
    cl_bin_dirs = []
    for d in model_output_dirs:
        cl_bin_dirs.append(os.path.join(d, "opencl_bin"))
    cl_bin_dirs_str = ",".join(cl_bin_dirs)
436 437 438 439 440

    tuning_codegen_dir = "%s/tuning/" % codegen_path
    if not os.path.exists(tuning_codegen_dir):
        sh.mkdir("-p", tuning_codegen_dir)

441 442 443 444 445
    tuning_param_variable_name = "kTuningParamsData"
    tuning_param_codegen(cl_bin_dirs_str,
                         mace_run_param_file,
                         "%s/tuning_params.cc" % tuning_codegen_dir,
                         tuning_param_variable_name)
Y
yejianwu 已提交
446 447


448
def gen_mace_version(codegen_path="mace/codegen"):
L
Liangliang He 已提交
449 450 451 452
    sh.mkdir("-p", "%s/version" % codegen_path)
    sh.bash("mace/tools/git/gen_version_source.sh",
            "%s/version/version.cc" % codegen_path)

453

L
liuqi 已提交
454
def gen_compiled_opencl_source(codegen_path="mace/codegen"):
455
    opencl_codegen_file = "%s/opencl/opencl_compiled_program.cc" % codegen_path
L
Liangliang He 已提交
456
    sh.mkdir("-p", "%s/opencl" % codegen_path)
457
    opencl_codegen(opencl_codegen_file)
L
Liangliang He 已提交
458

L
liuqi 已提交
459

Y
yejianwu 已提交
460 461 462 463 464 465 466 467 468 469 470 471 472
def gen_model_code(model_codegen_dir,
                   platform,
                   model_file_path,
                   weight_file_path,
                   model_sha256_checksum,
                   input_nodes,
                   output_nodes,
                   runtime,
                   model_tag,
                   input_shapes,
                   dsp_mode,
                   embed_model_data,
                   fast_conv,
Y
yejianwu 已提交
473 474 475
                   obfuscate,
                   model_output_dir,
                   model_load_type):
Y
yejianwu 已提交
476 477
    print("* Genearte model code")
    bazel_build_common("//mace/python/tools:converter")
Y
yejianwu 已提交
478

Y
yejianwu 已提交
479 480 481
    if os.path.exists(model_codegen_dir):
        sh.rm("-rf", model_codegen_dir)
    sh.mkdir("-p", model_codegen_dir)
Y
yejianwu 已提交
482

Y
yejianwu 已提交
483 484 485
    stdout_buff = []
    process_output = make_output_processor(stdout_buff)
    p = sh.python("bazel-bin/mace/python/tools/converter",
Y
yejianwu 已提交
486 487 488 489 490 491 492 493 494 495 496 497 498 499 500
                  "-u",
                  "--platform=%s" % platform,
                  "--model_file=%s" % model_file_path,
                  "--weight_file=%s" % weight_file_path,
                  "--model_checksum=%s" % model_sha256_checksum,
                  "--input_node=%s" % input_nodes,
                  "--output_node=%s" % output_nodes,
                  "--runtime=%s" % runtime,
                  "--template=%s" % "mace/python/tools",
                  "--model_tag=%s" % model_tag,
                  "--input_shape=%s" % input_shapes,
                  "--dsp_mode=%s" % dsp_mode,
                  "--embed_model_data=%s" % embed_model_data,
                  "--winograd=%s" % fast_conv,
                  "--obfuscate=%s" % obfuscate,
Y
yejianwu 已提交
501 502 503
                  "--codegen_output=%s/model.cc" % model_codegen_dir,
                  "--pb_output=%s/%s.pb" % (model_output_dir, model_tag),
                  "--model_load_type=%s" % model_load_type,
Y
yejianwu 已提交
504 505 506
                  _out=process_output,
                  _bg=True,
                  _err_to_out=True)
Y
yejianwu 已提交
507
    p.wait()
Y
yejianwu 已提交
508 509 510 511 512 513 514 515 516
    print("Model code gen done!\n")


def gen_random_input(model_output_dir,
                     input_nodes,
                     input_shapes,
                     input_files,
                     input_file_name="model_input"):
    for input_name in input_nodes:
L
liuqi 已提交
517 518
        formatted_name = common.formatted_file_name(
            input_file_name, input_name)
519 520
        if os.path.exists("%s/%s" % (model_output_dir, formatted_name)):
            sh.rm("%s/%s" % (model_output_dir, formatted_name))
Y
yejianwu 已提交
521 522
    input_nodes_str = ",".join(input_nodes)
    input_shapes_str = ":".join(input_shapes)
523 524 525
    generate_input_data("%s/%s" % (model_output_dir, input_file_name),
                        input_nodes_str,
                        input_shapes_str)
Y
yejianwu 已提交
526 527 528 529 530 531 532 533

    input_file_list = []
    if isinstance(input_files, list):
        input_file_list.extend(input_files)
    else:
        input_file_list.append(input_files)
    if len(input_file_list) != 0:
        input_name_list = []
W
wuchenghui 已提交
534 535
        if isinstance(input_nodes, list):
            input_name_list.extend(input_nodes)
Y
yejianwu 已提交
536
        else:
W
wuchenghui 已提交
537
            input_name_list.append(input_nodes)
Y
yejianwu 已提交
538 539 540 541 542 543
        if len(input_file_list) != len(input_name_list):
            raise Exception('If input_files set, the input files should '
                            'match the input names.')
        for i in range(len(input_file_list)):
            if input_file_list[i] is not None:
                dst_input_file = model_output_dir + '/' + \
L
liuqi 已提交
544 545
                        common.formatted_file_name(input_file_name,
                                                   input_name_list[i])
Y
yejianwu 已提交
546 547 548 549
                if input_file_list[i].startswith("http://") or \
                        input_file_list[i].startswith("https://"):
                    urllib.urlretrieve(input_file_list[i], dst_input_file)
                else:
550
                    sh.cp("-f", input_file_list[i], dst_input_file)
Y
yejianwu 已提交
551 552 553 554


def update_mace_run_lib(model_output_dir,
                        model_tag,
555
                        embed_model_data):
Y
yejianwu 已提交
556 557 558
    mace_run_filepath = model_output_dir + "/mace_run"
    if os.path.exists(mace_run_filepath):
        sh.rm("-rf", mace_run_filepath)
559
    sh.cp("-f", "bazel-bin/mace/tools/validation/mace_run", model_output_dir)
Y
yejianwu 已提交
560 561

    if embed_model_data == 0:
562
        sh.cp("-f", "mace/codegen/models/%s/%s.data" % (model_tag, model_tag),
Y
yejianwu 已提交
563 564
              model_output_dir)

565
    sh.cp("-f", "mace/codegen/models/%s/%s.h" % (model_tag, model_tag),
Y
yejianwu 已提交
566 567 568
          model_output_dir)


569 570 571 572
def create_internal_storage_dir(serialno, phone_data_dir):
    internal_storage_dir = "%s/interior/" % phone_data_dir
    sh.adb("-s", serialno, "shell", "mkdir", "-p", internal_storage_dir)
    return internal_storage_dir
573 574


W
wuchenghui 已提交
575 576
def tuning_run(abi,
               serialno,
Y
yejianwu 已提交
577 578 579 580 581 582 583
               vlog_level,
               embed_model_data,
               model_output_dir,
               input_nodes,
               output_nodes,
               input_shapes,
               output_shapes,
Y
yejianwu 已提交
584
               mace_model_dir,
Y
yejianwu 已提交
585 586 587 588 589 590 591
               model_tag,
               device_type,
               running_round,
               restart_round,
               limit_opencl_kernel_time,
               tuning,
               out_of_range_check,
592
               phone_data_dir,
W
wuchenghui 已提交
593 594 595 596
               omp_num_threads=-1,
               cpu_affinity_policy=1,
               gpu_perf_hint=3,
               gpu_priority_hint=3,
597 598 599
               valgrind=False,
               valgrind_path="/data/local/tmp/valgrind",
               valgrind_args="",
Y
yejianwu 已提交
600 601
               input_file_name="model_input",
               output_file_name="model_out"):
602
    print("* Run '%s' with round=%s, restart_round=%s, tuning=%s, "
W
wuchenghui 已提交
603 604
          "out_of_range_check=%s, omp_num_threads=%s, cpu_affinity_policy=%s, "
          "gpu_perf_hint=%s, gpu_priority_hint=%s" %
605
          (model_tag, running_round, restart_round, str(tuning),
W
wuchenghui 已提交
606 607
           str(out_of_range_check), omp_num_threads, cpu_affinity_policy,
           gpu_perf_hint, gpu_priority_hint))
Y
yejianwu 已提交
608
    if abi == "host":
Y
yejianwu 已提交
609 610 611 612
        if mace_model_dir:
            mace_model_path = "%s/%s.pb" % (mace_model_dir, model_tag)
        else:
            mace_model_path = ""
W
wuchenghui 已提交
613 614
        p = subprocess.Popen(
            [
Y
yejianwu 已提交
615 616 617
                "env",
                "MACE_CPP_MIN_VLOG_LEVEL=%s" % vlog_level,
                "%s/mace_run" % model_output_dir,
618
                "--model_name=%s" % model_tag,
Y
yejianwu 已提交
619 620 621 622 623 624 625 626 627 628
                "--input_node=%s" % ",".join(input_nodes),
                "--output_node=%s" % ",".join(output_nodes),
                "--input_shape=%s" % ":".join(input_shapes),
                "--output_shape=%s" % ":".join(output_shapes),
                "--input_file=%s/%s" % (model_output_dir, input_file_name),
                "--output_file=%s/%s" % (model_output_dir, output_file_name),
                "--model_data_file=%s/%s.data" % (model_output_dir, model_tag),
                "--device=%s" % device_type,
                "--round=%s" % running_round,
                "--restart_round=%s" % restart_round,
W
wuchenghui 已提交
629 630 631 632
                "--omp_num_threads=%s" % omp_num_threads,
                "--cpu_affinity_policy=%s" % cpu_affinity_policy,
                "--gpu_perf_hint=%s" % gpu_perf_hint,
                "--gpu_priority_hint=%s" % gpu_priority_hint,
Y
yejianwu 已提交
633
                "--model_file=%s" % mace_model_path,
W
wuchenghui 已提交
634 635 636
            ],
            stderr=subprocess.PIPE,
            stdout=subprocess.PIPE)
Y
yejianwu 已提交
637 638 639 640 641
        out, err = p.communicate()
        stdout = err + out
        print stdout
        print("Running finished!\n")
        return stdout
Y
yejianwu 已提交
642 643
    else:
        sh.adb("-s", serialno, "shell", "mkdir", "-p", phone_data_dir)
644 645
        internal_storage_dir = create_internal_storage_dir(
            serialno, phone_data_dir)
Y
yejianwu 已提交
646 647

        for input_name in input_nodes:
L
liuqi 已提交
648 649
            formatted_name = common.formatted_file_name(input_file_name,
                                                        input_name)
Y
yejianwu 已提交
650 651 652 653 654 655 656
            adb_push("%s/%s" % (model_output_dir, formatted_name),
                     phone_data_dir, serialno)
        adb_push("%s/mace_run" % model_output_dir, phone_data_dir,
                 serialno)
        if not embed_model_data:
            adb_push("%s/%s.data" % (model_output_dir, model_tag),
                     phone_data_dir, serialno)
L
Liangliang He 已提交
657
        adb_push("mace/third_party/nnlib/libhexagon_controller.so",
Y
yejianwu 已提交
658 659
                 phone_data_dir, serialno)

Y
yejianwu 已提交
660 661 662 663 664 665 666 667
        if mace_model_dir:
            mace_model_path = "%s/%s.pb" % (phone_data_dir, model_tag)
            adb_push("%s/%s.pb" % (mace_model_dir, model_tag),
                     mace_model_path,
                     serialno)
        else:
            mace_model_path = ""

Y
yejianwu 已提交
668 669
        stdout_buff = []
        process_output = make_output_processor(stdout_buff)
670
        adb_cmd = [
W
wuchenghui 已提交
671 672 673 674
            "LD_LIBRARY_PATH=%s" % phone_data_dir,
            "MACE_TUNING=%s" % int(tuning),
            "MACE_OUT_OF_RANGE_CHECK=%s" % int(out_of_range_check),
            "MACE_CPP_MIN_VLOG_LEVEL=%s" % vlog_level,
675
            "MACE_RUN_PARAMETER_PATH=%s/mace_run.config" % phone_data_dir,
676
            "MACE_INTERNAL_STORAGE_PATH=%s" % internal_storage_dir,
677 678 679 680 681 682 683 684 685
            "MACE_LIMIT_OPENCL_KERNEL_TIME=%s" % limit_opencl_kernel_time,
        ]
        if valgrind:
            adb_cmd.extend([
                "VALGRIND_LIB=%s" % valgrind_path + "/lib/valgrind",
                valgrind_path + "/bin/valgrind",
                valgrind_args
            ])
        adb_cmd.extend([
W
wuchenghui 已提交
686
            "%s/mace_run" % phone_data_dir,
687
            "--model_name=%s" % model_tag,
W
wuchenghui 已提交
688 689 690 691 692 693 694 695 696 697 698 699 700 701
            "--input_node=%s" % ",".join(input_nodes),
            "--output_node=%s" % ",".join(output_nodes),
            "--input_shape=%s" % ":".join(input_shapes),
            "--output_shape=%s" % ":".join(output_shapes),
            "--input_file=%s/%s" % (phone_data_dir, input_file_name),
            "--output_file=%s/%s" % (phone_data_dir, output_file_name),
            "--model_data_file=%s/%s.data" % (phone_data_dir, model_tag),
            "--device=%s" % device_type,
            "--round=%s" % running_round,
            "--restart_round=%s" % restart_round,
            "--omp_num_threads=%s" % omp_num_threads,
            "--cpu_affinity_policy=%s" % cpu_affinity_policy,
            "--gpu_perf_hint=%s" % gpu_perf_hint,
            "--gpu_priority_hint=%s" % gpu_priority_hint,
Y
yejianwu 已提交
702
            "--model_file=%s" % mace_model_path,
703 704 705 706 707 708 709
        ])
        adb_cmd = ' '.join(adb_cmd)
        p = sh.adb(
            "-s",
            serialno,
            "shell",
            adb_cmd,
W
wuchenghui 已提交
710 711 712
            _out=process_output,
            _bg=True,
            _err_to_out=True)
Y
yejianwu 已提交
713
        p.wait()
Y
yejianwu 已提交
714 715
        print("Running finished!\n")
        return "".join(stdout_buff)
Y
yejianwu 已提交
716 717


W
wuchenghui 已提交
718 719
def validate_model(abi,
                   serialno,
Y
yejianwu 已提交
720 721 722
                   model_file_path,
                   weight_file_path,
                   platform,
723
                   device_type,
Y
yejianwu 已提交
724 725 726 727 728
                   input_nodes,
                   output_nodes,
                   input_shapes,
                   output_shapes,
                   model_output_dir,
729
                   phone_data_dir,
L
liuqi 已提交
730
                   caffe_env,
Y
yejianwu 已提交
731 732 733
                   input_file_name="model_input",
                   output_file_name="model_out"):
    print("* Validate with %s" % platform)
L
liuqi 已提交
734 735 736 737 738 739 740 741 742
    if abi != "host":
        for output_name in output_nodes:
            formatted_name = common.formatted_file_name(
                output_file_name, output_name)
            if os.path.exists("%s/%s" % (model_output_dir,
                                         formatted_name)):
                sh.rm("-rf", "%s/%s" % (model_output_dir, formatted_name))
            adb_pull("%s/%s" % (phone_data_dir, formatted_name),
                     model_output_dir, serialno)
Y
yejianwu 已提交
743 744

    if platform == "tensorflow":
745 746
        validate(platform, model_file_path, "",
                 "%s/%s" % (model_output_dir, input_file_name),
747
                 "%s/%s" % (model_output_dir, output_file_name), device_type,
748 749
                 ":".join(input_shapes), ":".join(output_shapes),
                 ",".join(input_nodes), ",".join(output_nodes))
Y
yejianwu 已提交
750 751 752 753 754
    elif platform == "caffe":
        image_name = "mace-caffe:latest"
        container_name = "mace_caffe_validator"
        res_file = "validation.result"

L
liuqi 已提交
755 756 757 758 759 760 761 762
        if caffe_env == common.CaffeEnvType.LOCAL:
            import imp
            try:
                imp.find_module('caffe')
            except ImportError:
                logger.error('There is no caffe python module.')
            validate(platform, model_file_path, weight_file_path,
                     "%s/%s" % (model_output_dir, input_file_name),
763 764
                     "%s/%s" % (model_output_dir, output_file_name),
                     device_type,
L
liuqi 已提交
765 766 767 768 769 770 771 772 773 774 775 776 777 778 779 780 781 782 783 784 785 786 787 788 789 790 791 792 793 794 795 796 797 798
                     ":".join(input_shapes), ":".join(output_shapes),
                     ",".join(input_nodes), ",".join(output_nodes))
        elif caffe_env == common.CaffeEnvType.DOCKER:
            docker_image_id = sh.docker("images", "-q", image_name)
            if not docker_image_id:
                print("Build caffe docker")
                sh.docker("build", "-t", image_name,
                          "mace/third_party/caffe")

            container_id = sh.docker("ps", "-qa", "-f",
                                     "name=%s" % container_name)
            if container_id and not sh.docker("ps", "-qa", "--filter",
                                              "status=running", "-f",
                                              "name=%s" % container_name):
                sh.docker("rm", "-f", container_name)
                container_id = ""
            if not container_id:
                print("Run caffe container")
                sh.docker(
                        "run",
                        "-d",
                        "-it",
                        "--name",
                        container_name,
                        image_name,
                        "/bin/bash")

            for input_name in input_nodes:
                formatted_input_name = common.formatted_file_name(
                        input_file_name, input_name)
                sh.docker(
                        "cp",
                        "%s/%s" % (model_output_dir, formatted_input_name),
                        "%s:/mace" % container_name)
Y
yejianwu 已提交
799 800

            for output_name in output_nodes:
L
liuqi 已提交
801 802 803 804 805 806 807 808
                formatted_output_name = common.formatted_file_name(
                        output_file_name, output_name)
                sh.docker(
                        "cp",
                        "%s/%s" % (model_output_dir, formatted_output_name),
                        "%s:/mace" % container_name)
            model_file_name = os.path.basename(model_file_path)
            weight_file_name = os.path.basename(weight_file_path)
L
liuqi 已提交
809
            sh.docker("cp", "tools/common.py", "%s:/mace" % container_name)
L
liuqi 已提交
810 811 812 813 814 815 816 817 818 819 820 821 822 823 824 825 826
            sh.docker("cp", "tools/validate.py", "%s:/mace" % container_name)
            sh.docker("cp", model_file_path, "%s:/mace" % container_name)
            sh.docker("cp", weight_file_path, "%s:/mace" % container_name)

            stdout_buff = []
            process_output = make_output_processor(stdout_buff)
            p = sh.docker(
                    "exec",
                    container_name,
                    "python",
                    "-u",
                    "/mace/validate.py",
                    "--platform=caffe",
                    "--model_file=/mace/%s" % model_file_name,
                    "--weight_file=/mace/%s" % weight_file_name,
                    "--input_file=/mace/%s" % input_file_name,
                    "--mace_out_file=/mace/%s" % output_file_name,
827
                    "--device_type=%s" % device_type,
L
liuqi 已提交
828 829 830 831 832 833 834 835
                    "--input_node=%s" % ",".join(input_nodes),
                    "--output_node=%s" % ",".join(output_nodes),
                    "--input_shape=%s" % ":".join(input_shapes),
                    "--output_shape=%s" % ":".join(output_shapes),
                    _out=process_output,
                    _bg=True,
                    _err_to_out=True)
            p.wait()
Y
yejianwu 已提交
836 837 838 839 840 841 842

    print("Validation done!\n")


def build_production_code(abi):
    bazel_build("//mace/codegen:generated_opencl", abi=abi)
    bazel_build("//mace/codegen:generated_tuning_params", abi=abi)
L
liuqi 已提交
843 844 845 846
    if abi == 'host':
        bazel_build(
            "//mace/codegen:generated_models",
            abi=abi)
Y
yejianwu 已提交
847 848 849 850 851 852 853


def merge_libs(target_soc,
               abi,
               project_name,
               libmace_output_dir,
               model_output_dirs,
Y
yejianwu 已提交
854
               mace_model_dirs_kv,
Y
yejianwu 已提交
855 856 857 858 859 860
               hexagon_mode,
               embed_model_data):
    print("* Merge mace lib")
    project_output_dir = "%s/%s" % (libmace_output_dir, project_name)
    model_header_dir = "%s/include/mace/public" % project_output_dir
    model_data_dir = "%s/data" % project_output_dir
L
Liangliang He 已提交
861
    hexagon_lib_file = "mace/third_party/nnlib/libhexagon_controller.so"
Y
yejianwu 已提交
862 863 864 865 866 867
    model_bin_dir = "%s/%s/" % (project_output_dir, abi)

    if not os.path.exists(model_bin_dir):
        sh.mkdir("-p", model_bin_dir)
    if not os.path.exists(model_header_dir):
        sh.mkdir("-p", model_header_dir)
868
    sh.cp("-f", glob.glob("mace/public/*.h"), model_header_dir)
Y
yejianwu 已提交
869 870 871
    if not os.path.exists(model_data_dir):
        sh.mkdir("-p", model_data_dir)
    if hexagon_mode:
872
        sh.cp("-f", hexagon_lib_file, model_bin_dir)
Y
yejianwu 已提交
873

874 875
    sh.cp("-f", glob.glob("mace/codegen/engine/*.h"), model_header_dir)

Y
yejianwu 已提交
876 877
    mri_stream = ""
    if abi == "host":
878 879
        mri_stream += "create %s/libmace_%s.a\n" % \
                      (model_bin_dir, project_name)
Y
yejianwu 已提交
880
        mri_stream += (
881 882
            "addlib "
            "bazel-bin/mace/codegen/libgenerated_opencl.pic.a\n")
Y
yejianwu 已提交
883
        mri_stream += (
884 885
            "addlib "
            "bazel-bin/mace/codegen/libgenerated_tuning_params.pic.a\n")
886 887 888
        mri_stream += (
            "addlib "
            "bazel-bin/mace/codegen/libgenerated_models.pic.a\n")
Y
yejianwu 已提交
889
    else:
890 891
        mri_stream += "create %s/libmace_%s.%s.a\n" % \
                      (model_bin_dir, project_name, target_soc)
Y
yejianwu 已提交
892
        mri_stream += (
893 894
            "addlib "
            "bazel-bin/mace/codegen/libgenerated_opencl.a\n")
Y
yejianwu 已提交
895
        mri_stream += (
896 897
            "addlib "
            "bazel-bin/mace/codegen/libgenerated_tuning_params.a\n")
Y
yejianwu 已提交
898
        mri_stream += (
899 900
            "addlib "
            "bazel-bin/mace/codegen/libgenerated_version.a\n")
901
        mri_stream += (
902 903
            "addlib "
            "bazel-bin/mace/codegen/libgenerated_models.a\n")
Y
yejianwu 已提交
904
        mri_stream += (
905 906
            "addlib "
            "bazel-bin/mace/core/libcore.a\n")
Y
yejianwu 已提交
907
        mri_stream += (
908 909
            "addlib "
            "bazel-bin/mace/kernels/libkernels.a\n")
Y
yejianwu 已提交
910
        mri_stream += (
911 912
            "addlib "
            "bazel-bin/mace/utils/libutils.a\n")
Y
yejianwu 已提交
913
        mri_stream += (
914 915
            "addlib "
            "bazel-bin/mace/utils/libutils_prod.a\n")
Y
yejianwu 已提交
916
        mri_stream += (
917 918
            "addlib "
            "bazel-bin/mace/ops/libops.lo\n")
Y
yejianwu 已提交
919 920 921

    for model_output_dir in model_output_dirs:
        if not embed_model_data:
922 923 924
            sh.cp("-f", glob.glob("%s/*.data" % model_output_dir),
                  model_data_dir)
        sh.cp("-f", glob.glob("%s/*.h" % model_output_dir), model_header_dir)
Y
yejianwu 已提交
925

Y
yejianwu 已提交
926 927 928 929
    for model_name in mace_model_dirs_kv:
        sh.cp("-f", "%s/%s.pb" % (mace_model_dirs_kv[model_name], model_name),
              model_data_dir)

Y
yejianwu 已提交
930 931 932 933 934 935 936 937 938 939 940 941 942 943 944 945 946 947 948 949 950 951 952 953 954 955 956 957 958 959 960 961 962 963 964 965 966 967 968
    mri_stream += "save\n"
    mri_stream += "end\n"

    cmd = sh.Command("%s/toolchains/" % os.environ["ANDROID_NDK_HOME"] +
                     "aarch64-linux-android-4.9/prebuilt/linux-x86_64/" +
                     "bin/aarch64-linux-android-ar")

    cmd("-M", _in=mri_stream)

    print("Libs merged!\n")


def packaging_lib(libmace_output_dir, project_name):
    print("* Package libs for %s" % project_name)
    tar_package_name = "libmace_%s.tar.gz" % project_name
    project_dir = "%s/%s" % (libmace_output_dir, project_name)
    tar_package_path = "%s/%s" % (project_dir, tar_package_name)
    if os.path.exists(tar_package_path):
        sh.rm("-rf", tar_package_path)

    print("Start packaging '%s' libs into %s" % (project_name,
                                                 tar_package_path))
    # ls ${project_dir} -1 | grep -v build | grep -v .tar.gz | xargs -I {} \
    #       tar cvzf ${project_dir}/${tar_package_name} ${project_name}/{}
    sh.xargs(
            sh.grep(
                sh.grep(
                    sh.ls(project_dir, "-1"),
                    "-v", "build"),
                "-v", ".tar.gz"),
            "-I",
            "{}",
            "tar",
            "cvzf",
            "%s" % tar_package_path,
            "%s/{}" % project_dir)
    print("Packaging Done!\n")


969 970 971 972 973 974 975 976 977 978 979 980 981 982 983 984 985 986 987 988 989 990
def build_benchmark_model(abi,
                          embed_model_data,
                          model_output_dir,
                          model_tag,
                          hexagon_mode):
    benchmark_binary_file = "%s/benchmark_model" % model_output_dir
    if os.path.exists(benchmark_binary_file):
        sh.rm("-rf", benchmark_binary_file)
    if not embed_model_data:
        sh.cp("-f", "mace/codegen/models/%s/%s.data" % (model_tag, model_tag),
              model_output_dir)

    benchmark_target = "//mace/benchmark:benchmark_model"
    bazel_build(benchmark_target,
                abi=abi,
                production_mode=True,
                hexagon_mode=hexagon_mode)

    target_bin = "/".join(bazel_target_to_bin(benchmark_target))
    sh.cp("-f", target_bin, model_output_dir)


W
wuchenghui 已提交
991 992
def benchmark_model(abi,
                    serialno,
Y
yejianwu 已提交
993 994 995
                    vlog_level,
                    embed_model_data,
                    model_output_dir,
Y
yejianwu 已提交
996
                    mace_model_dir,
Y
yejianwu 已提交
997 998 999 1000 1001 1002
                    input_nodes,
                    output_nodes,
                    input_shapes,
                    output_shapes,
                    model_tag,
                    device_type,
1003
                    phone_data_dir,
W
wuchenghui 已提交
1004 1005 1006 1007
                    omp_num_threads=-1,
                    cpu_affinity_policy=1,
                    gpu_perf_hint=3,
                    gpu_priority_hint=3,
1008
                    input_file_name="model_input"):
Y
yejianwu 已提交
1009 1010 1011 1012 1013
    print("* Benchmark for %s" % model_tag)

    stdout_buff = []
    process_output = make_output_processor(stdout_buff)
    if abi == "host":
Y
yejianwu 已提交
1014 1015 1016 1017
        if mace_model_dir:
            mace_model_path = "%s/%s.pb" % (mace_model_dir, model_tag)
        else:
            mace_model_path = ""
W
wuchenghui 已提交
1018 1019
        p = subprocess.Popen(
            [
Y
yejianwu 已提交
1020 1021 1022
                "env",
                "MACE_CPP_MIN_VLOG_LEVEL=%s" % vlog_level,
                "%s/benchmark_model" % model_output_dir,
1023
                "--model_name=%s" % model_tag,
Y
yejianwu 已提交
1024 1025 1026 1027 1028 1029 1030
                "--input_node=%s" % ",".join(input_nodes),
                "--output_node=%s" % ",".join(output_nodes),
                "--input_shape=%s" % ":".join(input_shapes),
                "--output_shape=%s" % ":".join(output_shapes),
                "--input_file=%s/%s" % (model_output_dir, input_file_name),
                "--model_data_file=%s/%s.data" % (model_output_dir, model_tag),
                "--device=%s" % device_type,
W
wuchenghui 已提交
1031 1032 1033 1034
                "--omp_num_threads=%s" % omp_num_threads,
                "--cpu_affinity_policy=%s" % cpu_affinity_policy,
                "--gpu_perf_hint=%s" % gpu_perf_hint,
                "--gpu_priority_hint=%s" % gpu_priority_hint,
Y
yejianwu 已提交
1035
                "--model_file=%s" % mace_model_path,
W
wuchenghui 已提交
1036
            ])
Y
yejianwu 已提交
1037 1038 1039
        p.wait()
    else:
        sh.adb("-s", serialno, "shell", "mkdir", "-p", phone_data_dir)
1040 1041
        internal_storage_dir = create_internal_storage_dir(
            serialno, phone_data_dir)
Y
yejianwu 已提交
1042 1043

        for input_name in input_nodes:
L
liuqi 已提交
1044 1045
            formatted_name = common.formatted_file_name(input_file_name,
                                                        input_name)
Y
yejianwu 已提交
1046 1047 1048 1049 1050 1051 1052
            adb_push("%s/%s" % (model_output_dir, formatted_name),
                     phone_data_dir, serialno)
        adb_push("%s/benchmark_model" % model_output_dir, phone_data_dir,
                 serialno)
        if not embed_model_data:
            adb_push("%s/%s.data" % (model_output_dir, model_tag),
                     phone_data_dir, serialno)
Y
yejianwu 已提交
1053 1054 1055 1056 1057 1058 1059 1060
        if mace_model_dir:
            mace_model_path = "%s/%s.pb" % (phone_data_dir, model_tag)
            adb_push("%s/%s.pb" % (mace_model_dir, model_tag),
                     mace_model_path,
                     serialno)
        else:
            mace_model_path = ""

Y
yejianwu 已提交
1061
        p = sh.adb(
W
wuchenghui 已提交
1062 1063 1064 1065 1066 1067 1068
            "-s",
            serialno,
            "shell",
            "LD_LIBRARY_PATH=%s" % phone_data_dir,
            "MACE_CPP_MIN_VLOG_LEVEL=%s" % vlog_level,
            "MACE_RUN_PARAMETER_PATH=%s/mace_run.config" %
            phone_data_dir,
1069
            "MACE_INTERNAL_STORAGE_PATH=%s" % internal_storage_dir,
W
wuchenghui 已提交
1070 1071
            "MACE_OPENCL_PROFILING=1",
            "%s/benchmark_model" % phone_data_dir,
1072
            "--model_name=%s" % model_tag,
W
wuchenghui 已提交
1073 1074 1075 1076 1077 1078 1079 1080 1081 1082 1083
            "--input_node=%s" % ",".join(input_nodes),
            "--output_node=%s" % ",".join(output_nodes),
            "--input_shape=%s" % ":".join(input_shapes),
            "--output_shape=%s" % ":".join(output_shapes),
            "--input_file=%s/%s" % (phone_data_dir, input_file_name),
            "--model_data_file=%s/%s.data" % (phone_data_dir, model_tag),
            "--device=%s" % device_type,
            "--omp_num_threads=%s" % omp_num_threads,
            "--cpu_affinity_policy=%s" % cpu_affinity_policy,
            "--gpu_perf_hint=%s" % gpu_perf_hint,
            "--gpu_priority_hint=%s" % gpu_priority_hint,
Y
yejianwu 已提交
1084
            "--model_file=%s" % mace_model_path,
W
wuchenghui 已提交
1085 1086 1087
            _out=process_output,
            _bg=True,
            _err_to_out=True)
Y
yejianwu 已提交
1088 1089 1090 1091 1092 1093
        p.wait()

    print("Benchmark done!\n")
    return "".join(stdout_buff)


W
wuchenghui 已提交
1094 1095
def build_run_throughput_test(abi,
                              serialno,
Y
yejianwu 已提交
1096 1097 1098 1099 1100 1101 1102 1103 1104 1105 1106 1107
                              vlog_level,
                              run_seconds,
                              merged_lib_file,
                              model_input_dir,
                              embed_model_data,
                              input_nodes,
                              output_nodes,
                              input_shapes,
                              output_shapes,
                              cpu_model_tag,
                              gpu_model_tag,
                              dsp_model_tag,
1108
                              phone_data_dir,
Y
yejianwu 已提交
1109 1110 1111 1112 1113 1114 1115 1116 1117 1118 1119 1120 1121 1122 1123
                              strip="always",
                              input_file_name="model_input"):
    print("* Build and run throughput_test")

    model_tag_build_flag = ""
    if cpu_model_tag:
        model_tag_build_flag += "--copt=-DMACE_CPU_MODEL_TAG=%s " % \
                                cpu_model_tag
    if gpu_model_tag:
        model_tag_build_flag += "--copt=-DMACE_GPU_MODEL_TAG=%s " % \
                                gpu_model_tag
    if dsp_model_tag:
        model_tag_build_flag += "--copt=-DMACE_DSP_MODEL_TAG=%s " % \
                                dsp_model_tag

1124
    sh.cp("-f", merged_lib_file, "mace/benchmark/libmace_merged.a")
Y
yejianwu 已提交
1125 1126 1127 1128 1129 1130 1131 1132 1133 1134 1135 1136 1137 1138 1139 1140 1141 1142 1143 1144 1145 1146 1147 1148 1149 1150 1151 1152 1153 1154 1155 1156 1157 1158 1159 1160 1161 1162 1163 1164 1165 1166 1167 1168 1169 1170 1171 1172 1173 1174 1175
    stdout_buff = []
    process_output = make_output_processor(stdout_buff)
    p = sh.bazel(
        "build",
        "-c",
        "opt",
        "--strip",
        strip,
        "--verbose_failures",
        "//mace/benchmark:model_throughput_test",
        "--crosstool_top=//external:android/crosstool",
        "--host_crosstool_top=@bazel_tools//tools/cpp:toolchain",
        "--cpu=%s" % abi,
        "--copt=-std=c++11",
        "--copt=-D_GLIBCXX_USE_C99_MATH_TR1",
        "--copt=-Werror=return-type",
        "--copt=-O3",
        "--define",
        "neon=true",
        "--define",
        "openmp=true",
        model_tag_build_flag,
        _out=process_output,
        _bg=True,
        _err_to_out=True)
    p.wait()

    sh.rm("mace/benchmark/libmace_merged.a")
    sh.adb("-s",
           serialno,
           "shell",
           "mkdir",
           "-p",
           phone_data_dir)
    adb_push("%s/%s_%s" % (model_input_dir, input_file_name,
                           ",".join(input_nodes)),
             phone_data_dir,
             serialno)
    adb_push("bazel-bin/mace/benchmark/model_throughput_test",
             phone_data_dir,
             serialno)
    if not embed_model_data:
        adb_push("codegen/models/%s/%s.data" % cpu_model_tag,
                 phone_data_dir,
                 serialno)
        adb_push("codegen/models/%s/%s.data" % gpu_model_tag,
                 phone_data_dir,
                 serialno)
        adb_push("codegen/models/%s/%s.data" % dsp_model_tag,
                 phone_data_dir,
                 serialno)
L
Liangliang He 已提交
1176
    adb_push("mace/third_party/nnlib/libhexagon_controller.so",
Y
yejianwu 已提交
1177 1178 1179 1180 1181 1182 1183 1184 1185 1186 1187 1188 1189 1190 1191 1192 1193 1194 1195 1196 1197 1198 1199 1200 1201 1202 1203 1204 1205 1206 1207 1208
             phone_data_dir,
             serialno)

    p = sh.adb(
            "-s",
            serialno,
            "shell",
            "LD_LIBRARY_PATH=%s" % phone_data_dir,
            "MACE_CPP_MIN_VLOG_LEVEL=%s" % vlog_level,
            "MACE_RUN_PARAMETER_PATH=%s/mace_run.config" %
            phone_data_dir,
            "%s/model_throughput_test" % phone_data_dir,
            "--input_node=%s" % ",".join(input_nodes),
            "--output_node=%s" % ",".join(output_nodes),
            "--input_shape=%s" % ":".join(input_shapes),
            "--output_shape=%s" % ":".join(output_shapes),
            "--input_file=%s/%s" % (phone_data_dir, input_file_name),
            "--cpu_model_data_file=%s/%s.data" % (phone_data_dir,
                                                  cpu_model_tag),
            "--gpu_model_data_file=%s/%s.data" % (phone_data_dir,
                                                  gpu_model_tag),
            "--dsp_model_data_file=%s/%s.data" % (phone_data_dir,
                                                  dsp_model_tag),
            "--run_seconds=%s" % run_seconds,
            _out=process_output,
            _bg=True,
            _err_to_out=True)
    p.wait()

    print("throughput_test done!\n")


1209 1210 1211
################################
# falcon
################################
L
Liangliang He 已提交
1212
def falcon_tags(tags_dict):
L
Liangliang He 已提交
1213 1214 1215 1216 1217 1218 1219
    tags = ""
    for k, v in tags_dict.iteritems():
        if tags == "":
            tags = "%s=%s" % (k, v)
        else:
            tags = tags + ",%s=%s" % (k, v)
    return tags
L
Liangliang He 已提交
1220

1221

L
Liangliang He 已提交
1222 1223 1224 1225 1226 1227 1228 1229 1230 1231
def falcon_push_metrics(metrics, endpoint="mace_dev", tags={}):
    cli = falcon_cli.FalconCli.connect(
        server="transfer.falcon.miliao.srv", port=8433, debug=False)
    ts = int(time.time())
    falcon_metrics = [{
        "endpoint": endpoint,
        "metric": key,
        "tags": falcon_tags(tags),
        "timestamp": ts,
        "value": value,
L
Liangliang He 已提交
1232
        "step": 600,
L
Liangliang He 已提交
1233 1234 1235
        "counterType": "GAUGE"
    } for key, value in metrics.iteritems()]
    cli.update(falcon_metrics)