Number of threads used during auto-tunning

merrymercy · August 3, 2018, 11:29pm

There is a config function in

dmlc/tvm/blob/f32841fa839ecf09e512f702d3e9e28c27fe603f/src/runtime/thread_pool.cc#L343


// if excluding worker 0 and using master to run task 0
#ifndef _LIBCPP_SGX_CONFIG
bool exclude_worker0_{true};
#else
bool exclude_worker0_{false};
#endif
std::vector<std::unique_ptr<SpscTaskQueue> > queues_;
std::unique_ptr<tvm::runtime::threading::ThreadGroup> threads_;
};


TVM_REGISTER_GLOBAL("runtime.config_threadpool")
.set_body([](TVMArgs args, TVMRetValue* rv) {
  threading::ThreadGroup::AffinityMode mode =\
  static_cast<threading::ThreadGroup::AffinityMode>(\
  static_cast<int>(args[0]));
  int nthreads = args[1];
  ThreadPool::ThreadLocal()->UpdateWorkerConfiguration(mode, nthreads);
});




}  // namespace runtime

from python side, we can set this by

tracker = tvm.rpc.connect_tracker(args.host, args.port)                 
remote = tracker.request(args.rpc_key)
config_func = remote.get_function('runtime.config_threadpool')

config_func(1, 1) # use 1 big core
config_func(1, 2) # use 2 big cores
config_func(-1, 1) # use 1 small core
config_func(-1, 2) # use 2 small cores

For auto-tuning, there is no interface for this. Maybe you can add these code after this line.

github.com

dmlc/tvm/blob/83a2115d4b50c603a6ed7d7ee412641981e924eb/python/tvm/autotvm/measure/measure_methods.py#L244


    ref_input: List of numpy array
        Reference input for correctness check
    ref_output: List of numpy array
        Reference output for correctness check


    Returns
    -------
    results: List of MeasureResult
        The results for input_pack
    """
    remote = request_remote(key, (host, port), priority, session_timeout)


    res = _measure_common(input_pack, build_func, build_kwargs, number, repeat,
                          ref_input, ref_output,
                          remote)
    return res


fmeasure.pack_size = pack_size
fmeasure.rpc_info = {"key": key, "host": host, "port": port}
return fmeasure