Skip to content

Commit

Permalink
[Hexagon] Initial support for Hexagon codegen (apache#6261)
Browse files Browse the repository at this point in the history
* [Hexagon] Initial support for Hexagon codegen

This commit does not support parallel execution or prefetch.
LLVM 7 or later is required.

* Set native_vector_bits_ based on target features

* Initialize hvx_bytes

* Remove commented out line
  • Loading branch information
Krzysztof Parzyszek authored and Trevor Morris committed Sep 2, 2020
1 parent 8636845 commit 11e23f9
Show file tree
Hide file tree
Showing 8 changed files with 1,225 additions and 8 deletions.
211 changes: 211 additions & 0 deletions python/tvm/contrib/hexagon.py
Original file line number Diff line number Diff line change
@@ -0,0 +1,211 @@
# Licensed to the Apache Software Foundation (ASF) under one
# or more contributor license agreements. See the NOTICE file
# distributed with this work for additional information
# regarding copyright ownership. The ASF licenses this file
# to you under the Apache License, Version 2.0 (the
# "License"); you may not use this file except in compliance
# with the License. You may obtain a copy of the License at
#
# http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing,
# software distributed under the License is distributed on an
# "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
# KIND, either express or implied. See the License for the
# specific language governing permissions and limitations
# under the License.

'''Utility for Hexagon backend'''

import functools as ft
import os
import tvm
import tvm.ir
import tvm.contrib.cc as cc
from .._ffi.registry import register_func


# Linking Hexagon shared libraries.
#
# link_shared(name-of-shared-library, list-of-objects, kw-args)
#
# To use a custom linker, define a function that returns the path to the
# linker, and pass it to 'register_linker':
#
# def custom_linker_path():
# return '/path/to/hexagon/linker'
#
# register_linker(custom_linker_path)
#
# Subsequent calls to 'link_shared' will use the newly registered linker.

hexagon_toolchain_root = os.environ.get('HEXAGON_TOOLCHAIN') or '' # pylint: disable=invalid-name
hexagon_link_master = os.path.join( # pylint: disable=invalid-name
hexagon_toolchain_root, 'bin', 'hexagon-link')

def register_linker(f):
"""Register a function that will return the path to the Hexagon linker."""
return register_func('tvm.contrib.hexagon.hexagon_link', f, True)

@register_func('tvm.contrib.hexagon.hexagon_link')
def hexagon_link():
"""Return path to the Hexagon linker."""
return hexagon_link_master

@register_func('tvm.contrib.hexagon.link_shared')
def link_shared(so_name, objs, **kwargs):
"""Link shared library on Hexagon using the registered Hexagon linker.
Parameters
----------
so_name : str
Name of the shared library file.
objs : list[str,StringImm]
kwargs : additional arguments:
'verbose' - print additional information
Returns
-------
ret_val : int
This function returns 0 at the moment.
"""
# The list of object files can be passed as built-in Python strings,
# or as tvm.tir.StringImm's.
def to_str(s):
if isinstance(s, tvm.tir.StringImm):
return s.value
assert isinstance(s, str), 'argument "' + str(s) + '" should be a string or StrImm'
return s
objs = [to_str(s) for s in objs]

linker = tvm.get_global_func('tvm.contrib.hexagon.hexagon_link')()
if kwargs.get('verbose'):
print('tvm.contrib.hexagon.link_shared:')
print(' Using linker:', linker)
print(' Library name:', so_name)
print(' Object files:', objs)
if not os.access(linker, os.X_OK):
message = 'The linker "' + linker + '" does not exist or is not executable.'
if not os.environ.get('HEXAGON_TOOLCHAIN'):
message += ' The environment variable HEXAGON_TOOLCHAIN is unset. Please export ' + \
'HEXAGON_TOOLCHAIN in your environment, so that ${HEXAGON_TOOLCHAIN}/bin/' + \
'hexagon-link exists.'
else:
message += ' Please verify the value of the HEXAGON_LINKER environment variable ' + \
'(currently set to "' + hexagon_toolchain_root + '").'
raise Exception(message)

libpath = os.path.join(
hexagon_toolchain_root, 'target', 'hexagon', 'lib', 'v66', 'G0')
cc.create_shared(
so_name, objs,
# pylint: disable=bad-whitespace
options = ['-Bdynamic', '-shared', '-export-dynamic',
os.path.join(libpath, 'pic', 'libgcc.so')],
cc = linker)
return 0


### VTCM

vtcm_size = 4*1024*1024 # pylint: disable=invalid-name
@register_func('tvm.info.mem.local.vtcm')
def mem_info_vtcm():
# pylint: disable=bad-whitespace
return tvm.ir.make_node('MemoryInfo',
unit_bits = 8,
max_num_bits = vtcm_size*8,
max_simd_bits = 128*8,
head_address = tvm.runtime.const(100, 'uint32'))

def lower_vtcm_(get_alloc, get_free, def_align, func, mod, ctx): # pylint: disable=unused-argument
"""Generic VTCM allocation
Parameters
----------
get_alloc : function: tir.Allocate, int -> tir.expr (dtype='handle')
The VTCM allocation function. It takes an Allocate statement, and the required
alignment, and returns a pointer to the allocated VTCM buffer.
get_free : function: tir.expr (dtype='handle') -> None
The VTCM deallocation function. It takes the address of the allocated buffer
and frees it. It returns no value.
def_align : int
The default alignment that will be passed to the allocation function, if the
program does not specify the alignment via a 'storage_alignment' attribute.
func : tir.PrimFunc
mod : tvm.IRModule
ctx : transform.PassContext
Returns
-------
stmt : tvm.stmt
Transformed function body.
"""

vtcm_buffers = []
alignments = {}

def buf_align(var):
"""Determine the alignment of the buffer with variable 'var'."""
if var in alignments and alignments[var]:
return alignments[var][-1]
return def_align

def visit(stmt):
"""Collect information about VTCM buffers and their alignments."""
if isinstance(stmt, tvm.tir.AttrStmt):
if stmt.attr_key == 'storage_scope' and stmt.value == 'local.vtcm':
vtcm_buffers.append(stmt.node)
elif stmt.attr_key == 'storage_alignment':
if not stmt.node in alignments:
alignments[stmt.node] = []
alignments[stmt.node].append(stmt.value)

def mutate(stmt):
"""Insert calls to VTCM allocation and deallocation routines."""
if isinstance(stmt, tvm.tir.AttrStmt):
if stmt.attr_key == 'storage_scope' and stmt.value == 'local.vtcm':
vtcm_buffers.pop()
elif stmt.attr_key == 'storage_alignment':
alignments[stmt.node].pop()
return stmt
if isinstance(stmt, tvm.tir.Allocate):
var = stmt.buffer_var
if var in vtcm_buffers:
is_null = tvm.tir.call_intrin('bool', tvm.ir.Op.get('tir.isnullptr'), var)
throw_error = \
tvm.tir.call_intrin('int32', tvm.ir.Op.get('tir.tvm_throw_last_error'))
body_w_free = tvm.tir.SeqStmt([stmt.body, tvm.tir.Evaluate(get_free(var))])
body_w_check = \
tvm.tir.IfThenElse(is_null, tvm.tir.Evaluate(throw_error), body_w_free)
return tvm.tir.LetStmt(stmt.buffer_var, get_alloc(stmt, buf_align(var)),
body_w_check)
return stmt
raise ValueError("Wrong argument type (" + type(stmt) + ") to 'mutate'")

f = func.with_body(tvm.tir.stmt_functor.ir_transform(func.body, visit, mutate,
['tir.Allocate', 'tir.AttrStmt']))
return f


def ir_lower_vtcm():
"""Create a VTCM lowering pass.
VTCM memory has to be allocated using special functions.
"""
def get_alloc(stmt, align):
assert isinstance(stmt, tvm.tir.Allocate)
return tvm.tir.call_extern('handle', 'HexagonBackendAllocateVTCM',
ft.reduce(lambda x, y: x*y, stmt.extents, 1), align)
def get_free(var):
return tvm.tir.call_extern('handle', 'HexagonBackendFreeVTCM', var)

# pylint: disable=bad-whitespace
@tvm.tir.transform.prim_func_pass(opt_level = 0, name = "Lower VTCM pass")
def transform(func, mod, ctx):
return lower_vtcm_(get_alloc, get_free, 2048, func, mod, ctx)

return transform

def ir_lower_vtcm_pass():
return [(3, ir_lower_vtcm())]
22 changes: 18 additions & 4 deletions python/tvm/target/target.py
Original file line number Diff line number Diff line change
Expand Up @@ -236,7 +236,7 @@ def bifrost(model='unknown', options=None):
return _ffi_api.TargetCreate("opencl", *opts)


def hexagon(cpu_ver='v66', sim_args=None, hvx=128):
def hexagon(cpu_ver='v66', sim_args=None, llvm_args=None, hvx=128):
"""Returns a Hexagon target.
Parameters
Expand All @@ -249,6 +249,8 @@ def hexagon(cpu_ver='v66', sim_args=None, hvx=128):
Otherwise, separate versions are used for codegen and sim. Not
all allowed cpu strings will be valid, simulator will throw an
error if invalid. Does not affect codegen.
llvm_args : str or list of str
User defined compiler arguments.
hvx : int
Size of hvx register. Value of 0 indicates disabled hvx.
"""
Expand All @@ -274,7 +276,7 @@ def create_target(cpu_ver):
# HVX enable
if hvx:
mattr = ' -mattr=+hvx' + cpu_ver + ',+hvx-length' + str(hvx) + 'b'
return 'llvm' + target + mcpu + mattr
return target + mcpu + mattr

# Simulator string
def create_sim(cpu_ver, sim_args):
Expand Down Expand Up @@ -325,12 +327,24 @@ def validate_hvx_length(codegen_hvx, sim_args):

return sim_cpu + ' ' + validate_hvx_length(hvx, sim_args)

# LLVM string
def create_llvm(llvm_args):
# TVM's option parser doesn't allow '=' in values, but '=' can
# appear in LLVM flags. Replace it with '@', since it's unlikely
# that '@' will be used in another context.
if llvm_args is None or len(llvm_args.replace(' ', '')) == 0:
return ''
args = [s.replace('=', '@') for s in llvm_args.split()]
return '--llvm-options=' + ','.join(args)

# Sim args
os.environ['HEXAGON_SIM_ARGS'] = create_sim(cpu_ver, sim_args)

target_str = create_target(cpu_ver)
args_list = target_str.split()
return _ffi_api.TargetCreate("hexagon", *args_list)
llvm_str = create_llvm(llvm_args)
args_list = target_str.split() + llvm_str.split()

return _ffi_api.TargetCreate('hexagon', *args_list)


def create(target_str):
Expand Down
22 changes: 18 additions & 4 deletions src/runtime/hexagon/hexagon_module.cc
Original file line number Diff line number Diff line change
Expand Up @@ -195,24 +195,25 @@ class HexagonModuleNode final : public runtime::ModuleNode {
std::unordered_map<std::string, FunctionInfo> fmap, std::string asm_str,
std::string obj_str, std::string ir_str, std::string bc_str,
const std::set<std::string>& packed_c_abi)
: hexagon_device_(hexagon::Device::Global()),
: hexagon_device_(),
dl_handle_(nullptr),
data_(data),
fmt_(fmt),
fmap_(fmap),
asm_(asm_str),
obj_(obj_str),
ir_(ir_str),
bc_(bc_str),
packed_c_abi_funcs_(packed_c_abi) {
dl_handle_ = hexagon_device_->Load(data, fmt);
}
packed_c_abi_funcs_(packed_c_abi) {}

~HexagonModuleNode() {
if (dl_handle_) {
hexagon_device_->Unload(dl_handle_);
}
}

PackedFunc GetFunction(const std::string& name, const ObjectPtr<Object>& sptr_to_self) final;
std::string GetSource(const std::string& format) final;

const char* type_key() const final { return "hexagon"; }

Expand Down Expand Up @@ -333,6 +334,9 @@ PackedFunc HexagonModuleNode::GetFunction(const std::string& name,
auto f = fmap_.find(name);
if (f == fmap_.end()) return PackedFunc(nullptr);

if (!hexagon_device_) hexagon_device_ = hexagon::Device::Global();
if (!dl_handle_) dl_handle_ = hexagon_device_->Load(data_, fmt_);

// Get function pointer from device.
void* pf = hexagon_device_->Resolve(name);
// The cast result and the original share ownership. Do the cast here
Expand All @@ -355,6 +359,16 @@ PackedFunc HexagonModuleNode::GetFunction(const std::string& name,
}
}

std::string HexagonModuleNode::GetSource(const std::string& format) {
if (format == "s" || format == "asm") {
return asm_;
}
if (format == "ll") {
return ir_;
}
return "";
}

void HexagonModuleNode::RemapArgs(const TVMArgs& args, std::vector<TVMValue>& values,
std::vector<int>& type_codes,
std::vector<void*>& remote_tensors) const {
Expand Down
2 changes: 2 additions & 0 deletions src/runtime/module.cc
Original file line number Diff line number Diff line change
Expand Up @@ -138,6 +138,8 @@ bool RuntimeEnabled(const std::string& target) {
f_name = "device_api.rpc";
} else if (target == "micro_dev") {
f_name = "device_api.micro_dev";
} else if (target == "hexagon") {
f_name = "device_api.hexagon";
} else if (target.length() >= 5 && target.substr(0, 5) == "nvptx") {
f_name = "device_api.gpu";
} else if (target.length() >= 4 && target.substr(0, 4) == "rocm") {
Expand Down
Loading

0 comments on commit 11e23f9

Please sign in to comment.