blob: 41ac844eeaa3538555a990996e77df6fa4069266 [file] [log] [blame]
# Licensed to the Apache Software Foundation (ASF) under one
# or more contributor license agreements. See the NOTICE file
# distributed with this work for additional information
# regarding copyright ownership. The ASF licenses this file
# to you under the Apache License, Version 2.0 (the
# "License"); you may not use this file except in compliance
# with the License. You may obtain a copy of the License at
#
# http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing,
# software distributed under the License is distributed on an
# "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
# KIND, either express or implied. See the License for the
# specific language governing permissions and limitations
# under the License.
import pytest
import tvm
from tvm.target import _ffi_api, codegen, Target
from tvm.target.codegen import target_has_features
LLVM_VERSION = codegen.llvm_version_major()
min_llvm_version, tvm_target, x86_feature, is_supported = tvm.testing.parameters(
# sse4.1
(-1, "llvm -mtriple=x86_64-- -mcpu=btver2", "sse4a", True),
(-1, "llvm -mtriple=x86_64-- -mcpu=penryn", "sse4.1", True),
(-1, "llvm -mtriple=x86_64-- -mcpu=silvermont", "sse4.2", True),
(11, "llvm -mtriple=x86_64-- -mcpu=slm", "sse4.2", True),
(-1, "llvm -mtriple=x86_64-- -mcpu=goldmont", "sse4.2", True),
(-1, "llvm -mtriple=x86_64-- -mcpu=goldmont-plus", "sse4.2", True),
(-1, "llvm -mtriple=x86_64-- -mcpu=tremont", "sse4.2", True),
(-1, "llvm -mtriple=x86_64-- -mcpu=nehalem", "sse4.2", True),
(11, "llvm -mtriple=x86_64-- -mcpu=corei7", "sse4.2", True),
(-1, "llvm -mtriple=x86_64-- -mcpu=westmere", "sse4.2", True),
(-1, "llvm -mtriple=x86_64-- -mcpu=bdver1", "sse4.2", True),
(-1, "llvm -mtriple=x86_64-- -mcpu=bdver2", "sse4.2", True),
(-1, "llvm -mtriple=x86_64-- -mcpu=bdver3", "sse4.2", True),
(11, "llvm -mtriple=x86_64-- -mcpu=x86-64-v2", "sse4.2", True),
# avx
(-1, "llvm -mtriple=x86_64-- -mcpu=sandybridge", "avx", True),
(11, "llvm -mtriple=x86_64-- -mcpu=corei7-avx", "avx", True),
(-1, "llvm -mtriple=x86_64-- -mcpu=ivybridge", "avx", True),
(11, "llvm -mtriple=x86_64-- -mcpu=core-avx-i", "avx", True),
# avx2
(-1, "llvm -mtriple=x86_64-- -mcpu=haswell", "avx2", True),
(11, "llvm -mtriple=x86_64-- -mcpu=core-avx2", "avx2", True),
(-1, "llvm -mtriple=x86_64-- -mcpu=broadwell", "avx2", True),
(-1, "llvm -mtriple=x86_64-- -mcpu=skylake", "avx2", True),
(-1, "llvm -mtriple=x86_64-- -mcpu=bdver4", "avx2", True),
(-1, "llvm -mtriple=x86_64-- -mcpu=znver1", "avx2", True),
(-1, "llvm -mtriple=x86_64-- -mcpu=znver2", "avx2", True),
(11, "llvm -mtriple=x86_64-- -mcpu=znver3", "avx2", True),
(11, "llvm -mtriple=x86_64-- -mcpu=x86-64-v3", "avx2", True),
# avx512bw
(-1, "llvm -mtriple=x86_64-- -mcpu=skylake-avx512", "avx512bw", True),
(11, "llvm -mtriple=x86_64-- -mcpu=skx", "avx512bw", True),
(11, "llvm -mtriple=x86_64-- -mcpu=knl", "avx512bw", False),
(-1, "llvm -mtriple=x86_64-- -mcpu=knl", "avx512f", True),
(11, "llvm -mtriple=x86_64-- -mcpu=knl", ["avx512bw", "avx512f"], False),
(11, "llvm -mtriple=x86_64-- -mcpu=knl", ("avx512bw", "avx512f"), False),
(-1, "llvm -mtriple=x86_64-- -mcpu=knl", "avx512cd", True),
(11, "llvm -mtriple=x86_64-- -mcpu=knl", ["avx512cd", "avx512f"], True),
(11, "llvm -mtriple=x86_64-- -mcpu=knl", ("avx512cd", "avx512f"), True),
(-1, "llvm -mtriple=x86_64-- -mcpu=knl", "avx512er", True),
(-1, "llvm -mtriple=x86_64-- -mcpu=knl", "avx512pf", True),
(11, "llvm -mtriple=x86_64-- -mcpu=knm", "avx512bw", False),
(-1, "llvm -mtriple=x86_64-- -mcpu=knm", "avx512f", True),
(-1, "llvm -mtriple=x86_64-- -mcpu=knm", "avx512cd", True),
(-1, "llvm -mtriple=x86_64-- -mcpu=knm", "avx512er", True),
(-1, "llvm -mtriple=x86_64-- -mcpu=knm", "avx512pf", True),
(11, "llvm -mtriple=x86_64-- -mcpu=x86-64-v4", "avx512bw", True),
(-1, "llvm -mtriple=x86_64-- -mcpu=cannonlake", "avx512bw", True),
# explicit enumeration of VNNI capable due to collision with alderlake
(11, "llvm -mtriple=x86_64-- -mcpu=alderlake", "avx512bw", False),
(-1, "llvm -mtriple=x86_64-- -mcpu=cascadelake", "avx512bw", True),
(-1, "llvm -mtriple=x86_64-- -mcpu=icelake-client", "avx512bw", True),
(-1, "llvm -mtriple=x86_64-- -mcpu=icelake-server", "avx512bw", True),
(11, "llvm -mtriple=x86_64-- -mcpu=rocketlake", "avx512bw", True),
(-1, "llvm -mtriple=x86_64-- -mcpu=tigerlake", "avx512bw", True),
(-1, "llvm -mtriple=x86_64-- -mcpu=cooperlake", "avx512bw", True),
(11, "llvm -mtriple=x86_64-- -mcpu=sapphirerapids", "avx512bw", True),
# avx512vnni
(11, "llvm -mtriple=x86_64-- -mcpu=alderlake", "avx512vnni", False),
(11, "llvm -mtriple=x86_64-- -mcpu=alderlake", "avxvnni", True),
(-1, "llvm -mtriple=x86_64-- -mcpu=cascadelake", "avx512vnni", True),
(-1, "llvm -mtriple=x86_64-- -mcpu=icelake-client", "avx512vnni", True),
(-1, "llvm -mtriple=x86_64-- -mcpu=icelake-server", "avx512vnni", True),
(11, "llvm -mtriple=x86_64-- -mcpu=rocketlake", "avx512vnni", True),
(-1, "llvm -mtriple=x86_64-- -mcpu=tigerlake", "avx512vnni", True),
(-1, "llvm -mtriple=x86_64-- -mcpu=cooperlake", "avx512vnni", True),
(11, "llvm -mtriple=x86_64-- -mcpu=sapphirerapids", "avx512vnni", True),
# amx-int8
(11, "llvm -mtriple=x86_64-- -mcpu=sapphirerapids", "amx-int8", True),
# generic CPU (no features) but with extra -mattr
(-1, "llvm -mtriple=x86_64-- -mcpu=x86-64 -mattr=+sse4.1,+avx2", "avx2", True),
(-1, "llvm -mtriple=x86_64-- -mcpu=x86-64 -mattr=+sse4.1,+avx2", "sse4.1", True),
# enabling +sse4.1 implies ssse3 presence in LLVM
(-1, "llvm -mtriple=x86_64-- -mcpu=x86-64 -mattr=+sse4.1,+avx2", "ssse3", True),
(-1, "llvm -mtriple=x86_64-- -mcpu=ivybridge -mattr=-ssse3", "ssse3", False),
# disabling avx512f (foundation) also disables avx512bw
(-1, "llvm -mtriple=x86_64-- -mcpu=cascadelake -mattr=-avx512f", "avx512bw", False),
)
def test_x86_target_features(min_llvm_version, tvm_target, x86_feature, is_supported):
"""Test X86 features support for different targets.
Parameters
----------
min_llvm_version : int
Minimal LLVM version.
tvm_target : str
TVM target.
x86_feature : str
X86 CPU feature.
is_supported : bool
Expected result.
"""
##
## no context
##
# check for feature via the python api (no explicit target, no context target)
try:
assert target_has_features(x86_feature) == is_supported
assert False
except tvm.error.InternalError as e:
msg = str(e)
assert msg.find("Check failed: (allow_not_defined) is false: Target context required") != -1
if isinstance(x86_feature, str):
# check for feature via the ffi llvm api (no explicit target, no context target)
try:
assert _ffi_api.target_has_feature(x86_feature, None) == is_supported
assert False
except tvm.error.InternalError as e:
msg = str(e)
assert (
msg.find("Check failed: (allow_not_defined) is false: Target context required")
!= -1
)
# skip test on llvm_version
if LLVM_VERSION < min_llvm_version:
return
# check for feature via the python api (with explicit target, no context target)
assert target_has_features(x86_feature, Target(tvm_target)) == is_supported
if isinstance(x86_feature, str):
# check for feature via the ffi llvm api (with explicit target, no context target)
assert _ffi_api.target_has_feature(x86_feature, Target(tvm_target)) == is_supported
##
## with context
##
with Target(tvm_target):
mcpu = Target.current(False).mcpu
# check for feature via the python api (current context target)
assert target_has_features(x86_feature) == is_supported
# check for feature via the python api (with explicit target)
assert target_has_features(x86_feature, Target(tvm_target)) == is_supported
# check for feature via the ffi llvm api (current context target)
(sum(_ffi_api.target_has_feature(feat, None) for feat in x86_feature) > 0) == is_supported
# check for feature in target's llvm full x86 CPU feature list
if (not Target(tvm_target).mattr) and isinstance(x86_feature, str):
assert (x86_feature in codegen.llvm_get_cpu_features()) == is_supported