Blame - verif/checker/tosa_result_checker.py - tosa/reference_model

2021-12-15 17:14:56 +0000

[diff] [blame]

1

"""TOSA result checker script."""

Jeremy Johnson

2023-09-14 17:02:09 +0100

[diff] [blame]

2

Jeremy Johnson

2021-12-15 17:14:56 +0000

[diff] [blame]

3

# SPDX-License-Identifier: Apache-2.0

4

import argparse

Jeremy Johnson

2023-09-14 17:02:09 +0100

[diff] [blame]

5

import json

Jeremy Johnson

2021-12-15 17:14:56 +0000

[diff] [blame]

6

from enum import IntEnum

7

from enum import unique

8

from pathlib import Path

9

10

import numpy as np

Jeremy Johnson

2023-09-14 17:02:09 +0100

[diff] [blame]

11

from checker.color_print import LogColors

12

from checker.color_print import print_color

13

from checker.verifier import VerifierError

14

from checker.verifier import VerifierLibrary

James Ward

2022-10-19 12:20:31 +0100

[diff] [blame]

15

from generator.tosa_utils import float32_is_valid_bfloat16

Jeremy Johnson

2023-09-14 17:02:09 +0100

[diff] [blame]

16

from schemavalidation.schemavalidation import TestDescSchemaValidator

Jeremy Johnson

2021-12-15 17:14:56 +0000

[diff] [blame]

@unique

class TestResult(IntEnum):

21

"""Test result values."""

22

23

# Note: PASS must be 0 for command line return success

PASS = 0

MISSING_FILE = 1

INCORRECT_FORMAT = 2

MISMATCH = 3

INTERNAL_ERROR = 4

TestResultErrorStr = [

"",

"Missing file",

"Incorrect format",

"Mismatch",

"Internal error",

]

##################################

39

Jeremy Johnson

2022-09-15 10:38:17 +0100

[diff] [blame]

40

DEFAULT_FP_TOLERANCE = 1e-3

Jeremy Johnson

2023-09-14 17:02:09 +0100

[diff] [blame]

41

result_printing = True

42

43

44

def set_print_result(enabled):

45

"""Set whether to print out or not."""

46

global result_printing

47

result_printing = enabled

48

49

50

def _print_result(color, msg):

51

"""Print out result."""

52

global result_printing

53

if result_printing:

54

print_color(color, msg)

55

56

57

def compliance_check(

imp_result_path,

ref_result_path,

bnd_result_path,

test_name,

compliance_config,

ofm_name,

verify_lib_path,

):

Jeremy Johnson

2023-11-27 15:02:04 +0000

[diff] [blame^]

66

if verify_lib_path is None:

67

error = "Please supply --verify-lib-path"

else:

error = None

try:

vlib = VerifierLibrary(verify_lib_path)

72

except VerifierError as e:

73

error = str(e)

74

75

if error is not None:

Jeremy Johnson

2023-09-14 17:02:09 +0100

[diff] [blame]

76

_print_result(LogColors.RED, f"INTERNAL ERROR {test_name}")

Jeremy Johnson

2023-11-27 15:02:04 +0000

[diff] [blame^]

77

msg = f"Could not load verfier library: {error}"

Jeremy Johnson

2023-09-14 17:02:09 +0100

[diff] [blame]

78

return (TestResult.INTERNAL_ERROR, 0.0, msg)

79

80

success = vlib.verify_data(

81

ofm_name, compliance_config, imp_result_path, ref_result_path, bnd_result_path

82

)

83

if success:

Jeremy Johnson

2023-11-27 15:02:04 +0000

[diff] [blame^]

84

_print_result(LogColors.GREEN, f"Compliance Results PASS {test_name}")

Jeremy Johnson

2023-09-14 17:02:09 +0100

[diff] [blame]

85

return (TestResult.PASS, 0.0, "")

86

else:

87

_print_result(LogColors.RED, f"Results NON-COMPLIANT {test_name}")

Jeremy Johnson

6ce3502

2023-11-21 11:22:22 +0000

[diff] [blame]

88

return (TestResult.MISMATCH, 0.0, "Non-compliance results found")

Jeremy Johnson

2022-09-15 10:38:17 +0100

[diff] [blame]

89

Jeremy Johnson

2021-12-15 17:14:56 +0000

[diff] [blame]

90

91

def test_check(

Jeremy Johnson

2023-09-14 17:02:09 +0100

[diff] [blame]

92

ref_result_path,

93

imp_result_path,

94

test_name=None,

James Ward

2022-10-19 12:20:31 +0100

[diff] [blame]

95

quantize_tolerance=0,

Jeremy Johnson

2022-09-15 10:38:17 +0100

[diff] [blame]

96

float_tolerance=DEFAULT_FP_TOLERANCE,

James Ward

2022-10-19 12:20:31 +0100

[diff] [blame]

97

misc_checks=[],

Jeremy Johnson

2023-09-14 17:02:09 +0100

[diff] [blame]

98

test_desc=None,

99

bnd_result_path=None,

100

ofm_name=None,

101

verify_lib_path=None,

Jeremy Johnson

2021-12-15 17:14:56 +0000

[diff] [blame]

102

):

103

"""Check if the result is the same as the expected reference."""

Jeremy Johnson

2023-09-14 17:02:09 +0100

[diff] [blame]

104

if test_desc:

105

# New compliance method - first get test details

106

try:

107

TestDescSchemaValidator().validate_config(test_desc)

108

except Exception as e:

109

_print_result(LogColors.RED, f"Test INCORRECT FORMAT {test_name}")

110

msg = f"Incorrect test format: {e}"

111

return (TestResult.INCORRECT_FORMAT, 0.0, msg)

Jeremy Johnson

2021-12-15 17:14:56 +0000

[diff] [blame]

112

Jeremy Johnson

2023-09-14 17:02:09 +0100

[diff] [blame]

113

if test_name is None:

114

test_name = "test"

115

116

paths = [imp_result_path, ref_result_path, bnd_result_path]

117

names = ["Implementation", "Reference", "Bounds"]

118

arrays = [None, None, None]

119

120

# Check the files exist and are in the right format

121

for idx, path in enumerate(paths):

122

name = names[idx]

123

if path is None and name == "Bounds":

124

# Bounds can be None - skip it

125

continue

126

if not path.is_file():

127

_print_result(LogColors.RED, f"{name} MISSING FILE {test_name}")

128

msg = f"Missing {name} file: {str(path)}"

129

return (TestResult.MISSING_FILE, 0.0, msg)

130

try:

131

arrays[idx] = np.load(path)

132

except Exception as e:

133

_print_result(LogColors.RED, f"{name} INCORRECT FORMAT {test_name}")

134

msg = f"Incorrect numpy format of {str(path)}\nnumpy.load exception: {e}"

135

return (TestResult.INCORRECT_FORMAT, 0.0, msg)

136

137

if test_desc and "meta" in test_desc and "compliance" in test_desc["meta"]:

138

# Switch to using the verifier library for full compliance

139

if ofm_name is None:

140

ofm_name = test_desc["ofm_name"][0]

141

if len(test_desc["ofm_name"]) > 1:

142

_print_result(LogColors.RED, f"Output Name MISSING FILE {test_name}")

143

msg = "Must specify output name (ofm_name) to check as multiple found in desc.json"

144

return (TestResult.MISSING_FILE, 0.0, msg)

145

146

compliance_json = test_desc["meta"]["compliance"]

147

148

return compliance_check(

*arrays,

test_name,

compliance_json,

ofm_name,

verify_lib_path,

Jeremy Johnson

2022-09-15 10:38:17 +0100

[diff] [blame]

154

)

Jeremy Johnson

2023-09-14 17:02:09 +0100

[diff] [blame]

155

156

# Else continue with original checking method

157

test_result, reference_result, _ = arrays

Jeremy Johnson

2021-12-15 17:14:56 +0000

[diff] [blame]

158

159

# Type comparison

160

if test_result.dtype != reference_result.dtype:

Jeremy Johnson

2023-09-14 17:02:09 +0100

[diff] [blame]

161

_print_result(LogColors.RED, "Results TYPE MISMATCH {}".format(test_name))

Jeremy Johnson

2021-12-15 17:14:56 +0000

[diff] [blame]

162

msg = "Mismatch results type: Expected {}, got {}".format(

163

reference_result.dtype, test_result.dtype

164

)

165

return (TestResult.MISMATCH, 0.0, msg)

166

167

# Size comparison

168

# Size = 1 tensors can be equivalently represented as having rank 0 or rank

169

# >= 0, allow that special case

170

test_result = np.squeeze(test_result)

171

reference_result = np.squeeze(reference_result)

Jeremy Johnson

2022-09-15 10:38:17 +0100

[diff] [blame]

172

difference = None

Jeremy Johnson

2021-12-15 17:14:56 +0000

[diff] [blame]

173

174

if np.shape(test_result) != np.shape(reference_result):

Jeremy Johnson

2023-09-14 17:02:09 +0100

[diff] [blame]

175

_print_result(LogColors.RED, "Results MISCOMPARE {}".format(test_name))

Jeremy Johnson

2021-12-15 17:14:56 +0000

[diff] [blame]

176

msg = "Shapes mismatch: Reference {} vs {}".format(

177

np.shape(test_result), np.shape(reference_result)

178

)

179

return (TestResult.MISMATCH, 0.0, msg)

180

James Ward

2022-10-19 12:20:31 +0100

[diff] [blame]

181

# Perform miscellaneous checks

182

if "bf16" in misc_checks:

183

# Ensure floats are valid bfloat16 values

184

test_res_is_bf16 = all([float32_is_valid_bfloat16(f) for f in test_result.flat])

185

ref_res_is_bf16 = all(

186

[float32_is_valid_bfloat16(f) for f in reference_result.flat]

187

)

188

if not (test_res_is_bf16 and ref_res_is_bf16):

189

msg = (

190

"All output values must be valid bfloat16. "

191

"reference_result: {ref_res_is_bf16}; test_result: {test_res_is_bf16}"

192

)

193

return (TestResult.INCORRECT_FORMAT, 0.0, msg)

194

Jeremy Johnson

2021-12-15 17:14:56 +0000

[diff] [blame]

195

# for quantized test, allow +-(quantize_tolerance) error

Jeremy Johnson

72dcab7

2023-10-30 10:28:21 +0000

[diff] [blame]

196

if reference_result.dtype in (

np.int8,

np.int16,

np.int32,

np.int64,

np.uint8,

np.uint16,

):

Jeremy Johnson

2021-12-15 17:14:56 +0000

[diff] [blame]

204

205

if np.all(np.absolute(reference_result - test_result) <= quantize_tolerance):

Jeremy Johnson

2023-09-14 17:02:09 +0100

[diff] [blame]

206

_print_result(LogColors.GREEN, "Results PASS {}".format(test_name))

Jeremy Johnson

2021-12-15 17:14:56 +0000

[diff] [blame]

207

return (TestResult.PASS, 0.0, "")

208

else:

209

tolerance = quantize_tolerance + 1

210

while not np.all(

211

np.absolute(reference_result - test_result) <= quantize_tolerance

212

):

213

tolerance = tolerance + 1

if tolerance > 10:

break

if tolerance > 10:

msg = "Integer result does not match and is greater than 10 difference"

219

else:

220

msg = (

221

"Integer result does not match but is within {} difference".format(

tolerance

)

)

# Fall-through to below to add failure values

Jeremy Johnson

2022-09-15 10:38:17 +0100

[diff] [blame]

226

difference = reference_result - test_result

Jeremy Johnson

2021-12-15 17:14:56 +0000

[diff] [blame]

227

228

elif reference_result.dtype == bool:

229

assert test_result.dtype == bool

230

# All boolean values must match, xor will show up differences

231

test = np.array_equal(reference_result, test_result)

232

if np.all(test):

Jeremy Johnson

2023-09-14 17:02:09 +0100

[diff] [blame]

233

_print_result(LogColors.GREEN, "Results PASS {}".format(test_name))

Jeremy Johnson

2021-12-15 17:14:56 +0000

[diff] [blame]

234

return (TestResult.PASS, 0.0, "")

235

msg = "Boolean result does not match"

236

tolerance = 0.0

Jeremy Johnson

2022-09-15 10:38:17 +0100

[diff] [blame]

237

difference = None

Jeremy Johnson

2021-12-15 17:14:56 +0000

[diff] [blame]

238

# Fall-through to below to add failure values

239

James Ward

8b39043

2022-08-12 20:48:56 +0100

[diff] [blame]

240

# TODO: update for fp16 tolerance

241

elif reference_result.dtype == np.float32 or reference_result.dtype == np.float16:

Jeremy Johnson

2021-12-15 17:14:56 +0000

[diff] [blame]

242

tolerance = float_tolerance

243

if np.allclose(reference_result, test_result, atol=tolerance, equal_nan=True):

Jeremy Johnson

2023-09-14 17:02:09 +0100

[diff] [blame]

244

_print_result(LogColors.GREEN, "Results PASS {}".format(test_name))

Jeremy Johnson

2021-12-15 17:14:56 +0000

[diff] [blame]

245

return (TestResult.PASS, tolerance, "")

246

msg = "Float result does not match within tolerance of {}".format(tolerance)

Jeremy Johnson

2022-09-15 10:38:17 +0100

[diff] [blame]

247

difference = reference_result - test_result

Jeremy Johnson

2021-12-15 17:14:56 +0000

[diff] [blame]

248

# Fall-through to below to add failure values

Jeremy Johnson

2021-12-15 17:14:56 +0000

[diff] [blame]

249

else:

Jeremy Johnson

2023-09-14 17:02:09 +0100

[diff] [blame]

250

_print_result(LogColors.RED, "Results UNSUPPORTED TYPE {}".format(test_name))

Jeremy Johnson

2021-12-15 17:14:56 +0000

[diff] [blame]

251

msg = "Unsupported results type: {}".format(reference_result.dtype)

252

return (TestResult.MISMATCH, 0.0, msg)

253

254

# Fall-through for mismatch failure to add values to msg

Jeremy Johnson

2023-09-14 17:02:09 +0100

[diff] [blame]

255

_print_result(LogColors.RED, "Results MISCOMPARE {}".format(test_name))

Jeremy Johnson

2022-09-15 10:38:17 +0100

[diff] [blame]

256

np.set_printoptions(threshold=128, edgeitems=2)

257

258

if difference is not None:

259

tolerance_needed = np.amax(np.absolute(difference))

260

msg = "{}\n-- tolerance_needed: {}".format(msg, tolerance_needed)

261

262

msg = "{}\n>> reference_result: {}\n{}".format(

Jeremy Johnson

2021-12-15 17:14:56 +0000

[diff] [blame]

263

msg, reference_result.shape, reference_result

264

)

Jeremy Johnson

2022-09-15 10:38:17 +0100

[diff] [blame]

265

msg = "{}\n<< test_result: {}\n{}".format(msg, test_result.shape, test_result)

266

267

if difference is not None:

268

msg = "{}\n!! difference_result: \n{}".format(msg, difference)

Jeremy Johnson

2021-12-15 17:14:56 +0000

[diff] [blame]

269

return (TestResult.MISMATCH, tolerance, msg)

270

271

272

def main(argv=None):

Jeremy Johnson

2022-09-15 10:38:17 +0100

[diff] [blame]

273

"""Check that the supplied reference and result files have the same contents."""

Jeremy Johnson

2021-12-15 17:14:56 +0000

[diff] [blame]

274

parser = argparse.ArgumentParser()

275

parser.add_argument(

Jeremy Johnson

2023-09-14 17:02:09 +0100

[diff] [blame]

276

"ref_result_path",

277

type=Path,

278

help="path to the reference model result file to check",

Jeremy Johnson

2021-12-15 17:14:56 +0000

[diff] [blame]

279

)

280

parser.add_argument(

Jeremy Johnson

2023-09-14 17:02:09 +0100

[diff] [blame]

281

"imp_result_path",

282

type=Path,

283

help="path to the implementation result file to check",

Jeremy Johnson

2021-12-15 17:14:56 +0000

[diff] [blame]

284

)

Jeremy Johnson

2022-09-15 10:38:17 +0100

[diff] [blame]

285

parser.add_argument(

286

"--fp-tolerance", type=float, default=DEFAULT_FP_TOLERANCE, help="FP tolerance"

287

)

Jeremy Johnson

2023-09-14 17:02:09 +0100

[diff] [blame]

288

parser.add_argument(

Jeremy Johnson

2023-11-27 15:02:04 +0000

[diff] [blame^]

289

"--test-path", type=Path, help="path to the test that produced the results"

Jeremy Johnson

2023-09-14 17:02:09 +0100

[diff] [blame]

290

)

Jeremy Johnson

2023-11-27 15:02:04 +0000

[diff] [blame^]

291

# Deprecate the incorrectly formatted option by hiding it

292

parser.add_argument("--test_path", type=Path, help=argparse.SUPPRESS)

Jeremy Johnson

2023-09-14 17:02:09 +0100

[diff] [blame]

parser.add_argument(

"--bnd-result-path",

type=Path,

help="path to the reference model bounds result file for the dot product compliance check",

)

parser.add_argument(

"--ofm-name",

type=str,

help="name of the output tensor to check, defaults to the first ofm_name listed in the test",

)

parser.add_argument(

"--verify-lib-path",

type=Path,

help="path to TOSA verify library",

307

)

Jeremy Johnson

2021-12-15 17:14:56 +0000

[diff] [blame]

308

args = parser.parse_args(argv)

Jeremy Johnson

2021-12-15 17:14:56 +0000

[diff] [blame]

309

Jeremy Johnson

2023-09-14 17:02:09 +0100

[diff] [blame]

310

if args.test_path:

311

# Get details from the test path

312

test_desc_path = args.test_path / "desc.json"

313

if not args.test_path.is_dir() or not test_desc_path.is_file():

314

print(f"Invalid test directory {str(args.test_path)}")

315

return TestResult.MISSING_FILE

316

317

try:

318

with test_desc_path.open("r") as fd:

319

test_desc = json.load(fd)

320

except Exception as e:

321

print(f"Invalid test description file {str(test_desc_path)}: {e}")

322

return TestResult.INCORRECT_FORMAT

323

test_name = args.test_path.name

else:

test_desc = None

test_name = None

Jeremy Johnson

2022-09-15 10:38:17 +0100

[diff] [blame]

328

result, tolerance, msg = test_check(

Jeremy Johnson

2023-09-14 17:02:09 +0100

[diff] [blame]

329

args.ref_result_path,

330

args.imp_result_path,

331

float_tolerance=args.fp_tolerance,

332

test_name=test_name,

333

test_desc=test_desc,

334

bnd_result_path=args.bnd_result_path,

335

ofm_name=args.ofm_name,

336

verify_lib_path=args.verify_lib_path,

Jeremy Johnson

2022-09-15 10:38:17 +0100

[diff] [blame]

337

)

Jeremy Johnson