Blame - verif/checker/tosa_result_checker.py - tosa/reference_model

2021-12-15 17:14:56 +0000

[diff] [blame]

1

"""TOSA result checker script."""

Jeremy Johnson

2024-01-18 16:57:28 +0000

[diff] [blame^]

2

Jeremy Johnson

2021-12-15 17:14:56 +0000

[diff] [blame]

3

# SPDX-License-Identifier: Apache-2.0

4

import argparse

Jeremy Johnson

2023-09-14 17:02:09 +0100

[diff] [blame]

5

import json

Jeremy Johnson

2021-12-15 17:14:56 +0000

[diff] [blame]

6

from enum import IntEnum

7

from enum import unique

8

from pathlib import Path

9

10

import numpy as np

Jeremy Johnson

2023-09-14 17:02:09 +0100

[diff] [blame]

11

from checker.color_print import LogColors

12

from checker.color_print import print_color

13

from checker.verifier import VerifierError

14

from checker.verifier import VerifierLibrary

James Ward

2022-10-19 12:20:31 +0100

[diff] [blame]

15

from generator.tosa_utils import float32_is_valid_bfloat16

Jeremy Johnson

2023-09-14 17:02:09 +0100

[diff] [blame]

16

from schemavalidation.schemavalidation import TestDescSchemaValidator

Jeremy Johnson

2021-12-15 17:14:56 +0000

[diff] [blame]

@unique

class TestResult(IntEnum):

21

"""Test result values."""

22

23

# Note: PASS must be 0 for command line return success

PASS = 0

MISSING_FILE = 1

INCORRECT_FORMAT = 2

MISMATCH = 3

INTERNAL_ERROR = 4

TestResultErrorStr = [

"",

"Missing file",

"Incorrect format",

"Mismatch",

"Internal error",

]

##################################

39

Jeremy Johnson

2022-09-15 10:38:17 +0100

[diff] [blame]

40

DEFAULT_FP_TOLERANCE = 1e-3

Jeremy Johnson

2023-09-14 17:02:09 +0100

[diff] [blame]

41

result_printing = True

42

43

44

def set_print_result(enabled):

45

"""Set whether to print out or not."""

46

global result_printing

47

result_printing = enabled

48

49

50

def _print_result(color, msg):

51

"""Print out result."""

52

global result_printing

53

if result_printing:

54

print_color(color, msg)

55

56

57

def compliance_check(

Jeremy Johnson

2024-01-18 16:57:28 +0000

[diff] [blame^]

58

imp_result_data,

59

ref_result_data,

60

bnd_result_data,

Jeremy Johnson

2023-09-14 17:02:09 +0100

[diff] [blame]

test_name,

compliance_config,

ofm_name,

verify_lib_path,

):

Jeremy Johnson

2023-11-27 15:02:04 +0000

[diff] [blame]

66

if verify_lib_path is None:

67

error = "Please supply --verify-lib-path"

else:

error = None

try:

vlib = VerifierLibrary(verify_lib_path)

72

except VerifierError as e:

73

error = str(e)

74

75

if error is not None:

Jeremy Johnson

2023-09-14 17:02:09 +0100

[diff] [blame]

76

_print_result(LogColors.RED, f"INTERNAL ERROR {test_name}")

Jeremy Johnson

2023-11-27 15:02:04 +0000

[diff] [blame]

77

msg = f"Could not load verfier library: {error}"

Jeremy Johnson

2023-09-14 17:02:09 +0100

[diff] [blame]

78

return (TestResult.INTERNAL_ERROR, 0.0, msg)

79

80

success = vlib.verify_data(

Jeremy Johnson

2024-01-18 16:57:28 +0000

[diff] [blame^]

81

ofm_name, compliance_config, imp_result_data, ref_result_data, bnd_result_data

Jeremy Johnson

2023-09-14 17:02:09 +0100

[diff] [blame]

82

)

83

if success:

Jeremy Johnson

2023-11-27 15:02:04 +0000

[diff] [blame]

84

_print_result(LogColors.GREEN, f"Compliance Results PASS {test_name}")

Jeremy Johnson

2023-09-14 17:02:09 +0100

[diff] [blame]

85

return (TestResult.PASS, 0.0, "")

86

else:

87

_print_result(LogColors.RED, f"Results NON-COMPLIANT {test_name}")

Jeremy Johnson

2024-01-18 16:57:28 +0000

[diff] [blame^]

return (

TestResult.MISMATCH,

0.0,

f"Non-compliance results found for {ofm_name}",

92

)

Jeremy Johnson

2022-09-15 10:38:17 +0100

[diff] [blame]

93

Jeremy Johnson

2021-12-15 17:14:56 +0000

[diff] [blame]

94

95

def test_check(

Jeremy Johnson

2023-09-14 17:02:09 +0100

[diff] [blame]

96

ref_result_path,

97

imp_result_path,

98

test_name=None,

James Ward

2022-10-19 12:20:31 +0100

[diff] [blame]

99

quantize_tolerance=0,

Jeremy Johnson

2022-09-15 10:38:17 +0100

[diff] [blame]

100

float_tolerance=DEFAULT_FP_TOLERANCE,

James Ward

2022-10-19 12:20:31 +0100

[diff] [blame]

101

misc_checks=[],

Jeremy Johnson

2023-09-14 17:02:09 +0100

[diff] [blame]

102

test_desc=None,

103

bnd_result_path=None,

104

ofm_name=None,

105

verify_lib_path=None,

Jeremy Johnson

2021-12-15 17:14:56 +0000

[diff] [blame]

106

):

107

"""Check if the result is the same as the expected reference."""

Jeremy Johnson

2023-09-14 17:02:09 +0100

[diff] [blame]

108

if test_desc:

109

# New compliance method - first get test details

110

try:

111

TestDescSchemaValidator().validate_config(test_desc)

112

except Exception as e:

113

_print_result(LogColors.RED, f"Test INCORRECT FORMAT {test_name}")

114

msg = f"Incorrect test format: {e}"

115

return (TestResult.INCORRECT_FORMAT, 0.0, msg)

Jeremy Johnson

2021-12-15 17:14:56 +0000

[diff] [blame]

116

Jeremy Johnson

2023-09-14 17:02:09 +0100

[diff] [blame]

117

if test_name is None:

118

test_name = "test"

119

120

paths = [imp_result_path, ref_result_path, bnd_result_path]

121

names = ["Implementation", "Reference", "Bounds"]

122

arrays = [None, None, None]

123

124

# Check the files exist and are in the right format

125

for idx, path in enumerate(paths):

126

name = names[idx]

127

if path is None and name == "Bounds":

128

# Bounds can be None - skip it

129

continue

130

if not path.is_file():

131

_print_result(LogColors.RED, f"{name} MISSING FILE {test_name}")

132

msg = f"Missing {name} file: {str(path)}"

133

return (TestResult.MISSING_FILE, 0.0, msg)

134

try:

135

arrays[idx] = np.load(path)

136

except Exception as e:

137

_print_result(LogColors.RED, f"{name} INCORRECT FORMAT {test_name}")

138

msg = f"Incorrect numpy format of {str(path)}\nnumpy.load exception: {e}"

139

return (TestResult.INCORRECT_FORMAT, 0.0, msg)

140

141

if test_desc and "meta" in test_desc and "compliance" in test_desc["meta"]:

142

# Switch to using the verifier library for full compliance

143

if ofm_name is None:

144

ofm_name = test_desc["ofm_name"][0]

145

if len(test_desc["ofm_name"]) > 1:

146

_print_result(LogColors.RED, f"Output Name MISSING FILE {test_name}")

147

msg = "Must specify output name (ofm_name) to check as multiple found in desc.json"

148

return (TestResult.MISSING_FILE, 0.0, msg)

149

150

compliance_json = test_desc["meta"]["compliance"]

151

152

return compliance_check(

*arrays,

test_name,

compliance_json,

ofm_name,

verify_lib_path,

Jeremy Johnson

2022-09-15 10:38:17 +0100

[diff] [blame]

158

)

Jeremy Johnson

2023-09-14 17:02:09 +0100

[diff] [blame]

159

160

# Else continue with original checking method

161

test_result, reference_result, _ = arrays

Jeremy Johnson

2021-12-15 17:14:56 +0000

[diff] [blame]

162

163

# Type comparison

164

if test_result.dtype != reference_result.dtype:

Jeremy Johnson

2023-09-14 17:02:09 +0100

[diff] [blame]

165

_print_result(LogColors.RED, "Results TYPE MISMATCH {}".format(test_name))

Jeremy Johnson

2021-12-15 17:14:56 +0000

[diff] [blame]

166

msg = "Mismatch results type: Expected {}, got {}".format(

167

reference_result.dtype, test_result.dtype

168

)

169

return (TestResult.MISMATCH, 0.0, msg)

170

171

# Size comparison

172

# Size = 1 tensors can be equivalently represented as having rank 0 or rank

173

# >= 0, allow that special case

174

test_result = np.squeeze(test_result)

175

reference_result = np.squeeze(reference_result)

Jeremy Johnson

2022-09-15 10:38:17 +0100

[diff] [blame]

176

difference = None

Jeremy Johnson

2021-12-15 17:14:56 +0000

[diff] [blame]

177

178

if np.shape(test_result) != np.shape(reference_result):

Jeremy Johnson

2023-09-14 17:02:09 +0100

[diff] [blame]

179

_print_result(LogColors.RED, "Results MISCOMPARE {}".format(test_name))

Jeremy Johnson

2021-12-15 17:14:56 +0000

[diff] [blame]

180

msg = "Shapes mismatch: Reference {} vs {}".format(

181

np.shape(test_result), np.shape(reference_result)

182

)

183

return (TestResult.MISMATCH, 0.0, msg)

184

James Ward

2022-10-19 12:20:31 +0100

[diff] [blame]

185

# Perform miscellaneous checks

186

if "bf16" in misc_checks:

187

# Ensure floats are valid bfloat16 values

188

test_res_is_bf16 = all([float32_is_valid_bfloat16(f) for f in test_result.flat])

189

ref_res_is_bf16 = all(

190

[float32_is_valid_bfloat16(f) for f in reference_result.flat]

191

)

192

if not (test_res_is_bf16 and ref_res_is_bf16):

193

msg = (

194

"All output values must be valid bfloat16. "

195

"reference_result: {ref_res_is_bf16}; test_result: {test_res_is_bf16}"

196

)

197

return (TestResult.INCORRECT_FORMAT, 0.0, msg)

198

Jeremy Johnson

2021-12-15 17:14:56 +0000

[diff] [blame]

199

# for quantized test, allow +-(quantize_tolerance) error

Jeremy Johnson

72dcab7

2023-10-30 10:28:21 +0000

[diff] [blame]

200

if reference_result.dtype in (

np.int8,

np.int16,

np.int32,

np.int64,

np.uint8,

np.uint16,

):

Jeremy Johnson

2021-12-15 17:14:56 +0000

[diff] [blame]

208

209

if np.all(np.absolute(reference_result - test_result) <= quantize_tolerance):

Jeremy Johnson

2023-09-14 17:02:09 +0100

[diff] [blame]

210

_print_result(LogColors.GREEN, "Results PASS {}".format(test_name))

Jeremy Johnson

2021-12-15 17:14:56 +0000

[diff] [blame]

211

return (TestResult.PASS, 0.0, "")

212

else:

213

tolerance = quantize_tolerance + 1

214

while not np.all(

215

np.absolute(reference_result - test_result) <= quantize_tolerance

216

):

217

tolerance = tolerance + 1

if tolerance > 10:

break

if tolerance > 10:

msg = "Integer result does not match and is greater than 10 difference"

223

else:

224

msg = (

225

"Integer result does not match but is within {} difference".format(

tolerance

)

)

# Fall-through to below to add failure values

Jeremy Johnson

2022-09-15 10:38:17 +0100

[diff] [blame]

230

difference = reference_result - test_result

Jeremy Johnson

2021-12-15 17:14:56 +0000

[diff] [blame]

231

232

elif reference_result.dtype == bool:

233

assert test_result.dtype == bool

234

# All boolean values must match, xor will show up differences

235

test = np.array_equal(reference_result, test_result)

236

if np.all(test):

Jeremy Johnson

2023-09-14 17:02:09 +0100

[diff] [blame]

237

_print_result(LogColors.GREEN, "Results PASS {}".format(test_name))

Jeremy Johnson

2021-12-15 17:14:56 +0000

[diff] [blame]

238

return (TestResult.PASS, 0.0, "")

239

msg = "Boolean result does not match"

240

tolerance = 0.0

Jeremy Johnson

2022-09-15 10:38:17 +0100

[diff] [blame]

241

difference = None

Jeremy Johnson

2021-12-15 17:14:56 +0000

[diff] [blame]

242

# Fall-through to below to add failure values

243

James Ward

8b39043

2022-08-12 20:48:56 +0100

[diff] [blame]

244

# TODO: update for fp16 tolerance

245

elif reference_result.dtype == np.float32 or reference_result.dtype == np.float16:

Jeremy Johnson

2021-12-15 17:14:56 +0000

[diff] [blame]

246

tolerance = float_tolerance

247

if np.allclose(reference_result, test_result, atol=tolerance, equal_nan=True):

Jeremy Johnson

2023-09-14 17:02:09 +0100

[diff] [blame]

248

_print_result(LogColors.GREEN, "Results PASS {}".format(test_name))

Jeremy Johnson

2021-12-15 17:14:56 +0000

[diff] [blame]

249

return (TestResult.PASS, tolerance, "")

250

msg = "Float result does not match within tolerance of {}".format(tolerance)

Jeremy Johnson

2022-09-15 10:38:17 +0100

[diff] [blame]

251

difference = reference_result - test_result

Jeremy Johnson

2021-12-15 17:14:56 +0000

[diff] [blame]

252

# Fall-through to below to add failure values

Jeremy Johnson

2021-12-15 17:14:56 +0000

[diff] [blame]

253

else:

Jeremy Johnson

2023-09-14 17:02:09 +0100

[diff] [blame]

254

_print_result(LogColors.RED, "Results UNSUPPORTED TYPE {}".format(test_name))

Jeremy Johnson

2021-12-15 17:14:56 +0000

[diff] [blame]

255

msg = "Unsupported results type: {}".format(reference_result.dtype)

256

return (TestResult.MISMATCH, 0.0, msg)

257

258

# Fall-through for mismatch failure to add values to msg

Jeremy Johnson

2023-09-14 17:02:09 +0100

[diff] [blame]

259

_print_result(LogColors.RED, "Results MISCOMPARE {}".format(test_name))

Jeremy Johnson

2022-09-15 10:38:17 +0100

[diff] [blame]

260

np.set_printoptions(threshold=128, edgeitems=2)

261

262

if difference is not None:

263

tolerance_needed = np.amax(np.absolute(difference))

264

msg = "{}\n-- tolerance_needed: {}".format(msg, tolerance_needed)

265

266

msg = "{}\n>> reference_result: {}\n{}".format(

Jeremy Johnson

2021-12-15 17:14:56 +0000

[diff] [blame]

267

msg, reference_result.shape, reference_result

268

)

Jeremy Johnson

2022-09-15 10:38:17 +0100

[diff] [blame]

269

msg = "{}\n<< test_result: {}\n{}".format(msg, test_result.shape, test_result)

270

271

if difference is not None:

272

msg = "{}\n!! difference_result: \n{}".format(msg, difference)

Jeremy Johnson

2021-12-15 17:14:56 +0000

[diff] [blame]

273

return (TestResult.MISMATCH, tolerance, msg)

274

275

276

def main(argv=None):

Jeremy Johnson

2022-09-15 10:38:17 +0100

[diff] [blame]

277

"""Check that the supplied reference and result files have the same contents."""

Jeremy Johnson

2021-12-15 17:14:56 +0000

[diff] [blame]

278

parser = argparse.ArgumentParser()

279

parser.add_argument(

Jeremy Johnson

2023-09-14 17:02:09 +0100

[diff] [blame]

280

"ref_result_path",

281

type=Path,

282

help="path to the reference model result file to check",

Jeremy Johnson

2021-12-15 17:14:56 +0000

[diff] [blame]

283

)

284

parser.add_argument(

Jeremy Johnson

2023-09-14 17:02:09 +0100

[diff] [blame]

285

"imp_result_path",

286

type=Path,

287

help="path to the implementation result file to check",

Jeremy Johnson

2021-12-15 17:14:56 +0000

[diff] [blame]

288

)

Jeremy Johnson

2022-09-15 10:38:17 +0100

[diff] [blame]

289

parser.add_argument(

290

"--fp-tolerance", type=float, default=DEFAULT_FP_TOLERANCE, help="FP tolerance"

291

)

Jeremy Johnson

2023-09-14 17:02:09 +0100

[diff] [blame]

292

parser.add_argument(

Jeremy Johnson

2023-11-27 15:02:04 +0000

[diff] [blame]

293

"--test-path", type=Path, help="path to the test that produced the results"

Jeremy Johnson

2023-09-14 17:02:09 +0100

[diff] [blame]

294

)

Jeremy Johnson

2023-11-27 15:02:04 +0000

[diff] [blame]

295

# Deprecate the incorrectly formatted option by hiding it

296

parser.add_argument("--test_path", type=Path, help=argparse.SUPPRESS)

Jeremy Johnson

2023-09-14 17:02:09 +0100

[diff] [blame]

parser.add_argument(

"--bnd-result-path",

type=Path,

help="path to the reference model bounds result file for the dot product compliance check",

)

parser.add_argument(

"--ofm-name",

type=str,

help="name of the output tensor to check, defaults to the first ofm_name listed in the test",

)

parser.add_argument(

"--verify-lib-path",

type=Path,

help="path to TOSA verify library",

311

)

Jeremy Johnson

2021-12-15 17:14:56 +0000

[diff] [blame]

312

args = parser.parse_args(argv)

Jeremy Johnson

2021-12-15 17:14:56 +0000

[diff] [blame]

313

Jeremy Johnson

2023-09-14 17:02:09 +0100

[diff] [blame]

314

if args.test_path:

315

# Get details from the test path

316

test_desc_path = args.test_path / "desc.json"

317

if not args.test_path.is_dir() or not test_desc_path.is_file():

318

print(f"Invalid test directory {str(args.test_path)}")

319

return TestResult.MISSING_FILE

320

321

try:

322

with test_desc_path.open("r") as fd:

323

test_desc = json.load(fd)

324

except Exception as e:

325

print(f"Invalid test description file {str(test_desc_path)}: {e}")

326

return TestResult.INCORRECT_FORMAT

327

test_name = args.test_path.name

else:

test_desc = None

test_name = None

Jeremy Johnson

2022-09-15 10:38:17 +0100

[diff] [blame]

332

result, tolerance, msg = test_check(

Jeremy Johnson

2023-09-14 17:02:09 +0100

[diff] [blame]

333

args.ref_result_path,

334

args.imp_result_path,

335

float_tolerance=args.fp_tolerance,

336

test_name=test_name,

337

test_desc=test_desc,

338

bnd_result_path=args.bnd_result_path,

339

ofm_name=args.ofm_name,

340

verify_lib_path=args.verify_lib_path,

Jeremy Johnson

2022-09-15 10:38:17 +0100

[diff] [blame]

341

)

Jeremy Johnson