summaryrefslogtreecommitdiffstats
path: root/third_party/jpeg-xl/lib/jxl/base/iaca.h
blob: e5732dae5c81c76a8803c3855bc5aaf212d940a5 (plain)
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
// Copyright (c) the JPEG XL Project Authors. All rights reserved.
//
// Use of this source code is governed by a BSD-style
// license that can be found in the LICENSE file.

#ifndef LIB_JXL_BASE_IACA_H_
#define LIB_JXL_BASE_IACA_H_

#include "lib/jxl/base/compiler_specific.h"

// IACA (Intel's Code Analyzer) analyzes instruction latencies, but only for
// code between special markers. These functions embed such markers in an
// executable, but only for reading via IACA - they deliberately trigger a
// crash if executed to ensure they are removed in normal builds.

#ifndef JXL_IACA_ENABLED
#define JXL_IACA_ENABLED 0
#endif

namespace jxl {

// Call before the region of interest.
static JXL_INLINE void BeginIACA() {
#if JXL_IACA_ENABLED && (JXL_COMPILER_GCC || JXL_COMPILER_CLANG)
  asm volatile(
      // UD2 "instruction" raises an invalid opcode exception.
      ".byte 0x0F, 0x0B\n\t"
      // Magic sequence recognized by IACA (MOV + addr32 fs:NOP). This actually
      // clobbers EBX, but we don't care because the code won't be run, and we
      // want IACA to observe the same code the compiler would have generated
      // without this marker.
      "movl $111, %%ebx\n\t"
      ".byte 0x64, 0x67, 0x90\n\t"
      :
      :
      // (Allegedly) clobbering memory may prevent reordering.
      : "memory");
#endif
}

// Call after the region of interest.
static JXL_INLINE void EndIACA() {
#if JXL_IACA_ENABLED && (JXL_COMPILER_GCC || JXL_COMPILER_CLANG)
  asm volatile(
      // See above.
      "movl $222, %%ebx\n\t"
      ".byte 0x64, 0x67, 0x90\n\t"
      // UD2
      ".byte 0x0F, 0x0B\n\t"
      :
      :
      // (Allegedly) clobbering memory may prevent reordering.
      : "memory");
#endif
}

// Add to a scope to mark a region.
struct ScopeIACA {
  JXL_INLINE ScopeIACA() { BeginIACA(); }
  JXL_INLINE ~ScopeIACA() { EndIACA(); }
};

}  // namespace jxl

#endif  // LIB_JXL_BASE_IACA_H_