aboutsummaryrefslogtreecommitdiffstats
path: root/contrib/libs/crcutil/crc32c_sse4_intrin.h
blob: 5338d21d290e97dca9023baf4a1286d32c0f1b4a (plain) (blame)
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
// Copyright 2010 Google Inc.  All rights reserved. 
// 
// Licensed under the Apache License, Version 2.0 (the "License"); 
// you may not use this file except in compliance with the License. 
// You may obtain a copy of the License at 
// 
//      http://www.apache.org/licenses/LICENSE-2.0 
// 
// Unless required by applicable law or agreed to in writing, software 
// distributed under the License is distributed on an "AS IS" BASIS, 
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. 
// See the License for the specific language governing permissions and 
// limitations under the License. 
 
// Provides _mm_crc32_u64/32/8 intrinsics. 
 
#ifndef CRCUTIL_CRC32C_SSE4_INTRIN_H_ 
#define CRCUTIL_CRC32C_SSE4_INTRIN_H_ 
 
#include "platform.h" 
#include "base_types.h" 
 
#if CRCUTIL_USE_MM_CRC32 && (HAVE_I386 || HAVE_AMD64) 
 
#if defined(_MSC_VER) || defined(__SSE4_2__) 
 
#if defined(_MSC_VER) 
#pragma warning(push) 
// '_M_IA64' is not defined as a preprocessor macro 
#pragma warning(disable: 4668) 
#endif  // defined(_MSC_VER) 
 
#include <nmmintrin.h> 
 
#if defined(_MSC_VER) 
#pragma warning(pop) 
#endif  // defined(_MSC_VER) 
 
#elif GCC_VERSION_AVAILABLE(4, 5) && !defined(CRCUTIL_FORCE_ASM_CRC32C) 
// Allow the use of _mm_crc32_u* intrinsic when CRCUTIL_USE_MM_CRC32 
// is set irrespective of "-msse*" settings. This way, the sources 
// may be compiled with "-msse2 -mcrc32" and work on older CPUs, 
// while taking full advantage of "crc32" instruction on newer 
// CPUs (requires dynamic CPU detection). See "interface.cc". 
// 
// If neither -msse4 or -mcrc32 is provided and CRCUTIL_USE_MM_CRC32 is set 
// and CRCUTIL_FORCE_ASM_CRC32 is not set, compile-time error will happen. 
// Why? Becuase GCC disables __builtin_ia32_crc32* intrinsics when compiled 
// without -msse4 or -mcrc32. -msse4 could be detected at run time by checking 
// whether __SSE4_2__ is defined, but there is no way to tell whether the 
// sources are compiled with -mcrc32. 
 
extern __inline unsigned int __attribute__(( 
    __gnu_inline__, __always_inline__, __artificial__)) 
_mm_crc32_u8(unsigned int __C, unsigned char __V) { 
  return __builtin_ia32_crc32qi(__C, __V); 
} 
#ifdef __x86_64__ 
extern __inline unsigned long long __attribute__(( 
    __gnu_inline__, __always_inline__, __artificial__)) 
_mm_crc32_u64(unsigned long long __C, unsigned long long __V) { 
  return __builtin_ia32_crc32di(__C, __V); 
} 
#else 
extern __inline unsigned int __attribute__(( 
    __gnu_inline__, __always_inline__, __artificial__)) 
_mm_crc32_u32(unsigned int __C, unsigned int __V) { 
  return __builtin_ia32_crc32si (__C, __V); 
} 
#endif  // __x86_64__ 
 
#else 
 
// GCC 4.4.x and earlier: use inline asm. 
 
namespace crcutil { 
 
__forceinline uint64 _mm_crc32_u64(uint64 crc, uint64 value) { 
  asm("crc32q %[value], %[crc]\n" : [crc] "+r" (crc) : [value] "rm" (value)); 
  return crc; 
} 
 
__forceinline uint32 _mm_crc32_u32(uint32 crc, uint64 value) { 
  asm("crc32l %[value], %[crc]\n" : [crc] "+r" (crc) : [value] "rm" (value)); 
  return crc; 
} 
 
__forceinline uint32 _mm_crc32_u8(uint32 crc, uint8 value) { 
  asm("crc32b %[value], %[crc]\n" : [crc] "+r" (crc) : [value] "rm" (value)); 
  return crc; 
} 
 
}  // namespace crcutil 
 
#endif 
 
#endif  // CRCUTIL_USE_MM_CRC32 && (HAVE_I386 || HAVE_AMD64) 
 
#endif  // CRCUTIL_CRC32C_SSE4_INTRIN_H_