VirtualBox

source: vbox/trunk/src/VBox/Runtime/testcase/tstRTInlineAsm.cpp@ 50603

Last change on this file since 50603 was 49281, checked in by vboxsync, 11 years ago

cpuid experiment.

  • Property svn:eol-style set to native
  • Property svn:keywords set to Id Revision
File size: 61.3 KB
Line 
1/* $Id: tstRTInlineAsm.cpp 49281 2013-10-24 19:36:28Z vboxsync $ */
2/** @file
3 * IPRT Testcase - inline assembly.
4 */
5
6/*
7 * Copyright (C) 2006-2013 Oracle Corporation
8 *
9 * This file is part of VirtualBox Open Source Edition (OSE), as
10 * available from http://www.virtualbox.org. This file is free software;
11 * you can redistribute it and/or modify it under the terms of the GNU
12 * General Public License (GPL) as published by the Free Software
13 * Foundation, in version 2 as it comes in the "COPYING" file of the
14 * VirtualBox OSE distribution. VirtualBox OSE is distributed in the
15 * hope that it will be useful, but WITHOUT ANY WARRANTY of any kind.
16 *
17 * The contents of this file may alternatively be used under the terms
18 * of the Common Development and Distribution License Version 1.0
19 * (CDDL) only, as it comes in the "COPYING.CDDL" file of the
20 * VirtualBox OSE distribution, in which case the provisions of the
21 * CDDL are applicable instead of those of the GPL.
22 *
23 * You may elect to license modified versions of this file under the
24 * terms and conditions of either the GPL or the CDDL or both.
25 */
26
27/*******************************************************************************
28* Header Files *
29*******************************************************************************/
30#include <iprt/asm.h>
31#include <iprt/asm-math.h>
32
33/* See http://gcc.gnu.org/bugzilla/show_bug.cgi?id=44018. Only gcc version 4.4
34 * is affected. No harm for the VBox code: If the cpuid code compiles, it works
35 * fine. */
36#if defined(__GNUC__) && defined(RT_ARCH_X86) && defined(__PIC__)
37# if __GNUC__ == 4 && __GNUC_MINOR__ == 4
38# define GCC44_32BIT_PIC
39# endif
40#endif
41
42#if !defined(GCC44_32BIT_PIC) && (defined(RT_ARCH_AMD64) || defined(RT_ARCH_X86))
43# include <iprt/asm-amd64-x86.h>
44#else
45# include <iprt/time.h>
46#endif
47#include <iprt/stream.h>
48#include <iprt/string.h>
49#include <iprt/param.h>
50#include <iprt/thread.h>
51#include <iprt/test.h>
52#include <iprt/time.h>
53
54
55
56/*******************************************************************************
57* Defined Constants And Macros *
58*******************************************************************************/
59#define CHECKVAL(val, expect, fmt) \
60 do \
61 { \
62 if ((val) != (expect)) \
63 { \
64 RTTestFailed(g_hTest, "%s, %d: " #val ": expected " fmt " got " fmt "\n", __FUNCTION__, __LINE__, (expect), (val)); \
65 } \
66 } while (0)
67
68#define CHECKOP(op, expect, fmt, type) \
69 do \
70 { \
71 type val = op; \
72 if (val != (type)(expect)) \
73 { \
74 RTTestFailed(g_hTest, "%s, %d: " #op ": expected " fmt " got " fmt "\n", __FUNCTION__, __LINE__, (type)(expect), val); \
75 } \
76 } while (0)
77
78/**
79 * Calls a worker function with different worker variable storage types.
80 */
81#define DO_SIMPLE_TEST(name, type) \
82 do \
83 { \
84 RTTestISub(#name); \
85 type StackVar; \
86 tst ## name ## Worker(&StackVar); \
87 \
88 type *pVar = (type *)RTTestGuardedAllocHead(g_hTest, sizeof(type)); \
89 RTTEST_CHECK_BREAK(g_hTest, pVar); \
90 tst ## name ## Worker(pVar); \
91 RTTestGuardedFree(g_hTest, pVar); \
92 \
93 pVar = (type *)RTTestGuardedAllocTail(g_hTest, sizeof(type)); \
94 RTTEST_CHECK_BREAK(g_hTest, pVar); \
95 tst ## name ## Worker(pVar); \
96 RTTestGuardedFree(g_hTest, pVar); \
97 } while (0)
98
99
100/*******************************************************************************
101* Global Variables *
102*******************************************************************************/
103/** The test instance. */
104static RTTEST g_hTest;
105
106
107
108#if !defined(GCC44_32BIT_PIC) && (defined(RT_ARCH_AMD64) || defined(RT_ARCH_X86))
109
110const char *getCacheAss(unsigned u)
111{
112 if (u == 0)
113 return "res0 ";
114 if (u == 1)
115 return "direct";
116 if (u >= 256)
117 return "???";
118
119 char *pszRet;
120 RTStrAPrintf(&pszRet, "%d way", u); /* intentional leak! */
121 return pszRet;
122}
123
124
125const char *getL2CacheAss(unsigned u)
126{
127 switch (u)
128 {
129 case 0: return "off ";
130 case 1: return "direct";
131 case 2: return "2 way ";
132 case 3: return "res3 ";
133 case 4: return "4 way ";
134 case 5: return "res5 ";
135 case 6: return "8 way ";
136 case 7: return "res7 ";
137 case 8: return "16 way";
138 case 9: return "res9 ";
139 case 10: return "res10 ";
140 case 11: return "res11 ";
141 case 12: return "res12 ";
142 case 13: return "res13 ";
143 case 14: return "res14 ";
144 case 15: return "fully ";
145 default:
146 return "????";
147 }
148}
149
150
151/**
152 * Test and dump all possible info from the CPUID instruction.
153 *
154 * @remark Bits shared with the libc cpuid.c program. This all written by me, so no worries.
155 * @todo transform the dumping into a generic runtime function. We'll need it for logging!
156 */
157void tstASMCpuId(void)
158{
159 RTTestISub("ASMCpuId");
160
161 unsigned iBit;
162 struct
163 {
164 uint32_t uEBX, uEAX, uEDX, uECX;
165 } s;
166 if (!ASMHasCpuId())
167 {
168 RTTestIPrintf(RTTESTLVL_ALWAYS, "warning! CPU doesn't support CPUID\n");
169 return;
170 }
171
172 /*
173 * Try the 0 function and use that for checking the ASMCpuId_* variants.
174 */
175 ASMCpuId(0, &s.uEAX, &s.uEBX, &s.uECX, &s.uEDX);
176
177 uint32_t u32;
178
179 u32 = ASMCpuId_EAX(0);
180 CHECKVAL(u32, s.uEAX, "%x");
181 u32 = ASMCpuId_EBX(0);
182 CHECKVAL(u32, s.uEBX, "%x");
183 u32 = ASMCpuId_ECX(0);
184 CHECKVAL(u32, s.uECX, "%x");
185 u32 = ASMCpuId_EDX(0);
186 CHECKVAL(u32, s.uEDX, "%x");
187
188 uint32_t uECX2 = s.uECX - 1;
189 uint32_t uEDX2 = s.uEDX - 1;
190 ASMCpuId_ECX_EDX(0, &uECX2, &uEDX2);
191 CHECKVAL(uECX2, s.uECX, "%x");
192 CHECKVAL(uEDX2, s.uEDX, "%x");
193
194 uint32_t uEAX2 = s.uEAX - 1;
195 uint32_t uEBX2 = s.uEBX - 1;
196 uECX2 = s.uECX - 1;
197 uEDX2 = s.uEDX - 1;
198 ASMCpuIdExSlow(0, 0, 0, 0, &uEAX2, &uEBX2, &uECX2, &uEDX2);
199 CHECKVAL(uEAX2, s.uEAX, "%x");
200 CHECKVAL(uEBX2, s.uEBX, "%x");
201 CHECKVAL(uECX2, s.uECX, "%x");
202 CHECKVAL(uEDX2, s.uEDX, "%x");
203
204 /*
205 * Done testing, dump the information.
206 */
207 RTTestIPrintf(RTTESTLVL_ALWAYS, "CPUID Dump\n");
208 ASMCpuId(0, &s.uEAX, &s.uEBX, &s.uECX, &s.uEDX);
209 const uint32_t cFunctions = s.uEAX;
210
211 /* raw dump */
212 RTTestIPrintf(RTTESTLVL_ALWAYS,
213 "\n"
214 " RAW Standard CPUIDs\n"
215 "Function eax ebx ecx edx\n");
216 for (unsigned iStd = 0; iStd <= cFunctions + 3; iStd++)
217 {
218 ASMCpuId_Idx_ECX(iStd, 0, &s.uEAX, &s.uEBX, &s.uECX, &s.uEDX);
219 RTTestIPrintf(RTTESTLVL_ALWAYS, "%08x %08x %08x %08x %08x%s\n",
220 iStd, s.uEAX, s.uEBX, s.uECX, s.uEDX, iStd <= cFunctions ? "" : "*");
221
222 /* Leaf 04 and leaf 0d output depend on the initial value of ECX
223 * The same seems to apply to invalid standard functions */
224 if (iStd > cFunctions)
225 continue;
226 if (iStd != 0x04 && iStd != 0x0b && iStd != 0x0d)
227 {
228 u32 = ASMCpuId_EAX(iStd);
229 CHECKVAL(u32, s.uEAX, "%x");
230
231 uint32_t u32EbxMask = UINT32_MAX;
232 if (iStd == 1)
233 u32EbxMask = UINT32_C(0x00ffffff); /* Omit the local apic ID in case we're rescheduled. */
234 u32 = ASMCpuId_EBX(iStd);
235 CHECKVAL(u32 & u32EbxMask, s.uEBX & u32EbxMask, "%x");
236
237 u32 = ASMCpuId_ECX(iStd);
238 CHECKVAL(u32, s.uECX, "%x");
239 u32 = ASMCpuId_EDX(iStd);
240 CHECKVAL(u32, s.uEDX, "%x");
241
242 uECX2 = s.uECX - 1;
243 uEDX2 = s.uEDX - 1;
244 ASMCpuId_ECX_EDX(iStd, &uECX2, &uEDX2);
245 CHECKVAL(uECX2, s.uECX, "%x");
246 CHECKVAL(uEDX2, s.uEDX, "%x");
247 }
248
249 if (iStd == 0x04)
250 for (uint32_t uECX = 1; s.uEAX & 0x1f; uECX++)
251 {
252 ASMCpuId_Idx_ECX(iStd, uECX, &s.uEAX, &s.uEBX, &s.uECX, &s.uEDX);
253 RTTestIPrintf(RTTESTLVL_ALWAYS, " [%02x] %08x %08x %08x %08x\n", uECX, s.uEAX, s.uEBX, s.uECX, s.uEDX);
254 RTTESTI_CHECK_BREAK(uECX < 128);
255 }
256 else if (iStd == 0x0b)
257 for (uint32_t uECX = 1; (s.uEAX & 0x1f) && (s.uEBX & 0xffff); uECX++)
258 {
259 ASMCpuId_Idx_ECX(iStd, uECX, &s.uEAX, &s.uEBX, &s.uECX, &s.uEDX);
260 RTTestIPrintf(RTTESTLVL_ALWAYS, " [%02x] %08x %08x %08x %08x\n", uECX, s.uEAX, s.uEBX, s.uECX, s.uEDX);
261 RTTESTI_CHECK_BREAK(uECX < 128);
262 }
263 else if (iStd == 0x0d)
264 for (uint32_t uECX = 1; s.uEAX != 0 || s.uEBX != 0 || s.uECX != 0 || s.uEDX != 0; uECX++)
265 {
266 ASMCpuId_Idx_ECX(iStd, uECX, &s.uEAX, &s.uEBX, &s.uECX, &s.uEDX);
267 RTTestIPrintf(RTTESTLVL_ALWAYS, " [%02x] %08x %08x %08x %08x\n", uECX, s.uEAX, s.uEBX, s.uECX, s.uEDX);
268 RTTESTI_CHECK_BREAK(uECX < 128);
269 }
270 }
271
272 /*
273 * Understandable output
274 */
275 ASMCpuId(0, &s.uEAX, &s.uEBX, &s.uECX, &s.uEDX);
276 RTTestIPrintf(RTTESTLVL_ALWAYS,
277 "Name: %.04s%.04s%.04s\n"
278 "Support: 0-%u\n",
279 &s.uEBX, &s.uEDX, &s.uECX, s.uEAX);
280 bool const fIntel = ASMIsIntelCpuEx(s.uEBX, s.uECX, s.uEDX);
281
282 /*
283 * Get Features.
284 */
285 if (cFunctions >= 1)
286 {
287 static const char * const s_apszTypes[4] = { "primary", "overdrive", "MP", "reserved" };
288 ASMCpuId(1, &s.uEAX, &s.uEBX, &s.uECX, &s.uEDX);
289 RTTestIPrintf(RTTESTLVL_ALWAYS,
290 "Family: %#x \tExtended: %#x \tEffective: %#x\n"
291 "Model: %#x \tExtended: %#x \tEffective: %#x\n"
292 "Stepping: %d\n"
293 "Type: %d (%s)\n"
294 "APIC ID: %#04x\n"
295 "Logical CPUs: %d\n"
296 "CLFLUSH Size: %d\n"
297 "Brand ID: %#04x\n",
298 (s.uEAX >> 8) & 0xf, (s.uEAX >> 20) & 0x7f, ASMGetCpuFamily(s.uEAX),
299 (s.uEAX >> 4) & 0xf, (s.uEAX >> 16) & 0x0f, ASMGetCpuModel(s.uEAX, fIntel),
300 ASMGetCpuStepping(s.uEAX),
301 (s.uEAX >> 12) & 0x3, s_apszTypes[(s.uEAX >> 12) & 0x3],
302 (s.uEBX >> 24) & 0xff,
303 (s.uEBX >> 16) & 0xff,
304 (s.uEBX >> 8) & 0xff,
305 (s.uEBX >> 0) & 0xff);
306
307 RTTestIPrintf(RTTESTLVL_ALWAYS, "Features EDX: ");
308 if (s.uEDX & RT_BIT(0)) RTTestIPrintf(RTTESTLVL_ALWAYS, " FPU");
309 if (s.uEDX & RT_BIT(1)) RTTestIPrintf(RTTESTLVL_ALWAYS, " VME");
310 if (s.uEDX & RT_BIT(2)) RTTestIPrintf(RTTESTLVL_ALWAYS, " DE");
311 if (s.uEDX & RT_BIT(3)) RTTestIPrintf(RTTESTLVL_ALWAYS, " PSE");
312 if (s.uEDX & RT_BIT(4)) RTTestIPrintf(RTTESTLVL_ALWAYS, " TSC");
313 if (s.uEDX & RT_BIT(5)) RTTestIPrintf(RTTESTLVL_ALWAYS, " MSR");
314 if (s.uEDX & RT_BIT(6)) RTTestIPrintf(RTTESTLVL_ALWAYS, " PAE");
315 if (s.uEDX & RT_BIT(7)) RTTestIPrintf(RTTESTLVL_ALWAYS, " MCE");
316 if (s.uEDX & RT_BIT(8)) RTTestIPrintf(RTTESTLVL_ALWAYS, " CX8");
317 if (s.uEDX & RT_BIT(9)) RTTestIPrintf(RTTESTLVL_ALWAYS, " APIC");
318 if (s.uEDX & RT_BIT(10)) RTTestIPrintf(RTTESTLVL_ALWAYS, " 10");
319 if (s.uEDX & RT_BIT(11)) RTTestIPrintf(RTTESTLVL_ALWAYS, " SEP");
320 if (s.uEDX & RT_BIT(12)) RTTestIPrintf(RTTESTLVL_ALWAYS, " MTRR");
321 if (s.uEDX & RT_BIT(13)) RTTestIPrintf(RTTESTLVL_ALWAYS, " PGE");
322 if (s.uEDX & RT_BIT(14)) RTTestIPrintf(RTTESTLVL_ALWAYS, " MCA");
323 if (s.uEDX & RT_BIT(15)) RTTestIPrintf(RTTESTLVL_ALWAYS, " CMOV");
324 if (s.uEDX & RT_BIT(16)) RTTestIPrintf(RTTESTLVL_ALWAYS, " PAT");
325 if (s.uEDX & RT_BIT(17)) RTTestIPrintf(RTTESTLVL_ALWAYS, " PSE36");
326 if (s.uEDX & RT_BIT(18)) RTTestIPrintf(RTTESTLVL_ALWAYS, " PSN");
327 if (s.uEDX & RT_BIT(19)) RTTestIPrintf(RTTESTLVL_ALWAYS, " CLFSH");
328 if (s.uEDX & RT_BIT(20)) RTTestIPrintf(RTTESTLVL_ALWAYS, " 20");
329 if (s.uEDX & RT_BIT(21)) RTTestIPrintf(RTTESTLVL_ALWAYS, " DS");
330 if (s.uEDX & RT_BIT(22)) RTTestIPrintf(RTTESTLVL_ALWAYS, " ACPI");
331 if (s.uEDX & RT_BIT(23)) RTTestIPrintf(RTTESTLVL_ALWAYS, " MMX");
332 if (s.uEDX & RT_BIT(24)) RTTestIPrintf(RTTESTLVL_ALWAYS, " FXSR");
333 if (s.uEDX & RT_BIT(25)) RTTestIPrintf(RTTESTLVL_ALWAYS, " SSE");
334 if (s.uEDX & RT_BIT(26)) RTTestIPrintf(RTTESTLVL_ALWAYS, " SSE2");
335 if (s.uEDX & RT_BIT(27)) RTTestIPrintf(RTTESTLVL_ALWAYS, " SS");
336 if (s.uEDX & RT_BIT(28)) RTTestIPrintf(RTTESTLVL_ALWAYS, " HTT");
337 if (s.uEDX & RT_BIT(29)) RTTestIPrintf(RTTESTLVL_ALWAYS, " 29");
338 if (s.uEDX & RT_BIT(30)) RTTestIPrintf(RTTESTLVL_ALWAYS, " 30");
339 if (s.uEDX & RT_BIT(31)) RTTestIPrintf(RTTESTLVL_ALWAYS, " 31");
340 RTTestIPrintf(RTTESTLVL_ALWAYS, "\n");
341
342 /** @todo check intel docs. */
343 RTTestIPrintf(RTTESTLVL_ALWAYS, "Features ECX: ");
344 if (s.uECX & RT_BIT(0)) RTTestIPrintf(RTTESTLVL_ALWAYS, " SSE3");
345 for (iBit = 1; iBit < 13; iBit++)
346 if (s.uECX & RT_BIT(iBit))
347 RTTestIPrintf(RTTESTLVL_ALWAYS, " %d", iBit);
348 if (s.uECX & RT_BIT(13)) RTTestIPrintf(RTTESTLVL_ALWAYS, " CX16");
349 for (iBit = 14; iBit < 32; iBit++)
350 if (s.uECX & RT_BIT(iBit))
351 RTTestIPrintf(RTTESTLVL_ALWAYS, " %d", iBit);
352 RTTestIPrintf(RTTESTLVL_ALWAYS, "\n");
353 }
354
355 /*
356 * Extended.
357 * Implemented after AMD specs.
358 */
359 /** @todo check out the intel specs. */
360 ASMCpuId(0x80000000, &s.uEAX, &s.uEBX, &s.uECX, &s.uEDX);
361 if (!s.uEAX && !s.uEBX && !s.uECX && !s.uEDX)
362 {
363 RTTestIPrintf(RTTESTLVL_ALWAYS, "No extended CPUID info? Check the manual on how to detect this...\n");
364 return;
365 }
366 const uint32_t cExtFunctions = s.uEAX | 0x80000000;
367
368 /* raw dump */
369 RTTestIPrintf(RTTESTLVL_ALWAYS,
370 "\n"
371 " RAW Extended CPUIDs\n"
372 "Function eax ebx ecx edx\n");
373 for (unsigned iExt = 0x80000000; iExt <= cExtFunctions + 3; iExt++)
374 {
375 ASMCpuId(iExt, &s.uEAX, &s.uEBX, &s.uECX, &s.uEDX);
376 RTTestIPrintf(RTTESTLVL_ALWAYS, "%08x %08x %08x %08x %08x%s\n",
377 iExt, s.uEAX, s.uEBX, s.uECX, s.uEDX, iExt <= cExtFunctions ? "" : "*");
378
379 if (iExt > cExtFunctions)
380 continue; /* Invalid extended functions seems change the value if ECX changes */
381 if (iExt == 0x8000001d)
382 continue; /* Takes cache level in ecx. */
383
384 u32 = ASMCpuId_EAX(iExt);
385 CHECKVAL(u32, s.uEAX, "%x");
386 u32 = ASMCpuId_EBX(iExt);
387 CHECKVAL(u32, s.uEBX, "%x");
388 u32 = ASMCpuId_ECX(iExt);
389 CHECKVAL(u32, s.uECX, "%x");
390 u32 = ASMCpuId_EDX(iExt);
391 CHECKVAL(u32, s.uEDX, "%x");
392
393 uECX2 = s.uECX - 1;
394 uEDX2 = s.uEDX - 1;
395 ASMCpuId_ECX_EDX(iExt, &uECX2, &uEDX2);
396 CHECKVAL(uECX2, s.uECX, "%x");
397 CHECKVAL(uEDX2, s.uEDX, "%x");
398 }
399
400 /*
401 * Understandable output
402 */
403 ASMCpuId(0x80000000, &s.uEAX, &s.uEBX, &s.uECX, &s.uEDX);
404 RTTestIPrintf(RTTESTLVL_ALWAYS,
405 "Ext Name: %.4s%.4s%.4s\n"
406 "Ext Supports: 0x80000000-%#010x\n",
407 &s.uEBX, &s.uEDX, &s.uECX, s.uEAX);
408
409 if (cExtFunctions >= 0x80000001)
410 {
411 ASMCpuId(0x80000001, &s.uEAX, &s.uEBX, &s.uECX, &s.uEDX);
412 RTTestIPrintf(RTTESTLVL_ALWAYS,
413 "Family: %#x \tExtended: %#x \tEffective: %#x\n"
414 "Model: %#x \tExtended: %#x \tEffective: %#x\n"
415 "Stepping: %d\n"
416 "Brand ID: %#05x\n",
417 (s.uEAX >> 8) & 0xf, (s.uEAX >> 20) & 0x7f, ASMGetCpuFamily(s.uEAX),
418 (s.uEAX >> 4) & 0xf, (s.uEAX >> 16) & 0x0f, ASMGetCpuModel(s.uEAX, fIntel),
419 ASMGetCpuStepping(s.uEAX),
420 s.uEBX & 0xfff);
421
422 RTTestIPrintf(RTTESTLVL_ALWAYS, "Features EDX: ");
423 if (s.uEDX & RT_BIT(0)) RTTestIPrintf(RTTESTLVL_ALWAYS, " FPU");
424 if (s.uEDX & RT_BIT(1)) RTTestIPrintf(RTTESTLVL_ALWAYS, " VME");
425 if (s.uEDX & RT_BIT(2)) RTTestIPrintf(RTTESTLVL_ALWAYS, " DE");
426 if (s.uEDX & RT_BIT(3)) RTTestIPrintf(RTTESTLVL_ALWAYS, " PSE");
427 if (s.uEDX & RT_BIT(4)) RTTestIPrintf(RTTESTLVL_ALWAYS, " TSC");
428 if (s.uEDX & RT_BIT(5)) RTTestIPrintf(RTTESTLVL_ALWAYS, " MSR");
429 if (s.uEDX & RT_BIT(6)) RTTestIPrintf(RTTESTLVL_ALWAYS, " PAE");
430 if (s.uEDX & RT_BIT(7)) RTTestIPrintf(RTTESTLVL_ALWAYS, " MCE");
431 if (s.uEDX & RT_BIT(8)) RTTestIPrintf(RTTESTLVL_ALWAYS, " CMPXCHG8B");
432 if (s.uEDX & RT_BIT(9)) RTTestIPrintf(RTTESTLVL_ALWAYS, " APIC");
433 if (s.uEDX & RT_BIT(10)) RTTestIPrintf(RTTESTLVL_ALWAYS, " 10");
434 if (s.uEDX & RT_BIT(11)) RTTestIPrintf(RTTESTLVL_ALWAYS, " SysCallSysRet");
435 if (s.uEDX & RT_BIT(12)) RTTestIPrintf(RTTESTLVL_ALWAYS, " MTRR");
436 if (s.uEDX & RT_BIT(13)) RTTestIPrintf(RTTESTLVL_ALWAYS, " PGE");
437 if (s.uEDX & RT_BIT(14)) RTTestIPrintf(RTTESTLVL_ALWAYS, " MCA");
438 if (s.uEDX & RT_BIT(15)) RTTestIPrintf(RTTESTLVL_ALWAYS, " CMOV");
439 if (s.uEDX & RT_BIT(16)) RTTestIPrintf(RTTESTLVL_ALWAYS, " PAT");
440 if (s.uEDX & RT_BIT(17)) RTTestIPrintf(RTTESTLVL_ALWAYS, " PSE36");
441 if (s.uEDX & RT_BIT(18)) RTTestIPrintf(RTTESTLVL_ALWAYS, " 18");
442 if (s.uEDX & RT_BIT(19)) RTTestIPrintf(RTTESTLVL_ALWAYS, " 19");
443 if (s.uEDX & RT_BIT(20)) RTTestIPrintf(RTTESTLVL_ALWAYS, " NX");
444 if (s.uEDX & RT_BIT(21)) RTTestIPrintf(RTTESTLVL_ALWAYS, " 21");
445 if (s.uEDX & RT_BIT(22)) RTTestIPrintf(RTTESTLVL_ALWAYS, " MmxExt");
446 if (s.uEDX & RT_BIT(23)) RTTestIPrintf(RTTESTLVL_ALWAYS, " MMX");
447 if (s.uEDX & RT_BIT(24)) RTTestIPrintf(RTTESTLVL_ALWAYS, " FXSR");
448 if (s.uEDX & RT_BIT(25)) RTTestIPrintf(RTTESTLVL_ALWAYS, " FastFXSR");
449 if (s.uEDX & RT_BIT(26)) RTTestIPrintf(RTTESTLVL_ALWAYS, " 26");
450 if (s.uEDX & RT_BIT(27)) RTTestIPrintf(RTTESTLVL_ALWAYS, " RDTSCP");
451 if (s.uEDX & RT_BIT(28)) RTTestIPrintf(RTTESTLVL_ALWAYS, " 28");
452 if (s.uEDX & RT_BIT(29)) RTTestIPrintf(RTTESTLVL_ALWAYS, " LongMode");
453 if (s.uEDX & RT_BIT(30)) RTTestIPrintf(RTTESTLVL_ALWAYS, " 3DNowExt");
454 if (s.uEDX & RT_BIT(31)) RTTestIPrintf(RTTESTLVL_ALWAYS, " 3DNow");
455 RTTestIPrintf(RTTESTLVL_ALWAYS, "\n");
456
457 RTTestIPrintf(RTTESTLVL_ALWAYS, "Features ECX: ");
458 if (s.uECX & RT_BIT(0)) RTTestIPrintf(RTTESTLVL_ALWAYS, " LahfSahf");
459 if (s.uECX & RT_BIT(1)) RTTestIPrintf(RTTESTLVL_ALWAYS, " CmpLegacy");
460 if (s.uECX & RT_BIT(2)) RTTestIPrintf(RTTESTLVL_ALWAYS, " SVM");
461 if (s.uECX & RT_BIT(3)) RTTestIPrintf(RTTESTLVL_ALWAYS, " 3");
462 if (s.uECX & RT_BIT(4)) RTTestIPrintf(RTTESTLVL_ALWAYS, " AltMovCr8");
463 for (iBit = 5; iBit < 32; iBit++)
464 if (s.uECX & RT_BIT(iBit))
465 RTTestIPrintf(RTTESTLVL_ALWAYS, " %d", iBit);
466 RTTestIPrintf(RTTESTLVL_ALWAYS, "\n");
467 }
468
469 char szString[4*4*3+1] = {0};
470 if (cExtFunctions >= 0x80000002)
471 ASMCpuId(0x80000002, &szString[0 + 0], &szString[0 + 4], &szString[0 + 8], &szString[0 + 12]);
472 if (cExtFunctions >= 0x80000003)
473 ASMCpuId(0x80000003, &szString[16 + 0], &szString[16 + 4], &szString[16 + 8], &szString[16 + 12]);
474 if (cExtFunctions >= 0x80000004)
475 ASMCpuId(0x80000004, &szString[32 + 0], &szString[32 + 4], &szString[32 + 8], &szString[32 + 12]);
476 if (cExtFunctions >= 0x80000002)
477 RTTestIPrintf(RTTESTLVL_ALWAYS, "Full Name: %s\n", szString);
478
479 if (cExtFunctions >= 0x80000005)
480 {
481 ASMCpuId(0x80000005, &s.uEAX, &s.uEBX, &s.uECX, &s.uEDX);
482 RTTestIPrintf(RTTESTLVL_ALWAYS,
483 "TLB 2/4M Instr/Uni: %s %3d entries\n"
484 "TLB 2/4M Data: %s %3d entries\n",
485 getCacheAss((s.uEAX >> 8) & 0xff), (s.uEAX >> 0) & 0xff,
486 getCacheAss((s.uEAX >> 24) & 0xff), (s.uEAX >> 16) & 0xff);
487 RTTestIPrintf(RTTESTLVL_ALWAYS,
488 "TLB 4K Instr/Uni: %s %3d entries\n"
489 "TLB 4K Data: %s %3d entries\n",
490 getCacheAss((s.uEBX >> 8) & 0xff), (s.uEBX >> 0) & 0xff,
491 getCacheAss((s.uEBX >> 24) & 0xff), (s.uEBX >> 16) & 0xff);
492 RTTestIPrintf(RTTESTLVL_ALWAYS,
493 "L1 Instr Cache Line Size: %d bytes\n"
494 "L1 Instr Cache Lines Per Tag: %d\n"
495 "L1 Instr Cache Associativity: %s\n"
496 "L1 Instr Cache Size: %d KB\n",
497 (s.uEDX >> 0) & 0xff,
498 (s.uEDX >> 8) & 0xff,
499 getCacheAss((s.uEDX >> 16) & 0xff),
500 (s.uEDX >> 24) & 0xff);
501 RTTestIPrintf(RTTESTLVL_ALWAYS,
502 "L1 Data Cache Line Size: %d bytes\n"
503 "L1 Data Cache Lines Per Tag: %d\n"
504 "L1 Data Cache Associativity: %s\n"
505 "L1 Data Cache Size: %d KB\n",
506 (s.uECX >> 0) & 0xff,
507 (s.uECX >> 8) & 0xff,
508 getCacheAss((s.uECX >> 16) & 0xff),
509 (s.uECX >> 24) & 0xff);
510 }
511
512 if (cExtFunctions >= 0x80000006)
513 {
514 ASMCpuId(0x80000006, &s.uEAX, &s.uEBX, &s.uECX, &s.uEDX);
515 RTTestIPrintf(RTTESTLVL_ALWAYS,
516 "L2 TLB 2/4M Instr/Uni: %s %4d entries\n"
517 "L2 TLB 2/4M Data: %s %4d entries\n",
518 getL2CacheAss((s.uEAX >> 12) & 0xf), (s.uEAX >> 0) & 0xfff,
519 getL2CacheAss((s.uEAX >> 28) & 0xf), (s.uEAX >> 16) & 0xfff);
520 RTTestIPrintf(RTTESTLVL_ALWAYS,
521 "L2 TLB 4K Instr/Uni: %s %4d entries\n"
522 "L2 TLB 4K Data: %s %4d entries\n",
523 getL2CacheAss((s.uEBX >> 12) & 0xf), (s.uEBX >> 0) & 0xfff,
524 getL2CacheAss((s.uEBX >> 28) & 0xf), (s.uEBX >> 16) & 0xfff);
525 RTTestIPrintf(RTTESTLVL_ALWAYS,
526 "L2 Cache Line Size: %d bytes\n"
527 "L2 Cache Lines Per Tag: %d\n"
528 "L2 Cache Associativity: %s\n"
529 "L2 Cache Size: %d KB\n",
530 (s.uEDX >> 0) & 0xff,
531 (s.uEDX >> 8) & 0xf,
532 getL2CacheAss((s.uEDX >> 12) & 0xf),
533 (s.uEDX >> 16) & 0xffff);
534 }
535
536 if (cExtFunctions >= 0x80000007)
537 {
538 ASMCpuId(0x80000007, &s.uEAX, &s.uEBX, &s.uECX, &s.uEDX);
539 RTTestIPrintf(RTTESTLVL_ALWAYS, "APM Features: ");
540 if (s.uEDX & RT_BIT(0)) RTTestIPrintf(RTTESTLVL_ALWAYS, " TS");
541 if (s.uEDX & RT_BIT(1)) RTTestIPrintf(RTTESTLVL_ALWAYS, " FID");
542 if (s.uEDX & RT_BIT(2)) RTTestIPrintf(RTTESTLVL_ALWAYS, " VID");
543 if (s.uEDX & RT_BIT(3)) RTTestIPrintf(RTTESTLVL_ALWAYS, " TTP");
544 if (s.uEDX & RT_BIT(4)) RTTestIPrintf(RTTESTLVL_ALWAYS, " TM");
545 if (s.uEDX & RT_BIT(5)) RTTestIPrintf(RTTESTLVL_ALWAYS, " STC");
546 if (s.uEDX & RT_BIT(6)) RTTestIPrintf(RTTESTLVL_ALWAYS, " 6");
547 if (s.uEDX & RT_BIT(7)) RTTestIPrintf(RTTESTLVL_ALWAYS, " 7");
548 if (s.uEDX & RT_BIT(8)) RTTestIPrintf(RTTESTLVL_ALWAYS, " TscInvariant");
549 for (iBit = 9; iBit < 32; iBit++)
550 if (s.uEDX & RT_BIT(iBit))
551 RTTestIPrintf(RTTESTLVL_ALWAYS, " %d", iBit);
552 RTTestIPrintf(RTTESTLVL_ALWAYS, "\n");
553 }
554
555 if (cExtFunctions >= 0x80000008)
556 {
557 ASMCpuId(0x80000008, &s.uEAX, &s.uEBX, &s.uECX, &s.uEDX);
558 RTTestIPrintf(RTTESTLVL_ALWAYS,
559 "Physical Address Width: %d bits\n"
560 "Virtual Address Width: %d bits\n"
561 "Guest Physical Address Width: %d bits\n",
562 (s.uEAX >> 0) & 0xff,
563 (s.uEAX >> 8) & 0xff,
564 (s.uEAX >> 16) & 0xff);
565 RTTestIPrintf(RTTESTLVL_ALWAYS,
566 "Physical Core Count: %d\n",
567 ((s.uECX >> 0) & 0xff) + 1);
568 if ((s.uECX >> 12) & 0xf)
569 RTTestIPrintf(RTTESTLVL_ALWAYS, "ApicIdCoreIdSize: %d bits\n", (s.uECX >> 12) & 0xf);
570 }
571
572 if (cExtFunctions >= 0x8000000a)
573 {
574 ASMCpuId(0x8000000a, &s.uEAX, &s.uEBX, &s.uECX, &s.uEDX);
575 RTTestIPrintf(RTTESTLVL_ALWAYS,
576 "SVM Revision: %d (%#x)\n"
577 "Number of Address Space IDs: %d (%#x)\n",
578 s.uEAX & 0xff, s.uEAX & 0xff,
579 s.uEBX, s.uEBX);
580 }
581}
582
583# if 0
584static void bruteForceCpuId(void)
585{
586 RTTestISub("brute force CPUID leafs");
587 uint32_t auPrevValues[4] = { 0, 0, 0, 0};
588 uint32_t uLeaf = 0;
589 do
590 {
591 uint32_t auValues[4];
592 ASMCpuIdExSlow(uLeaf, 0, 0, 0, &auValues[0], &auValues[1], &auValues[2], &auValues[3]);
593 if ( (auValues[0] != auPrevValues[0] && auValues[0] != uLeaf)
594 || (auValues[1] != auPrevValues[1] && auValues[1] != 0)
595 || (auValues[2] != auPrevValues[2] && auValues[2] != 0)
596 || (auValues[3] != auPrevValues[3] && auValues[3] != 0)
597 || (uLeaf & (UINT32_C(0x08000000) - UINT32_C(1))) == 0)
598 {
599 RTTestIPrintf(RTTESTLVL_ALWAYS,
600 "%08x: %08x %08x %08x %08x\n", uLeaf,
601 auValues[0], auValues[1], auValues[2], auValues[3]);
602 }
603 auPrevValues[0] = auValues[0];
604 auPrevValues[1] = auValues[1];
605 auPrevValues[2] = auValues[2];
606 auPrevValues[3] = auValues[3];
607
608 //uint32_t uSubLeaf = 0;
609 //do
610 //{
611 //
612 //
613 //} while (false);
614 } while (uLeaf++ < UINT32_MAX);
615}
616# endif
617
618#endif /* AMD64 || X86 */
619
620DECLINLINE(void) tstASMAtomicXchgU8Worker(uint8_t volatile *pu8)
621{
622 *pu8 = 0;
623 CHECKOP(ASMAtomicXchgU8(pu8, 1), 0, "%#x", uint8_t);
624 CHECKVAL(*pu8, 1, "%#x");
625
626 CHECKOP(ASMAtomicXchgU8(pu8, 0), 1, "%#x", uint8_t);
627 CHECKVAL(*pu8, 0, "%#x");
628
629 CHECKOP(ASMAtomicXchgU8(pu8, 0xff), 0, "%#x", uint8_t);
630 CHECKVAL(*pu8, 0xff, "%#x");
631
632 CHECKOP(ASMAtomicXchgU8(pu8, 0x87), 0xffff, "%#x", uint8_t);
633 CHECKVAL(*pu8, 0x87, "%#x");
634}
635
636
637static void tstASMAtomicXchgU8(void)
638{
639 DO_SIMPLE_TEST(ASMAtomicXchgU8, uint8_t);
640}
641
642
643DECLINLINE(void) tstASMAtomicXchgU16Worker(uint16_t volatile *pu16)
644{
645 *pu16 = 0;
646
647 CHECKOP(ASMAtomicXchgU16(pu16, 1), 0, "%#x", uint16_t);
648 CHECKVAL(*pu16, 1, "%#x");
649
650 CHECKOP(ASMAtomicXchgU16(pu16, 0), 1, "%#x", uint16_t);
651 CHECKVAL(*pu16, 0, "%#x");
652
653 CHECKOP(ASMAtomicXchgU16(pu16, 0xffff), 0, "%#x", uint16_t);
654 CHECKVAL(*pu16, 0xffff, "%#x");
655
656 CHECKOP(ASMAtomicXchgU16(pu16, 0x8765), 0xffff, "%#x", uint16_t);
657 CHECKVAL(*pu16, 0x8765, "%#x");
658}
659
660
661static void tstASMAtomicXchgU16(void)
662{
663 DO_SIMPLE_TEST(ASMAtomicXchgU16, uint16_t);
664}
665
666
667DECLINLINE(void) tstASMAtomicXchgU32Worker(uint32_t volatile *pu32)
668{
669 *pu32 = 0;
670
671 CHECKOP(ASMAtomicXchgU32(pu32, 1), 0, "%#x", uint32_t);
672 CHECKVAL(*pu32, 1, "%#x");
673
674 CHECKOP(ASMAtomicXchgU32(pu32, 0), 1, "%#x", uint32_t);
675 CHECKVAL(*pu32, 0, "%#x");
676
677 CHECKOP(ASMAtomicXchgU32(pu32, ~UINT32_C(0)), 0, "%#x", uint32_t);
678 CHECKVAL(*pu32, ~UINT32_C(0), "%#x");
679
680 CHECKOP(ASMAtomicXchgU32(pu32, 0x87654321), ~UINT32_C(0), "%#x", uint32_t);
681 CHECKVAL(*pu32, 0x87654321, "%#x");
682}
683
684
685static void tstASMAtomicXchgU32(void)
686{
687 DO_SIMPLE_TEST(ASMAtomicXchgU32, uint32_t);
688}
689
690
691DECLINLINE(void) tstASMAtomicXchgU64Worker(uint64_t volatile *pu64)
692{
693 *pu64 = 0;
694
695 CHECKOP(ASMAtomicXchgU64(pu64, 1), UINT64_C(0), "%#llx", uint64_t);
696 CHECKVAL(*pu64, UINT64_C(1), "%#llx");
697
698 CHECKOP(ASMAtomicXchgU64(pu64, 0), UINT64_C(1), "%#llx", uint64_t);
699 CHECKVAL(*pu64, UINT64_C(0), "%#llx");
700
701 CHECKOP(ASMAtomicXchgU64(pu64, ~UINT64_C(0)), UINT64_C(0), "%#llx", uint64_t);
702 CHECKVAL(*pu64, ~UINT64_C(0), "%#llx");
703
704 CHECKOP(ASMAtomicXchgU64(pu64, UINT64_C(0xfedcba0987654321)), ~UINT64_C(0), "%#llx", uint64_t);
705 CHECKVAL(*pu64, UINT64_C(0xfedcba0987654321), "%#llx");
706}
707
708
709static void tstASMAtomicXchgU64(void)
710{
711 DO_SIMPLE_TEST(ASMAtomicXchgU64, uint64_t);
712}
713
714
715DECLINLINE(void) tstASMAtomicXchgPtrWorker(void * volatile *ppv)
716{
717 *ppv = NULL;
718
719 CHECKOP(ASMAtomicXchgPtr(ppv, (void *)(~(uintptr_t)0)), NULL, "%p", void *);
720 CHECKVAL(*ppv, (void *)(~(uintptr_t)0), "%p");
721
722 CHECKOP(ASMAtomicXchgPtr(ppv, (void *)0x87654321), (void *)(~(uintptr_t)0), "%p", void *);
723 CHECKVAL(*ppv, (void *)0x87654321, "%p");
724
725 CHECKOP(ASMAtomicXchgPtr(ppv, NULL), (void *)0x87654321, "%p", void *);
726 CHECKVAL(*ppv, NULL, "%p");
727}
728
729
730static void tstASMAtomicXchgPtr(void)
731{
732 DO_SIMPLE_TEST(ASMAtomicXchgPtr, void *);
733}
734
735
736DECLINLINE(void) tstASMAtomicCmpXchgU8Worker(uint8_t volatile *pu8)
737{
738 *pu8 = 0xff;
739
740 CHECKOP(ASMAtomicCmpXchgU8(pu8, 0, 0), false, "%d", bool);
741 CHECKVAL(*pu8, 0xff, "%x");
742
743 CHECKOP(ASMAtomicCmpXchgU8(pu8, 0, 0xff), true, "%d", bool);
744 CHECKVAL(*pu8, 0, "%x");
745
746 CHECKOP(ASMAtomicCmpXchgU8(pu8, 0x79, 0xff), false, "%d", bool);
747 CHECKVAL(*pu8, 0, "%x");
748
749 CHECKOP(ASMAtomicCmpXchgU8(pu8, 0x97, 0), true, "%d", bool);
750 CHECKVAL(*pu8, 0x97, "%x");
751}
752
753
754static void tstASMAtomicCmpXchgU8(void)
755{
756 DO_SIMPLE_TEST(ASMAtomicCmpXchgU8, uint8_t);
757}
758
759
760DECLINLINE(void) tstASMAtomicCmpXchgU32Worker(uint32_t volatile *pu32)
761{
762 *pu32 = UINT32_C(0xffffffff);
763
764 CHECKOP(ASMAtomicCmpXchgU32(pu32, 0, 0), false, "%d", bool);
765 CHECKVAL(*pu32, UINT32_C(0xffffffff), "%x");
766
767 CHECKOP(ASMAtomicCmpXchgU32(pu32, 0, UINT32_C(0xffffffff)), true, "%d", bool);
768 CHECKVAL(*pu32, 0, "%x");
769
770 CHECKOP(ASMAtomicCmpXchgU32(pu32, UINT32_C(0x8008efd), UINT32_C(0xffffffff)), false, "%d", bool);
771 CHECKVAL(*pu32, 0, "%x");
772
773 CHECKOP(ASMAtomicCmpXchgU32(pu32, UINT32_C(0x8008efd), 0), true, "%d", bool);
774 CHECKVAL(*pu32, UINT32_C(0x8008efd), "%x");
775}
776
777
778static void tstASMAtomicCmpXchgU32(void)
779{
780 DO_SIMPLE_TEST(ASMAtomicCmpXchgU32, uint32_t);
781}
782
783
784
785DECLINLINE(void) tstASMAtomicCmpXchgU64Worker(uint64_t volatile *pu64)
786{
787 *pu64 = UINT64_C(0xffffffffffffff);
788
789 CHECKOP(ASMAtomicCmpXchgU64(pu64, 0, 0), false, "%d", bool);
790 CHECKVAL(*pu64, UINT64_C(0xffffffffffffff), "%#llx");
791
792 CHECKOP(ASMAtomicCmpXchgU64(pu64, 0, UINT64_C(0xffffffffffffff)), true, "%d", bool);
793 CHECKVAL(*pu64, 0, "%x");
794
795 CHECKOP(ASMAtomicCmpXchgU64(pu64, UINT64_C(0x80040008008efd), UINT64_C(0xffffffff)), false, "%d", bool);
796 CHECKVAL(*pu64, 0, "%x");
797
798 CHECKOP(ASMAtomicCmpXchgU64(pu64, UINT64_C(0x80040008008efd), UINT64_C(0xffffffff00000000)), false, "%d", bool);
799 CHECKVAL(*pu64, 0, "%x");
800
801 CHECKOP(ASMAtomicCmpXchgU64(pu64, UINT64_C(0x80040008008efd), 0), true, "%d", bool);
802 CHECKVAL(*pu64, UINT64_C(0x80040008008efd), "%#llx");
803}
804
805
806static void tstASMAtomicCmpXchgU64(void)
807{
808 DO_SIMPLE_TEST(ASMAtomicCmpXchgU64, uint64_t);
809}
810
811
812DECLINLINE(void) tstASMAtomicCmpXchgExU32Worker(uint32_t volatile *pu32)
813{
814 *pu32 = UINT32_C(0xffffffff);
815 uint32_t u32Old = UINT32_C(0x80005111);
816
817 CHECKOP(ASMAtomicCmpXchgExU32(pu32, 0, 0, &u32Old), false, "%d", bool);
818 CHECKVAL(*pu32, UINT32_C(0xffffffff), "%x");
819 CHECKVAL(u32Old, UINT32_C(0xffffffff), "%x");
820
821 CHECKOP(ASMAtomicCmpXchgExU32(pu32, 0, UINT32_C(0xffffffff), &u32Old), true, "%d", bool);
822 CHECKVAL(*pu32, 0, "%x");
823 CHECKVAL(u32Old, UINT32_C(0xffffffff), "%x");
824
825 CHECKOP(ASMAtomicCmpXchgExU32(pu32, UINT32_C(0x8008efd), UINT32_C(0xffffffff), &u32Old), false, "%d", bool);
826 CHECKVAL(*pu32, 0, "%x");
827 CHECKVAL(u32Old, 0, "%x");
828
829 CHECKOP(ASMAtomicCmpXchgExU32(pu32, UINT32_C(0x8008efd), 0, &u32Old), true, "%d", bool);
830 CHECKVAL(*pu32, UINT32_C(0x8008efd), "%x");
831 CHECKVAL(u32Old, 0, "%x");
832
833 CHECKOP(ASMAtomicCmpXchgExU32(pu32, 0, UINT32_C(0x8008efd), &u32Old), true, "%d", bool);
834 CHECKVAL(*pu32, 0, "%x");
835 CHECKVAL(u32Old, UINT32_C(0x8008efd), "%x");
836}
837
838
839static void tstASMAtomicCmpXchgExU32(void)
840{
841 DO_SIMPLE_TEST(ASMAtomicCmpXchgExU32, uint32_t);
842}
843
844
845DECLINLINE(void) tstASMAtomicCmpXchgExU64Worker(uint64_t volatile *pu64)
846{
847 *pu64 = UINT64_C(0xffffffffffffffff);
848 uint64_t u64Old = UINT64_C(0x8000000051111111);
849
850 CHECKOP(ASMAtomicCmpXchgExU64(pu64, 0, 0, &u64Old), false, "%d", bool);
851 CHECKVAL(*pu64, UINT64_C(0xffffffffffffffff), "%llx");
852 CHECKVAL(u64Old, UINT64_C(0xffffffffffffffff), "%llx");
853
854 CHECKOP(ASMAtomicCmpXchgExU64(pu64, 0, UINT64_C(0xffffffffffffffff), &u64Old), true, "%d", bool);
855 CHECKVAL(*pu64, UINT64_C(0), "%llx");
856 CHECKVAL(u64Old, UINT64_C(0xffffffffffffffff), "%llx");
857
858 CHECKOP(ASMAtomicCmpXchgExU64(pu64, UINT64_C(0x80040008008efd), 0xffffffff, &u64Old), false, "%d", bool);
859 CHECKVAL(*pu64, UINT64_C(0), "%llx");
860 CHECKVAL(u64Old, UINT64_C(0), "%llx");
861
862 CHECKOP(ASMAtomicCmpXchgExU64(pu64, UINT64_C(0x80040008008efd), UINT64_C(0xffffffff00000000), &u64Old), false, "%d", bool);
863 CHECKVAL(*pu64, UINT64_C(0), "%llx");
864 CHECKVAL(u64Old, UINT64_C(0), "%llx");
865
866 CHECKOP(ASMAtomicCmpXchgExU64(pu64, UINT64_C(0x80040008008efd), 0, &u64Old), true, "%d", bool);
867 CHECKVAL(*pu64, UINT64_C(0x80040008008efd), "%llx");
868 CHECKVAL(u64Old, UINT64_C(0), "%llx");
869
870 CHECKOP(ASMAtomicCmpXchgExU64(pu64, 0, UINT64_C(0x80040008008efd), &u64Old), true, "%d", bool);
871 CHECKVAL(*pu64, UINT64_C(0), "%llx");
872 CHECKVAL(u64Old, UINT64_C(0x80040008008efd), "%llx");
873}
874
875
876static void tstASMAtomicCmpXchgExU64(void)
877{
878 DO_SIMPLE_TEST(ASMAtomicCmpXchgExU64, uint64_t);
879}
880
881
882DECLINLINE(void) tstASMAtomicReadU64Worker(uint64_t volatile *pu64)
883{
884 *pu64 = 0;
885
886 CHECKOP(ASMAtomicReadU64(pu64), UINT64_C(0), "%#llx", uint64_t);
887 CHECKVAL(*pu64, UINT64_C(0), "%#llx");
888
889 *pu64 = ~UINT64_C(0);
890 CHECKOP(ASMAtomicReadU64(pu64), ~UINT64_C(0), "%#llx", uint64_t);
891 CHECKVAL(*pu64, ~UINT64_C(0), "%#llx");
892
893 *pu64 = UINT64_C(0xfedcba0987654321);
894 CHECKOP(ASMAtomicReadU64(pu64), UINT64_C(0xfedcba0987654321), "%#llx", uint64_t);
895 CHECKVAL(*pu64, UINT64_C(0xfedcba0987654321), "%#llx");
896}
897
898
899static void tstASMAtomicReadU64(void)
900{
901 DO_SIMPLE_TEST(ASMAtomicReadU64, uint64_t);
902}
903
904
905DECLINLINE(void) tstASMAtomicUoReadU64Worker(uint64_t volatile *pu64)
906{
907 *pu64 = 0;
908
909 CHECKOP(ASMAtomicUoReadU64(pu64), UINT64_C(0), "%#llx", uint64_t);
910 CHECKVAL(*pu64, UINT64_C(0), "%#llx");
911
912 *pu64 = ~UINT64_C(0);
913 CHECKOP(ASMAtomicUoReadU64(pu64), ~UINT64_C(0), "%#llx", uint64_t);
914 CHECKVAL(*pu64, ~UINT64_C(0), "%#llx");
915
916 *pu64 = UINT64_C(0xfedcba0987654321);
917 CHECKOP(ASMAtomicUoReadU64(pu64), UINT64_C(0xfedcba0987654321), "%#llx", uint64_t);
918 CHECKVAL(*pu64, UINT64_C(0xfedcba0987654321), "%#llx");
919}
920
921
922static void tstASMAtomicUoReadU64(void)
923{
924 DO_SIMPLE_TEST(ASMAtomicUoReadU64, uint64_t);
925}
926
927
928DECLINLINE(void) tstASMAtomicAddS32Worker(int32_t *pi32)
929{
930 int32_t i32Rc;
931 *pi32 = 10;
932#define MYCHECK(op, rc, val) \
933 do { \
934 i32Rc = op; \
935 if (i32Rc != (rc)) \
936 RTTestFailed(g_hTest, "%s, %d: FAILURE: %s -> %d expected %d\n", __FUNCTION__, __LINE__, #op, i32Rc, rc); \
937 if (*pi32 != (val)) \
938 RTTestFailed(g_hTest, "%s, %d: FAILURE: %s => *pi32=%d expected %d\n", __FUNCTION__, __LINE__, #op, *pi32, val); \
939 } while (0)
940 MYCHECK(ASMAtomicAddS32(pi32, 1), 10, 11);
941 MYCHECK(ASMAtomicAddS32(pi32, -2), 11, 9);
942 MYCHECK(ASMAtomicAddS32(pi32, -9), 9, 0);
943 MYCHECK(ASMAtomicAddS32(pi32, -0x7fffffff), 0, -0x7fffffff);
944 MYCHECK(ASMAtomicAddS32(pi32, 0), -0x7fffffff, -0x7fffffff);
945 MYCHECK(ASMAtomicAddS32(pi32, 0x7fffffff), -0x7fffffff, 0);
946 MYCHECK(ASMAtomicAddS32(pi32, 0), 0, 0);
947#undef MYCHECK
948}
949
950static void tstASMAtomicAddS32(void)
951{
952 DO_SIMPLE_TEST(ASMAtomicAddS32, int32_t);
953}
954
955
956DECLINLINE(void) tstASMAtomicAddS64Worker(int64_t volatile *pi64)
957{
958 int64_t i64Rc;
959 *pi64 = 10;
960#define MYCHECK(op, rc, val) \
961 do { \
962 i64Rc = op; \
963 if (i64Rc != (rc)) \
964 RTTestFailed(g_hTest, "%s, %d: FAILURE: %s -> %llx expected %llx\n", __FUNCTION__, __LINE__, #op, i64Rc, (int64_t)rc); \
965 if (*pi64 != (val)) \
966 RTTestFailed(g_hTest, "%s, %d: FAILURE: %s => *pi64=%llx expected %llx\n", __FUNCTION__, __LINE__, #op, *pi64, (int64_t)(val)); \
967 } while (0)
968 MYCHECK(ASMAtomicAddS64(pi64, 1), 10, 11);
969 MYCHECK(ASMAtomicAddS64(pi64, -2), 11, 9);
970 MYCHECK(ASMAtomicAddS64(pi64, -9), 9, 0);
971 MYCHECK(ASMAtomicAddS64(pi64, -INT64_MAX), 0, -INT64_MAX);
972 MYCHECK(ASMAtomicAddS64(pi64, 0), -INT64_MAX, -INT64_MAX);
973 MYCHECK(ASMAtomicAddS64(pi64, -1), -INT64_MAX, INT64_MIN);
974 MYCHECK(ASMAtomicAddS64(pi64, INT64_MAX), INT64_MIN, -1);
975 MYCHECK(ASMAtomicAddS64(pi64, 1), -1, 0);
976 MYCHECK(ASMAtomicAddS64(pi64, 0), 0, 0);
977#undef MYCHECK
978}
979
980
981static void tstASMAtomicAddS64(void)
982{
983 DO_SIMPLE_TEST(ASMAtomicAddS64, int64_t);
984}
985
986
987DECLINLINE(void) tstASMAtomicDecIncS32Worker(int32_t volatile *pi32)
988{
989 int32_t i32Rc;
990 *pi32 = 10;
991#define MYCHECK(op, rc) \
992 do { \
993 i32Rc = op; \
994 if (i32Rc != (rc)) \
995 RTTestFailed(g_hTest, "%s, %d: FAILURE: %s -> %d expected %d\n", __FUNCTION__, __LINE__, #op, i32Rc, rc); \
996 if (*pi32 != (rc)) \
997 RTTestFailed(g_hTest, "%s, %d: FAILURE: %s => *pi32=%d expected %d\n", __FUNCTION__, __LINE__, #op, *pi32, rc); \
998 } while (0)
999 MYCHECK(ASMAtomicDecS32(pi32), 9);
1000 MYCHECK(ASMAtomicDecS32(pi32), 8);
1001 MYCHECK(ASMAtomicDecS32(pi32), 7);
1002 MYCHECK(ASMAtomicDecS32(pi32), 6);
1003 MYCHECK(ASMAtomicDecS32(pi32), 5);
1004 MYCHECK(ASMAtomicDecS32(pi32), 4);
1005 MYCHECK(ASMAtomicDecS32(pi32), 3);
1006 MYCHECK(ASMAtomicDecS32(pi32), 2);
1007 MYCHECK(ASMAtomicDecS32(pi32), 1);
1008 MYCHECK(ASMAtomicDecS32(pi32), 0);
1009 MYCHECK(ASMAtomicDecS32(pi32), -1);
1010 MYCHECK(ASMAtomicDecS32(pi32), -2);
1011 MYCHECK(ASMAtomicIncS32(pi32), -1);
1012 MYCHECK(ASMAtomicIncS32(pi32), 0);
1013 MYCHECK(ASMAtomicIncS32(pi32), 1);
1014 MYCHECK(ASMAtomicIncS32(pi32), 2);
1015 MYCHECK(ASMAtomicIncS32(pi32), 3);
1016 MYCHECK(ASMAtomicDecS32(pi32), 2);
1017 MYCHECK(ASMAtomicIncS32(pi32), 3);
1018 MYCHECK(ASMAtomicDecS32(pi32), 2);
1019 MYCHECK(ASMAtomicIncS32(pi32), 3);
1020#undef MYCHECK
1021}
1022
1023
1024static void tstASMAtomicDecIncS32(void)
1025{
1026 DO_SIMPLE_TEST(ASMAtomicDecIncS32, int32_t);
1027}
1028
1029
1030DECLINLINE(void) tstASMAtomicDecIncS64Worker(int64_t volatile *pi64)
1031{
1032 int64_t i64Rc;
1033 *pi64 = 10;
1034#define MYCHECK(op, rc) \
1035 do { \
1036 i64Rc = op; \
1037 if (i64Rc != (rc)) \
1038 RTTestFailed(g_hTest, "%s, %d: FAILURE: %s -> %lld expected %lld\n", __FUNCTION__, __LINE__, #op, i64Rc, rc); \
1039 if (*pi64 != (rc)) \
1040 RTTestFailed(g_hTest, "%s, %d: FAILURE: %s => *pi64=%lld expected %lld\n", __FUNCTION__, __LINE__, #op, *pi64, rc); \
1041 } while (0)
1042 MYCHECK(ASMAtomicDecS64(pi64), 9);
1043 MYCHECK(ASMAtomicDecS64(pi64), 8);
1044 MYCHECK(ASMAtomicDecS64(pi64), 7);
1045 MYCHECK(ASMAtomicDecS64(pi64), 6);
1046 MYCHECK(ASMAtomicDecS64(pi64), 5);
1047 MYCHECK(ASMAtomicDecS64(pi64), 4);
1048 MYCHECK(ASMAtomicDecS64(pi64), 3);
1049 MYCHECK(ASMAtomicDecS64(pi64), 2);
1050 MYCHECK(ASMAtomicDecS64(pi64), 1);
1051 MYCHECK(ASMAtomicDecS64(pi64), 0);
1052 MYCHECK(ASMAtomicDecS64(pi64), -1);
1053 MYCHECK(ASMAtomicDecS64(pi64), -2);
1054 MYCHECK(ASMAtomicIncS64(pi64), -1);
1055 MYCHECK(ASMAtomicIncS64(pi64), 0);
1056 MYCHECK(ASMAtomicIncS64(pi64), 1);
1057 MYCHECK(ASMAtomicIncS64(pi64), 2);
1058 MYCHECK(ASMAtomicIncS64(pi64), 3);
1059 MYCHECK(ASMAtomicDecS64(pi64), 2);
1060 MYCHECK(ASMAtomicIncS64(pi64), 3);
1061 MYCHECK(ASMAtomicDecS64(pi64), 2);
1062 MYCHECK(ASMAtomicIncS64(pi64), 3);
1063#undef MYCHECK
1064}
1065
1066
1067static void tstASMAtomicDecIncS64(void)
1068{
1069 DO_SIMPLE_TEST(ASMAtomicDecIncS64, int64_t);
1070}
1071
1072
1073DECLINLINE(void) tstASMAtomicAndOrU32Worker(uint32_t volatile *pu32)
1074{
1075 *pu32 = UINT32_C(0xffffffff);
1076
1077 ASMAtomicOrU32(pu32, UINT32_C(0xffffffff));
1078 CHECKVAL(*pu32, UINT32_C(0xffffffff), "%x");
1079
1080 ASMAtomicAndU32(pu32, UINT32_C(0xffffffff));
1081 CHECKVAL(*pu32, UINT32_C(0xffffffff), "%x");
1082
1083 ASMAtomicAndU32(pu32, UINT32_C(0x8f8f8f8f));
1084 CHECKVAL(*pu32, UINT32_C(0x8f8f8f8f), "%x");
1085
1086 ASMAtomicOrU32(pu32, UINT32_C(0x70707070));
1087 CHECKVAL(*pu32, UINT32_C(0xffffffff), "%x");
1088
1089 ASMAtomicAndU32(pu32, UINT32_C(1));
1090 CHECKVAL(*pu32, UINT32_C(1), "%x");
1091
1092 ASMAtomicOrU32(pu32, UINT32_C(0x80000000));
1093 CHECKVAL(*pu32, UINT32_C(0x80000001), "%x");
1094
1095 ASMAtomicAndU32(pu32, UINT32_C(0x80000000));
1096 CHECKVAL(*pu32, UINT32_C(0x80000000), "%x");
1097
1098 ASMAtomicAndU32(pu32, UINT32_C(0));
1099 CHECKVAL(*pu32, UINT32_C(0), "%x");
1100
1101 ASMAtomicOrU32(pu32, UINT32_C(0x42424242));
1102 CHECKVAL(*pu32, UINT32_C(0x42424242), "%x");
1103}
1104
1105
1106static void tstASMAtomicAndOrU32(void)
1107{
1108 DO_SIMPLE_TEST(ASMAtomicAndOrU32, uint32_t);
1109}
1110
1111
1112DECLINLINE(void) tstASMAtomicAndOrU64Worker(uint64_t volatile *pu64)
1113{
1114 *pu64 = UINT64_C(0xffffffff);
1115
1116 ASMAtomicOrU64(pu64, UINT64_C(0xffffffff));
1117 CHECKVAL(*pu64, UINT64_C(0xffffffff), "%x");
1118
1119 ASMAtomicAndU64(pu64, UINT64_C(0xffffffff));
1120 CHECKVAL(*pu64, UINT64_C(0xffffffff), "%x");
1121
1122 ASMAtomicAndU64(pu64, UINT64_C(0x8f8f8f8f));
1123 CHECKVAL(*pu64, UINT64_C(0x8f8f8f8f), "%x");
1124
1125 ASMAtomicOrU64(pu64, UINT64_C(0x70707070));
1126 CHECKVAL(*pu64, UINT64_C(0xffffffff), "%x");
1127
1128 ASMAtomicAndU64(pu64, UINT64_C(1));
1129 CHECKVAL(*pu64, UINT64_C(1), "%x");
1130
1131 ASMAtomicOrU64(pu64, UINT64_C(0x80000000));
1132 CHECKVAL(*pu64, UINT64_C(0x80000001), "%x");
1133
1134 ASMAtomicAndU64(pu64, UINT64_C(0x80000000));
1135 CHECKVAL(*pu64, UINT64_C(0x80000000), "%x");
1136
1137 ASMAtomicAndU64(pu64, UINT64_C(0));
1138 CHECKVAL(*pu64, UINT64_C(0), "%x");
1139
1140 ASMAtomicOrU64(pu64, UINT64_C(0x42424242));
1141 CHECKVAL(*pu64, UINT64_C(0x42424242), "%x");
1142
1143 // Same as above, but now 64-bit wide.
1144 ASMAtomicAndU64(pu64, UINT64_C(0));
1145 CHECKVAL(*pu64, UINT64_C(0), "%x");
1146
1147 ASMAtomicOrU64(pu64, UINT64_C(0xffffffffffffffff));
1148 CHECKVAL(*pu64, UINT64_C(0xffffffffffffffff), "%x");
1149
1150 ASMAtomicAndU64(pu64, UINT64_C(0xffffffffffffffff));
1151 CHECKVAL(*pu64, UINT64_C(0xffffffffffffffff), "%x");
1152
1153 ASMAtomicAndU64(pu64, UINT64_C(0x8f8f8f8f8f8f8f8f));
1154 CHECKVAL(*pu64, UINT64_C(0x8f8f8f8f8f8f8f8f), "%x");
1155
1156 ASMAtomicOrU64(pu64, UINT64_C(0x7070707070707070));
1157 CHECKVAL(*pu64, UINT64_C(0xffffffffffffffff), "%x");
1158
1159 ASMAtomicAndU64(pu64, UINT64_C(1));
1160 CHECKVAL(*pu64, UINT64_C(1), "%x");
1161
1162 ASMAtomicOrU64(pu64, UINT64_C(0x8000000000000000));
1163 CHECKVAL(*pu64, UINT64_C(0x8000000000000001), "%x");
1164
1165 ASMAtomicAndU64(pu64, UINT64_C(0x8000000000000000));
1166 CHECKVAL(*pu64, UINT64_C(0x8000000000000000), "%x");
1167
1168 ASMAtomicAndU64(pu64, UINT64_C(0));
1169 CHECKVAL(*pu64, UINT64_C(0), "%x");
1170
1171 ASMAtomicOrU64(pu64, UINT64_C(0x4242424242424242));
1172 CHECKVAL(*pu64, UINT64_C(0x4242424242424242), "%x");
1173}
1174
1175
1176static void tstASMAtomicAndOrU64(void)
1177{
1178 DO_SIMPLE_TEST(ASMAtomicAndOrU64, uint64_t);
1179}
1180
1181
1182typedef struct
1183{
1184 uint8_t ab[PAGE_SIZE];
1185} TSTPAGE;
1186
1187
1188DECLINLINE(void) tstASMMemZeroPageWorker(TSTPAGE *pPage)
1189{
1190 for (unsigned j = 0; j < 16; j++)
1191 {
1192 memset(pPage, 0x11 * j, sizeof(*pPage));
1193 ASMMemZeroPage(pPage);
1194 for (unsigned i = 0; i < sizeof(pPage->ab); i++)
1195 if (pPage->ab[i])
1196 RTTestFailed(g_hTest, "ASMMemZeroPage didn't clear byte at offset %#x!\n", i);
1197 }
1198}
1199
1200
1201static void tstASMMemZeroPage(void)
1202{
1203 DO_SIMPLE_TEST(ASMMemZeroPage, TSTPAGE);
1204}
1205
1206
1207void tstASMMemIsZeroPage(RTTEST hTest)
1208{
1209 RTTestSub(hTest, "ASMMemIsZeroPage");
1210
1211 void *pvPage1 = RTTestGuardedAllocHead(hTest, PAGE_SIZE);
1212 void *pvPage2 = RTTestGuardedAllocTail(hTest, PAGE_SIZE);
1213 RTTESTI_CHECK_RETV(pvPage1 && pvPage2);
1214
1215 memset(pvPage1, 0, PAGE_SIZE);
1216 memset(pvPage2, 0, PAGE_SIZE);
1217 RTTESTI_CHECK(ASMMemIsZeroPage(pvPage1));
1218 RTTESTI_CHECK(ASMMemIsZeroPage(pvPage2));
1219
1220 memset(pvPage1, 0xff, PAGE_SIZE);
1221 memset(pvPage2, 0xff, PAGE_SIZE);
1222 RTTESTI_CHECK(!ASMMemIsZeroPage(pvPage1));
1223 RTTESTI_CHECK(!ASMMemIsZeroPage(pvPage2));
1224
1225 memset(pvPage1, 0, PAGE_SIZE);
1226 memset(pvPage2, 0, PAGE_SIZE);
1227 for (unsigned off = 0; off < PAGE_SIZE; off++)
1228 {
1229 ((uint8_t *)pvPage1)[off] = 1;
1230 RTTESTI_CHECK(!ASMMemIsZeroPage(pvPage1));
1231 ((uint8_t *)pvPage1)[off] = 0;
1232
1233 ((uint8_t *)pvPage2)[off] = 0x80;
1234 RTTESTI_CHECK(!ASMMemIsZeroPage(pvPage2));
1235 ((uint8_t *)pvPage2)[off] = 0;
1236 }
1237
1238 RTTestSubDone(hTest);
1239}
1240
1241
1242void tstASMMemZero32(void)
1243{
1244 RTTestSub(g_hTest, "ASMMemFill32");
1245
1246 struct
1247 {
1248 uint64_t u64Magic1;
1249 uint8_t abPage[PAGE_SIZE - 32];
1250 uint64_t u64Magic2;
1251 } Buf1, Buf2, Buf3;
1252
1253 Buf1.u64Magic1 = UINT64_C(0xffffffffffffffff);
1254 memset(Buf1.abPage, 0x55, sizeof(Buf1.abPage));
1255 Buf1.u64Magic2 = UINT64_C(0xffffffffffffffff);
1256 Buf2.u64Magic1 = UINT64_C(0xffffffffffffffff);
1257 memset(Buf2.abPage, 0x77, sizeof(Buf2.abPage));
1258 Buf2.u64Magic2 = UINT64_C(0xffffffffffffffff);
1259 Buf3.u64Magic1 = UINT64_C(0xffffffffffffffff);
1260 memset(Buf3.abPage, 0x99, sizeof(Buf3.abPage));
1261 Buf3.u64Magic2 = UINT64_C(0xffffffffffffffff);
1262 ASMMemZero32(Buf1.abPage, sizeof(Buf1.abPage));
1263 ASMMemZero32(Buf2.abPage, sizeof(Buf2.abPage));
1264 ASMMemZero32(Buf3.abPage, sizeof(Buf3.abPage));
1265 if ( Buf1.u64Magic1 != UINT64_C(0xffffffffffffffff)
1266 || Buf1.u64Magic2 != UINT64_C(0xffffffffffffffff)
1267 || Buf2.u64Magic1 != UINT64_C(0xffffffffffffffff)
1268 || Buf2.u64Magic2 != UINT64_C(0xffffffffffffffff)
1269 || Buf3.u64Magic1 != UINT64_C(0xffffffffffffffff)
1270 || Buf3.u64Magic2 != UINT64_C(0xffffffffffffffff))
1271 {
1272 RTTestFailed(g_hTest, "ASMMemZero32 violated one/both magic(s)!\n");
1273 }
1274 for (unsigned i = 0; i < RT_ELEMENTS(Buf1.abPage); i++)
1275 if (Buf1.abPage[i])
1276 RTTestFailed(g_hTest, "ASMMemZero32 didn't clear byte at offset %#x!\n", i);
1277 for (unsigned i = 0; i < RT_ELEMENTS(Buf2.abPage); i++)
1278 if (Buf2.abPage[i])
1279 RTTestFailed(g_hTest, "ASMMemZero32 didn't clear byte at offset %#x!\n", i);
1280 for (unsigned i = 0; i < RT_ELEMENTS(Buf3.abPage); i++)
1281 if (Buf3.abPage[i])
1282 RTTestFailed(g_hTest, "ASMMemZero32 didn't clear byte at offset %#x!\n", i);
1283}
1284
1285
1286void tstASMMemFill32(void)
1287{
1288 RTTestSub(g_hTest, "ASMMemFill32");
1289
1290 struct
1291 {
1292 uint64_t u64Magic1;
1293 uint32_t au32Page[PAGE_SIZE / 4];
1294 uint64_t u64Magic2;
1295 } Buf1;
1296 struct
1297 {
1298 uint64_t u64Magic1;
1299 uint32_t au32Page[(PAGE_SIZE / 4) - 3];
1300 uint64_t u64Magic2;
1301 } Buf2;
1302 struct
1303 {
1304 uint64_t u64Magic1;
1305 uint32_t au32Page[(PAGE_SIZE / 4) - 1];
1306 uint64_t u64Magic2;
1307 } Buf3;
1308
1309 Buf1.u64Magic1 = UINT64_C(0xffffffffffffffff);
1310 memset(Buf1.au32Page, 0x55, sizeof(Buf1.au32Page));
1311 Buf1.u64Magic2 = UINT64_C(0xffffffffffffffff);
1312 Buf2.u64Magic1 = UINT64_C(0xffffffffffffffff);
1313 memset(Buf2.au32Page, 0x77, sizeof(Buf2.au32Page));
1314 Buf2.u64Magic2 = UINT64_C(0xffffffffffffffff);
1315 Buf3.u64Magic1 = UINT64_C(0xffffffffffffffff);
1316 memset(Buf3.au32Page, 0x99, sizeof(Buf3.au32Page));
1317 Buf3.u64Magic2 = UINT64_C(0xffffffffffffffff);
1318 ASMMemFill32(Buf1.au32Page, sizeof(Buf1.au32Page), 0xdeadbeef);
1319 ASMMemFill32(Buf2.au32Page, sizeof(Buf2.au32Page), 0xcafeff01);
1320 ASMMemFill32(Buf3.au32Page, sizeof(Buf3.au32Page), 0xf00dd00f);
1321 if ( Buf1.u64Magic1 != UINT64_C(0xffffffffffffffff)
1322 || Buf1.u64Magic2 != UINT64_C(0xffffffffffffffff)
1323 || Buf2.u64Magic1 != UINT64_C(0xffffffffffffffff)
1324 || Buf2.u64Magic2 != UINT64_C(0xffffffffffffffff)
1325 || Buf3.u64Magic1 != UINT64_C(0xffffffffffffffff)
1326 || Buf3.u64Magic2 != UINT64_C(0xffffffffffffffff))
1327 RTTestFailed(g_hTest, "ASMMemFill32 violated one/both magic(s)!\n");
1328 for (unsigned i = 0; i < RT_ELEMENTS(Buf1.au32Page); i++)
1329 if (Buf1.au32Page[i] != 0xdeadbeef)
1330 RTTestFailed(g_hTest, "ASMMemFill32 %#x: %#x exepcted %#x\n", i, Buf1.au32Page[i], 0xdeadbeef);
1331 for (unsigned i = 0; i < RT_ELEMENTS(Buf2.au32Page); i++)
1332 if (Buf2.au32Page[i] != 0xcafeff01)
1333 RTTestFailed(g_hTest, "ASMMemFill32 %#x: %#x exepcted %#x\n", i, Buf2.au32Page[i], 0xcafeff01);
1334 for (unsigned i = 0; i < RT_ELEMENTS(Buf3.au32Page); i++)
1335 if (Buf3.au32Page[i] != 0xf00dd00f)
1336 RTTestFailed(g_hTest, "ASMMemFill32 %#x: %#x exepcted %#x\n", i, Buf3.au32Page[i], 0xf00dd00f);
1337}
1338
1339
1340
1341void tstASMMath(void)
1342{
1343 RTTestSub(g_hTest, "Math");
1344
1345 uint64_t u64 = ASMMult2xU32RetU64(UINT32_C(0x80000000), UINT32_C(0x10000000));
1346 CHECKVAL(u64, UINT64_C(0x0800000000000000), "%#018RX64");
1347
1348 uint32_t u32 = ASMDivU64ByU32RetU32(UINT64_C(0x0800000000000000), UINT32_C(0x10000000));
1349 CHECKVAL(u32, UINT32_C(0x80000000), "%#010RX32");
1350
1351#if defined(RT_ARCH_AMD64) || defined(RT_ARCH_X86)
1352 u64 = ASMMultU64ByU32DivByU32(UINT64_C(0x0000000000000001), UINT32_C(0x00000001), UINT32_C(0x00000001));
1353 CHECKVAL(u64, UINT64_C(0x0000000000000001), "%#018RX64");
1354 u64 = ASMMultU64ByU32DivByU32(UINT64_C(0x0000000100000000), UINT32_C(0x80000000), UINT32_C(0x00000002));
1355 CHECKVAL(u64, UINT64_C(0x4000000000000000), "%#018RX64");
1356 u64 = ASMMultU64ByU32DivByU32(UINT64_C(0xfedcba9876543210), UINT32_C(0xffffffff), UINT32_C(0xffffffff));
1357 CHECKVAL(u64, UINT64_C(0xfedcba9876543210), "%#018RX64");
1358 u64 = ASMMultU64ByU32DivByU32(UINT64_C(0xffffffffffffffff), UINT32_C(0xffffffff), UINT32_C(0xffffffff));
1359 CHECKVAL(u64, UINT64_C(0xffffffffffffffff), "%#018RX64");
1360 u64 = ASMMultU64ByU32DivByU32(UINT64_C(0xffffffffffffffff), UINT32_C(0xfffffff0), UINT32_C(0xffffffff));
1361 CHECKVAL(u64, UINT64_C(0xfffffff0fffffff0), "%#018RX64");
1362 u64 = ASMMultU64ByU32DivByU32(UINT64_C(0x3415934810359583), UINT32_C(0x58734981), UINT32_C(0xf8694045));
1363 CHECKVAL(u64, UINT64_C(0x128b9c3d43184763), "%#018RX64");
1364 u64 = ASMMultU64ByU32DivByU32(UINT64_C(0x3415934810359583), UINT32_C(0xf8694045), UINT32_C(0x58734981));
1365 CHECKVAL(u64, UINT64_C(0x924719355cd35a27), "%#018RX64");
1366
1367# if 0 /* bird: question is whether this should trap or not:
1368 *
1369 * frank: Of course it must trap:
1370 *
1371 * 0xfffffff8 * 0x77d7daf8 = 0x77d7daf441412840
1372 *
1373 * During the following division, the quotient must fit into a 32-bit register.
1374 * Therefore the smallest valid divisor is
1375 *
1376 * (0x77d7daf441412840 >> 32) + 1 = 0x77d7daf5
1377 *
1378 * which is definitely greater than 0x3b9aca00.
1379 *
1380 * bird: No, the C version does *not* crash. So, the question is whether there's any
1381 * code depending on it not crashing.
1382 *
1383 * Of course the assembly versions of the code crash right now for the reasons you've
1384 * given, but the 32-bit MSC version does not crash.
1385 *
1386 * frank: The C version does not crash but delivers incorrect results for this case.
1387 * The reason is
1388 *
1389 * u.s.Hi = (unsigned long)(u64Hi / u32C);
1390 *
1391 * Here the division is actually 64-bit by 64-bit but the 64-bit result is truncated
1392 * to 32 bit. If using this (optimized and fast) function we should just be sure that
1393 * the operands are in a valid range.
1394 */
1395 u64 = ASMMultU64ByU32DivByU32(UINT64_C(0xfffffff8c65d6731), UINT32_C(0x77d7daf8), UINT32_C(0x3b9aca00));
1396 CHECKVAL(u64, UINT64_C(0x02b8f9a2aa74e3dc), "%#018RX64");
1397# endif
1398#endif /* AMD64 || X86 */
1399
1400 u32 = ASMModU64ByU32RetU32(UINT64_C(0x0ffffff8c65d6731), UINT32_C(0x77d7daf8));
1401 CHECKVAL(u32, UINT32_C(0x3B642451), "%#010RX32");
1402
1403 int32_t i32;
1404 i32 = ASMModS64ByS32RetS32(INT64_C(-11), INT32_C(-2));
1405 CHECKVAL(i32, INT32_C(-1), "%010RI32");
1406 i32 = ASMModS64ByS32RetS32(INT64_C(-11), INT32_C(2));
1407 CHECKVAL(i32, INT32_C(-1), "%010RI32");
1408 i32 = ASMModS64ByS32RetS32(INT64_C(11), INT32_C(-2));
1409 CHECKVAL(i32, INT32_C(1), "%010RI32");
1410
1411 i32 = ASMModS64ByS32RetS32(INT64_C(92233720368547758), INT32_C(2147483647));
1412 CHECKVAL(i32, INT32_C(2104533974), "%010RI32");
1413 i32 = ASMModS64ByS32RetS32(INT64_C(-92233720368547758), INT32_C(2147483647));
1414 CHECKVAL(i32, INT32_C(-2104533974), "%010RI32");
1415}
1416
1417
1418void tstASMByteSwap(void)
1419{
1420 RTTestSub(g_hTest, "ASMByteSwap*");
1421
1422 uint64_t u64In = UINT64_C(0x0011223344556677);
1423 uint64_t u64Out = ASMByteSwapU64(u64In);
1424 CHECKVAL(u64In, UINT64_C(0x0011223344556677), "%#018RX64");
1425 CHECKVAL(u64Out, UINT64_C(0x7766554433221100), "%#018RX64");
1426 u64Out = ASMByteSwapU64(u64Out);
1427 CHECKVAL(u64Out, u64In, "%#018RX64");
1428 u64In = UINT64_C(0x0123456789abcdef);
1429 u64Out = ASMByteSwapU64(u64In);
1430 CHECKVAL(u64In, UINT64_C(0x0123456789abcdef), "%#018RX64");
1431 CHECKVAL(u64Out, UINT64_C(0xefcdab8967452301), "%#018RX64");
1432 u64Out = ASMByteSwapU64(u64Out);
1433 CHECKVAL(u64Out, u64In, "%#018RX64");
1434 u64In = 0;
1435 u64Out = ASMByteSwapU64(u64In);
1436 CHECKVAL(u64Out, u64In, "%#018RX64");
1437 u64In = ~(uint64_t)0;
1438 u64Out = ASMByteSwapU64(u64In);
1439 CHECKVAL(u64Out, u64In, "%#018RX64");
1440
1441 uint32_t u32In = UINT32_C(0x00112233);
1442 uint32_t u32Out = ASMByteSwapU32(u32In);
1443 CHECKVAL(u32In, UINT32_C(0x00112233), "%#010RX32");
1444 CHECKVAL(u32Out, UINT32_C(0x33221100), "%#010RX32");
1445 u32Out = ASMByteSwapU32(u32Out);
1446 CHECKVAL(u32Out, u32In, "%#010RX32");
1447 u32In = UINT32_C(0x12345678);
1448 u32Out = ASMByteSwapU32(u32In);
1449 CHECKVAL(u32In, UINT32_C(0x12345678), "%#010RX32");
1450 CHECKVAL(u32Out, UINT32_C(0x78563412), "%#010RX32");
1451 u32Out = ASMByteSwapU32(u32Out);
1452 CHECKVAL(u32Out, u32In, "%#010RX32");
1453 u32In = 0;
1454 u32Out = ASMByteSwapU32(u32In);
1455 CHECKVAL(u32Out, u32In, "%#010RX32");
1456 u32In = ~(uint32_t)0;
1457 u32Out = ASMByteSwapU32(u32In);
1458 CHECKVAL(u32Out, u32In, "%#010RX32");
1459
1460 uint16_t u16In = UINT16_C(0x0011);
1461 uint16_t u16Out = ASMByteSwapU16(u16In);
1462 CHECKVAL(u16In, UINT16_C(0x0011), "%#06RX16");
1463 CHECKVAL(u16Out, UINT16_C(0x1100), "%#06RX16");
1464 u16Out = ASMByteSwapU16(u16Out);
1465 CHECKVAL(u16Out, u16In, "%#06RX16");
1466 u16In = UINT16_C(0x1234);
1467 u16Out = ASMByteSwapU16(u16In);
1468 CHECKVAL(u16In, UINT16_C(0x1234), "%#06RX16");
1469 CHECKVAL(u16Out, UINT16_C(0x3412), "%#06RX16");
1470 u16Out = ASMByteSwapU16(u16Out);
1471 CHECKVAL(u16Out, u16In, "%#06RX16");
1472 u16In = 0;
1473 u16Out = ASMByteSwapU16(u16In);
1474 CHECKVAL(u16Out, u16In, "%#06RX16");
1475 u16In = ~(uint16_t)0;
1476 u16Out = ASMByteSwapU16(u16In);
1477 CHECKVAL(u16Out, u16In, "%#06RX16");
1478}
1479
1480
1481void tstASMBench(void)
1482{
1483 /*
1484 * Make this static. We don't want to have this located on the stack.
1485 */
1486 static uint8_t volatile s_u8;
1487 static int8_t volatile s_i8;
1488 static uint16_t volatile s_u16;
1489 static int16_t volatile s_i16;
1490 static uint32_t volatile s_u32;
1491 static int32_t volatile s_i32;
1492 static uint64_t volatile s_u64;
1493 static int64_t volatile s_i64;
1494 register unsigned i;
1495 const unsigned cRounds = _2M;
1496 register uint64_t u64Elapsed;
1497
1498 RTTestSub(g_hTest, "Benchmarking");
1499
1500#if 0 && !defined(GCC44_32BIT_PIC) && (defined(RT_ARCH_AMD64) || defined(RT_ARCH_X86))
1501# define BENCH(op, str) \
1502 do { \
1503 RTThreadYield(); \
1504 u64Elapsed = ASMReadTSC(); \
1505 for (i = cRounds; i > 0; i--) \
1506 op; \
1507 u64Elapsed = ASMReadTSC() - u64Elapsed; \
1508 RTTestValue(g_hTest, str, u64Elapsed / cRounds, RTTESTUNIT_TICKS_PER_CALL); \
1509 } while (0)
1510#else
1511# define BENCH(op, str) \
1512 do { \
1513 RTThreadYield(); \
1514 u64Elapsed = RTTimeNanoTS(); \
1515 for (i = cRounds; i > 0; i--) \
1516 op; \
1517 u64Elapsed = RTTimeNanoTS() - u64Elapsed; \
1518 RTTestValue(g_hTest, str, u64Elapsed / cRounds, RTTESTUNIT_NS_PER_CALL); \
1519 } while (0)
1520#endif
1521
1522 BENCH(s_u32 = 0, "s_u32 = 0");
1523 BENCH(ASMAtomicUoReadU8(&s_u8), "ASMAtomicUoReadU8");
1524 BENCH(ASMAtomicUoReadS8(&s_i8), "ASMAtomicUoReadS8");
1525 BENCH(ASMAtomicUoReadU16(&s_u16), "ASMAtomicUoReadU16");
1526 BENCH(ASMAtomicUoReadS16(&s_i16), "ASMAtomicUoReadS16");
1527 BENCH(ASMAtomicUoReadU32(&s_u32), "ASMAtomicUoReadU32");
1528 BENCH(ASMAtomicUoReadS32(&s_i32), "ASMAtomicUoReadS32");
1529 BENCH(ASMAtomicUoReadU64(&s_u64), "ASMAtomicUoReadU64");
1530 BENCH(ASMAtomicUoReadS64(&s_i64), "ASMAtomicUoReadS64");
1531 BENCH(ASMAtomicReadU8(&s_u8), "ASMAtomicReadU8");
1532 BENCH(ASMAtomicReadS8(&s_i8), "ASMAtomicReadS8");
1533 BENCH(ASMAtomicReadU16(&s_u16), "ASMAtomicReadU16");
1534 BENCH(ASMAtomicReadS16(&s_i16), "ASMAtomicReadS16");
1535 BENCH(ASMAtomicReadU32(&s_u32), "ASMAtomicReadU32");
1536 BENCH(ASMAtomicReadS32(&s_i32), "ASMAtomicReadS32");
1537 BENCH(ASMAtomicReadU64(&s_u64), "ASMAtomicReadU64");
1538 BENCH(ASMAtomicReadS64(&s_i64), "ASMAtomicReadS64");
1539 BENCH(ASMAtomicUoWriteU8(&s_u8, 0), "ASMAtomicUoWriteU8");
1540 BENCH(ASMAtomicUoWriteS8(&s_i8, 0), "ASMAtomicUoWriteS8");
1541 BENCH(ASMAtomicUoWriteU16(&s_u16, 0), "ASMAtomicUoWriteU16");
1542 BENCH(ASMAtomicUoWriteS16(&s_i16, 0), "ASMAtomicUoWriteS16");
1543 BENCH(ASMAtomicUoWriteU32(&s_u32, 0), "ASMAtomicUoWriteU32");
1544 BENCH(ASMAtomicUoWriteS32(&s_i32, 0), "ASMAtomicUoWriteS32");
1545 BENCH(ASMAtomicUoWriteU64(&s_u64, 0), "ASMAtomicUoWriteU64");
1546 BENCH(ASMAtomicUoWriteS64(&s_i64, 0), "ASMAtomicUoWriteS64");
1547 BENCH(ASMAtomicWriteU8(&s_u8, 0), "ASMAtomicWriteU8");
1548 BENCH(ASMAtomicWriteS8(&s_i8, 0), "ASMAtomicWriteS8");
1549 BENCH(ASMAtomicWriteU16(&s_u16, 0), "ASMAtomicWriteU16");
1550 BENCH(ASMAtomicWriteS16(&s_i16, 0), "ASMAtomicWriteS16");
1551 BENCH(ASMAtomicWriteU32(&s_u32, 0), "ASMAtomicWriteU32");
1552 BENCH(ASMAtomicWriteS32(&s_i32, 0), "ASMAtomicWriteS32");
1553 BENCH(ASMAtomicWriteU64(&s_u64, 0), "ASMAtomicWriteU64");
1554 BENCH(ASMAtomicWriteS64(&s_i64, 0), "ASMAtomicWriteS64");
1555 BENCH(ASMAtomicXchgU8(&s_u8, 0), "ASMAtomicXchgU8");
1556 BENCH(ASMAtomicXchgS8(&s_i8, 0), "ASMAtomicXchgS8");
1557 BENCH(ASMAtomicXchgU16(&s_u16, 0), "ASMAtomicXchgU16");
1558 BENCH(ASMAtomicXchgS16(&s_i16, 0), "ASMAtomicXchgS16");
1559 BENCH(ASMAtomicXchgU32(&s_u32, 0), "ASMAtomicXchgU32");
1560 BENCH(ASMAtomicXchgS32(&s_i32, 0), "ASMAtomicXchgS32");
1561 BENCH(ASMAtomicXchgU64(&s_u64, 0), "ASMAtomicXchgU64");
1562 BENCH(ASMAtomicXchgS64(&s_i64, 0), "ASMAtomicXchgS64");
1563 BENCH(ASMAtomicCmpXchgU32(&s_u32, 0, 0), "ASMAtomicCmpXchgU32");
1564 BENCH(ASMAtomicCmpXchgS32(&s_i32, 0, 0), "ASMAtomicCmpXchgS32");
1565 BENCH(ASMAtomicCmpXchgU64(&s_u64, 0, 0), "ASMAtomicCmpXchgU64");
1566 BENCH(ASMAtomicCmpXchgS64(&s_i64, 0, 0), "ASMAtomicCmpXchgS64");
1567 BENCH(ASMAtomicCmpXchgU32(&s_u32, 0, 1), "ASMAtomicCmpXchgU32/neg");
1568 BENCH(ASMAtomicCmpXchgS32(&s_i32, 0, 1), "ASMAtomicCmpXchgS32/neg");
1569 BENCH(ASMAtomicCmpXchgU64(&s_u64, 0, 1), "ASMAtomicCmpXchgU64/neg");
1570 BENCH(ASMAtomicCmpXchgS64(&s_i64, 0, 1), "ASMAtomicCmpXchgS64/neg");
1571 BENCH(ASMAtomicIncU32(&s_u32), "ASMAtomicIncU32");
1572 BENCH(ASMAtomicIncS32(&s_i32), "ASMAtomicIncS32");
1573 BENCH(ASMAtomicDecU32(&s_u32), "ASMAtomicDecU32");
1574 BENCH(ASMAtomicDecS32(&s_i32), "ASMAtomicDecS32");
1575 BENCH(ASMAtomicAddU32(&s_u32, 5), "ASMAtomicAddU32");
1576 BENCH(ASMAtomicAddS32(&s_i32, 5), "ASMAtomicAddS32");
1577 /* The Darwin gcc does not like this ... */
1578#if !defined(RT_OS_DARWIN) && !defined(GCC44_32BIT_PIC) && (defined(RT_ARCH_AMD64) || defined(RT_ARCH_X86))
1579 BENCH(s_u8 = ASMGetApicId(), "ASMGetApicId");
1580#endif
1581
1582#undef BENCH
1583}
1584
1585
1586int main(int argc, char *argv[])
1587{
1588 int rc = RTTestInitAndCreate("tstRTInlineAsm", &g_hTest);
1589 if (rc)
1590 return rc;
1591 RTTestBanner(g_hTest);
1592
1593 /*
1594 * Execute the tests.
1595 */
1596#if !defined(GCC44_32BIT_PIC) && (defined(RT_ARCH_AMD64) || defined(RT_ARCH_X86))
1597 tstASMCpuId();
1598 //bruteForceCpuId();
1599#endif
1600#if 1
1601 tstASMAtomicXchgU8();
1602 tstASMAtomicXchgU16();
1603 tstASMAtomicXchgU32();
1604 tstASMAtomicXchgU64();
1605 tstASMAtomicXchgPtr();
1606 tstASMAtomicCmpXchgU8();
1607 tstASMAtomicCmpXchgU32();
1608 tstASMAtomicCmpXchgU64();
1609 tstASMAtomicCmpXchgExU32();
1610 tstASMAtomicCmpXchgExU64();
1611 tstASMAtomicReadU64();
1612 tstASMAtomicUoReadU64();
1613
1614 tstASMAtomicAddS32();
1615 tstASMAtomicAddS64();
1616 tstASMAtomicDecIncS32();
1617 tstASMAtomicDecIncS64();
1618 tstASMAtomicAndOrU32();
1619 tstASMAtomicAndOrU64();
1620
1621 tstASMMemZeroPage();
1622 tstASMMemIsZeroPage(g_hTest);
1623 tstASMMemZero32();
1624 tstASMMemFill32();
1625
1626 tstASMMath();
1627
1628 tstASMByteSwap();
1629
1630 tstASMBench();
1631#endif
1632
1633 /*
1634 * Show the result.
1635 */
1636 return RTTestSummaryAndDestroy(g_hTest);
1637}
1638
Note: See TracBrowser for help on using the repository browser.

© 2024 Oracle Support Privacy / Do Not Sell My Info Terms of Use Trademark Policy Automated Access Etiquette