amx_test.c 9.5 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341
  1. // SPDX-License-Identifier: GPL-2.0-only
  2. /*
  3. * amx tests
  4. *
  5. * Copyright (C) 2021, Intel, Inc.
  6. *
  7. * Tests for amx #NM exception and save/restore.
  8. */
  9. #include <fcntl.h>
  10. #include <stdio.h>
  11. #include <stdlib.h>
  12. #include <string.h>
  13. #include <sys/ioctl.h>
  14. #include <sys/syscall.h>
  15. #include "test_util.h"
  16. #include "kvm_util.h"
  17. #include "processor.h"
  18. #include "vmx.h"
  19. #ifndef __x86_64__
  20. # error This test is 64-bit only
  21. #endif
  22. #define NUM_TILES 8
  23. #define TILE_SIZE 1024
  24. #define XSAVE_SIZE ((NUM_TILES * TILE_SIZE) + PAGE_SIZE)
  25. /* Tile configuration associated: */
  26. #define PALETTE_TABLE_INDEX 1
  27. #define MAX_TILES 16
  28. #define RESERVED_BYTES 14
  29. #define XSAVE_HDR_OFFSET 512
  30. struct tile_config {
  31. u8 palette_id;
  32. u8 start_row;
  33. u8 reserved[RESERVED_BYTES];
  34. u16 colsb[MAX_TILES];
  35. u8 rows[MAX_TILES];
  36. };
  37. struct tile_data {
  38. u8 data[NUM_TILES * TILE_SIZE];
  39. };
  40. struct xtile_info {
  41. u16 bytes_per_tile;
  42. u16 bytes_per_row;
  43. u16 max_names;
  44. u16 max_rows;
  45. u32 xsave_offset;
  46. u32 xsave_size;
  47. };
  48. static struct xtile_info xtile;
  49. static inline void __ldtilecfg(void *cfg)
  50. {
  51. asm volatile(".byte 0xc4,0xe2,0x78,0x49,0x00"
  52. : : "a"(cfg));
  53. }
  54. static inline void __tileloadd(void *tile)
  55. {
  56. asm volatile(".byte 0xc4,0xe2,0x7b,0x4b,0x04,0x10"
  57. : : "a"(tile), "d"(0));
  58. }
  59. static inline int tileloadd_safe(void *tile)
  60. {
  61. return kvm_asm_safe(".byte 0xc4,0xe2,0x7b,0x4b,0x04,0x10",
  62. "a"(tile), "d"(0));
  63. }
  64. static inline void __tilerelease(void)
  65. {
  66. asm volatile(".byte 0xc4, 0xe2, 0x78, 0x49, 0xc0" ::);
  67. }
  68. static inline void __xsavec(struct xstate *xstate, uint64_t rfbm)
  69. {
  70. uint32_t rfbm_lo = rfbm;
  71. uint32_t rfbm_hi = rfbm >> 32;
  72. asm volatile("xsavec (%%rdi)"
  73. : : "D" (xstate), "a" (rfbm_lo), "d" (rfbm_hi)
  74. : "memory");
  75. }
  76. static void check_xtile_info(void)
  77. {
  78. GUEST_ASSERT((xgetbv(0) & XFEATURE_MASK_XTILE) == XFEATURE_MASK_XTILE);
  79. GUEST_ASSERT(this_cpu_has_p(X86_PROPERTY_XSTATE_MAX_SIZE_XCR0));
  80. GUEST_ASSERT(this_cpu_property(X86_PROPERTY_XSTATE_MAX_SIZE_XCR0) <= XSAVE_SIZE);
  81. xtile.xsave_offset = this_cpu_property(X86_PROPERTY_XSTATE_TILE_OFFSET);
  82. GUEST_ASSERT(xtile.xsave_offset == 2816);
  83. xtile.xsave_size = this_cpu_property(X86_PROPERTY_XSTATE_TILE_SIZE);
  84. GUEST_ASSERT(xtile.xsave_size == 8192);
  85. GUEST_ASSERT(sizeof(struct tile_data) >= xtile.xsave_size);
  86. GUEST_ASSERT(this_cpu_has_p(X86_PROPERTY_AMX_MAX_PALETTE_TABLES));
  87. GUEST_ASSERT(this_cpu_property(X86_PROPERTY_AMX_MAX_PALETTE_TABLES) >=
  88. PALETTE_TABLE_INDEX);
  89. GUEST_ASSERT(this_cpu_has_p(X86_PROPERTY_AMX_NR_TILE_REGS));
  90. xtile.max_names = this_cpu_property(X86_PROPERTY_AMX_NR_TILE_REGS);
  91. GUEST_ASSERT(xtile.max_names == 8);
  92. xtile.bytes_per_tile = this_cpu_property(X86_PROPERTY_AMX_BYTES_PER_TILE);
  93. GUEST_ASSERT(xtile.bytes_per_tile == 1024);
  94. xtile.bytes_per_row = this_cpu_property(X86_PROPERTY_AMX_BYTES_PER_ROW);
  95. GUEST_ASSERT(xtile.bytes_per_row == 64);
  96. xtile.max_rows = this_cpu_property(X86_PROPERTY_AMX_MAX_ROWS);
  97. GUEST_ASSERT(xtile.max_rows == 16);
  98. }
  99. static void set_tilecfg(struct tile_config *cfg)
  100. {
  101. int i;
  102. /* Only palette id 1 */
  103. cfg->palette_id = 1;
  104. for (i = 0; i < xtile.max_names; i++) {
  105. cfg->colsb[i] = xtile.bytes_per_row;
  106. cfg->rows[i] = xtile.max_rows;
  107. }
  108. }
  109. enum {
  110. /* Retrieve TMM0 from guest, stash it for TEST_RESTORE_TILEDATA */
  111. TEST_SAVE_TILEDATA = 1,
  112. /* Check TMM0 against tiledata */
  113. TEST_COMPARE_TILEDATA = 2,
  114. /* Restore TMM0 from earlier save */
  115. TEST_RESTORE_TILEDATA = 4,
  116. /* Full VM save/restore */
  117. TEST_SAVE_RESTORE = 8,
  118. };
  119. static void __attribute__((__flatten__)) guest_code(struct tile_config *amx_cfg,
  120. struct tile_data *tiledata,
  121. struct xstate *xstate)
  122. {
  123. int vector;
  124. GUEST_ASSERT(this_cpu_has(X86_FEATURE_XSAVE) &&
  125. this_cpu_has(X86_FEATURE_OSXSAVE));
  126. check_xtile_info();
  127. GUEST_SYNC(TEST_SAVE_RESTORE);
  128. /* xfd=0, enable amx */
  129. wrmsr(MSR_IA32_XFD, 0);
  130. GUEST_SYNC(TEST_SAVE_RESTORE);
  131. GUEST_ASSERT(rdmsr(MSR_IA32_XFD) == 0);
  132. set_tilecfg(amx_cfg);
  133. __ldtilecfg(amx_cfg);
  134. GUEST_SYNC(TEST_SAVE_RESTORE);
  135. /* Check save/restore when trap to userspace */
  136. __tileloadd(tiledata);
  137. GUEST_SYNC(TEST_SAVE_TILEDATA | TEST_COMPARE_TILEDATA | TEST_SAVE_RESTORE);
  138. /* xfd=0x40000, disable amx tiledata */
  139. wrmsr(MSR_IA32_XFD, XFEATURE_MASK_XTILE_DATA);
  140. /* host tries setting tiledata while guest XFD is set */
  141. GUEST_SYNC(TEST_RESTORE_TILEDATA);
  142. GUEST_SYNC(TEST_SAVE_RESTORE);
  143. wrmsr(MSR_IA32_XFD, 0);
  144. __tilerelease();
  145. GUEST_SYNC(TEST_SAVE_RESTORE);
  146. /*
  147. * After XSAVEC, XTILEDATA is cleared in the xstate_bv but is set in
  148. * the xcomp_bv.
  149. */
  150. xstate->header.xstate_bv = XFEATURE_MASK_XTILE_DATA;
  151. __xsavec(xstate, XFEATURE_MASK_XTILE_DATA);
  152. GUEST_ASSERT(!(xstate->header.xstate_bv & XFEATURE_MASK_XTILE_DATA));
  153. GUEST_ASSERT(xstate->header.xcomp_bv & XFEATURE_MASK_XTILE_DATA);
  154. /* #NM test */
  155. /* xfd=0x40000, disable amx tiledata */
  156. wrmsr(MSR_IA32_XFD, XFEATURE_MASK_XTILE_DATA);
  157. /*
  158. * XTILEDATA is cleared in xstate_bv but set in xcomp_bv, this property
  159. * remains the same even when amx tiledata is disabled by IA32_XFD.
  160. */
  161. xstate->header.xstate_bv = XFEATURE_MASK_XTILE_DATA;
  162. __xsavec(xstate, XFEATURE_MASK_XTILE_DATA);
  163. GUEST_ASSERT(!(xstate->header.xstate_bv & XFEATURE_MASK_XTILE_DATA));
  164. GUEST_ASSERT((xstate->header.xcomp_bv & XFEATURE_MASK_XTILE_DATA));
  165. GUEST_SYNC(TEST_SAVE_RESTORE);
  166. GUEST_ASSERT(rdmsr(MSR_IA32_XFD) == XFEATURE_MASK_XTILE_DATA);
  167. set_tilecfg(amx_cfg);
  168. __ldtilecfg(amx_cfg);
  169. /* Trigger #NM exception */
  170. vector = tileloadd_safe(tiledata);
  171. __GUEST_ASSERT(vector == NM_VECTOR,
  172. "Wanted #NM on tileloadd with XFD[18]=1, got %s",
  173. ex_str(vector));
  174. GUEST_ASSERT(!(get_cr0() & X86_CR0_TS));
  175. GUEST_ASSERT(rdmsr(MSR_IA32_XFD_ERR) == XFEATURE_MASK_XTILE_DATA);
  176. GUEST_ASSERT(rdmsr(MSR_IA32_XFD) == XFEATURE_MASK_XTILE_DATA);
  177. GUEST_SYNC(TEST_SAVE_RESTORE);
  178. GUEST_ASSERT(rdmsr(MSR_IA32_XFD_ERR) == XFEATURE_MASK_XTILE_DATA);
  179. GUEST_ASSERT(rdmsr(MSR_IA32_XFD) == XFEATURE_MASK_XTILE_DATA);
  180. /* Clear xfd_err */
  181. wrmsr(MSR_IA32_XFD_ERR, 0);
  182. /* xfd=0, enable amx */
  183. wrmsr(MSR_IA32_XFD, 0);
  184. GUEST_SYNC(TEST_SAVE_RESTORE);
  185. __tileloadd(tiledata);
  186. GUEST_SYNC(TEST_COMPARE_TILEDATA | TEST_SAVE_RESTORE);
  187. GUEST_DONE();
  188. }
  189. int main(int argc, char *argv[])
  190. {
  191. struct kvm_regs regs1, regs2;
  192. struct kvm_vcpu *vcpu;
  193. struct kvm_vm *vm;
  194. struct kvm_x86_state *state;
  195. struct kvm_x86_state *tile_state = NULL;
  196. int xsave_restore_size;
  197. vm_vaddr_t amx_cfg, tiledata, xstate;
  198. struct ucall uc;
  199. int ret;
  200. /*
  201. * Note, all off-by-default features must be enabled before anything
  202. * caches KVM_GET_SUPPORTED_CPUID, e.g. before using kvm_cpu_has().
  203. */
  204. vm_xsave_require_permission(XFEATURE_MASK_XTILE_DATA);
  205. TEST_REQUIRE(kvm_cpu_has(X86_FEATURE_XFD));
  206. TEST_REQUIRE(kvm_cpu_has(X86_FEATURE_XSAVE));
  207. TEST_REQUIRE(kvm_cpu_has(X86_FEATURE_AMX_TILE));
  208. TEST_REQUIRE(kvm_cpu_has(X86_FEATURE_XTILECFG));
  209. TEST_REQUIRE(kvm_cpu_has(X86_FEATURE_XTILEDATA));
  210. TEST_REQUIRE(kvm_cpu_has(X86_FEATURE_XTILEDATA_XFD));
  211. /* Create VM */
  212. vm = vm_create_with_one_vcpu(&vcpu, guest_code);
  213. TEST_ASSERT(kvm_cpu_has_p(X86_PROPERTY_XSTATE_MAX_SIZE),
  214. "KVM should enumerate max XSAVE size when XSAVE is supported");
  215. xsave_restore_size = kvm_cpu_property(X86_PROPERTY_XSTATE_MAX_SIZE);
  216. vcpu_regs_get(vcpu, &regs1);
  217. /* amx cfg for guest_code */
  218. amx_cfg = vm_vaddr_alloc_page(vm);
  219. memset(addr_gva2hva(vm, amx_cfg), 0x0, getpagesize());
  220. /* amx tiledata for guest_code */
  221. tiledata = vm_vaddr_alloc_pages(vm, 2);
  222. memset(addr_gva2hva(vm, tiledata), rand() | 1, 2 * getpagesize());
  223. /* XSAVE state for guest_code */
  224. xstate = vm_vaddr_alloc_pages(vm, DIV_ROUND_UP(XSAVE_SIZE, PAGE_SIZE));
  225. memset(addr_gva2hva(vm, xstate), 0, PAGE_SIZE * DIV_ROUND_UP(XSAVE_SIZE, PAGE_SIZE));
  226. vcpu_args_set(vcpu, 3, amx_cfg, tiledata, xstate);
  227. int iter = 0;
  228. for (;;) {
  229. vcpu_run(vcpu);
  230. TEST_ASSERT_KVM_EXIT_REASON(vcpu, KVM_EXIT_IO);
  231. switch (get_ucall(vcpu, &uc)) {
  232. case UCALL_ABORT:
  233. REPORT_GUEST_ASSERT(uc);
  234. /* NOT REACHED */
  235. case UCALL_SYNC:
  236. ++iter;
  237. if (uc.args[1] & TEST_SAVE_TILEDATA) {
  238. fprintf(stderr, "GUEST_SYNC #%d, save tiledata\n", iter);
  239. tile_state = vcpu_save_state(vcpu);
  240. }
  241. if (uc.args[1] & TEST_COMPARE_TILEDATA) {
  242. fprintf(stderr, "GUEST_SYNC #%d, check TMM0 contents\n", iter);
  243. /* Compacted mode, get amx offset by xsave area
  244. * size subtract 8K amx size.
  245. */
  246. u32 amx_offset = xsave_restore_size - NUM_TILES*TILE_SIZE;
  247. void *amx_start = (void *)tile_state->xsave + amx_offset;
  248. void *tiles_data = (void *)addr_gva2hva(vm, tiledata);
  249. /* Only check TMM0 register, 1 tile */
  250. ret = memcmp(amx_start, tiles_data, TILE_SIZE);
  251. TEST_ASSERT(ret == 0, "memcmp failed, ret=%d", ret);
  252. }
  253. if (uc.args[1] & TEST_RESTORE_TILEDATA) {
  254. fprintf(stderr, "GUEST_SYNC #%d, before KVM_SET_XSAVE\n", iter);
  255. vcpu_xsave_set(vcpu, tile_state->xsave);
  256. fprintf(stderr, "GUEST_SYNC #%d, after KVM_SET_XSAVE\n", iter);
  257. }
  258. if (uc.args[1] & TEST_SAVE_RESTORE) {
  259. fprintf(stderr, "GUEST_SYNC #%d, save/restore VM state\n", iter);
  260. state = vcpu_save_state(vcpu);
  261. memset(&regs1, 0, sizeof(regs1));
  262. vcpu_regs_get(vcpu, &regs1);
  263. kvm_vm_release(vm);
  264. /* Restore state in a new VM. */
  265. vcpu = vm_recreate_with_one_vcpu(vm);
  266. vcpu_load_state(vcpu, state);
  267. kvm_x86_state_cleanup(state);
  268. memset(&regs2, 0, sizeof(regs2));
  269. vcpu_regs_get(vcpu, &regs2);
  270. TEST_ASSERT(!memcmp(&regs1, &regs2, sizeof(regs2)),
  271. "Unexpected register values after vcpu_load_state; rdi: %lx rsi: %lx",
  272. (ulong) regs2.rdi, (ulong) regs2.rsi);
  273. }
  274. break;
  275. case UCALL_DONE:
  276. fprintf(stderr, "UCALL_DONE\n");
  277. goto done;
  278. default:
  279. TEST_FAIL("Unknown ucall %lu", uc.cmd);
  280. }
  281. }
  282. done:
  283. kvm_vm_free(vm);
  284. }