guest.c 26 KB

1234567891011121314151617181920212223242526272829303132333435363738394041424344454647484950515253545556575859606162636465666768697071727374757677787980818283848586878889909192939495969798991001011021031041051061071081091101111121131141151161171181191201211221231241251261271281291301311321331341351361371381391401411421431441451461471481491501511521531541551561571581591601611621631641651661671681691701711721731741751761771781791801811821831841851861871881891901911921931941951961971981992002012022032042052062072082092102112122132142152162172182192202212222232242252262272282292302312322332342352362372382392402412422432442452462472482492502512522532542552562572582592602612622632642652662672682692702712722732742752762772782792802812822832842852862872882892902912922932942952962972982993003013023033043053063073083093103113123133143153163173183193203213223233243253263273283293303313323333343353363373383393403413423433443453463473483493503513523533543553563573583593603613623633643653663673683693703713723733743753763773783793803813823833843853863873883893903913923933943953963973983994004014024034044054064074084094104114124134144154164174184194204214224234244254264274284294304314324334344354364374384394404414424434444454464474484494504514524534544554564574584594604614624634644654664674684694704714724734744754764774784794804814824834844854864874884894904914924934944954964974984995005015025035045055065075085095105115125135145155165175185195205215225235245255265275285295305315325335345355365375385395405415425435445455465475485495505515525535545555565575585595605615625635645655665675685695705715725735745755765775785795805815825835845855865875885895905915925935945955965975985996006016026036046056066076086096106116126136146156166176186196206216226236246256266276286296306316326336346356366376386396406416426436446456466476486496506516526536546556566576586596606616626636646656666676686696706716726736746756766776786796806816826836846856866876886896906916926936946956966976986997007017027037047057067077087097107117127137147157167177187197207217227237247257267277287297307317327337347357367377387397407417427437447457467477487497507517527537547557567577587597607617627637647657667677687697707717727737747757767777787797807817827837847857867877887897907917927937947957967977987998008018028038048058068078088098108118128138148158168178188198208218228238248258268278288298308318328338348358368378388398408418428438448458468478488498508518528538548558568578588598608618628638648658668678688698708718728738748758768778788798808818828838848858868878888898908918928938948958968978988999009019029039049059069079089099109119129139149159169179189199209219229239249259269279289299309319329339349359369379389399409419429439449459469479489499509519529539549559569579589599609619629639649659669679689699709719729739749759769779789799809819829839849859869879889899909919929939949959969979989991000100110021003100410051006100710081009101010111012101310141015101610171018101910201021102210231024102510261027102810291030103110321033103410351036103710381039104010411042104310441045104610471048104910501051105210531054105510561057105810591060106110621063106410651066106710681069107010711072107310741075107610771078107910801081
  1. // SPDX-License-Identifier: GPL-2.0-only
  2. /*
  3. * Copyright (C) 2012,2013 - ARM Ltd
  4. * Author: Marc Zyngier <marc.zyngier@arm.com>
  5. *
  6. * Derived from arch/arm/kvm/guest.c:
  7. * Copyright (C) 2012 - Virtual Open Systems and Columbia University
  8. * Author: Christoffer Dall <c.dall@virtualopensystems.com>
  9. */
  10. #include <linux/bits.h>
  11. #include <linux/errno.h>
  12. #include <linux/err.h>
  13. #include <linux/nospec.h>
  14. #include <linux/kvm_host.h>
  15. #include <linux/module.h>
  16. #include <linux/stddef.h>
  17. #include <linux/string.h>
  18. #include <linux/vmalloc.h>
  19. #include <linux/fs.h>
  20. #include <kvm/arm_hypercalls.h>
  21. #include <asm/cputype.h>
  22. #include <linux/uaccess.h>
  23. #include <asm/fpsimd.h>
  24. #include <asm/kvm.h>
  25. #include <asm/kvm_emulate.h>
  26. #include <asm/kvm_nested.h>
  27. #include <asm/sigcontext.h>
  28. #include "trace.h"
  29. const struct kvm_stats_desc kvm_vm_stats_desc[] = {
  30. KVM_GENERIC_VM_STATS()
  31. };
  32. const struct kvm_stats_header kvm_vm_stats_header = {
  33. .name_size = KVM_STATS_NAME_SIZE,
  34. .num_desc = ARRAY_SIZE(kvm_vm_stats_desc),
  35. .id_offset = sizeof(struct kvm_stats_header),
  36. .desc_offset = sizeof(struct kvm_stats_header) + KVM_STATS_NAME_SIZE,
  37. .data_offset = sizeof(struct kvm_stats_header) + KVM_STATS_NAME_SIZE +
  38. sizeof(kvm_vm_stats_desc),
  39. };
  40. const struct kvm_stats_desc kvm_vcpu_stats_desc[] = {
  41. KVM_GENERIC_VCPU_STATS(),
  42. STATS_DESC_COUNTER(VCPU, hvc_exit_stat),
  43. STATS_DESC_COUNTER(VCPU, wfe_exit_stat),
  44. STATS_DESC_COUNTER(VCPU, wfi_exit_stat),
  45. STATS_DESC_COUNTER(VCPU, mmio_exit_user),
  46. STATS_DESC_COUNTER(VCPU, mmio_exit_kernel),
  47. STATS_DESC_COUNTER(VCPU, signal_exits),
  48. STATS_DESC_COUNTER(VCPU, exits)
  49. };
  50. const struct kvm_stats_header kvm_vcpu_stats_header = {
  51. .name_size = KVM_STATS_NAME_SIZE,
  52. .num_desc = ARRAY_SIZE(kvm_vcpu_stats_desc),
  53. .id_offset = sizeof(struct kvm_stats_header),
  54. .desc_offset = sizeof(struct kvm_stats_header) + KVM_STATS_NAME_SIZE,
  55. .data_offset = sizeof(struct kvm_stats_header) + KVM_STATS_NAME_SIZE +
  56. sizeof(kvm_vcpu_stats_desc),
  57. };
  58. static bool core_reg_offset_is_vreg(u64 off)
  59. {
  60. return off >= KVM_REG_ARM_CORE_REG(fp_regs.vregs) &&
  61. off < KVM_REG_ARM_CORE_REG(fp_regs.fpsr);
  62. }
  63. static u64 core_reg_offset_from_id(u64 id)
  64. {
  65. return id & ~(KVM_REG_ARCH_MASK | KVM_REG_SIZE_MASK | KVM_REG_ARM_CORE);
  66. }
  67. static int core_reg_size_from_offset(const struct kvm_vcpu *vcpu, u64 off)
  68. {
  69. int size;
  70. switch (off) {
  71. case KVM_REG_ARM_CORE_REG(regs.regs[0]) ...
  72. KVM_REG_ARM_CORE_REG(regs.regs[30]):
  73. case KVM_REG_ARM_CORE_REG(regs.sp):
  74. case KVM_REG_ARM_CORE_REG(regs.pc):
  75. case KVM_REG_ARM_CORE_REG(regs.pstate):
  76. case KVM_REG_ARM_CORE_REG(sp_el1):
  77. case KVM_REG_ARM_CORE_REG(elr_el1):
  78. case KVM_REG_ARM_CORE_REG(spsr[0]) ...
  79. KVM_REG_ARM_CORE_REG(spsr[KVM_NR_SPSR - 1]):
  80. size = sizeof(__u64);
  81. break;
  82. case KVM_REG_ARM_CORE_REG(fp_regs.vregs[0]) ...
  83. KVM_REG_ARM_CORE_REG(fp_regs.vregs[31]):
  84. size = sizeof(__uint128_t);
  85. break;
  86. case KVM_REG_ARM_CORE_REG(fp_regs.fpsr):
  87. case KVM_REG_ARM_CORE_REG(fp_regs.fpcr):
  88. size = sizeof(__u32);
  89. break;
  90. default:
  91. return -EINVAL;
  92. }
  93. if (!IS_ALIGNED(off, size / sizeof(__u32)))
  94. return -EINVAL;
  95. /*
  96. * The KVM_REG_ARM64_SVE regs must be used instead of
  97. * KVM_REG_ARM_CORE for accessing the FPSIMD V-registers on
  98. * SVE-enabled vcpus:
  99. */
  100. if (vcpu_has_sve(vcpu) && core_reg_offset_is_vreg(off))
  101. return -EINVAL;
  102. return size;
  103. }
  104. static void *core_reg_addr(struct kvm_vcpu *vcpu, const struct kvm_one_reg *reg)
  105. {
  106. u64 off = core_reg_offset_from_id(reg->id);
  107. int size = core_reg_size_from_offset(vcpu, off);
  108. if (size < 0)
  109. return NULL;
  110. if (KVM_REG_SIZE(reg->id) != size)
  111. return NULL;
  112. switch (off) {
  113. case KVM_REG_ARM_CORE_REG(regs.regs[0]) ...
  114. KVM_REG_ARM_CORE_REG(regs.regs[30]):
  115. off -= KVM_REG_ARM_CORE_REG(regs.regs[0]);
  116. off /= 2;
  117. return &vcpu->arch.ctxt.regs.regs[off];
  118. case KVM_REG_ARM_CORE_REG(regs.sp):
  119. return &vcpu->arch.ctxt.regs.sp;
  120. case KVM_REG_ARM_CORE_REG(regs.pc):
  121. return &vcpu->arch.ctxt.regs.pc;
  122. case KVM_REG_ARM_CORE_REG(regs.pstate):
  123. return &vcpu->arch.ctxt.regs.pstate;
  124. case KVM_REG_ARM_CORE_REG(sp_el1):
  125. return __ctxt_sys_reg(&vcpu->arch.ctxt, SP_EL1);
  126. case KVM_REG_ARM_CORE_REG(elr_el1):
  127. return __ctxt_sys_reg(&vcpu->arch.ctxt, ELR_EL1);
  128. case KVM_REG_ARM_CORE_REG(spsr[KVM_SPSR_EL1]):
  129. return __ctxt_sys_reg(&vcpu->arch.ctxt, SPSR_EL1);
  130. case KVM_REG_ARM_CORE_REG(spsr[KVM_SPSR_ABT]):
  131. return &vcpu->arch.ctxt.spsr_abt;
  132. case KVM_REG_ARM_CORE_REG(spsr[KVM_SPSR_UND]):
  133. return &vcpu->arch.ctxt.spsr_und;
  134. case KVM_REG_ARM_CORE_REG(spsr[KVM_SPSR_IRQ]):
  135. return &vcpu->arch.ctxt.spsr_irq;
  136. case KVM_REG_ARM_CORE_REG(spsr[KVM_SPSR_FIQ]):
  137. return &vcpu->arch.ctxt.spsr_fiq;
  138. case KVM_REG_ARM_CORE_REG(fp_regs.vregs[0]) ...
  139. KVM_REG_ARM_CORE_REG(fp_regs.vregs[31]):
  140. off -= KVM_REG_ARM_CORE_REG(fp_regs.vregs[0]);
  141. off /= 4;
  142. return &vcpu->arch.ctxt.fp_regs.vregs[off];
  143. case KVM_REG_ARM_CORE_REG(fp_regs.fpsr):
  144. return &vcpu->arch.ctxt.fp_regs.fpsr;
  145. case KVM_REG_ARM_CORE_REG(fp_regs.fpcr):
  146. return &vcpu->arch.ctxt.fp_regs.fpcr;
  147. default:
  148. return NULL;
  149. }
  150. }
  151. static int get_core_reg(struct kvm_vcpu *vcpu, const struct kvm_one_reg *reg)
  152. {
  153. /*
  154. * Because the kvm_regs structure is a mix of 32, 64 and
  155. * 128bit fields, we index it as if it was a 32bit
  156. * array. Hence below, nr_regs is the number of entries, and
  157. * off the index in the "array".
  158. */
  159. __u32 __user *uaddr = (__u32 __user *)(unsigned long)reg->addr;
  160. int nr_regs = sizeof(struct kvm_regs) / sizeof(__u32);
  161. void *addr;
  162. u32 off;
  163. /* Our ID is an index into the kvm_regs struct. */
  164. off = core_reg_offset_from_id(reg->id);
  165. if (off >= nr_regs ||
  166. (off + (KVM_REG_SIZE(reg->id) / sizeof(__u32))) >= nr_regs)
  167. return -ENOENT;
  168. addr = core_reg_addr(vcpu, reg);
  169. if (!addr)
  170. return -EINVAL;
  171. if (copy_to_user(uaddr, addr, KVM_REG_SIZE(reg->id)))
  172. return -EFAULT;
  173. return 0;
  174. }
  175. static int set_core_reg(struct kvm_vcpu *vcpu, const struct kvm_one_reg *reg)
  176. {
  177. __u32 __user *uaddr = (__u32 __user *)(unsigned long)reg->addr;
  178. int nr_regs = sizeof(struct kvm_regs) / sizeof(__u32);
  179. __uint128_t tmp;
  180. void *valp = &tmp, *addr;
  181. u64 off;
  182. int err = 0;
  183. /* Our ID is an index into the kvm_regs struct. */
  184. off = core_reg_offset_from_id(reg->id);
  185. if (off >= nr_regs ||
  186. (off + (KVM_REG_SIZE(reg->id) / sizeof(__u32))) >= nr_regs)
  187. return -ENOENT;
  188. addr = core_reg_addr(vcpu, reg);
  189. if (!addr)
  190. return -EINVAL;
  191. if (KVM_REG_SIZE(reg->id) > sizeof(tmp))
  192. return -EINVAL;
  193. if (copy_from_user(valp, uaddr, KVM_REG_SIZE(reg->id))) {
  194. err = -EFAULT;
  195. goto out;
  196. }
  197. if (off == KVM_REG_ARM_CORE_REG(regs.pstate)) {
  198. u64 mode = (*(u64 *)valp) & PSR_AA32_MODE_MASK;
  199. switch (mode) {
  200. case PSR_AA32_MODE_USR:
  201. if (!kvm_supports_32bit_el0())
  202. return -EINVAL;
  203. break;
  204. case PSR_AA32_MODE_FIQ:
  205. case PSR_AA32_MODE_IRQ:
  206. case PSR_AA32_MODE_SVC:
  207. case PSR_AA32_MODE_ABT:
  208. case PSR_AA32_MODE_UND:
  209. case PSR_AA32_MODE_SYS:
  210. if (!vcpu_el1_is_32bit(vcpu))
  211. return -EINVAL;
  212. break;
  213. case PSR_MODE_EL2h:
  214. case PSR_MODE_EL2t:
  215. if (!vcpu_has_nv(vcpu))
  216. return -EINVAL;
  217. fallthrough;
  218. case PSR_MODE_EL0t:
  219. case PSR_MODE_EL1t:
  220. case PSR_MODE_EL1h:
  221. if (vcpu_el1_is_32bit(vcpu))
  222. return -EINVAL;
  223. break;
  224. default:
  225. err = -EINVAL;
  226. goto out;
  227. }
  228. }
  229. memcpy(addr, valp, KVM_REG_SIZE(reg->id));
  230. if (*vcpu_cpsr(vcpu) & PSR_MODE32_BIT) {
  231. int i, nr_reg;
  232. switch (*vcpu_cpsr(vcpu) & PSR_AA32_MODE_MASK) {
  233. /*
  234. * Either we are dealing with user mode, and only the
  235. * first 15 registers (+ PC) must be narrowed to 32bit.
  236. * AArch32 r0-r14 conveniently map to AArch64 x0-x14.
  237. */
  238. case PSR_AA32_MODE_USR:
  239. case PSR_AA32_MODE_SYS:
  240. nr_reg = 15;
  241. break;
  242. /*
  243. * Otherwise, this is a privileged mode, and *all* the
  244. * registers must be narrowed to 32bit.
  245. */
  246. default:
  247. nr_reg = 31;
  248. break;
  249. }
  250. for (i = 0; i < nr_reg; i++)
  251. vcpu_set_reg(vcpu, i, (u32)vcpu_get_reg(vcpu, i));
  252. *vcpu_pc(vcpu) = (u32)*vcpu_pc(vcpu);
  253. }
  254. out:
  255. return err;
  256. }
  257. #define vq_word(vq) (((vq) - SVE_VQ_MIN) / 64)
  258. #define vq_mask(vq) ((u64)1 << ((vq) - SVE_VQ_MIN) % 64)
  259. #define vq_present(vqs, vq) (!!((vqs)[vq_word(vq)] & vq_mask(vq)))
  260. static int get_sve_vls(struct kvm_vcpu *vcpu, const struct kvm_one_reg *reg)
  261. {
  262. unsigned int max_vq, vq;
  263. u64 vqs[KVM_ARM64_SVE_VLS_WORDS];
  264. if (!vcpu_has_sve(vcpu))
  265. return -ENOENT;
  266. if (WARN_ON(!sve_vl_valid(vcpu->arch.sve_max_vl)))
  267. return -EINVAL;
  268. memset(vqs, 0, sizeof(vqs));
  269. max_vq = vcpu_sve_max_vq(vcpu);
  270. for (vq = SVE_VQ_MIN; vq <= max_vq; ++vq)
  271. if (sve_vq_available(vq))
  272. vqs[vq_word(vq)] |= vq_mask(vq);
  273. if (copy_to_user((void __user *)reg->addr, vqs, sizeof(vqs)))
  274. return -EFAULT;
  275. return 0;
  276. }
  277. static int set_sve_vls(struct kvm_vcpu *vcpu, const struct kvm_one_reg *reg)
  278. {
  279. unsigned int max_vq, vq;
  280. u64 vqs[KVM_ARM64_SVE_VLS_WORDS];
  281. if (!vcpu_has_sve(vcpu))
  282. return -ENOENT;
  283. if (kvm_arm_vcpu_sve_finalized(vcpu))
  284. return -EPERM; /* too late! */
  285. if (WARN_ON(vcpu->arch.sve_state))
  286. return -EINVAL;
  287. if (copy_from_user(vqs, (const void __user *)reg->addr, sizeof(vqs)))
  288. return -EFAULT;
  289. max_vq = 0;
  290. for (vq = SVE_VQ_MIN; vq <= SVE_VQ_MAX; ++vq)
  291. if (vq_present(vqs, vq))
  292. max_vq = vq;
  293. if (max_vq > sve_vq_from_vl(kvm_sve_max_vl))
  294. return -EINVAL;
  295. /*
  296. * Vector lengths supported by the host can't currently be
  297. * hidden from the guest individually: instead we can only set a
  298. * maximum via ZCR_EL2.LEN. So, make sure the available vector
  299. * lengths match the set requested exactly up to the requested
  300. * maximum:
  301. */
  302. for (vq = SVE_VQ_MIN; vq <= max_vq; ++vq)
  303. if (vq_present(vqs, vq) != sve_vq_available(vq))
  304. return -EINVAL;
  305. /* Can't run with no vector lengths at all: */
  306. if (max_vq < SVE_VQ_MIN)
  307. return -EINVAL;
  308. /* vcpu->arch.sve_state will be alloc'd by kvm_vcpu_finalize_sve() */
  309. vcpu->arch.sve_max_vl = sve_vl_from_vq(max_vq);
  310. return 0;
  311. }
  312. #define SVE_REG_SLICE_SHIFT 0
  313. #define SVE_REG_SLICE_BITS 5
  314. #define SVE_REG_ID_SHIFT (SVE_REG_SLICE_SHIFT + SVE_REG_SLICE_BITS)
  315. #define SVE_REG_ID_BITS 5
  316. #define SVE_REG_SLICE_MASK \
  317. GENMASK(SVE_REG_SLICE_SHIFT + SVE_REG_SLICE_BITS - 1, \
  318. SVE_REG_SLICE_SHIFT)
  319. #define SVE_REG_ID_MASK \
  320. GENMASK(SVE_REG_ID_SHIFT + SVE_REG_ID_BITS - 1, SVE_REG_ID_SHIFT)
  321. #define SVE_NUM_SLICES (1 << SVE_REG_SLICE_BITS)
  322. #define KVM_SVE_ZREG_SIZE KVM_REG_SIZE(KVM_REG_ARM64_SVE_ZREG(0, 0))
  323. #define KVM_SVE_PREG_SIZE KVM_REG_SIZE(KVM_REG_ARM64_SVE_PREG(0, 0))
  324. /*
  325. * Number of register slices required to cover each whole SVE register.
  326. * NOTE: Only the first slice every exists, for now.
  327. * If you are tempted to modify this, you must also rework sve_reg_to_region()
  328. * to match:
  329. */
  330. #define vcpu_sve_slices(vcpu) 1
  331. /* Bounds of a single SVE register slice within vcpu->arch.sve_state */
  332. struct sve_state_reg_region {
  333. unsigned int koffset; /* offset into sve_state in kernel memory */
  334. unsigned int klen; /* length in kernel memory */
  335. unsigned int upad; /* extra trailing padding in user memory */
  336. };
  337. /*
  338. * Validate SVE register ID and get sanitised bounds for user/kernel SVE
  339. * register copy
  340. */
  341. static int sve_reg_to_region(struct sve_state_reg_region *region,
  342. struct kvm_vcpu *vcpu,
  343. const struct kvm_one_reg *reg)
  344. {
  345. /* reg ID ranges for Z- registers */
  346. const u64 zreg_id_min = KVM_REG_ARM64_SVE_ZREG(0, 0);
  347. const u64 zreg_id_max = KVM_REG_ARM64_SVE_ZREG(SVE_NUM_ZREGS - 1,
  348. SVE_NUM_SLICES - 1);
  349. /* reg ID ranges for P- registers and FFR (which are contiguous) */
  350. const u64 preg_id_min = KVM_REG_ARM64_SVE_PREG(0, 0);
  351. const u64 preg_id_max = KVM_REG_ARM64_SVE_FFR(SVE_NUM_SLICES - 1);
  352. unsigned int vq;
  353. unsigned int reg_num;
  354. unsigned int reqoffset, reqlen; /* User-requested offset and length */
  355. unsigned int maxlen; /* Maximum permitted length */
  356. size_t sve_state_size;
  357. const u64 last_preg_id = KVM_REG_ARM64_SVE_PREG(SVE_NUM_PREGS - 1,
  358. SVE_NUM_SLICES - 1);
  359. /* Verify that the P-regs and FFR really do have contiguous IDs: */
  360. BUILD_BUG_ON(KVM_REG_ARM64_SVE_FFR(0) != last_preg_id + 1);
  361. /* Verify that we match the UAPI header: */
  362. BUILD_BUG_ON(SVE_NUM_SLICES != KVM_ARM64_SVE_MAX_SLICES);
  363. reg_num = (reg->id & SVE_REG_ID_MASK) >> SVE_REG_ID_SHIFT;
  364. if (reg->id >= zreg_id_min && reg->id <= zreg_id_max) {
  365. if (!vcpu_has_sve(vcpu) || (reg->id & SVE_REG_SLICE_MASK) > 0)
  366. return -ENOENT;
  367. vq = vcpu_sve_max_vq(vcpu);
  368. reqoffset = SVE_SIG_ZREG_OFFSET(vq, reg_num) -
  369. SVE_SIG_REGS_OFFSET;
  370. reqlen = KVM_SVE_ZREG_SIZE;
  371. maxlen = SVE_SIG_ZREG_SIZE(vq);
  372. } else if (reg->id >= preg_id_min && reg->id <= preg_id_max) {
  373. if (!vcpu_has_sve(vcpu) || (reg->id & SVE_REG_SLICE_MASK) > 0)
  374. return -ENOENT;
  375. vq = vcpu_sve_max_vq(vcpu);
  376. reqoffset = SVE_SIG_PREG_OFFSET(vq, reg_num) -
  377. SVE_SIG_REGS_OFFSET;
  378. reqlen = KVM_SVE_PREG_SIZE;
  379. maxlen = SVE_SIG_PREG_SIZE(vq);
  380. } else {
  381. return -EINVAL;
  382. }
  383. sve_state_size = vcpu_sve_state_size(vcpu);
  384. if (WARN_ON(!sve_state_size))
  385. return -EINVAL;
  386. region->koffset = array_index_nospec(reqoffset, sve_state_size);
  387. region->klen = min(maxlen, reqlen);
  388. region->upad = reqlen - region->klen;
  389. return 0;
  390. }
  391. static int get_sve_reg(struct kvm_vcpu *vcpu, const struct kvm_one_reg *reg)
  392. {
  393. int ret;
  394. struct sve_state_reg_region region;
  395. char __user *uptr = (char __user *)reg->addr;
  396. /* Handle the KVM_REG_ARM64_SVE_VLS pseudo-reg as a special case: */
  397. if (reg->id == KVM_REG_ARM64_SVE_VLS)
  398. return get_sve_vls(vcpu, reg);
  399. /* Try to interpret reg ID as an architectural SVE register... */
  400. ret = sve_reg_to_region(&region, vcpu, reg);
  401. if (ret)
  402. return ret;
  403. if (!kvm_arm_vcpu_sve_finalized(vcpu))
  404. return -EPERM;
  405. if (copy_to_user(uptr, vcpu->arch.sve_state + region.koffset,
  406. region.klen) ||
  407. clear_user(uptr + region.klen, region.upad))
  408. return -EFAULT;
  409. return 0;
  410. }
  411. static int set_sve_reg(struct kvm_vcpu *vcpu, const struct kvm_one_reg *reg)
  412. {
  413. int ret;
  414. struct sve_state_reg_region region;
  415. const char __user *uptr = (const char __user *)reg->addr;
  416. /* Handle the KVM_REG_ARM64_SVE_VLS pseudo-reg as a special case: */
  417. if (reg->id == KVM_REG_ARM64_SVE_VLS)
  418. return set_sve_vls(vcpu, reg);
  419. /* Try to interpret reg ID as an architectural SVE register... */
  420. ret = sve_reg_to_region(&region, vcpu, reg);
  421. if (ret)
  422. return ret;
  423. if (!kvm_arm_vcpu_sve_finalized(vcpu))
  424. return -EPERM;
  425. if (copy_from_user(vcpu->arch.sve_state + region.koffset, uptr,
  426. region.klen))
  427. return -EFAULT;
  428. return 0;
  429. }
  430. int kvm_arch_vcpu_ioctl_get_regs(struct kvm_vcpu *vcpu, struct kvm_regs *regs)
  431. {
  432. return -EINVAL;
  433. }
  434. int kvm_arch_vcpu_ioctl_set_regs(struct kvm_vcpu *vcpu, struct kvm_regs *regs)
  435. {
  436. return -EINVAL;
  437. }
  438. static int copy_core_reg_indices(const struct kvm_vcpu *vcpu,
  439. u64 __user *uindices)
  440. {
  441. unsigned int i;
  442. int n = 0;
  443. for (i = 0; i < sizeof(struct kvm_regs) / sizeof(__u32); i++) {
  444. u64 reg = KVM_REG_ARM64 | KVM_REG_ARM_CORE | i;
  445. int size = core_reg_size_from_offset(vcpu, i);
  446. if (size < 0)
  447. continue;
  448. switch (size) {
  449. case sizeof(__u32):
  450. reg |= KVM_REG_SIZE_U32;
  451. break;
  452. case sizeof(__u64):
  453. reg |= KVM_REG_SIZE_U64;
  454. break;
  455. case sizeof(__uint128_t):
  456. reg |= KVM_REG_SIZE_U128;
  457. break;
  458. default:
  459. WARN_ON(1);
  460. continue;
  461. }
  462. if (uindices) {
  463. if (put_user(reg, uindices))
  464. return -EFAULT;
  465. uindices++;
  466. }
  467. n++;
  468. }
  469. return n;
  470. }
  471. static unsigned long num_core_regs(const struct kvm_vcpu *vcpu)
  472. {
  473. return copy_core_reg_indices(vcpu, NULL);
  474. }
  475. static unsigned long num_sve_regs(const struct kvm_vcpu *vcpu)
  476. {
  477. const unsigned int slices = vcpu_sve_slices(vcpu);
  478. if (!vcpu_has_sve(vcpu))
  479. return 0;
  480. /* Policed by KVM_GET_REG_LIST: */
  481. WARN_ON(!kvm_arm_vcpu_sve_finalized(vcpu));
  482. return slices * (SVE_NUM_PREGS + SVE_NUM_ZREGS + 1 /* FFR */)
  483. + 1; /* KVM_REG_ARM64_SVE_VLS */
  484. }
  485. static int copy_sve_reg_indices(const struct kvm_vcpu *vcpu,
  486. u64 __user *uindices)
  487. {
  488. const unsigned int slices = vcpu_sve_slices(vcpu);
  489. u64 reg;
  490. unsigned int i, n;
  491. int num_regs = 0;
  492. if (!vcpu_has_sve(vcpu))
  493. return 0;
  494. /* Policed by KVM_GET_REG_LIST: */
  495. WARN_ON(!kvm_arm_vcpu_sve_finalized(vcpu));
  496. /*
  497. * Enumerate this first, so that userspace can save/restore in
  498. * the order reported by KVM_GET_REG_LIST:
  499. */
  500. reg = KVM_REG_ARM64_SVE_VLS;
  501. if (put_user(reg, uindices++))
  502. return -EFAULT;
  503. ++num_regs;
  504. for (i = 0; i < slices; i++) {
  505. for (n = 0; n < SVE_NUM_ZREGS; n++) {
  506. reg = KVM_REG_ARM64_SVE_ZREG(n, i);
  507. if (put_user(reg, uindices++))
  508. return -EFAULT;
  509. num_regs++;
  510. }
  511. for (n = 0; n < SVE_NUM_PREGS; n++) {
  512. reg = KVM_REG_ARM64_SVE_PREG(n, i);
  513. if (put_user(reg, uindices++))
  514. return -EFAULT;
  515. num_regs++;
  516. }
  517. reg = KVM_REG_ARM64_SVE_FFR(i);
  518. if (put_user(reg, uindices++))
  519. return -EFAULT;
  520. num_regs++;
  521. }
  522. return num_regs;
  523. }
  524. /**
  525. * kvm_arm_num_regs - how many registers do we present via KVM_GET_ONE_REG
  526. * @vcpu: the vCPU pointer
  527. *
  528. * This is for all registers.
  529. */
  530. unsigned long kvm_arm_num_regs(struct kvm_vcpu *vcpu)
  531. {
  532. unsigned long res = 0;
  533. res += num_core_regs(vcpu);
  534. res += num_sve_regs(vcpu);
  535. res += kvm_arm_num_sys_reg_descs(vcpu);
  536. res += kvm_arm_get_fw_num_regs(vcpu);
  537. return res;
  538. }
  539. /**
  540. * kvm_arm_copy_reg_indices - get indices of all registers.
  541. * @vcpu: the vCPU pointer
  542. * @uindices: register list to copy
  543. *
  544. * We do core registers right here, then we append system regs.
  545. */
  546. int kvm_arm_copy_reg_indices(struct kvm_vcpu *vcpu, u64 __user *uindices)
  547. {
  548. int ret;
  549. ret = copy_core_reg_indices(vcpu, uindices);
  550. if (ret < 0)
  551. return ret;
  552. uindices += ret;
  553. ret = copy_sve_reg_indices(vcpu, uindices);
  554. if (ret < 0)
  555. return ret;
  556. uindices += ret;
  557. ret = kvm_arm_copy_fw_reg_indices(vcpu, uindices);
  558. if (ret < 0)
  559. return ret;
  560. uindices += kvm_arm_get_fw_num_regs(vcpu);
  561. return kvm_arm_copy_sys_reg_indices(vcpu, uindices);
  562. }
  563. int kvm_arm_get_reg(struct kvm_vcpu *vcpu, const struct kvm_one_reg *reg)
  564. {
  565. /* We currently use nothing arch-specific in upper 32 bits */
  566. if ((reg->id & ~KVM_REG_SIZE_MASK) >> 32 != KVM_REG_ARM64 >> 32)
  567. return -EINVAL;
  568. switch (reg->id & KVM_REG_ARM_COPROC_MASK) {
  569. case KVM_REG_ARM_CORE: return get_core_reg(vcpu, reg);
  570. case KVM_REG_ARM_FW:
  571. case KVM_REG_ARM_FW_FEAT_BMAP:
  572. return kvm_arm_get_fw_reg(vcpu, reg);
  573. case KVM_REG_ARM64_SVE: return get_sve_reg(vcpu, reg);
  574. }
  575. return kvm_arm_sys_reg_get_reg(vcpu, reg);
  576. }
  577. int kvm_arm_set_reg(struct kvm_vcpu *vcpu, const struct kvm_one_reg *reg)
  578. {
  579. /* We currently use nothing arch-specific in upper 32 bits */
  580. if ((reg->id & ~KVM_REG_SIZE_MASK) >> 32 != KVM_REG_ARM64 >> 32)
  581. return -EINVAL;
  582. switch (reg->id & KVM_REG_ARM_COPROC_MASK) {
  583. case KVM_REG_ARM_CORE: return set_core_reg(vcpu, reg);
  584. case KVM_REG_ARM_FW:
  585. case KVM_REG_ARM_FW_FEAT_BMAP:
  586. return kvm_arm_set_fw_reg(vcpu, reg);
  587. case KVM_REG_ARM64_SVE: return set_sve_reg(vcpu, reg);
  588. }
  589. return kvm_arm_sys_reg_set_reg(vcpu, reg);
  590. }
  591. int kvm_arch_vcpu_ioctl_get_sregs(struct kvm_vcpu *vcpu,
  592. struct kvm_sregs *sregs)
  593. {
  594. return -EINVAL;
  595. }
  596. int kvm_arch_vcpu_ioctl_set_sregs(struct kvm_vcpu *vcpu,
  597. struct kvm_sregs *sregs)
  598. {
  599. return -EINVAL;
  600. }
  601. int __kvm_arm_vcpu_get_events(struct kvm_vcpu *vcpu,
  602. struct kvm_vcpu_events *events)
  603. {
  604. events->exception.serror_has_esr = cpus_have_final_cap(ARM64_HAS_RAS_EXTN);
  605. events->exception.serror_pending = (vcpu->arch.hcr_el2 & HCR_VSE) ||
  606. vcpu_get_flag(vcpu, NESTED_SERROR_PENDING);
  607. if (events->exception.serror_pending && events->exception.serror_has_esr)
  608. events->exception.serror_esr = vcpu_get_vsesr(vcpu);
  609. /*
  610. * We never return a pending ext_dabt here because we deliver it to
  611. * the virtual CPU directly when setting the event and it's no longer
  612. * 'pending' at this point.
  613. */
  614. return 0;
  615. }
  616. static void commit_pending_events(struct kvm_vcpu *vcpu)
  617. {
  618. if (!vcpu_get_flag(vcpu, PENDING_EXCEPTION))
  619. return;
  620. /*
  621. * Reset the MMIO emulation state to avoid stepping PC after emulating
  622. * the exception entry.
  623. */
  624. vcpu->mmio_needed = false;
  625. kvm_call_hyp(__kvm_adjust_pc, vcpu);
  626. }
  627. int __kvm_arm_vcpu_set_events(struct kvm_vcpu *vcpu,
  628. struct kvm_vcpu_events *events)
  629. {
  630. bool serror_pending = events->exception.serror_pending;
  631. bool has_esr = events->exception.serror_has_esr;
  632. bool ext_dabt_pending = events->exception.ext_dabt_pending;
  633. u64 esr = events->exception.serror_esr;
  634. int ret = 0;
  635. /*
  636. * Immediately commit the pending SEA to the vCPU's architectural
  637. * state which is necessary since we do not return a pending SEA
  638. * to userspace via KVM_GET_VCPU_EVENTS.
  639. */
  640. if (ext_dabt_pending) {
  641. ret = kvm_inject_sea_dabt(vcpu, kvm_vcpu_get_hfar(vcpu));
  642. commit_pending_events(vcpu);
  643. }
  644. if (ret < 0)
  645. return ret;
  646. if (!serror_pending)
  647. return 0;
  648. if (!cpus_have_final_cap(ARM64_HAS_RAS_EXTN) && has_esr)
  649. return -EINVAL;
  650. if (has_esr && (esr & ~ESR_ELx_ISS_MASK))
  651. return -EINVAL;
  652. if (has_esr)
  653. ret = kvm_inject_serror_esr(vcpu, esr);
  654. else
  655. ret = kvm_inject_serror(vcpu);
  656. /*
  657. * We could've decided that the SError is due for immediate software
  658. * injection; commit the exception in case userspace decides it wants
  659. * to inject more exceptions for some strange reason.
  660. */
  661. commit_pending_events(vcpu);
  662. return (ret < 0) ? ret : 0;
  663. }
  664. u32 __attribute_const__ kvm_target_cpu(void)
  665. {
  666. unsigned long implementor = read_cpuid_implementor();
  667. unsigned long part_number = read_cpuid_part_number();
  668. switch (implementor) {
  669. case ARM_CPU_IMP_ARM:
  670. switch (part_number) {
  671. case ARM_CPU_PART_AEM_V8:
  672. return KVM_ARM_TARGET_AEM_V8;
  673. case ARM_CPU_PART_FOUNDATION:
  674. return KVM_ARM_TARGET_FOUNDATION_V8;
  675. case ARM_CPU_PART_CORTEX_A53:
  676. return KVM_ARM_TARGET_CORTEX_A53;
  677. case ARM_CPU_PART_CORTEX_A57:
  678. return KVM_ARM_TARGET_CORTEX_A57;
  679. }
  680. break;
  681. case ARM_CPU_IMP_APM:
  682. switch (part_number) {
  683. case APM_CPU_PART_XGENE:
  684. return KVM_ARM_TARGET_XGENE_POTENZA;
  685. }
  686. break;
  687. }
  688. /* Return a default generic target */
  689. return KVM_ARM_TARGET_GENERIC_V8;
  690. }
  691. int kvm_arch_vcpu_ioctl_get_fpu(struct kvm_vcpu *vcpu, struct kvm_fpu *fpu)
  692. {
  693. return -EINVAL;
  694. }
  695. int kvm_arch_vcpu_ioctl_set_fpu(struct kvm_vcpu *vcpu, struct kvm_fpu *fpu)
  696. {
  697. return -EINVAL;
  698. }
  699. int kvm_arch_vcpu_ioctl_translate(struct kvm_vcpu *vcpu,
  700. struct kvm_translation *tr)
  701. {
  702. return -EINVAL;
  703. }
  704. /**
  705. * kvm_arch_vcpu_ioctl_set_guest_debug - set up guest debugging
  706. * @vcpu: the vCPU pointer
  707. * @dbg: the ioctl data buffer
  708. *
  709. * This sets up and enables the VM for guest debugging. Userspace
  710. * passes in a control flag to enable different debug types and
  711. * potentially other architecture specific information in the rest of
  712. * the structure.
  713. */
  714. int kvm_arch_vcpu_ioctl_set_guest_debug(struct kvm_vcpu *vcpu,
  715. struct kvm_guest_debug *dbg)
  716. {
  717. trace_kvm_set_guest_debug(vcpu, dbg->control);
  718. if (dbg->control & ~KVM_GUESTDBG_VALID_MASK)
  719. return -EINVAL;
  720. if (!(dbg->control & KVM_GUESTDBG_ENABLE)) {
  721. vcpu->guest_debug = 0;
  722. vcpu_clear_flag(vcpu, HOST_SS_ACTIVE_PENDING);
  723. return 0;
  724. }
  725. vcpu->guest_debug = dbg->control;
  726. /* Hardware assisted Break and Watch points */
  727. if (vcpu->guest_debug & KVM_GUESTDBG_USE_HW)
  728. vcpu->arch.external_debug_state = dbg->arch;
  729. return 0;
  730. }
  731. int kvm_arm_vcpu_arch_set_attr(struct kvm_vcpu *vcpu,
  732. struct kvm_device_attr *attr)
  733. {
  734. int ret;
  735. switch (attr->group) {
  736. case KVM_ARM_VCPU_PMU_V3_CTRL:
  737. mutex_lock(&vcpu->kvm->arch.config_lock);
  738. ret = kvm_arm_pmu_v3_set_attr(vcpu, attr);
  739. mutex_unlock(&vcpu->kvm->arch.config_lock);
  740. break;
  741. case KVM_ARM_VCPU_TIMER_CTRL:
  742. ret = kvm_arm_timer_set_attr(vcpu, attr);
  743. break;
  744. case KVM_ARM_VCPU_PVTIME_CTRL:
  745. ret = kvm_arm_pvtime_set_attr(vcpu, attr);
  746. break;
  747. default:
  748. ret = -ENXIO;
  749. break;
  750. }
  751. return ret;
  752. }
  753. int kvm_arm_vcpu_arch_get_attr(struct kvm_vcpu *vcpu,
  754. struct kvm_device_attr *attr)
  755. {
  756. int ret;
  757. switch (attr->group) {
  758. case KVM_ARM_VCPU_PMU_V3_CTRL:
  759. ret = kvm_arm_pmu_v3_get_attr(vcpu, attr);
  760. break;
  761. case KVM_ARM_VCPU_TIMER_CTRL:
  762. ret = kvm_arm_timer_get_attr(vcpu, attr);
  763. break;
  764. case KVM_ARM_VCPU_PVTIME_CTRL:
  765. ret = kvm_arm_pvtime_get_attr(vcpu, attr);
  766. break;
  767. default:
  768. ret = -ENXIO;
  769. break;
  770. }
  771. return ret;
  772. }
  773. int kvm_arm_vcpu_arch_has_attr(struct kvm_vcpu *vcpu,
  774. struct kvm_device_attr *attr)
  775. {
  776. int ret;
  777. switch (attr->group) {
  778. case KVM_ARM_VCPU_PMU_V3_CTRL:
  779. ret = kvm_arm_pmu_v3_has_attr(vcpu, attr);
  780. break;
  781. case KVM_ARM_VCPU_TIMER_CTRL:
  782. ret = kvm_arm_timer_has_attr(vcpu, attr);
  783. break;
  784. case KVM_ARM_VCPU_PVTIME_CTRL:
  785. ret = kvm_arm_pvtime_has_attr(vcpu, attr);
  786. break;
  787. default:
  788. ret = -ENXIO;
  789. break;
  790. }
  791. return ret;
  792. }
  793. int kvm_vm_ioctl_mte_copy_tags(struct kvm *kvm,
  794. struct kvm_arm_copy_mte_tags *copy_tags)
  795. {
  796. gpa_t guest_ipa = copy_tags->guest_ipa;
  797. size_t length = copy_tags->length;
  798. void __user *tags = copy_tags->addr;
  799. gpa_t gfn;
  800. bool write = !(copy_tags->flags & KVM_ARM_TAGS_FROM_GUEST);
  801. int ret = 0;
  802. if (!kvm_has_mte(kvm))
  803. return -EINVAL;
  804. if (copy_tags->reserved[0] || copy_tags->reserved[1])
  805. return -EINVAL;
  806. if (copy_tags->flags & ~KVM_ARM_TAGS_FROM_GUEST)
  807. return -EINVAL;
  808. if (length & ~PAGE_MASK || guest_ipa & ~PAGE_MASK)
  809. return -EINVAL;
  810. /* Lengths above INT_MAX cannot be represented in the return value */
  811. if (length > INT_MAX)
  812. return -EINVAL;
  813. gfn = gpa_to_gfn(guest_ipa);
  814. mutex_lock(&kvm->slots_lock);
  815. if (write && atomic_read(&kvm->nr_memslots_dirty_logging)) {
  816. ret = -EBUSY;
  817. goto out;
  818. }
  819. while (length > 0) {
  820. struct page *page = __gfn_to_page(kvm, gfn, write);
  821. void *maddr;
  822. unsigned long num_tags;
  823. struct folio *folio;
  824. if (!page) {
  825. ret = -EFAULT;
  826. goto out;
  827. }
  828. if (!pfn_to_online_page(page_to_pfn(page))) {
  829. /* Reject ZONE_DEVICE memory */
  830. kvm_release_page_unused(page);
  831. ret = -EFAULT;
  832. goto out;
  833. }
  834. folio = page_folio(page);
  835. maddr = page_address(page);
  836. if (!write) {
  837. if ((folio_test_hugetlb(folio) &&
  838. folio_test_hugetlb_mte_tagged(folio)) ||
  839. page_mte_tagged(page))
  840. num_tags = mte_copy_tags_to_user(tags, maddr,
  841. MTE_GRANULES_PER_PAGE);
  842. else
  843. /* No tags in memory, so write zeros */
  844. num_tags = MTE_GRANULES_PER_PAGE -
  845. clear_user(tags, MTE_GRANULES_PER_PAGE);
  846. kvm_release_page_clean(page);
  847. } else {
  848. /*
  849. * Only locking to serialise with a concurrent
  850. * __set_ptes() in the VMM but still overriding the
  851. * tags, hence ignoring the return value.
  852. */
  853. if (folio_test_hugetlb(folio))
  854. folio_try_hugetlb_mte_tagging(folio);
  855. else
  856. try_page_mte_tagging(page);
  857. num_tags = mte_copy_tags_from_user(maddr, tags,
  858. MTE_GRANULES_PER_PAGE);
  859. /* uaccess failed, don't leave stale tags */
  860. if (num_tags != MTE_GRANULES_PER_PAGE)
  861. mte_clear_page_tags(maddr);
  862. if (folio_test_hugetlb(folio))
  863. folio_set_hugetlb_mte_tagged(folio);
  864. else
  865. set_page_mte_tagged(page);
  866. kvm_release_page_dirty(page);
  867. }
  868. if (num_tags != MTE_GRANULES_PER_PAGE) {
  869. ret = -EFAULT;
  870. goto out;
  871. }
  872. gfn++;
  873. tags += num_tags;
  874. length -= PAGE_SIZE;
  875. }
  876. out:
  877. mutex_unlock(&kvm->slots_lock);
  878. /* If some data has been copied report the number of bytes copied */
  879. if (length != copy_tags->length)
  880. return copy_tags->length - length;
  881. return ret;
  882. }