1 // SPDX-License-Identifier: GPL-2.0-only
5 * Copyright © 2021 Amazon.com, Inc. or its affiliates.
7 * Xen shared_info / pvclock testing
10 #include "test_util.h"
12 #include "processor.h"
17 #include <sys/syscall.h>
21 #define SHINFO_REGION_GVA 0xc0000000ULL
22 #define SHINFO_REGION_GPA 0xc0000000ULL
23 #define SHINFO_REGION_SLOT 10
24 #define PAGE_SIZE 4096
26 #define PVTIME_ADDR (SHINFO_REGION_GPA + PAGE_SIZE)
27 #define RUNSTATE_ADDR (SHINFO_REGION_GPA + PAGE_SIZE + 0x20)
29 #define RUNSTATE_VADDR (SHINFO_REGION_GVA + PAGE_SIZE + 0x20)
31 static struct kvm_vm *vm;
33 #define XEN_HYPERCALL_MSR 0x40000000
35 #define MIN_STEAL_TIME 50000
37 struct pvclock_vcpu_time_info {
42 u32 tsc_to_system_mul;
46 } __attribute__((__packed__)); /* 32 bytes */
48 struct pvclock_wall_clock {
52 } __attribute__((__packed__));
54 struct vcpu_runstate_info {
56 uint64_t state_entry_time;
60 #define RUNSTATE_running 0
61 #define RUNSTATE_runnable 1
62 #define RUNSTATE_blocked 2
63 #define RUNSTATE_offline 3
65 static void guest_code(void)
67 struct vcpu_runstate_info *rs = (void *)RUNSTATE_VADDR;
69 /* Test having the host set runstates manually */
70 GUEST_SYNC(RUNSTATE_runnable);
71 GUEST_ASSERT(rs->time[RUNSTATE_runnable] != 0);
72 GUEST_ASSERT(rs->state == 0);
74 GUEST_SYNC(RUNSTATE_blocked);
75 GUEST_ASSERT(rs->time[RUNSTATE_blocked] != 0);
76 GUEST_ASSERT(rs->state == 0);
78 GUEST_SYNC(RUNSTATE_offline);
79 GUEST_ASSERT(rs->time[RUNSTATE_offline] != 0);
80 GUEST_ASSERT(rs->state == 0);
82 /* Test runstate time adjust */
84 GUEST_ASSERT(rs->time[RUNSTATE_blocked] == 0x5a);
85 GUEST_ASSERT(rs->time[RUNSTATE_offline] == 0x6b6b);
87 /* Test runstate time set */
89 GUEST_ASSERT(rs->state_entry_time >= 0x8000);
90 GUEST_ASSERT(rs->time[RUNSTATE_runnable] == 0);
91 GUEST_ASSERT(rs->time[RUNSTATE_blocked] == 0x6b6b);
92 GUEST_ASSERT(rs->time[RUNSTATE_offline] == 0x5a);
94 /* sched_yield() should result in some 'runnable' time */
96 GUEST_ASSERT(rs->time[RUNSTATE_runnable] >= MIN_STEAL_TIME);
101 static long get_run_delay(void)
107 sprintf(path, "/proc/%ld/schedstat", syscall(SYS_gettid));
108 fp = fopen(path, "r");
109 fscanf(fp, "%ld %ld ", &val[0], &val[1]);
115 static int cmp_timespec(struct timespec *a, struct timespec *b)
117 if (a->tv_sec > b->tv_sec)
119 else if (a->tv_sec < b->tv_sec)
121 else if (a->tv_nsec > b->tv_nsec)
123 else if (a->tv_nsec < b->tv_nsec)
129 int main(int argc, char *argv[])
131 struct timespec min_ts, max_ts, vm_ts;
133 int xen_caps = kvm_check_cap(KVM_CAP_XEN_HVM);
134 if (!(xen_caps & KVM_XEN_HVM_CONFIG_SHARED_INFO) ) {
135 print_skip("KVM_XEN_HVM_CONFIG_SHARED_INFO not available");
139 bool do_runstate_tests = !!(xen_caps & KVM_XEN_HVM_CONFIG_RUNSTATE);
141 clock_gettime(CLOCK_REALTIME, &min_ts);
143 vm = vm_create_default(VCPU_ID, 0, (void *) guest_code);
144 vcpu_set_cpuid(vm, VCPU_ID, kvm_get_supported_cpuid());
146 /* Map a region for the shared_info page */
147 vm_userspace_mem_region_add(vm, VM_MEM_SRC_ANONYMOUS,
148 SHINFO_REGION_GPA, SHINFO_REGION_SLOT, 2, 0);
149 virt_map(vm, SHINFO_REGION_GVA, SHINFO_REGION_GPA, 2);
151 struct kvm_xen_hvm_config hvmc = {
152 .flags = KVM_XEN_HVM_CONFIG_INTERCEPT_HCALL,
153 .msr = XEN_HYPERCALL_MSR,
155 vm_ioctl(vm, KVM_XEN_HVM_CONFIG, &hvmc);
157 struct kvm_xen_hvm_attr lm = {
158 .type = KVM_XEN_ATTR_TYPE_LONG_MODE,
161 vm_ioctl(vm, KVM_XEN_HVM_SET_ATTR, &lm);
163 struct kvm_xen_hvm_attr ha = {
164 .type = KVM_XEN_ATTR_TYPE_SHARED_INFO,
165 .u.shared_info.gfn = SHINFO_REGION_GPA / PAGE_SIZE,
167 vm_ioctl(vm, KVM_XEN_HVM_SET_ATTR, &ha);
169 struct kvm_xen_vcpu_attr vi = {
170 .type = KVM_XEN_VCPU_ATTR_TYPE_VCPU_INFO,
171 .u.gpa = SHINFO_REGION_GPA + 0x40,
173 vcpu_ioctl(vm, VCPU_ID, KVM_XEN_VCPU_SET_ATTR, &vi);
175 struct kvm_xen_vcpu_attr pvclock = {
176 .type = KVM_XEN_VCPU_ATTR_TYPE_VCPU_TIME_INFO,
177 .u.gpa = PVTIME_ADDR,
179 vcpu_ioctl(vm, VCPU_ID, KVM_XEN_VCPU_SET_ATTR, &pvclock);
181 if (do_runstate_tests) {
182 struct kvm_xen_vcpu_attr st = {
183 .type = KVM_XEN_VCPU_ATTR_TYPE_RUNSTATE_ADDR,
184 .u.gpa = RUNSTATE_ADDR,
186 vcpu_ioctl(vm, VCPU_ID, KVM_XEN_VCPU_SET_ATTR, &st);
189 struct vcpu_runstate_info *rs = addr_gpa2hva(vm, RUNSTATE_ADDR);
193 volatile struct kvm_run *run = vcpu_state(vm, VCPU_ID);
196 vcpu_run(vm, VCPU_ID);
198 TEST_ASSERT(run->exit_reason == KVM_EXIT_IO,
199 "Got exit_reason other than KVM_EXIT_IO: %u (%s)\n",
201 exit_reason_str(run->exit_reason));
203 switch (get_ucall(vm, VCPU_ID, &uc)) {
205 TEST_FAIL("%s", (const char *)uc.args[0]);
208 struct kvm_xen_vcpu_attr rst;
211 /* If no runstate support, bail out early */
212 if (!do_runstate_tests)
215 TEST_ASSERT(rs->state_entry_time == rs->time[0] +
216 rs->time[1] + rs->time[2] + rs->time[3],
217 "runstate times don't add up");
219 switch (uc.args[1]) {
220 case RUNSTATE_running...RUNSTATE_offline:
221 rst.type = KVM_XEN_VCPU_ATTR_TYPE_RUNSTATE_CURRENT;
222 rst.u.runstate.state = uc.args[1];
223 vcpu_ioctl(vm, VCPU_ID, KVM_XEN_VCPU_SET_ATTR, &rst);
226 rst.type = KVM_XEN_VCPU_ATTR_TYPE_RUNSTATE_ADJUST;
227 memset(&rst.u, 0, sizeof(rst.u));
228 rst.u.runstate.state = (uint64_t)-1;
229 rst.u.runstate.time_blocked =
230 0x5a - rs->time[RUNSTATE_blocked];
231 rst.u.runstate.time_offline =
232 0x6b6b - rs->time[RUNSTATE_offline];
233 rst.u.runstate.time_runnable = -rst.u.runstate.time_blocked -
234 rst.u.runstate.time_offline;
235 vcpu_ioctl(vm, VCPU_ID, KVM_XEN_VCPU_SET_ATTR, &rst);
239 rst.type = KVM_XEN_VCPU_ATTR_TYPE_RUNSTATE_DATA;
240 memset(&rst.u, 0, sizeof(rst.u));
241 rst.u.runstate.state = RUNSTATE_running;
242 rst.u.runstate.state_entry_time = 0x6b6b + 0x5a;
243 rst.u.runstate.time_blocked = 0x6b6b;
244 rst.u.runstate.time_offline = 0x5a;
245 vcpu_ioctl(vm, VCPU_ID, KVM_XEN_VCPU_SET_ATTR, &rst);
248 /* Yield until scheduler delay exceeds target */
249 rundelay = get_run_delay() + MIN_STEAL_TIME;
252 } while (get_run_delay() < rundelay);
260 TEST_FAIL("Unknown ucall 0x%lx.", uc.cmd);
265 clock_gettime(CLOCK_REALTIME, &max_ts);
268 * Just a *really* basic check that things are being put in the
269 * right place. The actual calculations are much the same for
270 * Xen as they are for the KVM variants, so no need to check.
272 struct pvclock_wall_clock *wc;
273 struct pvclock_vcpu_time_info *ti, *ti2;
275 wc = addr_gpa2hva(vm, SHINFO_REGION_GPA + 0xc00);
276 ti = addr_gpa2hva(vm, SHINFO_REGION_GPA + 0x40 + 0x20);
277 ti2 = addr_gpa2hva(vm, PVTIME_ADDR);
279 vm_ts.tv_sec = wc->sec;
280 vm_ts.tv_nsec = wc->nsec;
281 TEST_ASSERT(wc->version && !(wc->version & 1),
282 "Bad wallclock version %x", wc->version);
283 TEST_ASSERT(cmp_timespec(&min_ts, &vm_ts) <= 0, "VM time too old");
284 TEST_ASSERT(cmp_timespec(&max_ts, &vm_ts) >= 0, "VM time too new");
286 TEST_ASSERT(ti->version && !(ti->version & 1),
287 "Bad time_info version %x", ti->version);
288 TEST_ASSERT(ti2->version && !(ti2->version & 1),
289 "Bad time_info version %x", ti->version);
291 if (do_runstate_tests) {
293 * Fetch runstate and check sanity. Strictly speaking in the
294 * general case we might not expect the numbers to be identical
295 * but in this case we know we aren't running the vCPU any more.
297 struct kvm_xen_vcpu_attr rst = {
298 .type = KVM_XEN_VCPU_ATTR_TYPE_RUNSTATE_DATA,
300 vcpu_ioctl(vm, VCPU_ID, KVM_XEN_VCPU_GET_ATTR, &rst);
302 TEST_ASSERT(rs->state == rst.u.runstate.state, "Runstate mismatch");
303 TEST_ASSERT(rs->state_entry_time == rst.u.runstate.state_entry_time,
304 "State entry time mismatch");
305 TEST_ASSERT(rs->time[RUNSTATE_running] == rst.u.runstate.time_running,
306 "Running time mismatch");
307 TEST_ASSERT(rs->time[RUNSTATE_runnable] == rst.u.runstate.time_runnable,
308 "Runnable time mismatch");
309 TEST_ASSERT(rs->time[RUNSTATE_blocked] == rst.u.runstate.time_blocked,
310 "Blocked time mismatch");
311 TEST_ASSERT(rs->time[RUNSTATE_offline] == rst.u.runstate.time_offline,
312 "Offline time mismatch");
314 TEST_ASSERT(rs->state_entry_time == rs->time[0] +
315 rs->time[1] + rs->time[2] + rs->time[3],
316 "runstate times don't add up");