xref: /xnu-12377.1.9/tests/arm_matrix.c (revision f6217f891ac0bb64f3d375211650a4c1ff8ca1ea)
1*f6217f89SApple OSS Distributions /*
2*f6217f89SApple OSS Distributions  * Copyright (c) 2019 Apple Computer, Inc. All rights reserved.
3*f6217f89SApple OSS Distributions  *
4*f6217f89SApple OSS Distributions  * @APPLE_OSREFERENCE_LICENSE_HEADER_START@
5*f6217f89SApple OSS Distributions  *
6*f6217f89SApple OSS Distributions  * This file contains Original Code and/or Modifications of Original Code
7*f6217f89SApple OSS Distributions  * as defined in and that are subject to the Apple Public Source License
8*f6217f89SApple OSS Distributions  * Version 2.0 (the 'License'). You may not use this file except in
9*f6217f89SApple OSS Distributions  * compliance with the License. The rights granted to you under the License
10*f6217f89SApple OSS Distributions  * may not be used to create, or enable the creation or redistribution of,
11*f6217f89SApple OSS Distributions  * unlawful or unlicensed copies of an Apple operating system, or to
12*f6217f89SApple OSS Distributions  * circumvent, violate, or enable the circumvention or violation of, any
13*f6217f89SApple OSS Distributions  * terms of an Apple operating system software license agreement.
14*f6217f89SApple OSS Distributions  *
15*f6217f89SApple OSS Distributions  * Please obtain a copy of the License at
16*f6217f89SApple OSS Distributions  * http://www.opensource.apple.com/apsl/ and read it before using this file.
17*f6217f89SApple OSS Distributions  *
18*f6217f89SApple OSS Distributions  * The Original Code and all software distributed under the License are
19*f6217f89SApple OSS Distributions  * distributed on an 'AS IS' basis, WITHOUT WARRANTY OF ANY KIND, EITHER
20*f6217f89SApple OSS Distributions  * EXPRESS OR IMPLIED, AND APPLE HEREBY DISCLAIMS ALL SUCH WARRANTIES,
21*f6217f89SApple OSS Distributions  * INCLUDING WITHOUT LIMITATION, ANY WARRANTIES OF MERCHANTABILITY,
22*f6217f89SApple OSS Distributions  * FITNESS FOR A PARTICULAR PURPOSE, QUIET ENJOYMENT OR NON-INFRINGEMENT.
23*f6217f89SApple OSS Distributions  * Please see the License for the specific language governing rights and
24*f6217f89SApple OSS Distributions  * limitations under the License.
25*f6217f89SApple OSS Distributions  *
26*f6217f89SApple OSS Distributions  * @APPLE_OSREFERENCE_LICENSE_HEADER_END@
27*f6217f89SApple OSS Distributions  */
28*f6217f89SApple OSS Distributions /**
29*f6217f89SApple OSS Distributions  * On devices that support it, this test ensures that a mach exception is
30*f6217f89SApple OSS Distributions  * generated when a matrix-math exception is triggered, and that the
31*f6217f89SApple OSS Distributions  * matrix register file is correctly preserved or zeroed on context switch.
32*f6217f89SApple OSS Distributions  */
33*f6217f89SApple OSS Distributions 
34*f6217f89SApple OSS Distributions /*
35*f6217f89SApple OSS Distributions  * IMPLEMENTATION NOTE:
36*f6217f89SApple OSS Distributions  *
37*f6217f89SApple OSS Distributions  * This test code goes to some unusual lengths to avoid calling out to libc or
38*f6217f89SApple OSS Distributions  * libdarwintest while the CPU is in streaming SVE mode (i.e., between
39*f6217f89SApple OSS Distributions  * ops->start() and ops->stop()).  Both of these libraries are built with SIMD
40*f6217f89SApple OSS Distributions  * instructions that will cause the test executable to crash while in streaming
41*f6217f89SApple OSS Distributions  * SVE mode.
42*f6217f89SApple OSS Distributions  *
43*f6217f89SApple OSS Distributions  * Ordinarily this is the wrong way to solve this problem.  Functions that use
44*f6217f89SApple OSS Distributions  * streaming SVE mode should have annotations telling the compiler so, and the
45*f6217f89SApple OSS Distributions  * compiler will automatically generate appropriate interworking code.  However
46*f6217f89SApple OSS Distributions  * this interworking code will stash SME state to memory and temporarily exit
47*f6217f89SApple OSS Distributions  * streaming SVE mode.  We're specifically testing how xnu manages live SME
48*f6217f89SApple OSS Distributions  * register state, so we can't let the compiler stash and disable this state
49*f6217f89SApple OSS Distributions  * behind our backs.
50*f6217f89SApple OSS Distributions  */
51*f6217f89SApple OSS Distributions 
52*f6217f89SApple OSS Distributions #ifdef __arm64__
53*f6217f89SApple OSS Distributions #include <mach/error.h>
54*f6217f89SApple OSS Distributions #endif /* __arm64__ */
55*f6217f89SApple OSS Distributions 
56*f6217f89SApple OSS Distributions #include <darwintest.h>
57*f6217f89SApple OSS Distributions #include <pthread.h>
58*f6217f89SApple OSS Distributions #include <stdlib.h>
59*f6217f89SApple OSS Distributions #include <mach/mach.h>
60*f6217f89SApple OSS Distributions #include <mach/thread_act.h>
61*f6217f89SApple OSS Distributions #include <mach/thread_status.h>
62*f6217f89SApple OSS Distributions #include <mach/exception.h>
63*f6217f89SApple OSS Distributions #include <machine/cpu_capabilities.h>
64*f6217f89SApple OSS Distributions #include <sys/types.h>
65*f6217f89SApple OSS Distributions #include <sys/sysctl.h>
66*f6217f89SApple OSS Distributions 
67*f6217f89SApple OSS Distributions #include "arm_matrix.h"
68*f6217f89SApple OSS Distributions #include "exc_helpers.h"
69*f6217f89SApple OSS Distributions #include "test_utils.h"
70*f6217f89SApple OSS Distributions 
71*f6217f89SApple OSS Distributions T_GLOBAL_META(
72*f6217f89SApple OSS Distributions 	T_META_NAMESPACE("xnu.arm"),
73*f6217f89SApple OSS Distributions 	T_META_RADAR_COMPONENT_NAME("xnu"),
74*f6217f89SApple OSS Distributions 	T_META_RADAR_COMPONENT_VERSION("arm"),
75*f6217f89SApple OSS Distributions 	T_META_OWNER("ghackmann"),
76*f6217f89SApple OSS Distributions 	T_META_RUN_CONCURRENTLY(true)
77*f6217f89SApple OSS Distributions 	);
78*f6217f89SApple OSS Distributions 
79*f6217f89SApple OSS Distributions #ifdef __arm64__
80*f6217f89SApple OSS Distributions 
81*f6217f89SApple OSS Distributions #ifndef EXC_ARM_SME_DISALLOWED
82*f6217f89SApple OSS Distributions #define EXC_ARM_SME_DISALLOWED 2
83*f6217f89SApple OSS Distributions #endif
84*f6217f89SApple OSS Distributions 
85*f6217f89SApple OSS Distributions /* Whether we caught the EXC_BAD_INSTRUCTION mach exception or not. */
86*f6217f89SApple OSS Distributions static volatile bool mach_exc_caught = false;
87*f6217f89SApple OSS Distributions 
88*f6217f89SApple OSS Distributions static size_t
bad_instruction_exception_handler(__unused mach_port_t task,__unused mach_port_t thread,exception_type_t type,mach_exception_data_t codes,__unused uint64_t exception_pc)89*f6217f89SApple OSS Distributions bad_instruction_exception_handler(
90*f6217f89SApple OSS Distributions 	__unused mach_port_t task,
91*f6217f89SApple OSS Distributions 	__unused mach_port_t thread,
92*f6217f89SApple OSS Distributions 	exception_type_t type,
93*f6217f89SApple OSS Distributions 	mach_exception_data_t codes,
94*f6217f89SApple OSS Distributions 	__unused uint64_t exception_pc)
95*f6217f89SApple OSS Distributions {
96*f6217f89SApple OSS Distributions 	T_QUIET; T_ASSERT_EQ(type, EXC_BAD_INSTRUCTION, "Caught an EXC_BAD_INSTRUCTION exception");
97*f6217f89SApple OSS Distributions 	T_QUIET; T_ASSERT_EQ(codes[0], (uint64_t)EXC_ARM_UNDEFINED, "The subcode is EXC_ARM_UNDEFINED");
98*f6217f89SApple OSS Distributions 
99*f6217f89SApple OSS Distributions 	mach_exc_caught = true;
100*f6217f89SApple OSS Distributions 	return 4;
101*f6217f89SApple OSS Distributions }
102*f6217f89SApple OSS Distributions #endif
103*f6217f89SApple OSS Distributions 
104*f6217f89SApple OSS Distributions 
105*f6217f89SApple OSS Distributions #ifdef __arm64__
106*f6217f89SApple OSS Distributions static void
test_matrix_not_started(const struct arm_matrix_operations * ops)107*f6217f89SApple OSS Distributions test_matrix_not_started(const struct arm_matrix_operations *ops)
108*f6217f89SApple OSS Distributions {
109*f6217f89SApple OSS Distributions 	if (!ops->is_available()) {
110*f6217f89SApple OSS Distributions 		T_SKIP("Running on non-%s target, skipping...", ops->name);
111*f6217f89SApple OSS Distributions 	}
112*f6217f89SApple OSS Distributions 
113*f6217f89SApple OSS Distributions 	mach_port_t exc_port = create_exception_port(EXC_MASK_BAD_INSTRUCTION);
114*f6217f89SApple OSS Distributions 
115*f6217f89SApple OSS Distributions 	size_t size = ops->data_size();
116*f6217f89SApple OSS Distributions 	uint8_t *d = ops->alloc_data();
117*f6217f89SApple OSS Distributions 	bzero(d, size);
118*f6217f89SApple OSS Distributions 
119*f6217f89SApple OSS Distributions 	ops->start();
120*f6217f89SApple OSS Distributions 	ops->load_one_vector(d);
121*f6217f89SApple OSS Distributions 	ops->stop();
122*f6217f89SApple OSS Distributions 	T_PASS("%s instruction after start instruction should not cause an exception", ops->name);
123*f6217f89SApple OSS Distributions 
124*f6217f89SApple OSS Distributions 	mach_exc_caught = false;
125*f6217f89SApple OSS Distributions 	run_exception_handler(exc_port, bad_instruction_exception_handler);
126*f6217f89SApple OSS Distributions 	ops->load_one_vector(d);
127*f6217f89SApple OSS Distributions 	T_EXPECT_TRUE(mach_exc_caught, "%s instruction before start instruction should cause an exception", ops->name);
128*f6217f89SApple OSS Distributions 
129*f6217f89SApple OSS Distributions 	free(d);
130*f6217f89SApple OSS Distributions }
131*f6217f89SApple OSS Distributions #endif
132*f6217f89SApple OSS Distributions 
133*f6217f89SApple OSS Distributions 
134*f6217f89SApple OSS Distributions T_DECL(sme_not_started,
135*f6217f89SApple OSS Distributions     "Test that SME instructions before smstart generate mach exceptions.", T_META_TAG_VM_NOT_ELIGIBLE)
136*f6217f89SApple OSS Distributions {
137*f6217f89SApple OSS Distributions #ifndef __arm64__
138*f6217f89SApple OSS Distributions 	T_SKIP("Running on non-arm64 target, skipping...");
139*f6217f89SApple OSS Distributions #else
140*f6217f89SApple OSS Distributions 	test_matrix_not_started(&sme_operations);
141*f6217f89SApple OSS Distributions #endif
142*f6217f89SApple OSS Distributions }
143*f6217f89SApple OSS Distributions 
144*f6217f89SApple OSS Distributions #ifdef __arm64__
145*f6217f89SApple OSS Distributions struct test_thread;
146*f6217f89SApple OSS Distributions typedef bool (*thread_fn_t)(struct test_thread const* thread);
147*f6217f89SApple OSS Distributions 
148*f6217f89SApple OSS Distributions struct test_thread {
149*f6217f89SApple OSS Distributions 	pthread_t thread;
150*f6217f89SApple OSS Distributions 	pthread_t companion_thread;
151*f6217f89SApple OSS Distributions 	thread_fn_t thread_fn;
152*f6217f89SApple OSS Distributions 	uint32_t cpuid;
153*f6217f89SApple OSS Distributions 	uint32_t thread_id;
154*f6217f89SApple OSS Distributions 	const struct arm_matrix_operations *ops;
155*f6217f89SApple OSS Distributions };
156*f6217f89SApple OSS Distributions 
157*f6217f89SApple OSS Distributions static uint32_t barrier;
158*f6217f89SApple OSS Distributions static pthread_cond_t barrier_cond = PTHREAD_COND_INITIALIZER;
159*f6217f89SApple OSS Distributions static pthread_mutex_t barrier_lock = PTHREAD_MUTEX_INITIALIZER;
160*f6217f89SApple OSS Distributions 
161*f6217f89SApple OSS Distributions static uint32_t end_barrier;
162*f6217f89SApple OSS Distributions static pthread_cond_t end_barrier_cond = PTHREAD_COND_INITIALIZER;
163*f6217f89SApple OSS Distributions static pthread_mutex_t end_barrier_lock = PTHREAD_MUTEX_INITIALIZER;
164*f6217f89SApple OSS Distributions 
165*f6217f89SApple OSS Distributions static void
test_thread_barrier(void)166*f6217f89SApple OSS Distributions test_thread_barrier(void)
167*f6217f89SApple OSS Distributions {
168*f6217f89SApple OSS Distributions 	/* Wait for all threads to reach this barrier */
169*f6217f89SApple OSS Distributions 	pthread_mutex_lock(&barrier_lock);
170*f6217f89SApple OSS Distributions 	barrier--;
171*f6217f89SApple OSS Distributions 	if (barrier) {
172*f6217f89SApple OSS Distributions 		while (barrier) {
173*f6217f89SApple OSS Distributions 			pthread_cond_wait(&barrier_cond, &barrier_lock);
174*f6217f89SApple OSS Distributions 		}
175*f6217f89SApple OSS Distributions 	} else {
176*f6217f89SApple OSS Distributions 		pthread_cond_broadcast(&barrier_cond);
177*f6217f89SApple OSS Distributions 	}
178*f6217f89SApple OSS Distributions 	pthread_mutex_unlock(&barrier_lock);
179*f6217f89SApple OSS Distributions }
180*f6217f89SApple OSS Distributions 
181*f6217f89SApple OSS Distributions static void
test_thread_notify_exited(void)182*f6217f89SApple OSS Distributions test_thread_notify_exited(void)
183*f6217f89SApple OSS Distributions {
184*f6217f89SApple OSS Distributions 	pthread_mutex_lock(&end_barrier_lock);
185*f6217f89SApple OSS Distributions 	if (0 == --end_barrier) {
186*f6217f89SApple OSS Distributions 		pthread_cond_signal(&end_barrier_cond);
187*f6217f89SApple OSS Distributions 	}
188*f6217f89SApple OSS Distributions 	pthread_mutex_unlock(&end_barrier_lock);
189*f6217f89SApple OSS Distributions }
190*f6217f89SApple OSS Distributions 
191*f6217f89SApple OSS Distributions static void
wait_for_test_threads(void)192*f6217f89SApple OSS Distributions wait_for_test_threads(void)
193*f6217f89SApple OSS Distributions {
194*f6217f89SApple OSS Distributions 	pthread_mutex_lock(&end_barrier_lock);
195*f6217f89SApple OSS Distributions 	while (end_barrier) {
196*f6217f89SApple OSS Distributions 		pthread_cond_wait(&end_barrier_cond, &end_barrier_lock);
197*f6217f89SApple OSS Distributions 	}
198*f6217f89SApple OSS Distributions 	pthread_mutex_unlock(&end_barrier_lock);
199*f6217f89SApple OSS Distributions }
200*f6217f89SApple OSS Distributions 
201*f6217f89SApple OSS Distributions static uint32_t
ncpus(void)202*f6217f89SApple OSS Distributions ncpus(void)
203*f6217f89SApple OSS Distributions {
204*f6217f89SApple OSS Distributions 	uint32_t ncpu;
205*f6217f89SApple OSS Distributions 	size_t ncpu_size = sizeof(ncpu);
206*f6217f89SApple OSS Distributions 	int err = sysctlbyname("hw.ncpu", &ncpu, &ncpu_size, NULL, 0);
207*f6217f89SApple OSS Distributions 	T_QUIET; T_ASSERT_POSIX_ZERO(err, "Retrieved CPU count");
208*f6217f89SApple OSS Distributions 
209*f6217f89SApple OSS Distributions 	return ncpu;
210*f6217f89SApple OSS Distributions }
211*f6217f89SApple OSS Distributions 
212*f6217f89SApple OSS Distributions static int
thread_bind_cpu_unchecked(uint32_t cpuid)213*f6217f89SApple OSS Distributions thread_bind_cpu_unchecked(uint32_t cpuid)
214*f6217f89SApple OSS Distributions {
215*f6217f89SApple OSS Distributions 	/*
216*f6217f89SApple OSS Distributions 	 * libc's sysctl() implementation calls strlen(name), which is
217*f6217f89SApple OSS Distributions 	 * SIMD-accelerated.  Avoid this by directly invoking the libsyscall
218*f6217f89SApple OSS Distributions 	 * wrapper with namelen computed at compile time.
219*f6217f89SApple OSS Distributions 	 */
220*f6217f89SApple OSS Distributions #define THREAD_BIND_CPU "kern.sched_thread_bind_cpu"
221*f6217f89SApple OSS Distributions 	extern int __sysctlbyname(const char *name, size_t namelen, void *oldp, size_t *oldlenp, void *newp, size_t newlen);
222*f6217f89SApple OSS Distributions 	const char *name = THREAD_BIND_CPU;
223*f6217f89SApple OSS Distributions 	size_t namelen = sizeof(THREAD_BIND_CPU) - 1;
224*f6217f89SApple OSS Distributions 	return __sysctlbyname(name, namelen, NULL, 0, &cpuid, sizeof(cpuid));
225*f6217f89SApple OSS Distributions }
226*f6217f89SApple OSS Distributions 
227*f6217f89SApple OSS Distributions static void
thread_bind_cpu(uint32_t cpuid)228*f6217f89SApple OSS Distributions thread_bind_cpu(uint32_t cpuid)
229*f6217f89SApple OSS Distributions {
230*f6217f89SApple OSS Distributions 	int err = thread_bind_cpu_unchecked(cpuid);
231*f6217f89SApple OSS Distributions 	T_QUIET; T_ASSERT_POSIX_ZERO(err, "Bound thread to CPU %u", cpuid);
232*f6217f89SApple OSS Distributions }
233*f6217f89SApple OSS Distributions 
234*f6217f89SApple OSS Distributions static void *
test_thread_shim(void * arg)235*f6217f89SApple OSS Distributions test_thread_shim(void *arg)
236*f6217f89SApple OSS Distributions {
237*f6217f89SApple OSS Distributions 	struct test_thread const *thread = arg;
238*f6217f89SApple OSS Distributions 
239*f6217f89SApple OSS Distributions 	thread_bind_cpu(thread->cpuid);
240*f6217f89SApple OSS Distributions 	bool const ret = thread->thread_fn(thread);
241*f6217f89SApple OSS Distributions 	test_thread_notify_exited();
242*f6217f89SApple OSS Distributions 	return (void *)(uintptr_t)ret;
243*f6217f89SApple OSS Distributions }
244*f6217f89SApple OSS Distributions 
245*f6217f89SApple OSS Distributions static void
test_on_each_cpu(thread_fn_t thread_fn,const struct arm_matrix_operations * ops,const char * desc)246*f6217f89SApple OSS Distributions test_on_each_cpu(thread_fn_t thread_fn, const struct arm_matrix_operations *ops, const char *desc)
247*f6217f89SApple OSS Distributions {
248*f6217f89SApple OSS Distributions 	uint32_t ncpu = ncpus();
249*f6217f89SApple OSS Distributions 	uint32_t nthreads = ncpu * 2;
250*f6217f89SApple OSS Distributions 	barrier = 1 /* This thread */ + nthreads;
251*f6217f89SApple OSS Distributions 	end_barrier = nthreads;
252*f6217f89SApple OSS Distributions 	struct test_thread *threads = calloc(nthreads, sizeof(threads[0]));
253*f6217f89SApple OSS Distributions 
254*f6217f89SApple OSS Distributions 	for (uint32_t i = 0; i < nthreads; i++) {
255*f6217f89SApple OSS Distributions 		threads[i].thread_fn = thread_fn;
256*f6217f89SApple OSS Distributions 		threads[i].cpuid = i % ncpu;
257*f6217f89SApple OSS Distributions 		threads[i].thread_id = i;
258*f6217f89SApple OSS Distributions 		threads[i].ops = ops;
259*f6217f89SApple OSS Distributions 
260*f6217f89SApple OSS Distributions 		int const err = pthread_create(&threads[i].thread, NULL, test_thread_shim, &threads[i]);
261*f6217f89SApple OSS Distributions 		T_QUIET; T_ASSERT_EQ(err, 0, "%s: created thread #%u", desc, i);
262*f6217f89SApple OSS Distributions 
263*f6217f89SApple OSS Distributions 		// The other of two threads under test pinned to the same CPU.
264*f6217f89SApple OSS Distributions 		threads[(ncpu + i) % nthreads].companion_thread = threads[i].thread;
265*f6217f89SApple OSS Distributions 	}
266*f6217f89SApple OSS Distributions 
267*f6217f89SApple OSS Distributions 	// Wait for all companion_threads to be set.
268*f6217f89SApple OSS Distributions 	test_thread_barrier();
269*f6217f89SApple OSS Distributions 
270*f6217f89SApple OSS Distributions 	// like pthread_join()ing all threads, but without the priority boosting shenanigans.
271*f6217f89SApple OSS Distributions 	wait_for_test_threads();
272*f6217f89SApple OSS Distributions 
273*f6217f89SApple OSS Distributions 	for (uint32_t i = 0; i < nthreads; i++) {
274*f6217f89SApple OSS Distributions 		void *thread_ret_ptr;
275*f6217f89SApple OSS Distributions 		int err = pthread_join(threads[i].thread, &thread_ret_ptr);
276*f6217f89SApple OSS Distributions 		T_QUIET; T_ASSERT_EQ(err, 0, "%s: joined thread #%u", desc, i);
277*f6217f89SApple OSS Distributions 
278*f6217f89SApple OSS Distributions 		bool thread_ret = (uintptr_t)thread_ret_ptr;
279*f6217f89SApple OSS Distributions 		if (thread_ret) {
280*f6217f89SApple OSS Distributions 			T_PASS("%s: thread #%u passed", desc, i);
281*f6217f89SApple OSS Distributions 		} else {
282*f6217f89SApple OSS Distributions 			T_FAIL("%s: thread #%u failed", desc, i);
283*f6217f89SApple OSS Distributions 		}
284*f6217f89SApple OSS Distributions 	}
285*f6217f89SApple OSS Distributions 
286*f6217f89SApple OSS Distributions 	free(threads);
287*f6217f89SApple OSS Distributions }
288*f6217f89SApple OSS Distributions 
289*f6217f89SApple OSS Distributions static bool
active_context_switch_thread(struct test_thread const * thread)290*f6217f89SApple OSS Distributions active_context_switch_thread(struct test_thread const* thread)
291*f6217f89SApple OSS Distributions {
292*f6217f89SApple OSS Distributions 	const struct arm_matrix_operations *ops = thread->ops;
293*f6217f89SApple OSS Distributions 	const uint32_t thread_id = thread->thread_id;
294*f6217f89SApple OSS Distributions 	size_t size = ops->data_size();
295*f6217f89SApple OSS Distributions 	uint8_t *d1 = ops->alloc_data();
296*f6217f89SApple OSS Distributions 	memset(d1, (char)thread_id, size);
297*f6217f89SApple OSS Distributions 
298*f6217f89SApple OSS Distributions 	uint8_t *d2 = ops->alloc_data();
299*f6217f89SApple OSS Distributions 
300*f6217f89SApple OSS Distributions 	test_thread_barrier();
301*f6217f89SApple OSS Distributions 
302*f6217f89SApple OSS Distributions 	// companion_thread will be valid only after the barrier.
303*f6217f89SApple OSS Distributions 	thread_t const companion_thread = pthread_mach_thread_np(thread->companion_thread);
304*f6217f89SApple OSS Distributions 	T_QUIET; T_ASSERT_NE(companion_thread, THREAD_NULL, "pthread_mach_thread_np");
305*f6217f89SApple OSS Distributions 
306*f6217f89SApple OSS Distributions 	bool ok = true;
307*f6217f89SApple OSS Distributions 	for (unsigned int i = 0; i < 100000 && ok; i++) {
308*f6217f89SApple OSS Distributions 		ops->start();
309*f6217f89SApple OSS Distributions 		ops->load_data(d1);
310*f6217f89SApple OSS Distributions 
311*f6217f89SApple OSS Distributions 		/*
312*f6217f89SApple OSS Distributions 		 * Rescheduling with the matrix registers active must preserve
313*f6217f89SApple OSS Distributions 		 * state, even after a context switch.
314*f6217f89SApple OSS Distributions 		 */
315*f6217f89SApple OSS Distributions 		thread_switch(companion_thread, SWITCH_OPTION_NONE, 0);
316*f6217f89SApple OSS Distributions 
317*f6217f89SApple OSS Distributions 		ops->store_data(d2);
318*f6217f89SApple OSS Distributions 		ops->stop();
319*f6217f89SApple OSS Distributions 
320*f6217f89SApple OSS Distributions 		if (memcmp(d1, d2, size)) {
321*f6217f89SApple OSS Distributions 			ok = false;
322*f6217f89SApple OSS Distributions 		}
323*f6217f89SApple OSS Distributions 	}
324*f6217f89SApple OSS Distributions 
325*f6217f89SApple OSS Distributions 	free(d2);
326*f6217f89SApple OSS Distributions 	free(d1);
327*f6217f89SApple OSS Distributions 	return ok;
328*f6217f89SApple OSS Distributions }
329*f6217f89SApple OSS Distributions 
330*f6217f89SApple OSS Distributions static bool
inactive_context_switch_thread(struct test_thread const * thread)331*f6217f89SApple OSS Distributions inactive_context_switch_thread(struct test_thread const* thread)
332*f6217f89SApple OSS Distributions {
333*f6217f89SApple OSS Distributions 	const struct arm_matrix_operations *ops = thread->ops;
334*f6217f89SApple OSS Distributions 	const uint32_t thread_id = thread->thread_id;
335*f6217f89SApple OSS Distributions 	size_t size = ops->data_size();
336*f6217f89SApple OSS Distributions 	uint8_t *d1 = ops->alloc_data();
337*f6217f89SApple OSS Distributions 	memset(d1, (char)thread_id, size);
338*f6217f89SApple OSS Distributions 
339*f6217f89SApple OSS Distributions 	uint8_t *d2 = ops->alloc_data();
340*f6217f89SApple OSS Distributions 
341*f6217f89SApple OSS Distributions 	test_thread_barrier();
342*f6217f89SApple OSS Distributions 
343*f6217f89SApple OSS Distributions 	// companion_thread will be valid only after the barrier.
344*f6217f89SApple OSS Distributions 	thread_t const companion_thread = pthread_mach_thread_np(thread->companion_thread);
345*f6217f89SApple OSS Distributions 	T_QUIET; T_ASSERT_NE(companion_thread, THREAD_NULL, "pthread_mach_thread_np");
346*f6217f89SApple OSS Distributions 
347*f6217f89SApple OSS Distributions 	bool ok = true;
348*f6217f89SApple OSS Distributions 	for (unsigned int i = 0; i < 100000 && ok; i++) {
349*f6217f89SApple OSS Distributions 		ops->start();
350*f6217f89SApple OSS Distributions 		ops->load_data(d1);
351*f6217f89SApple OSS Distributions 		ops->stop();
352*f6217f89SApple OSS Distributions 
353*f6217f89SApple OSS Distributions 		/*
354*f6217f89SApple OSS Distributions 		 * Rescheduling with the matrix registers inactive may preserve
355*f6217f89SApple OSS Distributions 		 * state or may zero it out.
356*f6217f89SApple OSS Distributions 		 */
357*f6217f89SApple OSS Distributions 		thread_switch(companion_thread, SWITCH_OPTION_NONE, 0);
358*f6217f89SApple OSS Distributions 
359*f6217f89SApple OSS Distributions 		ops->start();
360*f6217f89SApple OSS Distributions 		ops->store_data(d2);
361*f6217f89SApple OSS Distributions 		ops->stop();
362*f6217f89SApple OSS Distributions 
363*f6217f89SApple OSS Distributions 		for (size_t j = 0; j < size; j++) {
364*f6217f89SApple OSS Distributions 			if (d1[j] != d2[j] && d2[j] != 0) {
365*f6217f89SApple OSS Distributions 				ok = false;
366*f6217f89SApple OSS Distributions 			}
367*f6217f89SApple OSS Distributions 		}
368*f6217f89SApple OSS Distributions 	}
369*f6217f89SApple OSS Distributions 
370*f6217f89SApple OSS Distributions 	free(d2);
371*f6217f89SApple OSS Distributions 	free(d1);
372*f6217f89SApple OSS Distributions 	return ok;
373*f6217f89SApple OSS Distributions }
374*f6217f89SApple OSS Distributions 
375*f6217f89SApple OSS Distributions static void
test_thread_migration(const struct arm_matrix_operations * ops)376*f6217f89SApple OSS Distributions test_thread_migration(const struct arm_matrix_operations *ops)
377*f6217f89SApple OSS Distributions {
378*f6217f89SApple OSS Distributions 	size_t size = ops->data_size();
379*f6217f89SApple OSS Distributions 	uint8_t *d = ops->alloc_data();
380*f6217f89SApple OSS Distributions 	arc4random_buf(d, size);
381*f6217f89SApple OSS Distributions 
382*f6217f89SApple OSS Distributions 	uint32_t ncpu = ncpus();
383*f6217f89SApple OSS Distributions 	uint8_t *cpu_d[ncpu];
384*f6217f89SApple OSS Distributions 	for (uint32_t cpuid = 0; cpuid < ncpu; cpuid++) {
385*f6217f89SApple OSS Distributions 		cpu_d[cpuid] = ops->alloc_data();
386*f6217f89SApple OSS Distributions 		memset(cpu_d[cpuid], 0, size);
387*f6217f89SApple OSS Distributions 	}
388*f6217f89SApple OSS Distributions 
389*f6217f89SApple OSS Distributions 	ops->start();
390*f6217f89SApple OSS Distributions 	ops->load_data(d);
391*f6217f89SApple OSS Distributions 	for (uint32_t cpuid = 0; cpuid < ncpu; cpuid++) {
392*f6217f89SApple OSS Distributions 		int err = thread_bind_cpu_unchecked(cpuid);
393*f6217f89SApple OSS Distributions 		if (err) {
394*f6217f89SApple OSS Distributions 			ops->stop();
395*f6217f89SApple OSS Distributions 			T_ASSERT_POSIX_ZERO(err, "Bound thread to CPU %u", cpuid);
396*f6217f89SApple OSS Distributions 		}
397*f6217f89SApple OSS Distributions 		ops->store_data(cpu_d[cpuid]);
398*f6217f89SApple OSS Distributions 	}
399*f6217f89SApple OSS Distributions 	ops->stop();
400*f6217f89SApple OSS Distributions 
401*f6217f89SApple OSS Distributions 	for (uint32_t cpuid = 0; cpuid < ncpu; cpuid++) {
402*f6217f89SApple OSS Distributions 		int cmp = memcmp(d, cpu_d[cpuid], size);
403*f6217f89SApple OSS Distributions 		T_EXPECT_EQ(cmp, 0, "Matrix state migrated to CPU %u", cpuid);
404*f6217f89SApple OSS Distributions 		free(cpu_d[cpuid]);
405*f6217f89SApple OSS Distributions 	}
406*f6217f89SApple OSS Distributions 	free(d);
407*f6217f89SApple OSS Distributions }
408*f6217f89SApple OSS Distributions #endif
409*f6217f89SApple OSS Distributions 
410*f6217f89SApple OSS Distributions 
411*f6217f89SApple OSS Distributions T_DECL(sme_context_switch,
412*f6217f89SApple OSS Distributions     "Test that SME contexts are migrated during context switch and do not leak between process contexts.",
413*f6217f89SApple OSS Distributions     T_META_BOOTARGS_SET("enable_skstb=1"),
414*f6217f89SApple OSS Distributions     T_META_REQUIRES_SYSCTL_EQ("hw.optional.arm.FEAT_SME2", 1),
415*f6217f89SApple OSS Distributions     XNU_T_META_SOC_SPECIFIC, T_META_TAG_VM_NOT_ELIGIBLE)
416*f6217f89SApple OSS Distributions {
417*f6217f89SApple OSS Distributions #ifndef __arm64__
418*f6217f89SApple OSS Distributions 	T_SKIP("Running on non-arm64 target, skipping...");
419*f6217f89SApple OSS Distributions #else
420*f6217f89SApple OSS Distributions 	if (!sme_operations.is_available()) {
421*f6217f89SApple OSS Distributions 		T_SKIP("Running on non-SME target, skipping...");
422*f6217f89SApple OSS Distributions 	}
423*f6217f89SApple OSS Distributions 
424*f6217f89SApple OSS Distributions 	test_thread_migration(&sme_operations);
425*f6217f89SApple OSS Distributions 	test_on_each_cpu(active_context_switch_thread, &sme_operations, "SME context migrates when active");
426*f6217f89SApple OSS Distributions 	test_on_each_cpu(inactive_context_switch_thread, &sme_operations, "SME context does not leak across processes");
427*f6217f89SApple OSS Distributions #endif
428*f6217f89SApple OSS Distributions }
429*f6217f89SApple OSS Distributions 
430*f6217f89SApple OSS Distributions 
431*f6217f89SApple OSS Distributions #if __arm64__
432*f6217f89SApple OSS Distributions /*
433*f6217f89SApple OSS Distributions  * Sequence of events in thread_{get,set}_state test:
434*f6217f89SApple OSS Distributions  *
435*f6217f89SApple OSS Distributions  * 1. Parent creates child thread.
436*f6217f89SApple OSS Distributions  * 2. Child thread signals parent thread to proceed.
437*f6217f89SApple OSS Distributions  * 3. Parent populates child's matrix state registers via thread_set_state(),
438*f6217f89SApple OSS Distributions  *    and signals child thread to proceed.
439*f6217f89SApple OSS Distributions  * 4. Child arbitrarily updates each byte in its local matrix register state
440*f6217f89SApple OSS Distributions  *    by adding 1, and signals parent thread to proceed.
441*f6217f89SApple OSS Distributions  * 5. Parent reads back the child's updated matrix state with
442*f6217f89SApple OSS Distributions  *    thread_get_state(), and confirms that every byte has been modified as
443*f6217f89SApple OSS Distributions  *    expected.
444*f6217f89SApple OSS Distributions  */
445*f6217f89SApple OSS Distributions static enum thread_state_test_state {
446*f6217f89SApple OSS Distributions 	INIT,
447*f6217f89SApple OSS Distributions 	CHILD_READY,
448*f6217f89SApple OSS Distributions 	PARENT_POPULATED_MATRIX_STATE,
449*f6217f89SApple OSS Distributions 	CHILD_UPDATED_MATRIX_STATE,
450*f6217f89SApple OSS Distributions 	DONE
451*f6217f89SApple OSS Distributions } thread_state_test_state;
452*f6217f89SApple OSS Distributions 
453*f6217f89SApple OSS Distributions static pthread_cond_t thread_state_test_cond = PTHREAD_COND_INITIALIZER;
454*f6217f89SApple OSS Distributions static pthread_mutex_t thread_state_test_lock = PTHREAD_MUTEX_INITIALIZER;
455*f6217f89SApple OSS Distributions 
456*f6217f89SApple OSS Distributions static void
wait_for_thread_state_test_state(enum thread_state_test_state state)457*f6217f89SApple OSS Distributions wait_for_thread_state_test_state(enum thread_state_test_state state)
458*f6217f89SApple OSS Distributions {
459*f6217f89SApple OSS Distributions 	pthread_mutex_lock(&thread_state_test_lock);
460*f6217f89SApple OSS Distributions 	while (thread_state_test_state != state) {
461*f6217f89SApple OSS Distributions 		pthread_cond_wait(&thread_state_test_cond, &thread_state_test_lock);
462*f6217f89SApple OSS Distributions 	}
463*f6217f89SApple OSS Distributions 	pthread_mutex_unlock(&thread_state_test_lock);
464*f6217f89SApple OSS Distributions }
465*f6217f89SApple OSS Distributions 
466*f6217f89SApple OSS Distributions static void
thread_set_state_test_state(enum thread_state_test_state state)467*f6217f89SApple OSS Distributions thread_set_state_test_state(enum thread_state_test_state state)
468*f6217f89SApple OSS Distributions {
469*f6217f89SApple OSS Distributions 	pthread_mutex_lock(&thread_state_test_lock);
470*f6217f89SApple OSS Distributions 	thread_state_test_state = state;
471*f6217f89SApple OSS Distributions 	pthread_cond_broadcast(&thread_state_test_cond);
472*f6217f89SApple OSS Distributions 	pthread_mutex_unlock(&thread_state_test_lock);
473*f6217f89SApple OSS Distributions }
474*f6217f89SApple OSS Distributions 
475*f6217f89SApple OSS Distributions static void *
test_matrix_thread_state_child(void * arg __unused)476*f6217f89SApple OSS Distributions test_matrix_thread_state_child(void *arg __unused)
477*f6217f89SApple OSS Distributions {
478*f6217f89SApple OSS Distributions 	const struct arm_matrix_operations *ops = arg;
479*f6217f89SApple OSS Distributions 
480*f6217f89SApple OSS Distributions 	size_t size = ops->data_size();
481*f6217f89SApple OSS Distributions 	uint8_t *d = ops->alloc_data();
482*f6217f89SApple OSS Distributions 
483*f6217f89SApple OSS Distributions 
484*f6217f89SApple OSS Distributions 	thread_set_state_test_state(CHILD_READY);
485*f6217f89SApple OSS Distributions 	wait_for_thread_state_test_state(PARENT_POPULATED_MATRIX_STATE);
486*f6217f89SApple OSS Distributions 	ops->store_data(d);
487*f6217f89SApple OSS Distributions 	for (size_t i = 0; i < size; i++) {
488*f6217f89SApple OSS Distributions 		d[i]++;
489*f6217f89SApple OSS Distributions 	}
490*f6217f89SApple OSS Distributions 	ops->load_data(d);
491*f6217f89SApple OSS Distributions 	thread_set_state_test_state(CHILD_UPDATED_MATRIX_STATE);
492*f6217f89SApple OSS Distributions 
493*f6217f89SApple OSS Distributions 	wait_for_thread_state_test_state(DONE);
494*f6217f89SApple OSS Distributions 	ops->stop();
495*f6217f89SApple OSS Distributions 	return NULL;
496*f6217f89SApple OSS Distributions }
497*f6217f89SApple OSS Distributions 
498*f6217f89SApple OSS Distributions static void
test_matrix_thread_state(const struct arm_matrix_operations * ops)499*f6217f89SApple OSS Distributions test_matrix_thread_state(const struct arm_matrix_operations *ops)
500*f6217f89SApple OSS Distributions {
501*f6217f89SApple OSS Distributions 	if (!ops->is_available()) {
502*f6217f89SApple OSS Distributions 		T_SKIP("Running on non-%s target, skipping...", ops->name);
503*f6217f89SApple OSS Distributions 	}
504*f6217f89SApple OSS Distributions 
505*f6217f89SApple OSS Distributions 	size_t size = ops->data_size();
506*f6217f89SApple OSS Distributions 	uint8_t *d = ops->alloc_data();
507*f6217f89SApple OSS Distributions 	arc4random_buf(d, size);
508*f6217f89SApple OSS Distributions 
509*f6217f89SApple OSS Distributions 	thread_state_test_state = INIT;
510*f6217f89SApple OSS Distributions 
511*f6217f89SApple OSS Distributions 	pthread_t thread;
512*f6217f89SApple OSS Distributions #pragma clang diagnostic push
513*f6217f89SApple OSS Distributions #pragma clang diagnostic ignored "-Wincompatible-pointer-types-discards-qualifiers"
514*f6217f89SApple OSS Distributions 	void *arg = ops;
515*f6217f89SApple OSS Distributions #pragma clang diagnostic pop
516*f6217f89SApple OSS Distributions 	int err = pthread_create(&thread, NULL, test_matrix_thread_state_child, arg);
517*f6217f89SApple OSS Distributions 	T_QUIET; T_ASSERT_EQ(err, 0, "pthread_create()");
518*f6217f89SApple OSS Distributions 
519*f6217f89SApple OSS Distributions 	mach_port_t mach_thread = pthread_mach_thread_np(thread);
520*f6217f89SApple OSS Distributions 	T_QUIET; T_ASSERT_NE(mach_thread, MACH_PORT_NULL, "pthread_mach_thread_np()");
521*f6217f89SApple OSS Distributions 
522*f6217f89SApple OSS Distributions 	wait_for_thread_state_test_state(CHILD_READY);
523*f6217f89SApple OSS Distributions 	kern_return_t kr = ops->thread_set_state(mach_thread, d);
524*f6217f89SApple OSS Distributions 	T_QUIET; T_ASSERT_EQ(kr, KERN_SUCCESS, "%s thread_set_state()", ops->name);
525*f6217f89SApple OSS Distributions 	thread_set_state_test_state(PARENT_POPULATED_MATRIX_STATE);
526*f6217f89SApple OSS Distributions 
527*f6217f89SApple OSS Distributions 	wait_for_thread_state_test_state(CHILD_UPDATED_MATRIX_STATE);
528*f6217f89SApple OSS Distributions 	uint8_t *thread_d = ops->alloc_data();
529*f6217f89SApple OSS Distributions 	kr = ops->thread_get_state(mach_thread, thread_d);
530*f6217f89SApple OSS Distributions 	T_QUIET; T_ASSERT_EQ(kr, KERN_SUCCESS, "%s thread_get_state()", ops->name);
531*f6217f89SApple OSS Distributions 	for (size_t i = 0; i < size; i++) {
532*f6217f89SApple OSS Distributions 		d[i]++;
533*f6217f89SApple OSS Distributions 	}
534*f6217f89SApple OSS Distributions 	T_EXPECT_EQ(memcmp(d, thread_d, size), 0, "thread_get_state() read expected %s data from child thread", ops->name);
535*f6217f89SApple OSS Distributions 
536*f6217f89SApple OSS Distributions 	thread_set_state_test_state(DONE);
537*f6217f89SApple OSS Distributions 	free(thread_d);
538*f6217f89SApple OSS Distributions 	free(d);
539*f6217f89SApple OSS Distributions 	pthread_join(thread, NULL);
540*f6217f89SApple OSS Distributions }
541*f6217f89SApple OSS Distributions 
542*f6217f89SApple OSS Distributions #endif
543*f6217f89SApple OSS Distributions 
544*f6217f89SApple OSS Distributions #ifdef __arm64__
545*f6217f89SApple OSS Distributions 
546*f6217f89SApple OSS Distributions T_DECL(sme_thread_state,
547*f6217f89SApple OSS Distributions     "Test thread_{get,set}_state with SME thread state.",
548*f6217f89SApple OSS Distributions     XNU_T_META_SOC_SPECIFIC)
549*f6217f89SApple OSS Distributions {
550*f6217f89SApple OSS Distributions 	test_matrix_thread_state(&sme_operations);
551*f6217f89SApple OSS Distributions }
552*f6217f89SApple OSS Distributions 
553*f6217f89SApple OSS Distributions T_DECL(sme_exception_ports,
554*f6217f89SApple OSS Distributions     "Test that thread_set_exception_ports rejects SME thread-state flavors.",
555*f6217f89SApple OSS Distributions     XNU_T_META_SOC_SPECIFIC)
556*f6217f89SApple OSS Distributions {
557*f6217f89SApple OSS Distributions 	mach_port_t exc_port;
558*f6217f89SApple OSS Distributions 	mach_port_t task = mach_task_self();
559*f6217f89SApple OSS Distributions 	mach_port_t thread = mach_thread_self();
560*f6217f89SApple OSS Distributions 
561*f6217f89SApple OSS Distributions 	kern_return_t kr = mach_port_allocate(task, MACH_PORT_RIGHT_RECEIVE, &exc_port);
562*f6217f89SApple OSS Distributions 	T_QUIET; T_ASSERT_MACH_SUCCESS(kr, "Allocated mach exception port");
563*f6217f89SApple OSS Distributions 	kr = mach_port_insert_right(task, exc_port, exc_port, MACH_MSG_TYPE_MAKE_SEND);
564*f6217f89SApple OSS Distributions 	T_QUIET; T_ASSERT_MACH_SUCCESS(kr, "Inserted a SEND right into the exception port");
565*f6217f89SApple OSS Distributions 
566*f6217f89SApple OSS Distributions 	kr = thread_set_exception_ports(thread, EXC_MASK_ALL, exc_port, EXCEPTION_STATE, ARM_THREAD_STATE64);
567*f6217f89SApple OSS Distributions 	T_EXPECT_MACH_SUCCESS(kr, "thread_set_exception_ports accepts flavor %u", (unsigned int)ARM_THREAD_STATE64);
568*f6217f89SApple OSS Distributions 
569*f6217f89SApple OSS Distributions 	for (thread_state_flavor_t flavor = ARM_SME_STATE; flavor <= ARM_SME2_STATE; flavor++) {
570*f6217f89SApple OSS Distributions 		kr = thread_set_exception_ports(thread, EXC_MASK_ALL, exc_port, EXCEPTION_STATE, flavor);
571*f6217f89SApple OSS Distributions 		T_EXPECT_MACH_ERROR(kr, KERN_INVALID_ARGUMENT, "thread_set_exception_ports rejects flavor %u", (unsigned int)flavor);
572*f6217f89SApple OSS Distributions 	}
573*f6217f89SApple OSS Distributions }
574*f6217f89SApple OSS Distributions 
575*f6217f89SApple OSS Distributions T_DECL(sme_max_svl_b_sysctl,
576*f6217f89SApple OSS Distributions     "Test the hw.optional.arm.sme_max_svl_b sysctl",
577*f6217f89SApple OSS Distributions     XNU_T_META_SOC_SPECIFIC)
578*f6217f89SApple OSS Distributions {
579*f6217f89SApple OSS Distributions 	unsigned int max_svl_b;
580*f6217f89SApple OSS Distributions 	size_t max_svl_b_size = sizeof(max_svl_b);
581*f6217f89SApple OSS Distributions 
582*f6217f89SApple OSS Distributions 	int err = sysctlbyname("hw.optional.arm.sme_max_svl_b", &max_svl_b, &max_svl_b_size, NULL, 0);
583*f6217f89SApple OSS Distributions 	T_QUIET; T_ASSERT_POSIX_SUCCESS(err, "sysctlbyname(hw.optional.arm.sme_max_svl_b)");
584*f6217f89SApple OSS Distributions 	if (sme_operations.is_available()) {
585*f6217f89SApple OSS Distributions 		/* Architecturally SVL must be a power-of-two between 128 and 2048 bits */
586*f6217f89SApple OSS Distributions 		const unsigned int ARCH_MIN_SVL_B = 128 / 8;
587*f6217f89SApple OSS Distributions 		const unsigned int ARCH_MAX_SVL_B = 2048 / 8;
588*f6217f89SApple OSS Distributions 
589*f6217f89SApple OSS Distributions 		T_EXPECT_EQ(__builtin_popcount(max_svl_b), 1, "Maximum SVL_B is a power of 2");
590*f6217f89SApple OSS Distributions 		T_EXPECT_GE(max_svl_b, ARCH_MIN_SVL_B, "Maximum SVL_B >= architectural minimum");
591*f6217f89SApple OSS Distributions 		T_EXPECT_LE(max_svl_b, ARCH_MAX_SVL_B, "Maximum SVL_B <= architectural maximum");
592*f6217f89SApple OSS Distributions 	} else {
593*f6217f89SApple OSS Distributions 		T_EXPECT_EQ(max_svl_b, 0, "Maximum SVL_B is 0 when SME is unavailable");
594*f6217f89SApple OSS Distributions 	}
595*f6217f89SApple OSS Distributions }
596*f6217f89SApple OSS Distributions #endif /* __arm64__ */
597