xref: /xnu-11215.1.10/tests/arm_matrix_sme.c (revision 8d741a5de7ff4191bf97d57b9f54c2f6d4a15585)
1*8d741a5dSApple OSS Distributions /*
2*8d741a5dSApple OSS Distributions  * Copyright (c) 2022 Apple Computer, Inc. All rights reserved.
3*8d741a5dSApple OSS Distributions  *
4*8d741a5dSApple OSS Distributions  * @APPLE_OSREFERENCE_LICENSE_HEADER_START@
5*8d741a5dSApple OSS Distributions  *
6*8d741a5dSApple OSS Distributions  * This file contains Original Code and/or Modifications of Original Code
7*8d741a5dSApple OSS Distributions  * as defined in and that are subject to the Apple Public Source License
8*8d741a5dSApple OSS Distributions  * Version 2.0 (the 'License'). You may not use this file except in
9*8d741a5dSApple OSS Distributions  * compliance with the License. The rights granted to you under the License
10*8d741a5dSApple OSS Distributions  * may not be used to create, or enable the creation or redistribution of,
11*8d741a5dSApple OSS Distributions  * unlawful or unlicensed copies of an Apple operating system, or to
12*8d741a5dSApple OSS Distributions  * circumvent, violate, or enable the circumvention or violation of, any
13*8d741a5dSApple OSS Distributions  * terms of an Apple operating system software license agreement.
14*8d741a5dSApple OSS Distributions  *
15*8d741a5dSApple OSS Distributions  * Please obtain a copy of the License at
16*8d741a5dSApple OSS Distributions  * http://www.opensource.apple.com/apsl/ and read it before using this file.
17*8d741a5dSApple OSS Distributions  *
18*8d741a5dSApple OSS Distributions  * The Original Code and all software distributed under the License are
19*8d741a5dSApple OSS Distributions  * distributed on an 'AS IS' basis, WITHOUT WARRANTY OF ANY KIND, EITHER
20*8d741a5dSApple OSS Distributions  * EXPRESS OR IMPLIED, AND APPLE HEREBY DISCLAIMS ALL SUCH WARRANTIES,
21*8d741a5dSApple OSS Distributions  * INCLUDING WITHOUT LIMITATION, ANY WARRANTIES OF MERCHANTABILITY,
22*8d741a5dSApple OSS Distributions  * FITNESS FOR A PARTICULAR PURPOSE, QUIET ENJOYMENT OR NON-INFRINGEMENT.
23*8d741a5dSApple OSS Distributions  * Please see the License for the specific language governing rights and
24*8d741a5dSApple OSS Distributions  * limitations under the License.
25*8d741a5dSApple OSS Distributions  *
26*8d741a5dSApple OSS Distributions  * @APPLE_OSREFERENCE_LICENSE_HEADER_END@
27*8d741a5dSApple OSS Distributions  */
28*8d741a5dSApple OSS Distributions 
29*8d741a5dSApple OSS Distributions #include <stdint.h>
30*8d741a5dSApple OSS Distributions #include <stdlib.h>
31*8d741a5dSApple OSS Distributions #include <sys/sysctl.h>
32*8d741a5dSApple OSS Distributions 
33*8d741a5dSApple OSS Distributions #include "arm_matrix.h"
34*8d741a5dSApple OSS Distributions 
35*8d741a5dSApple OSS Distributions const static unsigned int SME_Z_VECTORS = 32;
36*8d741a5dSApple OSS Distributions const static unsigned int SME_P_VECTORS = 16;
37*8d741a5dSApple OSS Distributions 
38*8d741a5dSApple OSS Distributions static unsigned int
sme_version(void)39*8d741a5dSApple OSS Distributions sme_version(void)
40*8d741a5dSApple OSS Distributions {
41*8d741a5dSApple OSS Distributions 	static unsigned int ret = 0;
42*8d741a5dSApple OSS Distributions 	static bool already_read = false;
43*8d741a5dSApple OSS Distributions 
44*8d741a5dSApple OSS Distributions 	if (!already_read) {
45*8d741a5dSApple OSS Distributions 		size_t size = sizeof(unsigned int);
46*8d741a5dSApple OSS Distributions 		unsigned int feat_sme, feat_sme2;
47*8d741a5dSApple OSS Distributions 		sysctlbyname("hw.optional.arm.FEAT_SME", &feat_sme, &size, NULL, 0);
48*8d741a5dSApple OSS Distributions 		sysctlbyname("hw.optional.arm.FEAT_SME2", &feat_sme2, &size, NULL, 0);
49*8d741a5dSApple OSS Distributions 
50*8d741a5dSApple OSS Distributions 		if (feat_sme2) {
51*8d741a5dSApple OSS Distributions 			ret = 2;
52*8d741a5dSApple OSS Distributions 		} else if (feat_sme) {
53*8d741a5dSApple OSS Distributions 			ret = 1;
54*8d741a5dSApple OSS Distributions 		} else {
55*8d741a5dSApple OSS Distributions 			ret = 0;
56*8d741a5dSApple OSS Distributions 		}
57*8d741a5dSApple OSS Distributions 
58*8d741a5dSApple OSS Distributions 		already_read = true;
59*8d741a5dSApple OSS Distributions 	}
60*8d741a5dSApple OSS Distributions 
61*8d741a5dSApple OSS Distributions 	return ret;
62*8d741a5dSApple OSS Distributions }
63*8d741a5dSApple OSS Distributions 
64*8d741a5dSApple OSS Distributions static uint16_t
arm_sme_svl_b(void)65*8d741a5dSApple OSS Distributions arm_sme_svl_b(void)
66*8d741a5dSApple OSS Distributions {
67*8d741a5dSApple OSS Distributions 	uint64_t ret = 0;
68*8d741a5dSApple OSS Distributions 	asm volatile (
69*8d741a5dSApple OSS Distributions                 "rdsvl	%[ret], #1"
70*8d741a5dSApple OSS Distributions                 : [ret] "=r"(ret)
71*8d741a5dSApple OSS Distributions         );
72*8d741a5dSApple OSS Distributions 	return (uint16_t)ret;
73*8d741a5dSApple OSS Distributions }
74*8d741a5dSApple OSS Distributions 
75*8d741a5dSApple OSS Distributions static size_t
sme_za_size(void)76*8d741a5dSApple OSS Distributions sme_za_size(void)
77*8d741a5dSApple OSS Distributions {
78*8d741a5dSApple OSS Distributions 	return arm_sme_svl_b() * arm_sme_svl_b();
79*8d741a5dSApple OSS Distributions }
80*8d741a5dSApple OSS Distributions 
81*8d741a5dSApple OSS Distributions static size_t
sme_z_size(void)82*8d741a5dSApple OSS Distributions sme_z_size(void)
83*8d741a5dSApple OSS Distributions {
84*8d741a5dSApple OSS Distributions 	return arm_sme_svl_b() * SME_Z_VECTORS;
85*8d741a5dSApple OSS Distributions }
86*8d741a5dSApple OSS Distributions 
87*8d741a5dSApple OSS Distributions static size_t
sme_p_size(void)88*8d741a5dSApple OSS Distributions sme_p_size(void)
89*8d741a5dSApple OSS Distributions {
90*8d741a5dSApple OSS Distributions 	return arm_sme_svl_b() * SME_P_VECTORS / 8;
91*8d741a5dSApple OSS Distributions }
92*8d741a5dSApple OSS Distributions 
93*8d741a5dSApple OSS Distributions static size_t
sme_zt0_size(void)94*8d741a5dSApple OSS Distributions sme_zt0_size(void)
95*8d741a5dSApple OSS Distributions {
96*8d741a5dSApple OSS Distributions 	if (sme_version() >= 2) {
97*8d741a5dSApple OSS Distributions 		return 64;
98*8d741a5dSApple OSS Distributions 	} else {
99*8d741a5dSApple OSS Distributions 		return 0;
100*8d741a5dSApple OSS Distributions 	}
101*8d741a5dSApple OSS Distributions }
102*8d741a5dSApple OSS Distributions 
103*8d741a5dSApple OSS Distributions static size_t
sme_data_size(void)104*8d741a5dSApple OSS Distributions sme_data_size(void)
105*8d741a5dSApple OSS Distributions {
106*8d741a5dSApple OSS Distributions 	return sme_za_size() + sme_z_size() + sme_p_size() + sme_zt0_size();
107*8d741a5dSApple OSS Distributions }
108*8d741a5dSApple OSS Distributions 
109*8d741a5dSApple OSS Distributions static void *
sme_alloc_data(void)110*8d741a5dSApple OSS Distributions sme_alloc_data(void)
111*8d741a5dSApple OSS Distributions {
112*8d741a5dSApple OSS Distributions 	return malloc(sme_data_size());
113*8d741a5dSApple OSS Distributions }
114*8d741a5dSApple OSS Distributions 
115*8d741a5dSApple OSS Distributions static bool
sme_is_available(void)116*8d741a5dSApple OSS Distributions sme_is_available(void)
117*8d741a5dSApple OSS Distributions {
118*8d741a5dSApple OSS Distributions 	return sme_version() > 0;
119*8d741a5dSApple OSS Distributions }
120*8d741a5dSApple OSS Distributions 
121*8d741a5dSApple OSS Distributions static void
sme_start(void)122*8d741a5dSApple OSS Distributions sme_start(void)
123*8d741a5dSApple OSS Distributions {
124*8d741a5dSApple OSS Distributions 	asm volatile ("smstart");
125*8d741a5dSApple OSS Distributions }
126*8d741a5dSApple OSS Distributions 
127*8d741a5dSApple OSS Distributions static void
sme_stop(void)128*8d741a5dSApple OSS Distributions sme_stop(void)
129*8d741a5dSApple OSS Distributions {
130*8d741a5dSApple OSS Distributions 	asm volatile ("smstop");
131*8d741a5dSApple OSS Distributions }
132*8d741a5dSApple OSS Distributions 
133*8d741a5dSApple OSS Distributions static void
sme_load_one_vector(const void * addr)134*8d741a5dSApple OSS Distributions sme_load_one_vector(const void *addr)
135*8d741a5dSApple OSS Distributions {
136*8d741a5dSApple OSS Distributions 	asm volatile (
137*8d741a5dSApple OSS Distributions                 "mov    w12, #0"                "\n"
138*8d741a5dSApple OSS Distributions                 "ldr    za[w12, #0], [%[addr]]" "\n"
139*8d741a5dSApple OSS Distributions                 :
140*8d741a5dSApple OSS Distributions                 : [addr] "r"(addr)
141*8d741a5dSApple OSS Distributions                 : "w12"
142*8d741a5dSApple OSS Distributions         );
143*8d741a5dSApple OSS Distributions }
144*8d741a5dSApple OSS Distributions 
145*8d741a5dSApple OSS Distributions static void
sme_load_data(const void * addr)146*8d741a5dSApple OSS Distributions sme_load_data(const void *addr)
147*8d741a5dSApple OSS Distributions {
148*8d741a5dSApple OSS Distributions 	const uint8_t *za = addr;
149*8d741a5dSApple OSS Distributions 	const uint8_t *z = za + sme_za_size();
150*8d741a5dSApple OSS Distributions 	const uint8_t *p = z + sme_z_size();
151*8d741a5dSApple OSS Distributions 	uint16_t svl_b = arm_sme_svl_b();
152*8d741a5dSApple OSS Distributions 
153*8d741a5dSApple OSS Distributions 	for (register uint16_t i asm("w12") = 0; i < svl_b; i += 16) {
154*8d741a5dSApple OSS Distributions 		asm volatile (
155*8d741a5dSApple OSS Distributions                         "ldr    za[%w[i],  #0], [%[addr],  #0, mul vl]"   "\n"
156*8d741a5dSApple OSS Distributions                         "ldr    za[%w[i],  #1], [%[addr],  #1, mul vl]"   "\n"
157*8d741a5dSApple OSS Distributions                         "ldr    za[%w[i],  #2], [%[addr],  #2, mul vl]"   "\n"
158*8d741a5dSApple OSS Distributions                         "ldr    za[%w[i],  #3], [%[addr],  #3, mul vl]"   "\n"
159*8d741a5dSApple OSS Distributions                         "ldr    za[%w[i],  #4], [%[addr],  #4, mul vl]"   "\n"
160*8d741a5dSApple OSS Distributions                         "ldr    za[%w[i],  #5], [%[addr],  #5, mul vl]"   "\n"
161*8d741a5dSApple OSS Distributions                         "ldr    za[%w[i],  #6], [%[addr],  #6, mul vl]"   "\n"
162*8d741a5dSApple OSS Distributions                         "ldr    za[%w[i],  #7], [%[addr],  #7, mul vl]"   "\n"
163*8d741a5dSApple OSS Distributions                         "ldr    za[%w[i],  #8], [%[addr],  #8, mul vl]"   "\n"
164*8d741a5dSApple OSS Distributions                         "ldr    za[%w[i],  #9], [%[addr],  #9, mul vl]"   "\n"
165*8d741a5dSApple OSS Distributions                         "ldr    za[%w[i], #10], [%[addr], #10, mul vl]"   "\n"
166*8d741a5dSApple OSS Distributions                         "ldr    za[%w[i], #11], [%[addr], #11, mul vl]"   "\n"
167*8d741a5dSApple OSS Distributions                         "ldr    za[%w[i], #12], [%[addr], #12, mul vl]"   "\n"
168*8d741a5dSApple OSS Distributions                         "ldr    za[%w[i], #13], [%[addr], #13, mul vl]"   "\n"
169*8d741a5dSApple OSS Distributions                         "ldr    za[%w[i], #14], [%[addr], #14, mul vl]"   "\n"
170*8d741a5dSApple OSS Distributions                         "ldr    za[%w[i], #15], [%[addr], #15, mul vl]"   "\n"
171*8d741a5dSApple OSS Distributions                         :
172*8d741a5dSApple OSS Distributions                         : [i] "r"(i),
173*8d741a5dSApple OSS Distributions                           [addr] "r"(za + (i * svl_b))
174*8d741a5dSApple OSS Distributions                 );
175*8d741a5dSApple OSS Distributions 	}
176*8d741a5dSApple OSS Distributions 
177*8d741a5dSApple OSS Distributions 	asm volatile (
178*8d741a5dSApple OSS Distributions                 "ldr    z0, [%[z],   #0, mul vl]"        "\n"
179*8d741a5dSApple OSS Distributions                 "ldr    z1, [%[z],   #1, mul vl]"        "\n"
180*8d741a5dSApple OSS Distributions                 "ldr    z2, [%[z],   #2, mul vl]"        "\n"
181*8d741a5dSApple OSS Distributions                 "ldr    z3, [%[z],   #3, mul vl]"        "\n"
182*8d741a5dSApple OSS Distributions                 "ldr    z4, [%[z],   #4, mul vl]"        "\n"
183*8d741a5dSApple OSS Distributions                 "ldr    z5, [%[z],   #5, mul vl]"        "\n"
184*8d741a5dSApple OSS Distributions                 "ldr    z6, [%[z],   #6, mul vl]"        "\n"
185*8d741a5dSApple OSS Distributions                 "ldr    z7, [%[z],   #7, mul vl]"        "\n"
186*8d741a5dSApple OSS Distributions                 "ldr    z8, [%[z],   #8, mul vl]"        "\n"
187*8d741a5dSApple OSS Distributions                 "ldr    z9, [%[z],   #9, mul vl]"        "\n"
188*8d741a5dSApple OSS Distributions                 "ldr   z10, [%[z],  #10, mul vl]"        "\n"
189*8d741a5dSApple OSS Distributions                 "ldr   z11, [%[z],  #11, mul vl]"        "\n"
190*8d741a5dSApple OSS Distributions                 "ldr   z12, [%[z],  #12, mul vl]"        "\n"
191*8d741a5dSApple OSS Distributions                 "ldr   z13, [%[z],  #13, mul vl]"        "\n"
192*8d741a5dSApple OSS Distributions                 "ldr   z14, [%[z],  #14, mul vl]"        "\n"
193*8d741a5dSApple OSS Distributions                 "ldr   z15, [%[z],  #15, mul vl]"        "\n"
194*8d741a5dSApple OSS Distributions                 "ldr   z16, [%[z],  #16, mul vl]"        "\n"
195*8d741a5dSApple OSS Distributions                 "ldr   z17, [%[z],  #17, mul vl]"        "\n"
196*8d741a5dSApple OSS Distributions                 "ldr   z18, [%[z],  #18, mul vl]"        "\n"
197*8d741a5dSApple OSS Distributions                 "ldr   z19, [%[z],  #19, mul vl]"        "\n"
198*8d741a5dSApple OSS Distributions                 "ldr   z20, [%[z],  #20, mul vl]"        "\n"
199*8d741a5dSApple OSS Distributions                 "ldr   z21, [%[z],  #21, mul vl]"        "\n"
200*8d741a5dSApple OSS Distributions                 "ldr   z22, [%[z],  #22, mul vl]"        "\n"
201*8d741a5dSApple OSS Distributions                 "ldr   z23, [%[z],  #23, mul vl]"        "\n"
202*8d741a5dSApple OSS Distributions                 "ldr   z24, [%[z],  #24, mul vl]"        "\n"
203*8d741a5dSApple OSS Distributions                 "ldr   z25, [%[z],  #25, mul vl]"        "\n"
204*8d741a5dSApple OSS Distributions                 "ldr   z26, [%[z],  #26, mul vl]"        "\n"
205*8d741a5dSApple OSS Distributions                 "ldr   z27, [%[z],  #27, mul vl]"        "\n"
206*8d741a5dSApple OSS Distributions                 "ldr   z28, [%[z],  #28, mul vl]"        "\n"
207*8d741a5dSApple OSS Distributions                 "ldr   z29, [%[z],  #29, mul vl]"        "\n"
208*8d741a5dSApple OSS Distributions                 "ldr   z30, [%[z],  #30, mul vl]"        "\n"
209*8d741a5dSApple OSS Distributions                 "ldr   z31, [%[z],  #31, mul vl]"        "\n"
210*8d741a5dSApple OSS Distributions                 :
211*8d741a5dSApple OSS Distributions                 : [z] "r"(z)
212*8d741a5dSApple OSS Distributions         );
213*8d741a5dSApple OSS Distributions 
214*8d741a5dSApple OSS Distributions 	asm volatile (
215*8d741a5dSApple OSS Distributions                 "ldr     p0, [%[p],  #0, mul vl]"        "\n"
216*8d741a5dSApple OSS Distributions                 "ldr     p1, [%[p],  #1, mul vl]"        "\n"
217*8d741a5dSApple OSS Distributions                 "ldr     p2, [%[p],  #2, mul vl]"        "\n"
218*8d741a5dSApple OSS Distributions                 "ldr     p3, [%[p],  #3, mul vl]"        "\n"
219*8d741a5dSApple OSS Distributions                 "ldr     p4, [%[p],  #4, mul vl]"        "\n"
220*8d741a5dSApple OSS Distributions                 "ldr     p5, [%[p],  #5, mul vl]"        "\n"
221*8d741a5dSApple OSS Distributions                 "ldr     p6, [%[p],  #6, mul vl]"        "\n"
222*8d741a5dSApple OSS Distributions                 "ldr     p7, [%[p],  #7, mul vl]"        "\n"
223*8d741a5dSApple OSS Distributions                 "ldr     p8, [%[p],  #8, mul vl]"        "\n"
224*8d741a5dSApple OSS Distributions                 "ldr     p9, [%[p],  #9, mul vl]"        "\n"
225*8d741a5dSApple OSS Distributions                 "ldr    p10, [%[p], #10, mul vl]"        "\n"
226*8d741a5dSApple OSS Distributions                 "ldr    p11, [%[p], #11, mul vl]"        "\n"
227*8d741a5dSApple OSS Distributions                 "ldr    p12, [%[p], #12, mul vl]"        "\n"
228*8d741a5dSApple OSS Distributions                 "ldr    p13, [%[p], #13, mul vl]"        "\n"
229*8d741a5dSApple OSS Distributions                 "ldr    p14, [%[p], #14, mul vl]"        "\n"
230*8d741a5dSApple OSS Distributions                 "ldr    p15, [%[p], #15, mul vl]"        "\n"
231*8d741a5dSApple OSS Distributions                 :
232*8d741a5dSApple OSS Distributions                 : [p] "r"(p)
233*8d741a5dSApple OSS Distributions         );
234*8d741a5dSApple OSS Distributions 
235*8d741a5dSApple OSS Distributions 	if (sme_zt0_size()) {
236*8d741a5dSApple OSS Distributions 		const uint8_t *zt0 = p + sme_p_size();
237*8d741a5dSApple OSS Distributions 		asm volatile (
238*8d741a5dSApple OSS Distributions                         "ldr	zt0, [%[zt0]]"
239*8d741a5dSApple OSS Distributions                         :
240*8d741a5dSApple OSS Distributions                         : [zt0] "r"(zt0)
241*8d741a5dSApple OSS Distributions                 );
242*8d741a5dSApple OSS Distributions 	}
243*8d741a5dSApple OSS Distributions }
244*8d741a5dSApple OSS Distributions 
245*8d741a5dSApple OSS Distributions static void
sme_store_data(void * addr)246*8d741a5dSApple OSS Distributions sme_store_data(void *addr)
247*8d741a5dSApple OSS Distributions {
248*8d741a5dSApple OSS Distributions 	uint8_t *za = addr;
249*8d741a5dSApple OSS Distributions 	uint8_t *z = za + sme_za_size();
250*8d741a5dSApple OSS Distributions 	uint8_t *p = z + sme_z_size();
251*8d741a5dSApple OSS Distributions 	uint16_t svl_b = arm_sme_svl_b();
252*8d741a5dSApple OSS Distributions 
253*8d741a5dSApple OSS Distributions 	for (register uint16_t i asm("w12") = 0; i < svl_b; i += 16) {
254*8d741a5dSApple OSS Distributions 		asm volatile (
255*8d741a5dSApple OSS Distributions                         "str    za[%w[i],  #0], [%[addr],  #0, mul vl]"   "\n"
256*8d741a5dSApple OSS Distributions                         "str    za[%w[i],  #1], [%[addr],  #1, mul vl]"   "\n"
257*8d741a5dSApple OSS Distributions                         "str    za[%w[i],  #2], [%[addr],  #2, mul vl]"   "\n"
258*8d741a5dSApple OSS Distributions                         "str    za[%w[i],  #3], [%[addr],  #3, mul vl]"   "\n"
259*8d741a5dSApple OSS Distributions                         "str    za[%w[i],  #4], [%[addr],  #4, mul vl]"   "\n"
260*8d741a5dSApple OSS Distributions                         "str    za[%w[i],  #5], [%[addr],  #5, mul vl]"   "\n"
261*8d741a5dSApple OSS Distributions                         "str    za[%w[i],  #6], [%[addr],  #6, mul vl]"   "\n"
262*8d741a5dSApple OSS Distributions                         "str    za[%w[i],  #7], [%[addr],  #7, mul vl]"   "\n"
263*8d741a5dSApple OSS Distributions                         "str    za[%w[i],  #8], [%[addr],  #8, mul vl]"   "\n"
264*8d741a5dSApple OSS Distributions                         "str    za[%w[i],  #9], [%[addr],  #9, mul vl]"   "\n"
265*8d741a5dSApple OSS Distributions                         "str    za[%w[i], #10], [%[addr], #10, mul vl]"   "\n"
266*8d741a5dSApple OSS Distributions                         "str    za[%w[i], #11], [%[addr], #11, mul vl]"   "\n"
267*8d741a5dSApple OSS Distributions                         "str    za[%w[i], #12], [%[addr], #12, mul vl]"   "\n"
268*8d741a5dSApple OSS Distributions                         "str    za[%w[i], #13], [%[addr], #13, mul vl]"   "\n"
269*8d741a5dSApple OSS Distributions                         "str    za[%w[i], #14], [%[addr], #14, mul vl]"   "\n"
270*8d741a5dSApple OSS Distributions                         "str    za[%w[i], #15], [%[addr], #15, mul vl]"   "\n"
271*8d741a5dSApple OSS Distributions                         :
272*8d741a5dSApple OSS Distributions                         : [i] "r"(i),
273*8d741a5dSApple OSS Distributions                           [addr] "r"(za + (i * svl_b))
274*8d741a5dSApple OSS Distributions                 );
275*8d741a5dSApple OSS Distributions 	}
276*8d741a5dSApple OSS Distributions 
277*8d741a5dSApple OSS Distributions 	asm volatile (
278*8d741a5dSApple OSS Distributions                 "str    z0, [%[z],   #0, mul vl]"        "\n"
279*8d741a5dSApple OSS Distributions                 "str    z1, [%[z],   #1, mul vl]"        "\n"
280*8d741a5dSApple OSS Distributions                 "str    z2, [%[z],   #2, mul vl]"        "\n"
281*8d741a5dSApple OSS Distributions                 "str    z3, [%[z],   #3, mul vl]"        "\n"
282*8d741a5dSApple OSS Distributions                 "str    z4, [%[z],   #4, mul vl]"        "\n"
283*8d741a5dSApple OSS Distributions                 "str    z5, [%[z],   #5, mul vl]"        "\n"
284*8d741a5dSApple OSS Distributions                 "str    z6, [%[z],   #6, mul vl]"        "\n"
285*8d741a5dSApple OSS Distributions                 "str    z7, [%[z],   #7, mul vl]"        "\n"
286*8d741a5dSApple OSS Distributions                 "str    z8, [%[z],   #8, mul vl]"        "\n"
287*8d741a5dSApple OSS Distributions                 "str    z9, [%[z],   #9, mul vl]"        "\n"
288*8d741a5dSApple OSS Distributions                 "str   z10, [%[z],  #10, mul vl]"        "\n"
289*8d741a5dSApple OSS Distributions                 "str   z11, [%[z],  #11, mul vl]"        "\n"
290*8d741a5dSApple OSS Distributions                 "str   z12, [%[z],  #12, mul vl]"        "\n"
291*8d741a5dSApple OSS Distributions                 "str   z13, [%[z],  #13, mul vl]"        "\n"
292*8d741a5dSApple OSS Distributions                 "str   z14, [%[z],  #14, mul vl]"        "\n"
293*8d741a5dSApple OSS Distributions                 "str   z15, [%[z],  #15, mul vl]"        "\n"
294*8d741a5dSApple OSS Distributions                 "str   z16, [%[z],  #16, mul vl]"        "\n"
295*8d741a5dSApple OSS Distributions                 "str   z17, [%[z],  #17, mul vl]"        "\n"
296*8d741a5dSApple OSS Distributions                 "str   z18, [%[z],  #18, mul vl]"        "\n"
297*8d741a5dSApple OSS Distributions                 "str   z19, [%[z],  #19, mul vl]"        "\n"
298*8d741a5dSApple OSS Distributions                 "str   z20, [%[z],  #20, mul vl]"        "\n"
299*8d741a5dSApple OSS Distributions                 "str   z21, [%[z],  #21, mul vl]"        "\n"
300*8d741a5dSApple OSS Distributions                 "str   z22, [%[z],  #22, mul vl]"        "\n"
301*8d741a5dSApple OSS Distributions                 "str   z23, [%[z],  #23, mul vl]"        "\n"
302*8d741a5dSApple OSS Distributions                 "str   z24, [%[z],  #24, mul vl]"        "\n"
303*8d741a5dSApple OSS Distributions                 "str   z25, [%[z],  #25, mul vl]"        "\n"
304*8d741a5dSApple OSS Distributions                 "str   z26, [%[z],  #26, mul vl]"        "\n"
305*8d741a5dSApple OSS Distributions                 "str   z27, [%[z],  #27, mul vl]"        "\n"
306*8d741a5dSApple OSS Distributions                 "str   z28, [%[z],  #28, mul vl]"        "\n"
307*8d741a5dSApple OSS Distributions                 "str   z29, [%[z],  #29, mul vl]"        "\n"
308*8d741a5dSApple OSS Distributions                 "str   z30, [%[z],  #30, mul vl]"        "\n"
309*8d741a5dSApple OSS Distributions                 "str   z31, [%[z],  #31, mul vl]"        "\n"
310*8d741a5dSApple OSS Distributions                 :
311*8d741a5dSApple OSS Distributions                 : [z] "r"(z)
312*8d741a5dSApple OSS Distributions         );
313*8d741a5dSApple OSS Distributions 
314*8d741a5dSApple OSS Distributions 	asm volatile (
315*8d741a5dSApple OSS Distributions                 "str     p0, [%[p],  #0, mul vl]"        "\n"
316*8d741a5dSApple OSS Distributions                 "str     p1, [%[p],  #1, mul vl]"        "\n"
317*8d741a5dSApple OSS Distributions                 "str     p2, [%[p],  #2, mul vl]"        "\n"
318*8d741a5dSApple OSS Distributions                 "str     p3, [%[p],  #3, mul vl]"        "\n"
319*8d741a5dSApple OSS Distributions                 "str     p4, [%[p],  #4, mul vl]"        "\n"
320*8d741a5dSApple OSS Distributions                 "str     p5, [%[p],  #5, mul vl]"        "\n"
321*8d741a5dSApple OSS Distributions                 "str     p6, [%[p],  #6, mul vl]"        "\n"
322*8d741a5dSApple OSS Distributions                 "str     p7, [%[p],  #7, mul vl]"        "\n"
323*8d741a5dSApple OSS Distributions                 "str     p8, [%[p],  #8, mul vl]"        "\n"
324*8d741a5dSApple OSS Distributions                 "str     p9, [%[p],  #9, mul vl]"        "\n"
325*8d741a5dSApple OSS Distributions                 "str    p10, [%[p], #10, mul vl]"        "\n"
326*8d741a5dSApple OSS Distributions                 "str    p11, [%[p], #11, mul vl]"        "\n"
327*8d741a5dSApple OSS Distributions                 "str    p12, [%[p], #12, mul vl]"        "\n"
328*8d741a5dSApple OSS Distributions                 "str    p13, [%[p], #13, mul vl]"        "\n"
329*8d741a5dSApple OSS Distributions                 "str    p14, [%[p], #14, mul vl]"        "\n"
330*8d741a5dSApple OSS Distributions                 "str    p15, [%[p], #15, mul vl]"        "\n"
331*8d741a5dSApple OSS Distributions                 :
332*8d741a5dSApple OSS Distributions                 : [p] "r"(p)
333*8d741a5dSApple OSS Distributions         );
334*8d741a5dSApple OSS Distributions 
335*8d741a5dSApple OSS Distributions 	if (sme_zt0_size()) {
336*8d741a5dSApple OSS Distributions 		uint8_t *zt0 = p + sme_p_size();
337*8d741a5dSApple OSS Distributions 		asm volatile (
338*8d741a5dSApple OSS Distributions                         "str	zt0, [%[zt0]]"
339*8d741a5dSApple OSS Distributions                         :
340*8d741a5dSApple OSS Distributions                         : [zt0] "r"(zt0)
341*8d741a5dSApple OSS Distributions                 );
342*8d741a5dSApple OSS Distributions 	}
343*8d741a5dSApple OSS Distributions }
344*8d741a5dSApple OSS Distributions 
345*8d741a5dSApple OSS Distributions const struct arm_matrix_operations sme_operations = {
346*8d741a5dSApple OSS Distributions 	.name = "SME",
347*8d741a5dSApple OSS Distributions 
348*8d741a5dSApple OSS Distributions 	.data_size = sme_data_size,
349*8d741a5dSApple OSS Distributions 	.alloc_data = sme_alloc_data,
350*8d741a5dSApple OSS Distributions 
351*8d741a5dSApple OSS Distributions 	.is_available = sme_is_available,
352*8d741a5dSApple OSS Distributions 	.start = sme_start,
353*8d741a5dSApple OSS Distributions 	.stop = sme_stop,
354*8d741a5dSApple OSS Distributions 
355*8d741a5dSApple OSS Distributions 	.load_one_vector = sme_load_one_vector,
356*8d741a5dSApple OSS Distributions 	.load_data = sme_load_data,
357*8d741a5dSApple OSS Distributions 	.store_data = sme_store_data,
358*8d741a5dSApple OSS Distributions };
359