Sun Jul 19 07:32:43 2020 UTC ()

fix build with clang/llvm.

clang aarch64 assembler doesn't accept optional number of lanes of vector register.
(but ARMARM says that an assembler must accept it)


(ryo)

diff -r1.4 -r1.5 src/sys/crypto/aes/arch/arm/aes_armv8_64.S

--- src/sys/crypto/aes/arch/arm/aes_armv8_64.S 2020/06/30 23:06:02	1.4
+++ src/sys/crypto/aes/arch/arm/aes_armv8_64.S 2020/07/19 07:32:43	1.5

 @@ -1,14 +1,14 @@
-/*	$NetBSD: aes_armv8_64.S,v 1.4 2020/06/30 23:06:02 riastradh Exp $	*/
+/*	$NetBSD: aes_armv8_64.S,v 1.5 2020/07/19 07:32:43 ryo Exp $	*/
 /*-
  * Copyright (c) 2020 The NetBSD Foundation, Inc.
  * All rights reserved.
+ *
  * Redistribution and use in source and binary forms, with or without
  * modification, are permitted provided that the following conditions
  * are met:
  * 1. Redistributions of source code must retain the above copyright
  *    notice, this list of conditions and the following disclaimer.
  * 2. Redistributions in binary form must reproduce the above copyright
  *    notice, this list of conditions and the following disclaimer in the
  *    documentation and/or other materials provided with the distribution.
 @@ -228,46 +228,46 @@ ENTRY(aesarmv8_setenckey192)
 	eor	v5.16b, v5.16b, v3.16b
 	eor	v5.16b, v5.16b, v6.16b
 	eor	v5.16b, v5.16b, v7.16b
 	/*
 	 * At this point, rk is split across v2.4s = (rk[0],rk[1],...)
 	 * and v5.4s = (rk[2],rk[3],...); nrk is in v5.4s =
 	 * (...,nrk[0],nrk[1]); and we have yet to compute nrk[2] or
 	 * nrk[3], which requires rklo[0] and rklo[1] in v2.4s =
 	 * (rklo[0],rklo[1],...).
 	 */
 	/* v1.4s := (nrk[0], nrk[1], nrk[1], nrk[1]) */
-	dup	v1.4s, v5.4s[3]
+	dup	v1.4s, v5.s[3]
-	mov	v1.4s[0], v5.4s[2]
+	mov	v1.s[0], v5.s[2]
 	/*
 	 * v6.4s := (0, 0, rklo[0], rklo[1])
 	 * v7.4s := (0, 0, 0, rklo[0])
 	 */
 	ext	v6.16b, v0.16b, v2.16b, #8
 	ext	v7.16b, v0.16b, v2.16b, #4
 	/* v3.4s := (nrk[0], nrk[1], nrk[2], nrk[3]) */
 	eor	v3.16b, v1.16b, v6.16b
 	eor	v3.16b, v3.16b, v7.16b
 	/*
 	 * Recall v2.4s = (rk[0], rk[1], xxx, xxx)
 	 * and v5.4s = (rk[2], rk[3], xxx, xxx).  Set
 	 * v2.4s := (rk[0], rk[1], rk[2], rk[3])
 	 */
-	mov	v2.2d[1], v5.2d[0]
+	mov	v2.d[1], v5.d[0]
 	/* store two round keys */
 	stp	q2, q3, [x0], #0x20
 	/*
 	 * Live vector registers at this point:
+	 *
 	 *	q0 = zero
 	 *	q2 = rk
 	 *	q3 = nrk
 	 *	v5.4s = (rk[2], rk[3], nrk[0], nrk[1])
 	 *	q16 = unshiftrows_rotword_1
 	 *	q17 = unshiftrows_rotword_3
 @@ -315,27 +315,27 @@ ENTRY(aesarmv8_setenckey192)
 	subs	x2, x2, #3	/* count down three rounds */
 	str	q1, [x0], #0x10	/* store third round key */
 	b.eq	2f
 	/*
 	 * v4.4s := (nrk[2], nrk[3], xxx, xxx)
 	 * v5.4s := (0, nrk[2], xxx, xxx)
 	 */
 	ext	v4.16b, v3.16b, v0.16b, #8
 	ext	v5.16b, v0.16b, v4.16b, #12
 	/* v2.4s := (nnrk[3], nnrk[3], xxx, xxx) */
-	dup	v2.4s, v1.4s[3]
+	dup	v2.4s, v1.s[3]
 	/*
 	 * v2.4s := (nnnrklo[0] = nnrk[3] ^ nrk[2],
 	 *     nnnrklo[1] = nnrk[3] ^ nrk[2] ^ nrk[3],
 	 *     xxx, xxx)
 	 */
 	eor	v2.16b, v2.16b, v4.16b
 	eor	v2.16b, v2.16b, v5.16b
 	b	1b
 :	ret
 END(aesarmv8_setenckey192)