Re: [PATCH 07/27] arm64/sve: Low-level SVE architectural state manipulation functions

2017-08-21 Thread Dave Martin
On Mon, Aug 21, 2017 at 11:11:48AM +0100, Alex Bennée wrote:
> 
> Dave Martin  writes:
> 
> > Manipulating the SVE architectural state, including the vector and
> > predicate registers, first-fault register and the vector length,
> > requires the use of dedicated instructions added by SVE.
> >
> > This patch adds suitable assembly functions for saving and
> > restoring the SVE registers and querying the vector length.
> > Setting of the vector length is done as part of register restore.
> >
> > Since people building kernels may not all get an SVE-enabled
> > toolchain for a while, this patch uses macros that generate
> > explicit opcodes in place of assembler mnemonics.
> >
> > Signed-off-by: Dave Martin 
> > ---
> >  arch/arm64/include/asm/fpsimd.h   |   5 ++
> >  arch/arm64/include/asm/fpsimdmacros.h | 137 
> > ++
> >  arch/arm64/kernel/entry-fpsimd.S  |  17 +
> >  3 files changed, 159 insertions(+)

[...]

> > diff --git a/arch/arm64/include/asm/fpsimdmacros.h 
> > b/arch/arm64/include/asm/fpsimdmacros.h
> > index 0f5fdd3..5023064 100644
> > --- a/arch/arm64/include/asm/fpsimdmacros.h
> > +++ b/arch/arm64/include/asm/fpsimdmacros.h

[...]

> > +.macro _sve_str_v nz, nxbase, offset=0
> > +   _sve_check_zreg \nz
> > +   _check_general_reg \nxbase
> > +   _check_num (\offset), -0x100, 0xff
> > +   .inst   0xe5804000  \
> > +   | (\nz) \
> > +   | ((\nxbase) << 5)  \
> > +   | (((\offset) & 7) << 10)   \
> > +   | (((\offset) & 0x1f8) << 13)
> > +.endm
> 
> Can we have references to the ARM ARM titles (the section numbers keep
> changing) for each hand-hacked instruction please. Otherwise it is
> impossible to verify each one.

That's fair -- will do.

The supplement didn't exist at the time I first wrote this code...

[...]

Cheers
---Dave
___
kvmarm mailing list
kvmarm@lists.cs.columbia.edu
https://lists.cs.columbia.edu/mailman/listinfo/kvmarm


Re: [PATCH 07/27] arm64/sve: Low-level SVE architectural state manipulation functions

2017-08-21 Thread Alex Bennée

Dave Martin  writes:

> Manipulating the SVE architectural state, including the vector and
> predicate registers, first-fault register and the vector length,
> requires the use of dedicated instructions added by SVE.
>
> This patch adds suitable assembly functions for saving and
> restoring the SVE registers and querying the vector length.
> Setting of the vector length is done as part of register restore.
>
> Since people building kernels may not all get an SVE-enabled
> toolchain for a while, this patch uses macros that generate
> explicit opcodes in place of assembler mnemonics.
>
> Signed-off-by: Dave Martin 
> ---
>  arch/arm64/include/asm/fpsimd.h   |   5 ++
>  arch/arm64/include/asm/fpsimdmacros.h | 137 
> ++
>  arch/arm64/kernel/entry-fpsimd.S  |  17 +
>  3 files changed, 159 insertions(+)
>
> diff --git a/arch/arm64/include/asm/fpsimd.h b/arch/arm64/include/asm/fpsimd.h
> index 410c481..026a7c7 100644
> --- a/arch/arm64/include/asm/fpsimd.h
> +++ b/arch/arm64/include/asm/fpsimd.h
> @@ -67,6 +67,11 @@ extern void fpsimd_update_current_state(struct 
> fpsimd_state *state);
>
>  extern void fpsimd_flush_task_state(struct task_struct *target);
>
> +extern void sve_save_state(void *state, u32 *pfpsr);
> +extern void sve_load_state(void const *state, u32 const *pfpsr,
> +unsigned long vq_minus_1);
> +extern unsigned int sve_get_vl(void);
> +
>  /* For use by EFI runtime services calls only */
>  extern void __efi_fpsimd_begin(void);
>  extern void __efi_fpsimd_end(void);
> diff --git a/arch/arm64/include/asm/fpsimdmacros.h 
> b/arch/arm64/include/asm/fpsimdmacros.h
> index 0f5fdd3..5023064 100644
> --- a/arch/arm64/include/asm/fpsimdmacros.h
> +++ b/arch/arm64/include/asm/fpsimdmacros.h
> @@ -75,3 +75,140 @@
>   ldr w\tmpnr, [\state, #16 * 2 + 4]
>   fpsimd_restore_fpcr x\tmpnr, \state
>  .endm
> +
> +.macro _check_general_reg nr
> + .if (\nr) < 0 || (\nr) > 30
> + .error "Bad register number \nr."
> + .endif
> +.endm
> +
> +.macro _sve_check_zreg znr
> + .if (\znr) < 0 || (\znr) > 31
> + .error "Bad Scalable Vector Extension vector register number 
> \znr."
> + .endif
> +.endm
> +
> +.macro _sve_check_preg pnr
> + .if (\pnr) < 0 || (\pnr) > 15
> + .error "Bad Scalable Vector Extension predicate register number 
> \pnr."
> + .endif
> +.endm
> +
> +.macro _check_num n, min, max
> + .if (\n) < (\min) || (\n) > (\max)
> + .error "Number \n out of range [\min,\max]"
> + .endif
> +.endm
> +
> +.macro _sve_str_v nz, nxbase, offset=0
> + _sve_check_zreg \nz
> + _check_general_reg \nxbase
> + _check_num (\offset), -0x100, 0xff
> + .inst   0xe5804000  \
> + | (\nz) \
> + | ((\nxbase) << 5)  \
> + | (((\offset) & 7) << 10)   \
> + | (((\offset) & 0x1f8) << 13)
> +.endm

Can we have references to the ARM ARM titles (the section numbers keep
changing) for each hand-hacked instruction please. Otherwise it is
impossible to verify each one.

> +
> +.macro _sve_ldr_v nz, nxbase, offset=0
> + _sve_check_zreg \nz
> + _check_general_reg \nxbase
> + _check_num (\offset), -0x100, 0xff
> + .inst   0x85804000  \
> + | (\nz) \
> + | ((\nxbase) << 5)  \
> + | (((\offset) & 7) << 10)   \
> + | (((\offset) & 0x1f8) << 13)
> +.endm
> +
> +.macro _sve_str_p np, nxbase, offset=0
> + _sve_check_preg \np
> + _check_general_reg \nxbase
> + _check_num (\offset), -0x100, 0xff
> + .inst   0xe580  \
> + | (\np) \
> + | ((\nxbase) << 5)  \
> + | (((\offset) & 7) << 10)   \
> + | (((\offset) & 0x1f8) << 13)
> +.endm
> +
> +.macro _sve_ldr_p np, nxbase, offset=0
> + _sve_check_preg \np
> + _check_general_reg \nxbase
> + _check_num (\offset), -0x100, 0xff
> + .inst   0x8580  \
> + | (\np) \
> + | ((\nxbase) << 5)  \
> + | (((\offset) & 7) << 10)   \
> + | (((\offset) & 0x1f8) << 13)
> +.endm
> +
> +.macro _sve_rdvl nx, imm
> + _check_general_reg \nx
> + _check_num (\imm), -0x20, 0x1f
> + .inst   0x04bf5000  \
> + | (\nx) \
> + | (((\imm) & 0x3f) << 5)
> +.endm
> +
> +.macro _sve_rdffr np
> + _sve_check_preg \np
> + .inst   0x2519f000  \
> + | (\np)
> +.endm
> +
> +.macro _sve_wrffr np
> + _sve_check_preg \np
> + .inst   0x25289000  \
> + | ((\np) << 5)
> +.endm
> +
> +.macro __for from:req, 

[PATCH 07/27] arm64/sve: Low-level SVE architectural state manipulation functions

2017-08-09 Thread Dave Martin
Manipulating the SVE architectural state, including the vector and
predicate registers, first-fault register and the vector length,
requires the use of dedicated instructions added by SVE.

This patch adds suitable assembly functions for saving and
restoring the SVE registers and querying the vector length.
Setting of the vector length is done as part of register restore.

Since people building kernels may not all get an SVE-enabled
toolchain for a while, this patch uses macros that generate
explicit opcodes in place of assembler mnemonics.

Signed-off-by: Dave Martin 
---
 arch/arm64/include/asm/fpsimd.h   |   5 ++
 arch/arm64/include/asm/fpsimdmacros.h | 137 ++
 arch/arm64/kernel/entry-fpsimd.S  |  17 +
 3 files changed, 159 insertions(+)

diff --git a/arch/arm64/include/asm/fpsimd.h b/arch/arm64/include/asm/fpsimd.h
index 410c481..026a7c7 100644
--- a/arch/arm64/include/asm/fpsimd.h
+++ b/arch/arm64/include/asm/fpsimd.h
@@ -67,6 +67,11 @@ extern void fpsimd_update_current_state(struct fpsimd_state 
*state);
 
 extern void fpsimd_flush_task_state(struct task_struct *target);
 
+extern void sve_save_state(void *state, u32 *pfpsr);
+extern void sve_load_state(void const *state, u32 const *pfpsr,
+  unsigned long vq_minus_1);
+extern unsigned int sve_get_vl(void);
+
 /* For use by EFI runtime services calls only */
 extern void __efi_fpsimd_begin(void);
 extern void __efi_fpsimd_end(void);
diff --git a/arch/arm64/include/asm/fpsimdmacros.h 
b/arch/arm64/include/asm/fpsimdmacros.h
index 0f5fdd3..5023064 100644
--- a/arch/arm64/include/asm/fpsimdmacros.h
+++ b/arch/arm64/include/asm/fpsimdmacros.h
@@ -75,3 +75,140 @@
ldr w\tmpnr, [\state, #16 * 2 + 4]
fpsimd_restore_fpcr x\tmpnr, \state
 .endm
+
+.macro _check_general_reg nr
+   .if (\nr) < 0 || (\nr) > 30
+   .error "Bad register number \nr."
+   .endif
+.endm
+
+.macro _sve_check_zreg znr
+   .if (\znr) < 0 || (\znr) > 31
+   .error "Bad Scalable Vector Extension vector register number 
\znr."
+   .endif
+.endm
+
+.macro _sve_check_preg pnr
+   .if (\pnr) < 0 || (\pnr) > 15
+   .error "Bad Scalable Vector Extension predicate register number 
\pnr."
+   .endif
+.endm
+
+.macro _check_num n, min, max
+   .if (\n) < (\min) || (\n) > (\max)
+   .error "Number \n out of range [\min,\max]"
+   .endif
+.endm
+
+.macro _sve_str_v nz, nxbase, offset=0
+   _sve_check_zreg \nz
+   _check_general_reg \nxbase
+   _check_num (\offset), -0x100, 0xff
+   .inst   0xe5804000  \
+   | (\nz) \
+   | ((\nxbase) << 5)  \
+   | (((\offset) & 7) << 10)   \
+   | (((\offset) & 0x1f8) << 13)
+.endm
+
+.macro _sve_ldr_v nz, nxbase, offset=0
+   _sve_check_zreg \nz
+   _check_general_reg \nxbase
+   _check_num (\offset), -0x100, 0xff
+   .inst   0x85804000  \
+   | (\nz) \
+   | ((\nxbase) << 5)  \
+   | (((\offset) & 7) << 10)   \
+   | (((\offset) & 0x1f8) << 13)
+.endm
+
+.macro _sve_str_p np, nxbase, offset=0
+   _sve_check_preg \np
+   _check_general_reg \nxbase
+   _check_num (\offset), -0x100, 0xff
+   .inst   0xe580  \
+   | (\np) \
+   | ((\nxbase) << 5)  \
+   | (((\offset) & 7) << 10)   \
+   | (((\offset) & 0x1f8) << 13)
+.endm
+
+.macro _sve_ldr_p np, nxbase, offset=0
+   _sve_check_preg \np
+   _check_general_reg \nxbase
+   _check_num (\offset), -0x100, 0xff
+   .inst   0x8580  \
+   | (\np) \
+   | ((\nxbase) << 5)  \
+   | (((\offset) & 7) << 10)   \
+   | (((\offset) & 0x1f8) << 13)
+.endm
+
+.macro _sve_rdvl nx, imm
+   _check_general_reg \nx
+   _check_num (\imm), -0x20, 0x1f
+   .inst   0x04bf5000  \
+   | (\nx) \
+   | (((\imm) & 0x3f) << 5)
+.endm
+
+.macro _sve_rdffr np
+   _sve_check_preg \np
+   .inst   0x2519f000  \
+   | (\np)
+.endm
+
+.macro _sve_wrffr np
+   _sve_check_preg \np
+   .inst   0x25289000  \
+   | ((\np) << 5)
+.endm
+
+.macro __for from:req, to:req
+   .if (\from) == (\to)
+   _for__body \from
+   .else
+   __for \from, (\from) + ((\to) - (\from)) / 2
+   __for (\from) + ((\to) - (\from)) / 2 + 1, \to
+   .endif
+.endm
+
+.macro _for var:req, from:req, to:req, insn:vararg
+   .macro _for__body \var:req
+   \insn
+   .endm
+
+   __for