From: Roman Kisel <[email protected]> Sent: Wednesday, August 27, 2025 
6:06 PM
> 
> The existing Hyper-V wrappers for getting and setting MSRs are
> hv_get/set_msr(). Via hv_get/set_non_nested_msr(), they detect
> when running in a CoCo VM with a paravisor, and use the TDX or
> SNP guest-host communication protocol to bypass the paravisor
> and go directly to the host hypervisor for SynIC MSRs. The "set"
> function also implements the required special handling for the
> SINT MSRs.
> 
> Provide functions that allow manipulating the SynIC registers
> through the paravisor. Move vmbus_signal_eom() to a more
> appropriate location (which also avoids breaking KVM).
> 
> Signed-off-by: Roman Kisel <[email protected]>
> Reviewed-by: Alok Tiwari <[email protected]>

Reviewed-by: Michael Kelley <[email protected]>

> ---
>  arch/x86/kernel/cpu/mshyperv.c | 39 ++++++++++++++++++++++++++++++++++
>  drivers/hv/hv_common.c         | 13 ++++++++++++
>  drivers/hv/hyperv_vmbus.h      | 39 ++++++++++++++++++++++++++++++++++
>  include/asm-generic/mshyperv.h | 37 ++------------------------------
>  4 files changed, 93 insertions(+), 35 deletions(-)
> 
> diff --git a/arch/x86/kernel/cpu/mshyperv.c b/arch/x86/kernel/cpu/mshyperv.c
> index 95cd78004b11..a619b661275b 100644
> --- a/arch/x86/kernel/cpu/mshyperv.c
> +++ b/arch/x86/kernel/cpu/mshyperv.c
> @@ -109,6 +109,45 @@ bool hv_confidential_vmbus_available(void)
>       return eax &
> HYPERV_VS_PROPERTIES_EAX_CONFIDENTIAL_VMBUS_AVAILABLE;
>  }
> 
> +/*
> + * Attempt to get the SynIC register value from the paravisor.
> + *
> + * Not all paravisors support reading SynIC registers, so this function
> + * may fail. The register for the SynIC of the running CPU is accessed.
> + *
> + * Writes the SynIC register value into the memory pointed by val,
> + * and ~0ULL is on failure.
> + *
> + * Returns -ENODEV if the MSR is not a SynIC register, or another error
> + * code if getting the MSR fails (meaning the paravisor doesn't support
> + * relaying VMBus communucations).
> + */
> +int hv_para_get_synic_register(unsigned int reg, u64 *val)
> +{
> +     if (!ms_hyperv.paravisor_present || !hv_is_synic_msr(reg))
> +             return -ENODEV;
> +     return native_read_msr_safe(reg, val);
> +}
> +
> +/*
> + * Attempt to set the SynIC register value with the paravisor.
> + *
> + * Not all paravisors support setting SynIC registers, so this function
> + * may fail. The register for the SynIC of the running CPU is accessed.
> + *
> + * Sets the register to the value supplied.
> + *
> + * Returns: -ENODEV if the MSR is not a SynIC register, or another error
> + * code if writing to the MSR fails (meaning the paravisor doesn't support
> + * relaying VMBus communucations).
> + */
> +int hv_para_set_synic_register(unsigned int reg, u64 val)
> +{
> +     if (!ms_hyperv.paravisor_present || !hv_is_synic_msr(reg))
> +             return -ENODEV;
> +     return native_write_msr_safe(reg, val);
> +}
> +
>  u64 hv_get_msr(unsigned int reg)
>  {
>       if (hv_nested)
> diff --git a/drivers/hv/hv_common.c b/drivers/hv/hv_common.c
> index fae63c54e531..8285ba005a71 100644
> --- a/drivers/hv/hv_common.c
> +++ b/drivers/hv/hv_common.c
> @@ -722,6 +722,19 @@ bool __weak hv_confidential_vmbus_available(void)
>  }
>  EXPORT_SYMBOL_GPL(hv_confidential_vmbus_available);
> 
> +int __weak hv_para_get_synic_register(unsigned int reg, u64 *val)
> +{
> +     *val = ~0ULL;
> +     return -ENODEV;
> +}
> +EXPORT_SYMBOL_GPL(hv_para_get_synic_register);
> +
> +int __weak hv_para_set_synic_register(unsigned int reg, u64 val)
> +{
> +     return -ENODEV;
> +}
> +EXPORT_SYMBOL_GPL(hv_para_set_synic_register);
> +
>  void hv_identify_partition_type(void)
>  {
>       /* Assume guest role */
> diff --git a/drivers/hv/hyperv_vmbus.h b/drivers/hv/hyperv_vmbus.h
> index 6e4c3acc1169..e8b87fbb88cb 100644
> --- a/drivers/hv/hyperv_vmbus.h
> +++ b/drivers/hv/hyperv_vmbus.h
> @@ -15,6 +15,7 @@
>  #include <linux/list.h>
>  #include <linux/bitops.h>
>  #include <asm/sync_bitops.h>
> +#include <asm/mshyperv.h>
>  #include <linux/atomic.h>
>  #include <linux/hyperv.h>
>  #include <linux/interrupt.h>
> @@ -336,6 +337,44 @@ extern const struct vmbus_channel_message_table_entry
> 
>  bool vmbus_is_confidential(void);
> 
> +/* Free the message slot and signal end-of-message if required */
> +static inline void vmbus_signal_eom(struct hv_message *msg, u32 old_msg_type)
> +{
> +     /*
> +      * On crash we're reading some other CPU's message page and we need
> +      * to be careful: this other CPU may already had cleared the header
> +      * and the host may already had delivered some other message there.
> +      * In case we blindly write msg->header.message_type we're going
> +      * to lose it. We can still lose a message of the same type but
> +      * we count on the fact that there can only be one
> +      * CHANNELMSG_UNLOAD_RESPONSE and we don't care about other messages
> +      * on crash.
> +      */
> +     if (cmpxchg(&msg->header.message_type, old_msg_type,
> +                 HVMSG_NONE) != old_msg_type)
> +             return;
> +
> +     /*
> +      * The cmxchg() above does an implicit memory barrier to
> +      * ensure the write to MessageType (ie set to
> +      * HVMSG_NONE) happens before we read the
> +      * MessagePending and EOMing. Otherwise, the EOMing
> +      * will not deliver any more messages since there is
> +      * no empty slot
> +      */
> +     if (msg->header.message_flags.msg_pending) {
> +             /*
> +              * This will cause message queue rescan to
> +              * possibly deliver another msg from the
> +              * hypervisor
> +              */
> +             if (vmbus_is_confidential())
> +                     hv_para_set_synic_register(HV_MSR_EOM, 0);
> +             else
> +                     hv_set_msr(HV_MSR_EOM, 0);
> +     }
> +}
> +
>  struct hv_device *vmbus_device_create(const guid_t *type,
>                                     const guid_t *instance,
>                                     struct vmbus_channel *channel);
> diff --git a/include/asm-generic/mshyperv.h b/include/asm-generic/mshyperv.h
> index acb017f6c423..4b0b05faef70 100644
> --- a/include/asm-generic/mshyperv.h
> +++ b/include/asm-generic/mshyperv.h
> @@ -163,41 +163,6 @@ static inline u64 hv_generate_guest_id(u64 
> kernel_version)
>       return guest_id;
>  }
> 
> -/* Free the message slot and signal end-of-message if required */
> -static inline void vmbus_signal_eom(struct hv_message *msg, u32 old_msg_type)
> -{
> -     /*
> -      * On crash we're reading some other CPU's message page and we need
> -      * to be careful: this other CPU may already had cleared the header
> -      * and the host may already had delivered some other message there.
> -      * In case we blindly write msg->header.message_type we're going
> -      * to lose it. We can still lose a message of the same type but
> -      * we count on the fact that there can only be one
> -      * CHANNELMSG_UNLOAD_RESPONSE and we don't care about other messages
> -      * on crash.
> -      */
> -     if (cmpxchg(&msg->header.message_type, old_msg_type,
> -                 HVMSG_NONE) != old_msg_type)
> -             return;
> -
> -     /*
> -      * The cmxchg() above does an implicit memory barrier to
> -      * ensure the write to MessageType (ie set to
> -      * HVMSG_NONE) happens before we read the
> -      * MessagePending and EOMing. Otherwise, the EOMing
> -      * will not deliver any more messages since there is
> -      * no empty slot
> -      */
> -     if (msg->header.message_flags.msg_pending) {
> -             /*
> -              * This will cause message queue rescan to
> -              * possibly deliver another msg from the
> -              * hypervisor
> -              */
> -             hv_set_msr(HV_MSR_EOM, 0);
> -     }
> -}
> -
>  int hv_get_hypervisor_version(union hv_hypervisor_version_info *info);
> 
>  void hv_setup_vmbus_handler(void (*handler)(void));
> @@ -335,6 +300,8 @@ bool hv_isolation_type_snp(void);
>  bool hv_confidential_vmbus_available(void);
>  u64 hv_ghcb_hypercall(u64 control, void *input, void *output, u32 
> input_size);
>  u64 hv_tdx_hypercall(u64 control, u64 param1, u64 param2);
> +int hv_para_get_synic_register(unsigned int reg, u64 *val);
> +int hv_para_set_synic_register(unsigned int reg, u64 val);
>  void hyperv_cleanup(void);
>  bool hv_query_ext_cap(u64 cap_query);
>  void hv_setup_dma_ops(struct device *dev, bool coherent);
> --
> 2.43.0
> 


Reply via email to