xen/arm: Implement Set/Way operations

author Julien Grall <julien.grall@arm.com>

Tue, 18 Dec 2018 18:04:16 +0000 (18:04 +0000)

committer Stefano Stabellini <sstabellini@kernel.org>

Tue, 18 Dec 2018 22:32:31 +0000 (14:32 -0800)
author Julien Grall <julien.grall@arm.com>
Tue, 18 Dec 2018 18:04:16 +0000 (18:04 +0000)
committer Stefano Stabellini <sstabellini@kernel.org>
Tue, 18 Dec 2018 22:32:31 +0000 (14:32 -0800)
diff --git a/xen/arch/arm/arm64/vsysreg.c b/xen/arch/arm/arm64/vsysreg.c

index 16ac9c344ab43eceb42be67457195d9afed0cbd6..8a85507d9df7ea0409da174c1d43287b65f6c068 100644 (file)
--- a/xen/arch/arm/arm64/vsysreg.c
+++ b/xen/arch/arm/arm64/vsysreg.c
@@ -34,9 +34,14 @@
  static bool vreg_emulate_##reg(struct cpu_user_regs *regs,          \
                                 uint64_t *r, bool read)              \
  {                                                                   \
+    struct vcpu *v = current;                                       \
+    bool cache_enabled = vcpu_has_cache_enabled(v);                 \
+                                                                    \
      GUEST_BUG_ON(read);                                             \
      WRITE_SYSREG64(*r, reg);                                        \
                                                                      \
+    p2m_toggle_cache(v, cache_enabled);                             \
+                                                                    \
      return true;                                                    \
  }
  
@@ -84,6 +89,18 @@ void do_sysreg(struct cpu_user_regs *regs,
              set_user_reg(regs, regidx, v->arch.actlr);
          break;
  
+    /*
+     * HCR_EL2.TSW
+     *
+     * ARMv8 (DDI 0487B.b): Table D1-42
+     */
+    case HSR_SYSREG_DCISW:
+    case HSR_SYSREG_DCCSW:
+    case HSR_SYSREG_DCCISW:
+        if ( !hsr.sysreg.read )
+            p2m_set_way_flush(current);
+        break;
+
      /*
       * HCR_EL2.TVM
       *
diff --git a/xen/arch/arm/p2m.c b/xen/arch/arm/p2m.c

index ff52cb178f70ee5f3d1506df2c321328a872b72e..22bec7390b4b3ac29e9c64a385001f91388fb5c1 100644 (file)
--- a/xen/arch/arm/p2m.c
+++ b/xen/arch/arm/p2m.c
@@ -3,6 +3,7 @@
  #include <xen/iocap.h>
  #include <xen/lib.h>
  #include <xen/sched.h>
+#include <xen/softirq.h>
  
  #include <asm/event.h>
  #include <asm/flushtlb.h>
@@ -1615,6 +1616,95 @@ int p2m_cache_flush_range(struct domain *d, gfn_t *pstart, gfn_t end)
      return rc;
  }
  
+/*
+ * Clean & invalidate RAM associated to the guest vCPU.
+ *
+ * The function can only work with the current vCPU and should be called
+ * with IRQ enabled as the vCPU could get preempted.
+ */
+void p2m_flush_vm(struct vcpu *v)
+{
+    int rc;
+    gfn_t start = _gfn(0);
+
+    ASSERT(v == current);
+    ASSERT(local_irq_is_enabled());
+    ASSERT(v->arch.need_flush_to_ram);
+
+    do
+    {
+        rc = p2m_cache_flush_range(v->domain, &start, _gfn(ULONG_MAX));
+        if ( rc == -ERESTART )
+            do_softirq();
+    } while ( rc == -ERESTART );
+
+    if ( rc != 0 )
+        gprintk(XENLOG_WARNING,
+                "P2M has not been correctly cleaned (rc = %d)\n",
+                rc);
+
+    v->arch.need_flush_to_ram = false;
+}
+
+/*
+ * See note at ARMv7 ARM B1.14.4 (DDI 0406C.c) (TL;DR: S/W ops are not
+ * easily virtualized).
+ *
+ * Main problems:
+ *  - S/W ops are local to a CPU (not broadcast)
+ *  - We have line migration behind our back (speculation)
+ *  - System caches don't support S/W at all (damn!)
+ *
+ * In the face of the above, the best we can do is to try and convert
+ * S/W ops to VA ops. Because the guest is not allowed to infer the S/W
+ * to PA mapping, it can only use S/W to nuke the whole cache, which is
+ * rather a good thing for us.
+ *
+ * Also, it is only used when turning caches on/off ("The expected
+ * usage of the cache maintenance instructions that operate by set/way
+ * is associated with the powerdown and powerup of caches, if this is
+ * required by the implementation.").
+ *
+ * We use the following policy:
+ *  - If we trap a S/W operation, we enabled VM trapping to detect
+ *  caches being turned on/off, and do a full clean.
+ *
+ *  - We flush the caches on both caches being turned on and off.
+ *
+ *  - Once the caches are enabled, we stop trapping VM ops.
+ */
+void p2m_set_way_flush(struct vcpu *v)
+{
+    /* This function can only work with the current vCPU. */
+    ASSERT(v == current);
+
+    if ( !(v->arch.hcr_el2 & HCR_TVM) )
+    {
+        v->arch.need_flush_to_ram = true;
+        vcpu_hcr_set_flags(v, HCR_TVM);
+    }
+}
+
+void p2m_toggle_cache(struct vcpu *v, bool was_enabled)
+{
+    bool now_enabled = vcpu_has_cache_enabled(v);
+
+    /* This function can only work with the current vCPU. */
+    ASSERT(v == current);
+
+    /*
+     * If switching the MMU+caches on, need to invalidate the caches.
+     * If switching it off, need to clean the caches.
+     * Clean + invalidate does the trick always.
+     */
+    if ( was_enabled != now_enabled )
+        v->arch.need_flush_to_ram = true;
+
+    /* Caches are now on, stop trapping VM ops (until a S/W op) */
+    if ( now_enabled )
+        vcpu_hcr_clear_flags(v, HCR_TVM);
+}
+
  mfn_t gfn_to_mfn(struct domain *d, gfn_t gfn)
  {
      return p2m_lookup(d, gfn, NULL);
diff --git a/xen/arch/arm/traps.c b/xen/arch/arm/traps.c

index 02665cc7b4f2e0c76aa77329c43c61c1f01af71c..221c762adad60cfdef6a5c37123a6ac59a13ec55 100644 (file)
--- a/xen/arch/arm/traps.c
+++ b/xen/arch/arm/traps.c
@@ -97,7 +97,7 @@ register_t get_default_hcr_flags(void)
  {
      return  (HCR_PTW|HCR_BSU_INNER|HCR_AMO|HCR_IMO|HCR_FMO|HCR_VM|
               (vwfi != NATIVE ? (HCR_TWI|HCR_TWE) : 0) |
-             HCR_TSC|HCR_TAC|HCR_SWIO|HCR_TIDCP|HCR_FB);
+             HCR_TSC|HCR_TAC|HCR_SWIO|HCR_TIDCP|HCR_FB|HCR_TSW);
  }
  
  static enum {
@@ -2258,10 +2258,33 @@ static void check_for_pcpu_work(void)
      }
  }
  
+/*
+ * Process pending work for the vCPU. Any call should be fast or
+ * implement preemption.
+ */
+static void check_for_vcpu_work(void)
+{
+    struct vcpu *v = current;
+
+    if ( likely(!v->arch.need_flush_to_ram) )
+        return;
+
+    /*
+     * Give a chance for the pCPU to process work before handling the vCPU
+     * pending work.
+     */
+    check_for_pcpu_work();
+
+    local_irq_enable();
+    p2m_flush_vm(v);
+    local_irq_disable();
+}
+
  void leave_hypervisor_tail(void)
  {
      local_irq_disable();
  
+    check_for_vcpu_work();
      check_for_pcpu_work();
  
      vgic_sync_to_lrs();
diff --git a/xen/arch/arm/vcpreg.c b/xen/arch/arm/vcpreg.c

index 550c25ec3fbfc8bb627b658308dbeb143081e21a..cdc91cdf5bc13faa5d204e6edae3a1847b39fe1a 100644 (file)
--- a/xen/arch/arm/vcpreg.c
+++ b/xen/arch/arm/vcpreg.c
@@ -51,9 +51,14 @@
  #define TVM_REG(sz, func, reg...)                                           \
  static bool func(struct cpu_user_regs *regs, uint##sz##_t *r, bool read)    \
  {                                                                           \
+    struct vcpu *v = current;                                               \
+    bool cache_enabled = vcpu_has_cache_enabled(v);                         \
+                                                                            \
      GUEST_BUG_ON(read);                                                     \
      WRITE_SYSREG##sz(*r, reg);                                              \
                                                                              \
+    p2m_toggle_cache(v, cache_enabled);                                     \
+                                                                            \
      return true;                                                            \
  }
  
@@ -71,6 +76,8 @@ static bool func(struct cpu_user_regs *regs, uint##sz##_t *r, bool read)    \
  static bool vreg_emulate_##xreg(struct cpu_user_regs *regs, uint32_t *r,    \
                                  bool read, bool hi)                         \
  {                                                                           \
+    struct vcpu *v = current;                                               \
+    bool cache_enabled = vcpu_has_cache_enabled(v);                         \
      register_t reg = READ_SYSREG(xreg);                                     \
                                                                              \
      GUEST_BUG_ON(read);                                                     \
@@ -86,6 +93,8 @@ static bool vreg_emulate_##xreg(struct cpu_user_regs *regs, uint32_t *r,    \
      }                                                                       \
      WRITE_SYSREG(reg, xreg);                                                \
                                                                              \
+    p2m_toggle_cache(v, cache_enabled);                                     \
+                                                                            \
      return true;                                                            \
  }                                                                           \
                                                                              \
@@ -185,6 +194,19 @@ void do_cp15_32(struct cpu_user_regs *regs, const union hsr hsr)
              set_user_reg(regs, regidx, v->arch.actlr);
          break;
  
+    /*
+     * HCR_EL2.TSW
+     *
+     * ARMv7 (DDI 0406C.b): B1.14.6
+     * ARMv8 (DDI 0487B.b): Table D1-42
+     */
+    case HSR_CPREG32(DCISW):
+    case HSR_CPREG32(DCCSW):
+    case HSR_CPREG32(DCCISW):
+        if ( !cp32.read )
+            p2m_set_way_flush(current);
+        break;
+
      /*
       * HCR_EL2.TVM
       *
diff --git a/xen/include/asm-arm/domain.h b/xen/include/asm-arm/domain.h

index 175de449273de9ab5730f01934df1a08218fd9e9..312fec89328187f7614b96d49ac828bbfa75aeb5 100644 (file)
--- a/xen/include/asm-arm/domain.h
+++ b/xen/include/asm-arm/domain.h
@@ -202,6 +202,15 @@ struct arch_vcpu
      struct vtimer phys_timer;
      struct vtimer virt_timer;
      bool   vtimer_initialized;
+
+    /*
+     * The full P2M may require some cleaning (e.g when emulation
+     * set/way). As the action can take a long time, it requires
+     * preemption. It is deferred until we return to guest, where we can
+     * more easily check for softirqs and preempt the vCPU safely.
+     */
+    bool need_flush_to_ram;
+
  }  __cacheline_aligned;
  
  void vcpu_show_execution_state(struct vcpu *);
diff --git a/xen/include/asm-arm/p2m.h b/xen/include/asm-arm/p2m.h

index a633e27cc92bcaf7de2a40409cb325ac7d4cffbd..79abcb5a630e544ffae16ce219561ae60deb072f 100644 (file)
--- a/xen/include/asm-arm/p2m.h
+++ b/xen/include/asm-arm/p2m.h
@@ -6,6 +6,8 @@
  #include <xen/rwlock.h>
  #include <xen/mem_access.h>
  
+#include <asm/current.h>
+
  #define paddr_bits PADDR_BITS
  
  /* Holds the bit size of IPAs in p2m tables.  */
@@ -237,6 +239,12 @@ bool p2m_resolve_translation_fault(struct domain *d, gfn_t gfn);
   */
  int p2m_cache_flush_range(struct domain *d, gfn_t *pstart, gfn_t end);
  
+void p2m_set_way_flush(struct vcpu *v);
+
+void p2m_toggle_cache(struct vcpu *v, bool was_enabled);
+
+void p2m_flush_vm(struct vcpu *v);
+
  /*
   * Map a region in the guest p2m with a specific p2m type.
   * The memory attributes will be derived from the p2m type.
@@ -364,6 +372,18 @@ static inline int set_foreign_p2m_entry(struct domain *d, unsigned long gfn,
      return -EOPNOTSUPP;
  }
  
+/*
+ * A vCPU has cache enabled only when the MMU is enabled and data cache
+ * is enabled.
+ */
+static inline bool vcpu_has_cache_enabled(struct vcpu *v)
+{
+    /* Only works with the current vCPU */
+    ASSERT(current == v);
+
+    return (READ_SYSREG32(SCTLR_EL1) & (SCTLR_C|SCTLR_M)) == (SCTLR_C|SCTLR_M);
+}
+
  #endif /* _XEN_P2M_H */
  
  /*
author	Julien Grall <julien.grall@arm.com>
	Tue, 18 Dec 2018 18:04:16 +0000 (18:04 +0000)
committer	Stefano Stabellini <sstabellini@kernel.org>
	Tue, 18 Dec 2018 22:32:31 +0000 (14:32 -0800)
xen/arch/arm/arm64/vsysreg.c		patch \| blob \| blame \| history
xen/arch/arm/p2m.c		patch \| blob \| blame \| history
xen/arch/arm/traps.c		patch \| blob \| blame \| history
xen/arch/arm/vcpreg.c		patch \| blob \| blame \| history
xen/include/asm-arm/domain.h		patch \| blob \| blame \| history
xen/include/asm-arm/p2m.h		patch \| blob \| blame \| history