coresight: etm4x: Refactor probing routine
[linux-2.6-microblaze.git] / drivers / hwtracing / coresight / coresight-etm4x-core.c
index b20b6ff..c3e458a 100644 (file)
@@ -59,32 +59,98 @@ static u64 etm4_get_access_type(struct etmv4_config *config);
 
 static enum cpuhp_state hp_online;
 
-static void etm4_os_unlock(struct etmv4_drvdata *drvdata)
+struct etm4_init_arg {
+       struct etmv4_drvdata    *drvdata;
+       struct csdev_access     *csa;
+};
+
+/*
+ * Check if TRCSSPCICRn(i) is implemented for a given instance.
+ *
+ * TRCSSPCICRn is implemented only if :
+ *     TRCSSPCICR<n> is present only if all of the following are true:
+ *             TRCIDR4.NUMSSCC > n.
+ *             TRCIDR4.NUMPC > 0b0000 .
+ *             TRCSSCSR<n>.PC == 0b1
+ */
+static inline bool etm4x_sspcicrn_present(struct etmv4_drvdata *drvdata, int n)
+{
+       return (n < drvdata->nr_ss_cmp) &&
+              drvdata->nr_pe &&
+              (drvdata->config.ss_status[n] & TRCSSCSRn_PC);
+}
+
+u64 etm4x_sysreg_read(u32 offset, bool _relaxed, bool _64bit)
+{
+       u64 res = 0;
+
+       switch (offset) {
+       ETM4x_READ_SYSREG_CASES(res)
+       default :
+               pr_warn_ratelimited("etm4x: trying to read unsupported register @%x\n",
+                        offset);
+       }
+
+       if (!_relaxed)
+               __iormb(res);   /* Imitate the !relaxed I/O helpers */
+
+       return res;
+}
+
+void etm4x_sysreg_write(u64 val, u32 offset, bool _relaxed, bool _64bit)
+{
+       if (!_relaxed)
+               __iowmb();      /* Imitate the !relaxed I/O helpers */
+       if (!_64bit)
+               val &= GENMASK(31, 0);
+
+       switch (offset) {
+       ETM4x_WRITE_SYSREG_CASES(val)
+       default :
+               pr_warn_ratelimited("etm4x: trying to write to unsupported register @%x\n",
+                       offset);
+       }
+}
+
+static void etm4_os_unlock_csa(struct etmv4_drvdata *drvdata, struct csdev_access *csa)
 {
        /* Writing 0 to TRCOSLAR unlocks the trace registers */
-       writel_relaxed(0x0, drvdata->base + TRCOSLAR);
+       etm4x_relaxed_write32(csa, 0x0, TRCOSLAR);
        drvdata->os_unlock = true;
        isb();
 }
 
+static void etm4_os_unlock(struct etmv4_drvdata *drvdata)
+{
+       if (!WARN_ON(!drvdata->csdev))
+               etm4_os_unlock_csa(drvdata, &drvdata->csdev->access);
+
+}
+
 static void etm4_os_lock(struct etmv4_drvdata *drvdata)
 {
+       if (WARN_ON(!drvdata->csdev))
+               return;
+
        /* Writing 0x1 to TRCOSLAR locks the trace registers */
-       writel_relaxed(0x1, drvdata->base + TRCOSLAR);
+       etm4x_relaxed_write32(&drvdata->csdev->access, 0x1, TRCOSLAR);
        drvdata->os_unlock = false;
        isb();
 }
 
-static bool etm4_arch_supported(u8 arch)
+static void etm4_cs_lock(struct etmv4_drvdata *drvdata,
+                        struct csdev_access *csa)
 {
-       /* Mask out the minor version number */
-       switch (arch & 0xf0) {
-       case ETM_ARCH_V4:
-               break;
-       default:
-               return false;
-       }
-       return true;
+       /* Software Lock is only accessible via memory mapped interface */
+       if (csa->io_mem)
+               CS_LOCK(csa->base);
+}
+
+static void etm4_cs_unlock(struct etmv4_drvdata *drvdata,
+                          struct csdev_access *csa)
+{
+       if (csa->io_mem)
+               CS_UNLOCK(csa->base);
 }
 
 static int etm4_cpu_id(struct coresight_device *csdev)
@@ -201,57 +267,63 @@ static int etm4_enable_hw(struct etmv4_drvdata *drvdata)
 {
        int i, rc;
        struct etmv4_config *config = &drvdata->config;
-       struct device *etm_dev = &drvdata->csdev->dev;
+       struct coresight_device *csdev = drvdata->csdev;
+       struct device *etm_dev = &csdev->dev;
+       struct csdev_access *csa = &csdev->access;
 
-       CS_UNLOCK(drvdata->base);
+
+       etm4_cs_unlock(drvdata, csa);
        etm4_enable_arch_specific(drvdata);
 
        etm4_os_unlock(drvdata);
 
-       rc = coresight_claim_device_unlocked(drvdata->base);
+       rc = coresight_claim_device_unlocked(csdev);
        if (rc)
                goto done;
 
        /* Disable the trace unit before programming trace registers */
-       writel_relaxed(0, drvdata->base + TRCPRGCTLR);
+       etm4x_relaxed_write32(csa, 0, TRCPRGCTLR);
+
+       /*
+        * If we use system instructions, we need to synchronize the
+        * write to the TRCPRGCTLR, before accessing the TRCSTATR.
+        * See ARM IHI0064F, section
+        * "4.3.7 Synchronization of register updates"
+        */
+       if (!csa->io_mem)
+               isb();
 
        /* wait for TRCSTATR.IDLE to go up */
-       if (coresight_timeout(drvdata->base, TRCSTATR, TRCSTATR_IDLE_BIT, 1))
+       if (coresight_timeout(csa, TRCSTATR, TRCSTATR_IDLE_BIT, 1))
                dev_err(etm_dev,
                        "timeout while waiting for Idle Trace Status\n");
        if (drvdata->nr_pe)
-               writel_relaxed(config->pe_sel, drvdata->base + TRCPROCSELR);
-       writel_relaxed(config->cfg, drvdata->base + TRCCONFIGR);
+               etm4x_relaxed_write32(csa, config->pe_sel, TRCPROCSELR);
+       etm4x_relaxed_write32(csa, config->cfg, TRCCONFIGR);
        /* nothing specific implemented */
-       writel_relaxed(0x0, drvdata->base + TRCAUXCTLR);
-       writel_relaxed(config->eventctrl0, drvdata->base + TRCEVENTCTL0R);
-       writel_relaxed(config->eventctrl1, drvdata->base + TRCEVENTCTL1R);
-       writel_relaxed(config->stall_ctrl, drvdata->base + TRCSTALLCTLR);
-       writel_relaxed(config->ts_ctrl, drvdata->base + TRCTSCTLR);
-       writel_relaxed(config->syncfreq, drvdata->base + TRCSYNCPR);
-       writel_relaxed(config->ccctlr, drvdata->base + TRCCCCTLR);
-       writel_relaxed(config->bb_ctrl, drvdata->base + TRCBBCTLR);
-       writel_relaxed(drvdata->trcid, drvdata->base + TRCTRACEIDR);
-       writel_relaxed(config->vinst_ctrl, drvdata->base + TRCVICTLR);
-       writel_relaxed(config->viiectlr, drvdata->base + TRCVIIECTLR);
-       writel_relaxed(config->vissctlr,
-                      drvdata->base + TRCVISSCTLR);
+       etm4x_relaxed_write32(csa, 0x0, TRCAUXCTLR);
+       etm4x_relaxed_write32(csa, config->eventctrl0, TRCEVENTCTL0R);
+       etm4x_relaxed_write32(csa, config->eventctrl1, TRCEVENTCTL1R);
+       etm4x_relaxed_write32(csa, config->stall_ctrl, TRCSTALLCTLR);
+       etm4x_relaxed_write32(csa, config->ts_ctrl, TRCTSCTLR);
+       etm4x_relaxed_write32(csa, config->syncfreq, TRCSYNCPR);
+       etm4x_relaxed_write32(csa, config->ccctlr, TRCCCCTLR);
+       etm4x_relaxed_write32(csa, config->bb_ctrl, TRCBBCTLR);
+       etm4x_relaxed_write32(csa, drvdata->trcid, TRCTRACEIDR);
+       etm4x_relaxed_write32(csa, config->vinst_ctrl, TRCVICTLR);
+       etm4x_relaxed_write32(csa, config->viiectlr, TRCVIIECTLR);
+       etm4x_relaxed_write32(csa, config->vissctlr, TRCVISSCTLR);
        if (drvdata->nr_pe_cmp)
-               writel_relaxed(config->vipcssctlr,
-                              drvdata->base + TRCVIPCSSCTLR);
+               etm4x_relaxed_write32(csa, config->vipcssctlr, TRCVIPCSSCTLR);
        for (i = 0; i < drvdata->nrseqstate - 1; i++)
-               writel_relaxed(config->seq_ctrl[i],
-                              drvdata->base + TRCSEQEVRn(i));
-       writel_relaxed(config->seq_rst, drvdata->base + TRCSEQRSTEVR);
-       writel_relaxed(config->seq_state, drvdata->base + TRCSEQSTR);
-       writel_relaxed(config->ext_inp, drvdata->base + TRCEXTINSELR);
+               etm4x_relaxed_write32(csa, config->seq_ctrl[i], TRCSEQEVRn(i));
+       etm4x_relaxed_write32(csa, config->seq_rst, TRCSEQRSTEVR);
+       etm4x_relaxed_write32(csa, config->seq_state, TRCSEQSTR);
+       etm4x_relaxed_write32(csa, config->ext_inp, TRCEXTINSELR);
        for (i = 0; i < drvdata->nr_cntr; i++) {
-               writel_relaxed(config->cntrldvr[i],
-                              drvdata->base + TRCCNTRLDVRn(i));
-               writel_relaxed(config->cntr_ctrl[i],
-                              drvdata->base + TRCCNTCTLRn(i));
-               writel_relaxed(config->cntr_val[i],
-                              drvdata->base + TRCCNTVRn(i));
+               etm4x_relaxed_write32(csa, config->cntrldvr[i], TRCCNTRLDVRn(i));
+               etm4x_relaxed_write32(csa, config->cntr_ctrl[i], TRCCNTCTLRn(i));
+               etm4x_relaxed_write32(csa, config->cntr_val[i], TRCCNTVRn(i));
        }
 
        /*
@@ -259,54 +331,52 @@ static int etm4_enable_hw(struct etmv4_drvdata *drvdata)
         * such start at 2.
         */
        for (i = 2; i < drvdata->nr_resource * 2; i++)
-               writel_relaxed(config->res_ctrl[i],
-                              drvdata->base + TRCRSCTLRn(i));
+               etm4x_relaxed_write32(csa, config->res_ctrl[i], TRCRSCTLRn(i));
 
        for (i = 0; i < drvdata->nr_ss_cmp; i++) {
                /* always clear status bit on restart if using single-shot */
                if (config->ss_ctrl[i] || config->ss_pe_cmp[i])
                        config->ss_status[i] &= ~BIT(31);
-               writel_relaxed(config->ss_ctrl[i],
-                              drvdata->base + TRCSSCCRn(i));
-               writel_relaxed(config->ss_status[i],
-                              drvdata->base + TRCSSCSRn(i));
-               writel_relaxed(config->ss_pe_cmp[i],
-                              drvdata->base + TRCSSPCICRn(i));
+               etm4x_relaxed_write32(csa, config->ss_ctrl[i], TRCSSCCRn(i));
+               etm4x_relaxed_write32(csa, config->ss_status[i], TRCSSCSRn(i));
+               if (etm4x_sspcicrn_present(drvdata, i))
+                       etm4x_relaxed_write32(csa, config->ss_pe_cmp[i], TRCSSPCICRn(i));
        }
        for (i = 0; i < drvdata->nr_addr_cmp; i++) {
-               writeq_relaxed(config->addr_val[i],
-                              drvdata->base + TRCACVRn(i));
-               writeq_relaxed(config->addr_acc[i],
-                              drvdata->base + TRCACATRn(i));
+               etm4x_relaxed_write64(csa, config->addr_val[i], TRCACVRn(i));
+               etm4x_relaxed_write64(csa, config->addr_acc[i], TRCACATRn(i));
        }
        for (i = 0; i < drvdata->numcidc; i++)
-               writeq_relaxed(config->ctxid_pid[i],
-                              drvdata->base + TRCCIDCVRn(i));
-       writel_relaxed(config->ctxid_mask0, drvdata->base + TRCCIDCCTLR0);
+               etm4x_relaxed_write64(csa, config->ctxid_pid[i], TRCCIDCVRn(i));
+       etm4x_relaxed_write32(csa, config->ctxid_mask0, TRCCIDCCTLR0);
        if (drvdata->numcidc > 4)
-               writel_relaxed(config->ctxid_mask1, drvdata->base + TRCCIDCCTLR1);
+               etm4x_relaxed_write32(csa, config->ctxid_mask1, TRCCIDCCTLR1);
 
        for (i = 0; i < drvdata->numvmidc; i++)
-               writeq_relaxed(config->vmid_val[i],
-                              drvdata->base + TRCVMIDCVRn(i));
-       writel_relaxed(config->vmid_mask0, drvdata->base + TRCVMIDCCTLR0);
+               etm4x_relaxed_write64(csa, config->vmid_val[i], TRCVMIDCVRn(i));
+       etm4x_relaxed_write32(csa, config->vmid_mask0, TRCVMIDCCTLR0);
        if (drvdata->numvmidc > 4)
-               writel_relaxed(config->vmid_mask1, drvdata->base + TRCVMIDCCTLR1);
+               etm4x_relaxed_write32(csa, config->vmid_mask1, TRCVMIDCCTLR1);
 
        if (!drvdata->skip_power_up) {
+               u32 trcpdcr = etm4x_relaxed_read32(csa, TRCPDCR);
+
                /*
                 * Request to keep the trace unit powered and also
                 * emulation of powerdown
                 */
-               writel_relaxed(readl_relaxed(drvdata->base + TRCPDCR) |
-                              TRCPDCR_PU, drvdata->base + TRCPDCR);
+               etm4x_relaxed_write32(csa, trcpdcr | TRCPDCR_PU, TRCPDCR);
        }
 
        /* Enable the trace unit */
-       writel_relaxed(1, drvdata->base + TRCPRGCTLR);
+       etm4x_relaxed_write32(csa, 1, TRCPRGCTLR);
+
+       /* Synchronize the register updates for sysreg access */
+       if (!csa->io_mem)
+               isb();
 
        /* wait for TRCSTATR.IDLE to go back down to '0' */
-       if (coresight_timeout(drvdata->base, TRCSTATR, TRCSTATR_IDLE_BIT, 0))
+       if (coresight_timeout(csa, TRCSTATR, TRCSTATR_IDLE_BIT, 0))
                dev_err(etm_dev,
                        "timeout while waiting for Idle Trace Status\n");
 
@@ -318,7 +388,7 @@ static int etm4_enable_hw(struct etmv4_drvdata *drvdata)
        isb();
 
 done:
-       CS_LOCK(drvdata->base);
+       etm4_cs_lock(drvdata, csa);
 
        dev_dbg(etm_dev, "cpu: %d enable smp call done: %d\n",
                drvdata->cpu, rc);
@@ -570,20 +640,22 @@ static void etm4_disable_hw(void *info)
        u32 control;
        struct etmv4_drvdata *drvdata = info;
        struct etmv4_config *config = &drvdata->config;
-       struct device *etm_dev = &drvdata->csdev->dev;
+       struct coresight_device *csdev = drvdata->csdev;
+       struct device *etm_dev = &csdev->dev;
+       struct csdev_access *csa = &csdev->access;
        int i;
 
-       CS_UNLOCK(drvdata->base);
+       etm4_cs_unlock(drvdata, csa);
        etm4_disable_arch_specific(drvdata);
 
        if (!drvdata->skip_power_up) {
                /* power can be removed from the trace unit now */
-               control = readl_relaxed(drvdata->base + TRCPDCR);
+               control = etm4x_relaxed_read32(csa, TRCPDCR);
                control &= ~TRCPDCR_PU;
-               writel_relaxed(control, drvdata->base + TRCPDCR);
+               etm4x_relaxed_write32(csa, control, TRCPDCR);
        }
 
-       control = readl_relaxed(drvdata->base + TRCPRGCTLR);
+       control = etm4x_relaxed_read32(csa, TRCPRGCTLR);
 
        /* EN, bit[0] Trace unit enable bit */
        control &= ~0x1;
@@ -595,29 +667,27 @@ static void etm4_disable_hw(void *info)
         */
        dsb(sy);
        isb();
-       writel_relaxed(control, drvdata->base + TRCPRGCTLR);
+       etm4x_relaxed_write32(csa, control, TRCPRGCTLR);
 
        /* wait for TRCSTATR.PMSTABLE to go to '1' */
-       if (coresight_timeout(drvdata->base, TRCSTATR,
-                             TRCSTATR_PMSTABLE_BIT, 1))
+       if (coresight_timeout(csa, TRCSTATR, TRCSTATR_PMSTABLE_BIT, 1))
                dev_err(etm_dev,
                        "timeout while waiting for PM stable Trace Status\n");
 
        /* read the status of the single shot comparators */
        for (i = 0; i < drvdata->nr_ss_cmp; i++) {
                config->ss_status[i] =
-                       readl_relaxed(drvdata->base + TRCSSCSRn(i));
+                       etm4x_relaxed_read32(csa, TRCSSCSRn(i));
        }
 
        /* read back the current counter values */
        for (i = 0; i < drvdata->nr_cntr; i++) {
                config->cntr_val[i] =
-                       readl_relaxed(drvdata->base + TRCCNTVRn(i));
+                       etm4x_relaxed_read32(csa, TRCCNTVRn(i));
        }
 
-       coresight_disclaim_device_unlocked(drvdata->base);
-
-       CS_LOCK(drvdata->base);
+       coresight_disclaim_device_unlocked(csdev);
+       etm4_cs_lock(drvdata, csa);
 
        dev_dbg(&drvdata->csdev->dev,
                "cpu: %d disable smp call done\n", drvdata->cpu);
@@ -641,7 +711,7 @@ static int etm4_disable_perf(struct coresight_device *csdev,
         * scheduled again.  Configuration of the start/stop logic happens in
         * function etm4_set_event_filters().
         */
-       control = readl_relaxed(drvdata->base + TRCVICTLR);
+       control = etm4x_relaxed_read32(&csdev->access, TRCVICTLR);
        /* TRCVICTLR::SSSTATUS, bit[9] */
        filters->ssstatus = (control & BIT(9));
 
@@ -712,24 +782,110 @@ static const struct coresight_ops etm4_cs_ops = {
        .source_ops     = &etm4_source_ops,
 };
 
+static inline bool cpu_supports_sysreg_trace(void)
+{
+       u64 dfr0 = read_sysreg_s(SYS_ID_AA64DFR0_EL1);
+
+       return ((dfr0 >> ID_AA64DFR0_TRACEVER_SHIFT) & 0xfUL) > 0;
+}
+
+static bool etm4_init_sysreg_access(struct etmv4_drvdata *drvdata,
+                                   struct csdev_access *csa)
+{
+       u32 devarch;
+
+       if (!cpu_supports_sysreg_trace())
+               return false;
+
+       /*
+        * ETMs implementing sysreg access must implement TRCDEVARCH.
+        */
+       devarch = read_etm4x_sysreg_const_offset(TRCDEVARCH);
+       if ((devarch & ETM_DEVARCH_ID_MASK) != ETM_DEVARCH_ETMv4x_ARCH)
+               return false;
+       *csa = (struct csdev_access) {
+               .io_mem = false,
+               .read   = etm4x_sysreg_read,
+               .write  = etm4x_sysreg_write,
+       };
+
+       drvdata->arch = etm_devarch_to_arch(devarch);
+       return true;
+}
+
+static bool etm4_init_iomem_access(struct etmv4_drvdata *drvdata,
+                                  struct csdev_access *csa)
+{
+       u32 devarch = readl_relaxed(drvdata->base + TRCDEVARCH);
+       u32 idr1 = readl_relaxed(drvdata->base + TRCIDR1);
+
+       /*
+        * All ETMs must implement TRCDEVARCH to indicate that
+        * the component is an ETMv4. To support any broken
+        * implementations we fall back to TRCIDR1 check, which
+        * is not really reliable.
+        */
+       if ((devarch & ETM_DEVARCH_ID_MASK) == ETM_DEVARCH_ETMv4x_ARCH) {
+               drvdata->arch = etm_devarch_to_arch(devarch);
+       } else {
+               pr_warn("CPU%d: ETM4x incompatible TRCDEVARCH: %x, falling back to TRCIDR1\n",
+                       smp_processor_id(), devarch);
+
+               if (ETM_TRCIDR1_ARCH_MAJOR(idr1) != ETM_TRCIDR1_ARCH_ETMv4)
+                       return false;
+               drvdata->arch = etm_trcidr_to_arch(idr1);
+       }
+
+       *csa = CSDEV_ACCESS_IOMEM(drvdata->base);
+       return true;
+}
+
+static bool etm4_init_csdev_access(struct etmv4_drvdata *drvdata,
+                                  struct csdev_access *csa)
+{
+       /*
+        * Always choose the memory mapped io, if there is
+        * a memory map to prevent sysreg access on broken
+        * systems.
+        */
+       if (drvdata->base)
+               return etm4_init_iomem_access(drvdata, csa);
+
+       if (etm4_init_sysreg_access(drvdata, csa))
+               return true;
+
+       return false;
+}
+
 static void etm4_init_arch_data(void *info)
 {
        u32 etmidr0;
-       u32 etmidr1;
        u32 etmidr2;
        u32 etmidr3;
        u32 etmidr4;
        u32 etmidr5;
-       struct etmv4_drvdata *drvdata = info;
+       struct etm4_init_arg *init_arg = info;
+       struct etmv4_drvdata *drvdata;
+       struct csdev_access *csa;
        int i;
 
-       /* Make sure all registers are accessible */
-       etm4_os_unlock(drvdata);
+       drvdata = init_arg->drvdata;
+       csa = init_arg->csa;
+
+       /*
+        * If we are unable to detect the access mechanism,
+        * or unable to detect the trace unit type, fail
+        * early.
+        */
+       if (!etm4_init_csdev_access(drvdata, csa))
+               return;
 
-       CS_UNLOCK(drvdata->base);
+       /* Make sure all registers are accessible */
+       etm4_os_unlock_csa(drvdata, csa);
+       etm4_cs_unlock(drvdata, csa);
 
        /* find all capabilities of the tracing unit */
-       etmidr0 = readl_relaxed(drvdata->base + TRCIDR0);
+       etmidr0 = etm4x_relaxed_read32(csa, TRCIDR0);
 
        /* INSTP0, bits[2:1] P0 tracing support field */
        if (BMVAL(etmidr0, 1, 1) && BMVAL(etmidr0, 2, 2))
@@ -768,17 +924,8 @@ static void etm4_init_arch_data(void *info)
        /* TSSIZE, bits[28:24] Global timestamp size field */
        drvdata->ts_size = BMVAL(etmidr0, 24, 28);
 
-       /* base architecture of trace unit */
-       etmidr1 = readl_relaxed(drvdata->base + TRCIDR1);
-       /*
-        * TRCARCHMIN, bits[7:4] architecture the minor version number
-        * TRCARCHMAJ, bits[11:8] architecture major versin number
-        */
-       drvdata->arch = BMVAL(etmidr1, 4, 11);
-       drvdata->config.arch = drvdata->arch;
-
        /* maximum size of resources */
-       etmidr2 = readl_relaxed(drvdata->base + TRCIDR2);
+       etmidr2 = etm4x_relaxed_read32(csa, TRCIDR2);
        /* CIDSIZE, bits[9:5] Indicates the Context ID size */
        drvdata->ctxid_size = BMVAL(etmidr2, 5, 9);
        /* VMIDSIZE, bits[14:10] Indicates the VMID size */
@@ -786,11 +933,12 @@ static void etm4_init_arch_data(void *info)
        /* CCSIZE, bits[28:25] size of the cycle counter in bits minus 12 */
        drvdata->ccsize = BMVAL(etmidr2, 25, 28);
 
-       etmidr3 = readl_relaxed(drvdata->base + TRCIDR3);
+       etmidr3 = etm4x_relaxed_read32(csa, TRCIDR3);
        /* CCITMIN, bits[11:0] minimum threshold value that can be programmed */
        drvdata->ccitmin = BMVAL(etmidr3, 0, 11);
        /* EXLEVEL_S, bits[19:16] Secure state instruction tracing */
        drvdata->s_ex_level = BMVAL(etmidr3, 16, 19);
+       drvdata->config.s_ex_level = drvdata->s_ex_level;
        /* EXLEVEL_NS, bits[23:20] Non-secure state instruction tracing */
        drvdata->ns_ex_level = BMVAL(etmidr3, 20, 23);
 
@@ -836,7 +984,7 @@ static void etm4_init_arch_data(void *info)
                drvdata->nooverflow = false;
 
        /* number of resources trace unit supports */
-       etmidr4 = readl_relaxed(drvdata->base + TRCIDR4);
+       etmidr4 = etm4x_relaxed_read32(csa, TRCIDR4);
        /* NUMACPAIRS, bits[0:3] number of addr comparator pairs for tracing */
        drvdata->nr_addr_cmp = BMVAL(etmidr4, 0, 3);
        /* NUMPC, bits[15:12] number of PE comparator inputs for tracing */
@@ -852,7 +1000,7 @@ static void etm4_init_arch_data(void *info)
         * Otherwise for values 0x1 and above the number is N + 1 as per v4.2.
         */
        drvdata->nr_resource = BMVAL(etmidr4, 16, 19);
-       if ((drvdata->arch < ETM4X_ARCH_4V3) || (drvdata->nr_resource > 0))
+       if ((drvdata->arch < ETM_ARCH_V4_3) || (drvdata->nr_resource > 0))
                drvdata->nr_resource += 1;
        /*
         * NUMSSCC, bits[23:20] the number of single-shot
@@ -862,14 +1010,14 @@ static void etm4_init_arch_data(void *info)
        drvdata->nr_ss_cmp = BMVAL(etmidr4, 20, 23);
        for (i = 0; i < drvdata->nr_ss_cmp; i++) {
                drvdata->config.ss_status[i] =
-                       readl_relaxed(drvdata->base + TRCSSCSRn(i));
+                       etm4x_relaxed_read32(csa, TRCSSCSRn(i));
        }
        /* NUMCIDC, bits[27:24] number of Context ID comparators for tracing */
        drvdata->numcidc = BMVAL(etmidr4, 24, 27);
        /* NUMVMIDC, bits[31:28] number of VMID comparators for tracing */
        drvdata->numvmidc = BMVAL(etmidr4, 28, 31);
 
-       etmidr5 = readl_relaxed(drvdata->base + TRCIDR5);
+       etmidr5 = etm4x_relaxed_read32(csa, TRCIDR5);
        /* NUMEXTIN, bits[8:0] number of external inputs implemented */
        drvdata->nr_ext_inp = BMVAL(etmidr5, 0, 8);
        /* TRACEIDSIZE, bits[21:16] indicates the trace ID width */
@@ -891,23 +1039,19 @@ static void etm4_init_arch_data(void *info)
        drvdata->nrseqstate = BMVAL(etmidr5, 25, 27);
        /* NUMCNTR, bits[30:28] number of counters available for tracing */
        drvdata->nr_cntr = BMVAL(etmidr5, 28, 30);
-       CS_LOCK(drvdata->base);
+       etm4_cs_lock(drvdata, csa);
+}
+
+static inline u32 etm4_get_victlr_access_type(struct etmv4_config *config)
+{
+       return etm4_get_access_type(config) << TRCVICTLR_EXLEVEL_SHIFT;
 }
 
 /* Set ELx trace filter access in the TRCVICTLR register */
 static void etm4_set_victlr_access(struct etmv4_config *config)
 {
-       u64 access_type;
-
-       config->vinst_ctrl &= ~(ETM_EXLEVEL_S_VICTLR_MASK | ETM_EXLEVEL_NS_VICTLR_MASK);
-
-       /*
-        * TRCVICTLR::EXLEVEL_NS:EXLEVELS: Set kernel / user filtering
-        * bits in vinst_ctrl, same bit pattern as TRCACATRn values returned by
-        * etm4_get_access_type() but with a relative shift in this register.
-        */
-       access_type = etm4_get_access_type(config) << ETM_EXLEVEL_LSHIFT_TRCVICTLR;
-       config->vinst_ctrl |= (u32)access_type;
+       config->vinst_ctrl &= ~TRCVICTLR_EXLEVEL_MASK;
+       config->vinst_ctrl |= etm4_get_victlr_access_type(config);
 }
 
 static void etm4_set_default_config(struct etmv4_config *config)
@@ -937,12 +1081,9 @@ static u64 etm4_get_ns_access_type(struct etmv4_config *config)
        u64 access_type = 0;
 
        /*
-        * EXLEVEL_NS, bits[15:12]
-        * The Exception levels are:
-        *   Bit[12] Exception level 0 - Application
-        *   Bit[13] Exception level 1 - OS
-        *   Bit[14] Exception level 2 - Hypervisor
-        *   Bit[15] Never implemented
+        * EXLEVEL_NS, for NonSecure Exception levels.
+        * The mask here is a generic value and must be
+        * shifted to the corresponding field for the registers
         */
        if (!is_kernel_in_hyp_mode()) {
                /* Stay away from hypervisor mode for non-VHE */
@@ -959,27 +1100,26 @@ static u64 etm4_get_ns_access_type(struct etmv4_config *config)
        return access_type;
 }
 
+/*
+ * Construct the exception level masks for a given config.
+ * This must be shifted to the corresponding register field
+ * for usage.
+ */
 static u64 etm4_get_access_type(struct etmv4_config *config)
 {
-       u64 access_type = etm4_get_ns_access_type(config);
-       u64 s_hyp = (config->arch & 0x0f) >= 0x4 ? ETM_EXLEVEL_S_HYP : 0;
-
-       /*
-        * EXLEVEL_S, bits[11:8], don't trace anything happening
-        * in secure state.
-        */
-       access_type |= (ETM_EXLEVEL_S_APP       |
-                       ETM_EXLEVEL_S_OS        |
-                       s_hyp                   |
-                       ETM_EXLEVEL_S_MON);
+       /* All Secure exception levels are excluded from the trace */
+       return etm4_get_ns_access_type(config) | (u64)config->s_ex_level;
+}
 
-       return access_type;
+static u64 etm4_get_comparator_access_type(struct etmv4_config *config)
+{
+       return etm4_get_access_type(config) << TRCACATR_EXLEVEL_SHIFT;
 }
 
 static void etm4_set_comparator_filter(struct etmv4_config *config,
                                       u64 start, u64 stop, int comparator)
 {
-       u64 access_type = etm4_get_access_type(config);
+       u64 access_type = etm4_get_comparator_access_type(config);
 
        /* First half of default address comparator */
        config->addr_val[comparator] = start;
@@ -1014,7 +1154,7 @@ static void etm4_set_start_stop_filter(struct etmv4_config *config,
                                       enum etm_addr_type type)
 {
        int shift;
-       u64 access_type = etm4_get_access_type(config);
+       u64 access_type = etm4_get_comparator_access_type(config);
 
        /* Configure the comparator */
        config->addr_val[comparator] = address;
@@ -1255,7 +1395,15 @@ static int etm4_cpu_save(struct etmv4_drvdata *drvdata)
 {
        int i, ret = 0;
        struct etmv4_save_state *state;
-       struct device *etm_dev = &drvdata->csdev->dev;
+       struct coresight_device *csdev = drvdata->csdev;
+       struct csdev_access *csa;
+       struct device *etm_dev;
+
+       if (WARN_ON(!csdev))
+               return -ENODEV;
+
+       etm_dev = &csdev->dev;
+       csa = &csdev->access;
 
        /*
         * As recommended by 3.4.1 ("The procedure when powering down the PE")
@@ -1264,14 +1412,12 @@ static int etm4_cpu_save(struct etmv4_drvdata *drvdata)
        dsb(sy);
        isb();
 
-       CS_UNLOCK(drvdata->base);
-
+       etm4_cs_unlock(drvdata, csa);
        /* Lock the OS lock to disable trace and external debugger access */
        etm4_os_lock(drvdata);
 
        /* wait for TRCSTATR.PMSTABLE to go up */
-       if (coresight_timeout(drvdata->base, TRCSTATR,
-                             TRCSTATR_PMSTABLE_BIT, 1)) {
+       if (coresight_timeout(csa, TRCSTATR, TRCSTATR_PMSTABLE_BIT, 1)) {
                dev_err(etm_dev,
                        "timeout while waiting for PM Stable Status\n");
                etm4_os_unlock(drvdata);
@@ -1281,55 +1427,56 @@ static int etm4_cpu_save(struct etmv4_drvdata *drvdata)
 
        state = drvdata->save_state;
 
-       state->trcprgctlr = readl(drvdata->base + TRCPRGCTLR);
+       state->trcprgctlr = etm4x_read32(csa, TRCPRGCTLR);
        if (drvdata->nr_pe)
-               state->trcprocselr = readl(drvdata->base + TRCPROCSELR);
-       state->trcconfigr = readl(drvdata->base + TRCCONFIGR);
-       state->trcauxctlr = readl(drvdata->base + TRCAUXCTLR);
-       state->trceventctl0r = readl(drvdata->base + TRCEVENTCTL0R);
-       state->trceventctl1r = readl(drvdata->base + TRCEVENTCTL1R);
-       state->trcstallctlr = readl(drvdata->base + TRCSTALLCTLR);
-       state->trctsctlr = readl(drvdata->base + TRCTSCTLR);
-       state->trcsyncpr = readl(drvdata->base + TRCSYNCPR);
-       state->trcccctlr = readl(drvdata->base + TRCCCCTLR);
-       state->trcbbctlr = readl(drvdata->base + TRCBBCTLR);
-       state->trctraceidr = readl(drvdata->base + TRCTRACEIDR);
-       state->trcqctlr = readl(drvdata->base + TRCQCTLR);
-
-       state->trcvictlr = readl(drvdata->base + TRCVICTLR);
-       state->trcviiectlr = readl(drvdata->base + TRCVIIECTLR);
-       state->trcvissctlr = readl(drvdata->base + TRCVISSCTLR);
+               state->trcprocselr = etm4x_read32(csa, TRCPROCSELR);
+       state->trcconfigr = etm4x_read32(csa, TRCCONFIGR);
+       state->trcauxctlr = etm4x_read32(csa, TRCAUXCTLR);
+       state->trceventctl0r = etm4x_read32(csa, TRCEVENTCTL0R);
+       state->trceventctl1r = etm4x_read32(csa, TRCEVENTCTL1R);
+       state->trcstallctlr = etm4x_read32(csa, TRCSTALLCTLR);
+       state->trctsctlr = etm4x_read32(csa, TRCTSCTLR);
+       state->trcsyncpr = etm4x_read32(csa, TRCSYNCPR);
+       state->trcccctlr = etm4x_read32(csa, TRCCCCTLR);
+       state->trcbbctlr = etm4x_read32(csa, TRCBBCTLR);
+       state->trctraceidr = etm4x_read32(csa, TRCTRACEIDR);
+       state->trcqctlr = etm4x_read32(csa, TRCQCTLR);
+
+       state->trcvictlr = etm4x_read32(csa, TRCVICTLR);
+       state->trcviiectlr = etm4x_read32(csa, TRCVIIECTLR);
+       state->trcvissctlr = etm4x_read32(csa, TRCVISSCTLR);
        if (drvdata->nr_pe_cmp)
-               state->trcvipcssctlr = readl(drvdata->base + TRCVIPCSSCTLR);
-       state->trcvdctlr = readl(drvdata->base + TRCVDCTLR);
-       state->trcvdsacctlr = readl(drvdata->base + TRCVDSACCTLR);
-       state->trcvdarcctlr = readl(drvdata->base + TRCVDARCCTLR);
+               state->trcvipcssctlr = etm4x_read32(csa, TRCVIPCSSCTLR);
+       state->trcvdctlr = etm4x_read32(csa, TRCVDCTLR);
+       state->trcvdsacctlr = etm4x_read32(csa, TRCVDSACCTLR);
+       state->trcvdarcctlr = etm4x_read32(csa, TRCVDARCCTLR);
 
        for (i = 0; i < drvdata->nrseqstate - 1; i++)
-               state->trcseqevr[i] = readl(drvdata->base + TRCSEQEVRn(i));
+               state->trcseqevr[i] = etm4x_read32(csa, TRCSEQEVRn(i));
 
-       state->trcseqrstevr = readl(drvdata->base + TRCSEQRSTEVR);
-       state->trcseqstr = readl(drvdata->base + TRCSEQSTR);
-       state->trcextinselr = readl(drvdata->base + TRCEXTINSELR);
+       state->trcseqrstevr = etm4x_read32(csa, TRCSEQRSTEVR);
+       state->trcseqstr = etm4x_read32(csa, TRCSEQSTR);
+       state->trcextinselr = etm4x_read32(csa, TRCEXTINSELR);
 
        for (i = 0; i < drvdata->nr_cntr; i++) {
-               state->trccntrldvr[i] = readl(drvdata->base + TRCCNTRLDVRn(i));
-               state->trccntctlr[i] = readl(drvdata->base + TRCCNTCTLRn(i));
-               state->trccntvr[i] = readl(drvdata->base + TRCCNTVRn(i));
+               state->trccntrldvr[i] = etm4x_read32(csa, TRCCNTRLDVRn(i));
+               state->trccntctlr[i] = etm4x_read32(csa, TRCCNTCTLRn(i));
+               state->trccntvr[i] = etm4x_read32(csa, TRCCNTVRn(i));
        }
 
        for (i = 0; i < drvdata->nr_resource * 2; i++)
-               state->trcrsctlr[i] = readl(drvdata->base + TRCRSCTLRn(i));
+               state->trcrsctlr[i] = etm4x_read32(csa, TRCRSCTLRn(i));
 
        for (i = 0; i < drvdata->nr_ss_cmp; i++) {
-               state->trcssccr[i] = readl(drvdata->base + TRCSSCCRn(i));
-               state->trcsscsr[i] = readl(drvdata->base + TRCSSCSRn(i));
-               state->trcsspcicr[i] = readl(drvdata->base + TRCSSPCICRn(i));
+               state->trcssccr[i] = etm4x_read32(csa, TRCSSCCRn(i));
+               state->trcsscsr[i] = etm4x_read32(csa, TRCSSCSRn(i));
+               if (etm4x_sspcicrn_present(drvdata, i))
+                       state->trcsspcicr[i] = etm4x_read32(csa, TRCSSPCICRn(i));
        }
 
        for (i = 0; i < drvdata->nr_addr_cmp * 2; i++) {
-               state->trcacvr[i] = readq(drvdata->base + TRCACVRn(i));
-               state->trcacatr[i] = readq(drvdata->base + TRCACATRn(i));
+               state->trcacvr[i] = etm4x_read64(csa, TRCACVRn(i));
+               state->trcacatr[i] = etm4x_read64(csa, TRCACATRn(i));
        }
 
        /*
@@ -1340,25 +1487,26 @@ static int etm4_cpu_save(struct etmv4_drvdata *drvdata)
         */
 
        for (i = 0; i < drvdata->numcidc; i++)
-               state->trccidcvr[i] = readq(drvdata->base + TRCCIDCVRn(i));
+               state->trccidcvr[i] = etm4x_read64(csa, TRCCIDCVRn(i));
 
        for (i = 0; i < drvdata->numvmidc; i++)
-               state->trcvmidcvr[i] = readq(drvdata->base + TRCVMIDCVRn(i));
+               state->trcvmidcvr[i] = etm4x_read64(csa, TRCVMIDCVRn(i));
 
-       state->trccidcctlr0 = readl(drvdata->base + TRCCIDCCTLR0);
+       state->trccidcctlr0 = etm4x_read32(csa, TRCCIDCCTLR0);
        if (drvdata->numcidc > 4)
-               state->trccidcctlr1 = readl(drvdata->base + TRCCIDCCTLR1);
+               state->trccidcctlr1 = etm4x_read32(csa, TRCCIDCCTLR1);
 
-       state->trcvmidcctlr0 = readl(drvdata->base + TRCVMIDCCTLR0);
+       state->trcvmidcctlr0 = etm4x_read32(csa, TRCVMIDCCTLR0);
        if (drvdata->numvmidc > 4)
-               state->trcvmidcctlr1 = readl(drvdata->base + TRCVMIDCCTLR1);
+               state->trcvmidcctlr0 = etm4x_read32(csa, TRCVMIDCCTLR1);
 
-       state->trcclaimset = readl(drvdata->base + TRCCLAIMCLR);
+       state->trcclaimset = etm4x_read32(csa, TRCCLAIMCLR);
 
-       state->trcpdcr = readl(drvdata->base + TRCPDCR);
+       if (!drvdata->skip_power_up)
+               state->trcpdcr = etm4x_read32(csa, TRCPDCR);
 
        /* wait for TRCSTATR.IDLE to go up */
-       if (coresight_timeout(drvdata->base, TRCSTATR, TRCSTATR_IDLE_BIT, 1)) {
+       if (coresight_timeout(csa, TRCSTATR, TRCSTATR_IDLE_BIT, 1)) {
                dev_err(etm_dev,
                        "timeout while waiting for Idle Trace Status\n");
                etm4_os_unlock(drvdata);
@@ -1373,11 +1521,11 @@ static int etm4_cpu_save(struct etmv4_drvdata *drvdata)
         * potentially save power on systems that respect the TRCPDCR_PU
         * despite requesting software to save/restore state.
         */
-       writel_relaxed((state->trcpdcr & ~TRCPDCR_PU),
-                       drvdata->base + TRCPDCR);
-
+       if (!drvdata->skip_power_up)
+               etm4x_relaxed_write32(csa, (state->trcpdcr & ~TRCPDCR_PU),
+                                     TRCPDCR);
 out:
-       CS_LOCK(drvdata->base);
+       etm4_cs_lock(drvdata, csa);
        return ret;
 }
 
@@ -1385,91 +1533,82 @@ static void etm4_cpu_restore(struct etmv4_drvdata *drvdata)
 {
        int i;
        struct etmv4_save_state *state = drvdata->save_state;
+       struct csdev_access tmp_csa = CSDEV_ACCESS_IOMEM(drvdata->base);
+       struct csdev_access *csa = &tmp_csa;
 
-       CS_UNLOCK(drvdata->base);
-
-       writel_relaxed(state->trcclaimset, drvdata->base + TRCCLAIMSET);
+       etm4_cs_unlock(drvdata, csa);
+       etm4x_relaxed_write32(csa, state->trcclaimset, TRCCLAIMSET);
 
-       writel_relaxed(state->trcprgctlr, drvdata->base + TRCPRGCTLR);
+       etm4x_relaxed_write32(csa, state->trcprgctlr, TRCPRGCTLR);
        if (drvdata->nr_pe)
-               writel_relaxed(state->trcprocselr, drvdata->base + TRCPROCSELR);
-       writel_relaxed(state->trcconfigr, drvdata->base + TRCCONFIGR);
-       writel_relaxed(state->trcauxctlr, drvdata->base + TRCAUXCTLR);
-       writel_relaxed(state->trceventctl0r, drvdata->base + TRCEVENTCTL0R);
-       writel_relaxed(state->trceventctl1r, drvdata->base + TRCEVENTCTL1R);
-       writel_relaxed(state->trcstallctlr, drvdata->base + TRCSTALLCTLR);
-       writel_relaxed(state->trctsctlr, drvdata->base + TRCTSCTLR);
-       writel_relaxed(state->trcsyncpr, drvdata->base + TRCSYNCPR);
-       writel_relaxed(state->trcccctlr, drvdata->base + TRCCCCTLR);
-       writel_relaxed(state->trcbbctlr, drvdata->base + TRCBBCTLR);
-       writel_relaxed(state->trctraceidr, drvdata->base + TRCTRACEIDR);
-       writel_relaxed(state->trcqctlr, drvdata->base + TRCQCTLR);
-
-       writel_relaxed(state->trcvictlr, drvdata->base + TRCVICTLR);
-       writel_relaxed(state->trcviiectlr, drvdata->base + TRCVIIECTLR);
-       writel_relaxed(state->trcvissctlr, drvdata->base + TRCVISSCTLR);
+               etm4x_relaxed_write32(csa, state->trcprocselr, TRCPROCSELR);
+       etm4x_relaxed_write32(csa, state->trcconfigr, TRCCONFIGR);
+       etm4x_relaxed_write32(csa, state->trcauxctlr, TRCAUXCTLR);
+       etm4x_relaxed_write32(csa, state->trceventctl0r, TRCEVENTCTL0R);
+       etm4x_relaxed_write32(csa, state->trceventctl1r, TRCEVENTCTL1R);
+       etm4x_relaxed_write32(csa, state->trcstallctlr, TRCSTALLCTLR);
+       etm4x_relaxed_write32(csa, state->trctsctlr, TRCTSCTLR);
+       etm4x_relaxed_write32(csa, state->trcsyncpr, TRCSYNCPR);
+       etm4x_relaxed_write32(csa, state->trcccctlr, TRCCCCTLR);
+       etm4x_relaxed_write32(csa, state->trcbbctlr, TRCBBCTLR);
+       etm4x_relaxed_write32(csa, state->trctraceidr, TRCTRACEIDR);
+       etm4x_relaxed_write32(csa, state->trcqctlr, TRCQCTLR);
+
+       etm4x_relaxed_write32(csa, state->trcvictlr, TRCVICTLR);
+       etm4x_relaxed_write32(csa, state->trcviiectlr, TRCVIIECTLR);
+       etm4x_relaxed_write32(csa, state->trcvissctlr, TRCVISSCTLR);
        if (drvdata->nr_pe_cmp)
-               writel_relaxed(state->trcvipcssctlr, drvdata->base + TRCVIPCSSCTLR);
-       writel_relaxed(state->trcvdctlr, drvdata->base + TRCVDCTLR);
-       writel_relaxed(state->trcvdsacctlr, drvdata->base + TRCVDSACCTLR);
-       writel_relaxed(state->trcvdarcctlr, drvdata->base + TRCVDARCCTLR);
+               etm4x_relaxed_write32(csa, state->trcvipcssctlr, TRCVIPCSSCTLR);
+       etm4x_relaxed_write32(csa, state->trcvdctlr, TRCVDCTLR);
+       etm4x_relaxed_write32(csa, state->trcvdsacctlr, TRCVDSACCTLR);
+       etm4x_relaxed_write32(csa, state->trcvdarcctlr, TRCVDARCCTLR);
 
        for (i = 0; i < drvdata->nrseqstate - 1; i++)
-               writel_relaxed(state->trcseqevr[i],
-                              drvdata->base + TRCSEQEVRn(i));
+               etm4x_relaxed_write32(csa, state->trcseqevr[i], TRCSEQEVRn(i));
 
-       writel_relaxed(state->trcseqrstevr, drvdata->base + TRCSEQRSTEVR);
-       writel_relaxed(state->trcseqstr, drvdata->base + TRCSEQSTR);
-       writel_relaxed(state->trcextinselr, drvdata->base + TRCEXTINSELR);
+       etm4x_relaxed_write32(csa, state->trcseqrstevr, TRCSEQRSTEVR);
+       etm4x_relaxed_write32(csa, state->trcseqstr, TRCSEQSTR);
+       etm4x_relaxed_write32(csa, state->trcextinselr, TRCEXTINSELR);
 
        for (i = 0; i < drvdata->nr_cntr; i++) {
-               writel_relaxed(state->trccntrldvr[i],
-                              drvdata->base + TRCCNTRLDVRn(i));
-               writel_relaxed(state->trccntctlr[i],
-                              drvdata->base + TRCCNTCTLRn(i));
-               writel_relaxed(state->trccntvr[i],
-                              drvdata->base + TRCCNTVRn(i));
+               etm4x_relaxed_write32(csa, state->trccntrldvr[i], TRCCNTRLDVRn(i));
+               etm4x_relaxed_write32(csa, state->trccntctlr[i], TRCCNTCTLRn(i));
+               etm4x_relaxed_write32(csa, state->trccntvr[i], TRCCNTVRn(i));
        }
 
        for (i = 0; i < drvdata->nr_resource * 2; i++)
-               writel_relaxed(state->trcrsctlr[i],
-                              drvdata->base + TRCRSCTLRn(i));
+               etm4x_relaxed_write32(csa, state->trcrsctlr[i], TRCRSCTLRn(i));
 
        for (i = 0; i < drvdata->nr_ss_cmp; i++) {
-               writel_relaxed(state->trcssccr[i],
-                              drvdata->base + TRCSSCCRn(i));
-               writel_relaxed(state->trcsscsr[i],
-                              drvdata->base + TRCSSCSRn(i));
-               writel_relaxed(state->trcsspcicr[i],
-                              drvdata->base + TRCSSPCICRn(i));
+               etm4x_relaxed_write32(csa, state->trcssccr[i], TRCSSCCRn(i));
+               etm4x_relaxed_write32(csa, state->trcsscsr[i], TRCSSCSRn(i));
+               if (etm4x_sspcicrn_present(drvdata, i))
+                       etm4x_relaxed_write32(csa, state->trcsspcicr[i], TRCSSPCICRn(i));
        }
 
        for (i = 0; i < drvdata->nr_addr_cmp * 2; i++) {
-               writeq_relaxed(state->trcacvr[i],
-                              drvdata->base + TRCACVRn(i));
-               writeq_relaxed(state->trcacatr[i],
-                              drvdata->base + TRCACATRn(i));
+               etm4x_relaxed_write64(csa, state->trcacvr[i], TRCACVRn(i));
+               etm4x_relaxed_write64(csa, state->trcacatr[i], TRCACATRn(i));
        }
 
        for (i = 0; i < drvdata->numcidc; i++)
-               writeq_relaxed(state->trccidcvr[i],
-                              drvdata->base + TRCCIDCVRn(i));
+               etm4x_relaxed_write64(csa, state->trccidcvr[i], TRCCIDCVRn(i));
 
        for (i = 0; i < drvdata->numvmidc; i++)
-               writeq_relaxed(state->trcvmidcvr[i],
-                              drvdata->base + TRCVMIDCVRn(i));
+               etm4x_relaxed_write64(csa, state->trcvmidcvr[i], TRCVMIDCVRn(i));
 
-       writel_relaxed(state->trccidcctlr0, drvdata->base + TRCCIDCCTLR0);
+       etm4x_relaxed_write32(csa, state->trccidcctlr0, TRCCIDCCTLR0);
        if (drvdata->numcidc > 4)
-               writel_relaxed(state->trccidcctlr1, drvdata->base + TRCCIDCCTLR1);
+               etm4x_relaxed_write32(csa, state->trccidcctlr1, TRCCIDCCTLR1);
 
-       writel_relaxed(state->trcvmidcctlr0, drvdata->base + TRCVMIDCCTLR0);
+       etm4x_relaxed_write32(csa, state->trcvmidcctlr0, TRCVMIDCCTLR0);
        if (drvdata->numvmidc > 4)
-               writel_relaxed(state->trcvmidcctlr1, drvdata->base + TRCVMIDCCTLR1);
+               etm4x_relaxed_write32(csa, state->trcvmidcctlr0, TRCVMIDCCTLR1);
 
-       writel_relaxed(state->trcclaimset, drvdata->base + TRCCLAIMSET);
+       etm4x_relaxed_write32(csa, state->trcclaimset, TRCCLAIMSET);
 
-       writel_relaxed(state->trcpdcr, drvdata->base + TRCPDCR);
+       if (!drvdata->skip_power_up)
+               etm4x_relaxed_write32(csa, state->trcpdcr, TRCPDCR);
 
        drvdata->state_needs_restore = false;
 
@@ -1482,7 +1621,7 @@ static void etm4_cpu_restore(struct etmv4_drvdata *drvdata)
 
        /* Unlock the OS lock to re-enable trace and external debug access */
        etm4_os_unlock(drvdata);
-       CS_LOCK(drvdata->base);
+       etm4_cs_lock(drvdata, csa);
 }
 
 static int etm4_cpu_pm_notify(struct notifier_block *nb, unsigned long cmd,
@@ -1569,15 +1708,13 @@ static void etm4_pm_clear(void)
        }
 }
 
-static int etm4_probe(struct amba_device *adev, const struct amba_id *id)
+static int etm4_probe(struct device *dev, void __iomem *base, u32 etm_pid)
 {
        int ret;
-       void __iomem *base;
-       struct device *dev = &adev->dev;
        struct coresight_platform_data *pdata = NULL;
        struct etmv4_drvdata *drvdata;
-       struct resource *res = &adev->res;
        struct coresight_desc desc = { 0 };
+       struct etm4_init_arg init_arg = { 0 };
 
        drvdata = devm_kzalloc(dev, sizeof(*drvdata), GFP_KERNEL);
        if (!drvdata)
@@ -1599,11 +1736,6 @@ static int etm4_probe(struct amba_device *adev, const struct amba_id *id)
        if (fwnode_property_present(dev_fwnode(dev), "qcom,skip-power-up"))
                drvdata->skip_power_up = true;
 
-       /* Validity for the resource is already checked by the AMBA core */
-       base = devm_ioremap_resource(dev, res);
-       if (IS_ERR(base))
-               return PTR_ERR(base);
-
        drvdata->base = base;
 
        spin_lock_init(&drvdata->spinlock);
@@ -1616,11 +1748,14 @@ static int etm4_probe(struct amba_device *adev, const struct amba_id *id)
        if (!desc.name)
                return -ENOMEM;
 
+       init_arg.drvdata = drvdata;
+       init_arg.csa = &desc.access;
+
        if (smp_call_function_single(drvdata->cpu,
-                               etm4_init_arch_data,  drvdata, 1))
+                               etm4_init_arch_data,  &init_arg, 1))
                dev_err(dev, "ETM arch init failed\n");
 
-       if (etm4_arch_supported(drvdata->arch) == false)
+       if (!drvdata->arch)
                return -EINVAL;
 
        etm4_init_trace_id(drvdata);
@@ -1630,7 +1765,7 @@ static int etm4_probe(struct amba_device *adev, const struct amba_id *id)
        if (IS_ERR(pdata))
                return PTR_ERR(pdata);
 
-       adev->dev.platform_data = pdata;
+       dev->platform_data = pdata;
 
        desc.type = CORESIGHT_DEV_TYPE_SOURCE;
        desc.subtype.source_subtype = CORESIGHT_DEV_SUBTYPE_SOURCE_PROC;
@@ -1650,25 +1785,44 @@ static int etm4_probe(struct amba_device *adev, const struct amba_id *id)
 
        etmdrvdata[drvdata->cpu] = drvdata;
 
-       pm_runtime_put(&adev->dev);
        dev_info(&drvdata->csdev->dev, "CPU%d: ETM v%d.%d initialized\n",
-                drvdata->cpu, drvdata->arch >> 4, drvdata->arch & 0xf);
+                drvdata->cpu, ETM_ARCH_MAJOR_VERSION(drvdata->arch),
+                ETM_ARCH_MINOR_VERSION(drvdata->arch));
 
        if (boot_enable) {
                coresight_enable(drvdata->csdev);
                drvdata->boot_enable = true;
        }
 
-       etm4_check_arch_features(drvdata, id->id);
+       etm4_check_arch_features(drvdata, etm_pid);
 
        return 0;
 }
 
+static int etm4_probe_amba(struct amba_device *adev, const struct amba_id *id)
+{
+       void __iomem *base;
+       struct device *dev = &adev->dev;
+       struct resource *res = &adev->res;
+       int ret;
+
+       /* Validity for the resource is already checked by the AMBA core */
+       base = devm_ioremap_resource(dev, res);
+       if (IS_ERR(base))
+               return PTR_ERR(base);
+
+       ret = etm4_probe(dev, base, id->id);
+       if (!ret)
+               pm_runtime_put(&adev->dev);
+
+       return ret;
+}
+
 static struct amba_cs_uci_id uci_id_etm4[] = {
        {
                /*  ETMv4 UCI data */
-               .devarch        = 0x47704a13,
-               .devarch_mask   = 0xfff0ffff,
+               .devarch        = ETM_DEVARCH_ETMv4x_ARCH,
+               .devarch_mask   = ETM_DEVARCH_ID_MASK,
                .devtype        = 0x00000013,
        }
 };
@@ -1680,15 +1834,12 @@ static void clear_etmdrvdata(void *info)
        etmdrvdata[cpu] = NULL;
 }
 
-static int etm4_remove(struct amba_device *adev)
+static int __exit etm4_remove_dev(struct etmv4_drvdata *drvdata)
 {
-       struct etmv4_drvdata *drvdata = dev_get_drvdata(&adev->dev);
-
        etm_perf_symlink(drvdata->csdev, false);
-
        /*
-        * Taking hotplug lock here to avoid racing between etm4_remove and
-        * CPU hotplug call backs.
+        * Taking hotplug lock here to avoid racing between etm4_remove_dev()
+        * and CPU hotplug call backs.
         */
        cpus_read_lock();
        /*
@@ -1707,12 +1858,23 @@ static int etm4_remove(struct amba_device *adev)
        return 0;
 }
 
+static int __exit etm4_remove_amba(struct amba_device *adev)
+{
+       struct etmv4_drvdata *drvdata = dev_get_drvdata(&adev->dev);
+
+       if (drvdata)
+               return etm4_remove_dev(drvdata);
+       return 0;
+}
+
 static const struct amba_id etm4_ids[] = {
        CS_AMBA_ID(0x000bb95d),                 /* Cortex-A53 */
        CS_AMBA_ID(0x000bb95e),                 /* Cortex-A57 */
        CS_AMBA_ID(0x000bb95a),                 /* Cortex-A72 */
        CS_AMBA_ID(0x000bb959),                 /* Cortex-A73 */
        CS_AMBA_UCI_ID(0x000bb9da, uci_id_etm4),/* Cortex-A35 */
+       CS_AMBA_UCI_ID(0x000bbd05, uci_id_etm4),/* Cortex-A55 */
+       CS_AMBA_UCI_ID(0x000bbd0a, uci_id_etm4),/* Cortex-A75 */
        CS_AMBA_UCI_ID(0x000bbd0c, uci_id_etm4),/* Neoverse N1 */
        CS_AMBA_UCI_ID(0x000f0205, uci_id_etm4),/* Qualcomm Kryo */
        CS_AMBA_UCI_ID(0x000f0211, uci_id_etm4),/* Qualcomm Kryo */
@@ -1728,14 +1890,14 @@ static const struct amba_id etm4_ids[] = {
 
 MODULE_DEVICE_TABLE(amba, etm4_ids);
 
-static struct amba_driver etm4x_driver = {
+static struct amba_driver etm4x_amba_driver = {
        .drv = {
                .name   = "coresight-etm4x",
                .owner  = THIS_MODULE,
                .suppress_bind_attrs = true,
        },
-       .probe          = etm4_probe,
-       .remove         = etm4_remove,
+       .probe          = etm4_probe_amba,
+       .remove         = etm4_remove_amba,
        .id_table       = etm4_ids,
 };
 
@@ -1749,7 +1911,7 @@ static int __init etm4x_init(void)
        if (ret)
                return ret;
 
-       ret = amba_driver_register(&etm4x_driver);
+       ret = amba_driver_register(&etm4x_amba_driver);
        if (ret) {
                pr_err("Error registering etm4x driver\n");
                etm4_pm_clear();
@@ -1760,7 +1922,7 @@ static int __init etm4x_init(void)
 
 static void __exit etm4x_exit(void)
 {
-       amba_driver_unregister(&etm4x_driver);
+       amba_driver_unregister(&etm4x_amba_driver);
        etm4_pm_clear();
 }