From 0f2b6eb4ef0c24d668fd8310e632b53deebbc970 Mon Sep 17 00:00:00 2001 From: Taylor R Campbell Date: Sun, 13 Feb 2022 13:57:22 +0000 Subject: [PATCH] acpi_pcc(4): Membar audit. - When submitting a command, use atomic_store_release so that the command we're submitting is initialized before we clear the status bits allowing it to proceed. The previous ordering -- membar_sync and then store status bits -- was correct, but membar_sync is stronger than necessary. - When waiting for a command to complete, use atomic_load_acquire to read the status, so that whatever memory operations were involved in the command's execution happen before all memory operations dependent on the status being completed. The previous ordering -- membar_sync and then load status bits -- would fail to guarantee this memory ordering, and membar_sync is stronger than necessary. No need for membar_sync because there's no store-before-load ordering required anywhere here. --- sys/dev/acpi/acpi_pcc.c | 14 ++++++++------ 1 file changed, 8 insertions(+), 6 deletions(-) diff --git a/sys/dev/acpi/acpi_pcc.c b/sys/dev/acpi/acpi_pcc.c index 0d9c0c618624..f79a53c41313 100644 --- a/sys/dev/acpi/acpi_pcc.c +++ b/sys/dev/acpi/acpi_pcc.c @@ -43,7 +43,6 @@ __KERNEL_RCSID(0, "$NetBSD: acpi_pcc.c,v 1.1 2020/12/13 20:27:53 jmcneill Exp $" #include #include -#define PCC_MEMORY_BARRIER() membar_sync() #if defined(__aarch64__) #define PCC_DMA_BARRIER() __asm __volatile("dsb sy" ::: "memory") #else @@ -221,8 +220,8 @@ pcc_wait_command(struct pcc_subspace *ss, bool first) shmem = ss->ss_data; retry = imax(1000, ss->ss_turnaround + ss->ss_latency * 100); while (retry > 0) { - PCC_MEMORY_BARRIER(); - if ((shmem->Status & PCC_STATUS_COMMAND_COMPLETE) != 0) + if ((atomic_load_acquire(&shmem->Status) & + PCC_STATUS_COMMAND_COMPLETE) != 0) return AE_OK; delay(10); retry -= 10; @@ -266,6 +265,7 @@ pcc_send_command(struct pcc_subspace *ss, ACPI_GENERIC_ADDRESS *reg, volatile ACPI_PCCT_SHARED_MEMORY *shmem = ss->ss_data; uint8_t *data = __UNVOLATILE(shmem + 1); UINT64 tmp, mask; + UINT16 status; KASSERT(ss->ss_type == ACPI_PCCT_TYPE_GENERIC_SUBSPACE || ss->ss_type == ACPI_PCCT_TYPE_HW_REDUCED_SUBSPACE || @@ -281,9 +281,11 @@ pcc_send_command(struct pcc_subspace *ss, ACPI_GENERIC_ADDRESS *reg, tmp |= __SHIFTIN(val, mask); ACPI_MOVE_64_TO_64(data + reg->Address, &tmp); } - PCC_MEMORY_BARRIER(); - shmem->Status &= ~(PCC_STATUS_COMMAND_COMPLETE | - PCC_STATUS_COMMAND_ERROR); + status = shmem->Status; + status &= ~PCC_STATUS_COMMAND_COMPLETE; + status &= ~PCC_STATUS_COMMAND_ERROR; + atomic_store_release(&shmem->Status, status); + PCC_DMA_BARRIER(); return pcc_doorbell(&ss->ss_doorbell_reg);