Message ID | 20220319062833.3136528-6-jane.chu@oracle.com (mailing list archive) |
---|---|
State | New, archived |
Headers | show |
Series | DAX poison recovery | expand |
> -static void hwpoison_clear(struct pmem_device *pmem, > - phys_addr_t phys, unsigned int len) > +static phys_addr_t to_phys(struct pmem_device *pmem, phys_addr_t offset) > { > + return pmem->phys_addr + offset; > +} > + > +static sector_t to_sect(struct pmem_device *pmem, phys_addr_t offset) > +{ > + return (offset - pmem->data_offset) / 512; > +} > + > +static phys_addr_t to_offset(struct pmem_device *pmem, sector_t sector) > +{ > + return sector * 512 + pmem->data_offset; > +} The multiplicate / divison using 512 could use shifts using SECTOR_SHIFT. > + > +static void clear_hwpoison(struct pmem_device *pmem, phys_addr_t offset, > + unsigned int len) > +static void clear_bb(struct pmem_device *pmem, sector_t sector, long blks) All these functions lack a pmem_ prefix. > +static blk_status_t __pmem_clear_poison(struct pmem_device *pmem, > + phys_addr_t offset, unsigned int len, > + unsigned int *blks) > +{ > + phys_addr_t phys = to_phys(pmem, offset); > long cleared; > + blk_status_t rc; > > + cleared = nvdimm_clear_poison(to_dev(pmem), phys, len); > + *blks = cleared / 512; > + rc = (cleared < len) ? BLK_STS_IOERR : BLK_STS_OK; > + if (cleared <= 0 || *blks == 0) > + return rc; This look odd. I think just returing the cleared byte value would make much more sense: static long __pmem_clear_poison(struct pmem_device *pmem, phys_addr_t offset, unsigned int len) { long cleared = nvdimm_clear_poison(to_dev(pmem), phys, len); if (cleared > 0) { clear_hwpoison(pmem, offset, cleared); arch_invalidate_pmem(pmem->virt_addr + offset, len); } return cleared; }
On 3/22/2022 1:53 AM, Christoph Hellwig wrote: >> -static void hwpoison_clear(struct pmem_device *pmem, >> - phys_addr_t phys, unsigned int len) >> +static phys_addr_t to_phys(struct pmem_device *pmem, phys_addr_t offset) >> { >> + return pmem->phys_addr + offset; >> +} >> + >> +static sector_t to_sect(struct pmem_device *pmem, phys_addr_t offset) >> +{ >> + return (offset - pmem->data_offset) / 512; >> +} >> + >> +static phys_addr_t to_offset(struct pmem_device *pmem, sector_t sector) >> +{ >> + return sector * 512 + pmem->data_offset; >> +} > > The multiplicate / divison using 512 could use shifts using > SECTOR_SHIFT. Nice, will do. > >> + >> +static void clear_hwpoison(struct pmem_device *pmem, phys_addr_t offset, >> + unsigned int len) > >> +static void clear_bb(struct pmem_device *pmem, sector_t sector, long blks) > > All these functions lack a pmem_ prefix. Did you mean all of the helpers or just "clear_hwpoison" and "clear_bb"? The reason I ask is that there are existing static helpers without pmem_ prefix, just short function names. > >> +static blk_status_t __pmem_clear_poison(struct pmem_device *pmem, >> + phys_addr_t offset, unsigned int len, >> + unsigned int *blks) >> +{ >> + phys_addr_t phys = to_phys(pmem, offset); >> long cleared; >> + blk_status_t rc; >> >> + cleared = nvdimm_clear_poison(to_dev(pmem), phys, len); >> + *blks = cleared / 512; >> + rc = (cleared < len) ? BLK_STS_IOERR : BLK_STS_OK; >> + if (cleared <= 0 || *blks == 0) >> + return rc; > > This look odd. I think just returing the cleared byte value would > make much more sense: > > static long __pmem_clear_poison(struct pmem_device *pmem, > phys_addr_t offset, unsigned int len) > { > long cleared = nvdimm_clear_poison(to_dev(pmem), phys, len); > > if (cleared > 0) { > clear_hwpoison(pmem, offset, cleared); > arch_invalidate_pmem(pmem->virt_addr + offset, len); > } > > return cleared; > } Yes, this is cleaner, will do. Thanks! -jane
diff --git a/drivers/nvdimm/pmem.c b/drivers/nvdimm/pmem.c index 7cdaa279beca..18f357fbef69 100644 --- a/drivers/nvdimm/pmem.c +++ b/drivers/nvdimm/pmem.c @@ -45,10 +45,27 @@ static struct nd_region *to_region(struct pmem_device *pmem) return to_nd_region(to_dev(pmem)->parent); } -static void hwpoison_clear(struct pmem_device *pmem, - phys_addr_t phys, unsigned int len) +static phys_addr_t to_phys(struct pmem_device *pmem, phys_addr_t offset) { + return pmem->phys_addr + offset; +} + +static sector_t to_sect(struct pmem_device *pmem, phys_addr_t offset) +{ + return (offset - pmem->data_offset) / 512; +} + +static phys_addr_t to_offset(struct pmem_device *pmem, sector_t sector) +{ + return sector * 512 + pmem->data_offset; +} + +static void clear_hwpoison(struct pmem_device *pmem, phys_addr_t offset, + unsigned int len) +{ + phys_addr_t phys = to_phys(pmem, offset); unsigned long pfn_start, pfn_end, pfn; + unsigned int blks = len / 512; /* only pmem in the linear map supports HWPoison */ if (is_vmalloc_addr(pmem->virt_addr)) @@ -67,33 +84,47 @@ static void hwpoison_clear(struct pmem_device *pmem, if (test_and_clear_pmem_poison(page)) clear_mce_nospec(pfn); } + + dev_dbg(to_dev(pmem), "%#llx clear %u sector%s\n", + (unsigned long long) to_sect(pmem, offset), blks, + blks > 1 ? "s" : ""); } -static blk_status_t pmem_clear_poison(struct pmem_device *pmem, - phys_addr_t offset, unsigned int len) +static void clear_bb(struct pmem_device *pmem, sector_t sector, long blks) { - struct device *dev = to_dev(pmem); - sector_t sector; + badblocks_clear(&pmem->bb, sector, blks); + if (pmem->bb_state) + sysfs_notify_dirent(pmem->bb_state); +} + +static blk_status_t __pmem_clear_poison(struct pmem_device *pmem, + phys_addr_t offset, unsigned int len, + unsigned int *blks) +{ + phys_addr_t phys = to_phys(pmem, offset); long cleared; - blk_status_t rc = BLK_STS_OK; - - sector = (offset - pmem->data_offset) / 512; - - cleared = nvdimm_clear_poison(dev, pmem->phys_addr + offset, len); - if (cleared < len) - rc = BLK_STS_IOERR; - if (cleared > 0 && cleared / 512) { - hwpoison_clear(pmem, pmem->phys_addr + offset, cleared); - cleared /= 512; - dev_dbg(dev, "%#llx clear %ld sector%s\n", - (unsigned long long) sector, cleared, - cleared > 1 ? "s" : ""); - badblocks_clear(&pmem->bb, sector, cleared); - if (pmem->bb_state) - sysfs_notify_dirent(pmem->bb_state); - } + blk_status_t rc; + cleared = nvdimm_clear_poison(to_dev(pmem), phys, len); + *blks = cleared / 512; + rc = (cleared < len) ? BLK_STS_IOERR : BLK_STS_OK; + if (cleared <= 0 || *blks == 0) + return rc; + + clear_hwpoison(pmem, offset, cleared); arch_invalidate_pmem(pmem->virt_addr + offset, len); + return rc; +} + +static blk_status_t pmem_clear_poison(struct pmem_device *pmem, + phys_addr_t offset, unsigned int len) +{ + unsigned int blks; + blk_status_t rc; + + rc = __pmem_clear_poison(pmem, offset, len, &blks); + if (blks > 0) + clear_bb(pmem, to_sect(pmem, offset), blks); return rc; } @@ -143,7 +174,7 @@ static blk_status_t pmem_do_read(struct pmem_device *pmem, sector_t sector, unsigned int len) { blk_status_t rc; - phys_addr_t pmem_off = sector * 512 + pmem->data_offset; + phys_addr_t pmem_off = to_offset(pmem, sector); void *pmem_addr = pmem->virt_addr + pmem_off; if (unlikely(is_bad_pmem(&pmem->bb, sector, len))) @@ -158,7 +189,7 @@ static blk_status_t pmem_do_write(struct pmem_device *pmem, struct page *page, unsigned int page_off, sector_t sector, unsigned int len) { - phys_addr_t pmem_off = sector * 512 + pmem->data_offset; + phys_addr_t pmem_off = to_offset(pmem, sector); void *pmem_addr = pmem->virt_addr + pmem_off; if (unlikely(is_bad_pmem(&pmem->bb, sector, len))) {
Refactor the pmem_clear_poison() in order to share common code later. Signed-off-by: Jane Chu <jane.chu@oracle.com> --- drivers/nvdimm/pmem.c | 81 ++++++++++++++++++++++++++++++------------- 1 file changed, 56 insertions(+), 25 deletions(-)