Commit 20d48595 authored by Masahiro Yamada's avatar Masahiro Yamada Committed by Boris Brezillon

mtd: nand: denali: fix bitflips calculation in handle_ecc()

This function is wrong in multiple ways:

[1] Counting corrected bytes instead of corrected bits.

The following code is counting the number of corrected _bytes_.

    /* correct the ECC error */
    buf[offset] ^= err_cor_value;
    mtd->ecc_stats.corrected++;
    bitflips++;

What the core framework expects is the number of corrected _bits_.
They can be different if multiple bitflips occur within one byte.

[2] total number of errors instead of max of per-sector errors

The core framework expects that corrected errors are counted per
sector, then the max value should be taken.  The current code simply
iterates over the whole page, i.e. counts the total number of
correction in the page.  This means "too many bitflips" is triggered
earlier than it should be, i.e. the NAND device is worn out sooner.

Besides those bugs, this function is unreadable due to the deep
nesting.  Notice the whole code in this function is wrapped in
if (irq_status & INTR__ECC_ERR), so this conditional can be moved
out of the function.  Also, use shorter names for local variables.

Re-work the function to fix all the issues.
Signed-off-by: default avatarMasahiro Yamada <yamada.masahiro@socionext.com>
Signed-off-by: default avatarBoris Brezillon <boris.brezillon@free-electrons.com>
parent 8927ad39
...@@ -836,80 +836,80 @@ static bool is_erased(uint8_t *buf, int len) ...@@ -836,80 +836,80 @@ static bool is_erased(uint8_t *buf, int len)
#define ECC_SECTOR(x) (((x) & ECC_ERROR_ADDRESS__SECTOR_NR) >> 12) #define ECC_SECTOR(x) (((x) & ECC_ERROR_ADDRESS__SECTOR_NR) >> 12)
#define ECC_BYTE(x) (((x) & ECC_ERROR_ADDRESS__OFFSET)) #define ECC_BYTE(x) (((x) & ECC_ERROR_ADDRESS__OFFSET))
#define ECC_CORRECTION_VALUE(x) ((x) & ERR_CORRECTION_INFO__BYTEMASK) #define ECC_CORRECTION_VALUE(x) ((x) & ERR_CORRECTION_INFO__BYTEMASK)
#define ECC_ERROR_CORRECTABLE(x) (!((x) & ERR_CORRECTION_INFO__ERROR_TYPE)) #define ECC_ERROR_UNCORRECTABLE(x) ((x) & ERR_CORRECTION_INFO__ERROR_TYPE)
#define ECC_ERR_DEVICE(x) (((x) & ERR_CORRECTION_INFO__DEVICE_NR) >> 8) #define ECC_ERR_DEVICE(x) (((x) & ERR_CORRECTION_INFO__DEVICE_NR) >> 8)
#define ECC_LAST_ERR(x) ((x) & ERR_CORRECTION_INFO__LAST_ERR_INFO) #define ECC_LAST_ERR(x) ((x) & ERR_CORRECTION_INFO__LAST_ERR_INFO)
static bool handle_ecc(struct denali_nand_info *denali, uint8_t *buf, static int handle_ecc(struct mtd_info *mtd, struct denali_nand_info *denali,
uint32_t irq_status, unsigned int *max_bitflips) uint8_t *buf, bool *check_erased_page)
{ {
bool check_erased_page = false;
unsigned int bitflips = 0; unsigned int bitflips = 0;
unsigned int max_bitflips = 0;
uint32_t err_addr, err_cor_info;
unsigned int err_byte, err_sector, err_device;
uint8_t err_cor_value;
unsigned int prev_sector = 0;
if (irq_status & INTR__ECC_ERR) { /* read the ECC errors. we'll ignore them for now */
/* read the ECC errors. we'll ignore them for now */ denali_set_intr_modes(denali, false);
uint32_t err_address, err_correction_info, err_byte,
err_sector, err_device, err_correction_value; do {
denali_set_intr_modes(denali, false); err_addr = ioread32(denali->flash_reg + ECC_ERROR_ADDRESS);
err_sector = ECC_SECTOR(err_addr);
do { err_byte = ECC_BYTE(err_addr);
err_address = ioread32(denali->flash_reg +
ECC_ERROR_ADDRESS); err_cor_info = ioread32(denali->flash_reg + ERR_CORRECTION_INFO);
err_sector = ECC_SECTOR(err_address); err_cor_value = ECC_CORRECTION_VALUE(err_cor_info);
err_byte = ECC_BYTE(err_address); err_device = ECC_ERR_DEVICE(err_cor_info);
err_correction_info = ioread32(denali->flash_reg + /* reset the bitflip counter when crossing ECC sector */
ERR_CORRECTION_INFO); if (err_sector != prev_sector)
err_correction_value = bitflips = 0;
ECC_CORRECTION_VALUE(err_correction_info);
err_device = ECC_ERR_DEVICE(err_correction_info); if (ECC_ERROR_UNCORRECTABLE(err_cor_info)) {
/*
if (ECC_ERROR_CORRECTABLE(err_correction_info)) { * if the error is not correctable, need to look at the
/* * page to see if it is an erased page. if so, then
* If err_byte is larger than ECC_SECTOR_SIZE, * it's not a real ECC error
* means error happened in OOB, so we ignore */
* it. It's no need for us to correct it *check_erased_page = true;
* err_device is represented the NAND error } else if (err_byte < ECC_SECTOR_SIZE) {
* bits are happened in if there are more /*
* than one NAND connected. * If err_byte is larger than ECC_SECTOR_SIZE, means error
*/ * happened in OOB, so we ignore it. It's no need for
if (err_byte < ECC_SECTOR_SIZE) { * us to correct it err_device is represented the NAND
struct mtd_info *mtd = * error bits are happened in if there are more than
nand_to_mtd(&denali->nand); * one NAND connected.
int offset; */
int offset;
offset = (err_sector * unsigned int flips_in_byte;
ECC_SECTOR_SIZE +
err_byte) * offset = (err_sector * ECC_SECTOR_SIZE + err_byte) *
denali->devnum + denali->devnum + err_device;
err_device;
/* correct the ECC error */ /* correct the ECC error */
buf[offset] ^= err_correction_value; flips_in_byte = hweight8(buf[offset] ^ err_cor_value);
mtd->ecc_stats.corrected++; buf[offset] ^= err_cor_value;
bitflips++; mtd->ecc_stats.corrected += flips_in_byte;
} bitflips += flips_in_byte;
} else {
/* max_bitflips = max(max_bitflips, bitflips);
* if the error is not correctable, need to }
* look at the page to see if it is an erased
* page. if so, then it's not a real ECC error prev_sector = err_sector;
*/ } while (!ECC_LAST_ERR(err_cor_info));
check_erased_page = true;
} /*
} while (!ECC_LAST_ERR(err_correction_info)); * Once handle all ecc errors, controller will trigger a
/* * ECC_TRANSACTION_DONE interrupt, so here just wait for
* Once handle all ecc errors, controller will triger * a while for this interrupt
* a ECC_TRANSACTION_DONE interrupt, so here just wait */
* for a while for this interrupt while (!(read_interrupt_status(denali) & INTR__ECC_TRANSACTION_DONE))
*/ cpu_relax();
while (!(read_interrupt_status(denali) & clear_interrupts(denali);
INTR__ECC_TRANSACTION_DONE)) denali_set_intr_modes(denali, true);
cpu_relax();
clear_interrupts(denali); return max_bitflips;
denali_set_intr_modes(denali, true);
}
*max_bitflips = bitflips;
return check_erased_page;
} }
/* programs the controller to either enable/disable DMA transfers */ /* programs the controller to either enable/disable DMA transfers */
...@@ -1045,7 +1045,7 @@ static int denali_read_oob(struct mtd_info *mtd, struct nand_chip *chip, ...@@ -1045,7 +1045,7 @@ static int denali_read_oob(struct mtd_info *mtd, struct nand_chip *chip,
static int denali_read_page(struct mtd_info *mtd, struct nand_chip *chip, static int denali_read_page(struct mtd_info *mtd, struct nand_chip *chip,
uint8_t *buf, int oob_required, int page) uint8_t *buf, int oob_required, int page)
{ {
unsigned int max_bitflips; unsigned int max_bitflips = 0;
struct denali_nand_info *denali = mtd_to_denali(mtd); struct denali_nand_info *denali = mtd_to_denali(mtd);
dma_addr_t addr = denali->buf.dma_buf; dma_addr_t addr = denali->buf.dma_buf;
...@@ -1077,7 +1077,8 @@ static int denali_read_page(struct mtd_info *mtd, struct nand_chip *chip, ...@@ -1077,7 +1077,8 @@ static int denali_read_page(struct mtd_info *mtd, struct nand_chip *chip,
memcpy(buf, denali->buf.buf, mtd->writesize); memcpy(buf, denali->buf.buf, mtd->writesize);
check_erased_page = handle_ecc(denali, buf, irq_status, &max_bitflips); if (irq_status & INTR__ECC_ERR)
max_bitflips = handle_ecc(mtd, denali, buf, &check_erased_page);
denali_enable_dma(denali, false); denali_enable_dma(denali, false);
if (check_erased_page) { if (check_erased_page) {
......
Markdown is supported
0%
or
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment