diff mbox series

[v2] mmc: dw_mmc: Add data CRC error injection

Message ID 20210701080534.23138-1-vincent.whitchurch@axis.com
State New
Headers show
Series [v2] mmc: dw_mmc: Add data CRC error injection | expand

Commit Message

Vincent Whitchurch July 1, 2021, 8:05 a.m. UTC
This driver has had problems when handling data errors.  Add fault
injection support so that the abort handling can be easily triggered and
regression-tested.  A hrtimer is used to indicate a data CRC error at
various points during the data transfer.

Note that for the recent problem with hangs in the case of some data CRC
errors, a udelay(10) inserted at the start of send_stop_abort() greatly
helped in triggering the error, but I've not included this as part of
the fault injection support since it seemed too specific.

Signed-off-by: Vincent Whitchurch <vincent.whitchurch@axis.com>
---

Notes:
    v2: Add missing includes.

 drivers/mmc/host/dw_mmc.c | 73 +++++++++++++++++++++++++++++++++++++++
 drivers/mmc/host/dw_mmc.h |  7 ++++
 2 files changed, 80 insertions(+)

Comments

Jaehoon Chung July 25, 2021, 9:41 p.m. UTC | #1
On 7/1/21 5:05 PM, Vincent Whitchurch wrote:
> This driver has had problems when handling data errors.  Add fault

> injection support so that the abort handling can be easily triggered and

> regression-tested.  A hrtimer is used to indicate a data CRC error at

> various points during the data transfer.

> 

> Note that for the recent problem with hangs in the case of some data CRC

> errors, a udelay(10) inserted at the start of send_stop_abort() greatly

> helped in triggering the error, but I've not included this as part of

> the fault injection support since it seemed too specific.

> 

> Signed-off-by: Vincent Whitchurch <vincent.whitchurch@axis.com>


Reviewed-by: Jaehoon Chung <jh80.chung@samsung.com>


Best Regards,
Jaehoon Chung

> ---

> 

> Notes:

>     v2: Add missing includes.

> 

>  drivers/mmc/host/dw_mmc.c | 73 +++++++++++++++++++++++++++++++++++++++

>  drivers/mmc/host/dw_mmc.h |  7 ++++

>  2 files changed, 80 insertions(+)

> 

> diff --git a/drivers/mmc/host/dw_mmc.c b/drivers/mmc/host/dw_mmc.c

> index d333130d1531..dbbb94e6ff4b 100644

> --- a/drivers/mmc/host/dw_mmc.c

> +++ b/drivers/mmc/host/dw_mmc.c

> @@ -17,9 +17,11 @@

>  #include <linux/interrupt.h>

>  #include <linux/iopoll.h>

>  #include <linux/ioport.h>

> +#include <linux/ktime.h>

>  #include <linux/module.h>

>  #include <linux/platform_device.h>

>  #include <linux/pm_runtime.h>

> +#include <linux/prandom.h>

>  #include <linux/seq_file.h>

>  #include <linux/slab.h>

>  #include <linux/stat.h>

> @@ -181,6 +183,9 @@ static void dw_mci_init_debugfs(struct dw_mci_slot *slot)

>  			   &host->pending_events);

>  	debugfs_create_xul("completed_events", S_IRUSR, root,

>  			   &host->completed_events);

> +#ifdef CONFIG_FAULT_INJECTION

> +	fault_create_debugfs_attr("fail_data_crc", root, &host->fail_data_crc);

> +#endif

>  }

>  #endif /* defined(CONFIG_DEBUG_FS) */

>  

> @@ -1788,6 +1793,68 @@ static const struct mmc_host_ops dw_mci_ops = {

>  	.prepare_hs400_tuning	= dw_mci_prepare_hs400_tuning,

>  };

>  

> +#ifdef CONFIG_FAULT_INJECTION

> +static enum hrtimer_restart dw_mci_fault_timer(struct hrtimer *t)

> +{

> +	struct dw_mci *host = container_of(t, struct dw_mci, fault_timer);

> +	unsigned long flags;

> +

> +	spin_lock_irqsave(&host->irq_lock, flags);

> +

> +	if (!host->data_status)

> +		host->data_status = SDMMC_INT_DCRC;

> +	set_bit(EVENT_DATA_ERROR, &host->pending_events);

> +	tasklet_schedule(&host->tasklet);

> +

> +	spin_unlock_irqrestore(&host->irq_lock, flags);

> +

> +	return HRTIMER_NORESTART;

> +}

> +

> +static void dw_mci_start_fault_timer(struct dw_mci *host)

> +{

> +	struct mmc_data *data = host->data;

> +

> +	if (!data || data->blocks <= 1)

> +		return;

> +

> +	if (!should_fail(&host->fail_data_crc, 1))

> +		return;

> +

> +	/*

> +	 * Try to inject the error at random points during the data transfer.

> +	 */

> +	hrtimer_start(&host->fault_timer,

> +		      ms_to_ktime(prandom_u32() % 25),

> +		      HRTIMER_MODE_REL);

> +}

> +

> +static void dw_mci_stop_fault_timer(struct dw_mci *host)

> +{

> +	hrtimer_cancel(&host->fault_timer);

> +}

> +

> +static void dw_mci_init_fault(struct dw_mci *host)

> +{

> +	host->fail_data_crc = (struct fault_attr) FAULT_ATTR_INITIALIZER;

> +

> +	hrtimer_init(&host->fault_timer, CLOCK_MONOTONIC, HRTIMER_MODE_REL);

> +	host->fault_timer.function = dw_mci_fault_timer;

> +}

> +#else

> +static void dw_mci_init_fault(struct dw_mci *host)

> +{

> +}

> +

> +static void dw_mci_start_fault_timer(struct dw_mci *host)

> +{

> +}

> +

> +static void dw_mci_stop_fault_timer(struct dw_mci *host)

> +{

> +}

> +#endif

> +

>  static void dw_mci_request_end(struct dw_mci *host, struct mmc_request *mrq)

>  	__releases(&host->lock)

>  	__acquires(&host->lock)

> @@ -2102,6 +2169,7 @@ static void dw_mci_tasklet_func(struct tasklet_struct *t)

>  				break;

>  			}

>  

> +			dw_mci_stop_fault_timer(host);

>  			host->data = NULL;

>  			set_bit(EVENT_DATA_COMPLETE, &host->completed_events);

>  			err = dw_mci_data_complete(host, data);

> @@ -2151,6 +2219,7 @@ static void dw_mci_tasklet_func(struct tasklet_struct *t)

>  			if (mrq->cmd->error && mrq->data)

>  				dw_mci_reset(host);

>  

> +			dw_mci_stop_fault_timer(host);

>  			host->cmd = NULL;

>  			host->data = NULL;

>  

> @@ -2600,6 +2669,8 @@ static void dw_mci_cmd_interrupt(struct dw_mci *host, u32 status)

>  

>  	set_bit(EVENT_CMD_COMPLETE, &host->pending_events);

>  	tasklet_schedule(&host->tasklet);

> +

> +	dw_mci_start_fault_timer(host);

>  }

>  

>  static void dw_mci_handle_cd(struct dw_mci *host)

> @@ -3223,6 +3294,8 @@ int dw_mci_probe(struct dw_mci *host)

>  	spin_lock_init(&host->irq_lock);

>  	INIT_LIST_HEAD(&host->queue);

>  

> +	dw_mci_init_fault(host);

> +

>  	/*

>  	 * Get the host data width - this assumes that HCON has been set with

>  	 * the correct values.

> diff --git a/drivers/mmc/host/dw_mmc.h b/drivers/mmc/host/dw_mmc.h

> index da5923a92e60..ce05d81477d9 100644

> --- a/drivers/mmc/host/dw_mmc.h

> +++ b/drivers/mmc/host/dw_mmc.h

> @@ -14,6 +14,8 @@

>  #include <linux/mmc/core.h>

>  #include <linux/dmaengine.h>

>  #include <linux/reset.h>

> +#include <linux/fault-inject.h>

> +#include <linux/hrtimer.h>

>  #include <linux/interrupt.h>

>  

>  enum dw_mci_state {

> @@ -230,6 +232,11 @@ struct dw_mci {

>  	struct timer_list       cmd11_timer;

>  	struct timer_list       cto_timer;

>  	struct timer_list       dto_timer;

> +

> +#ifdef CONFIG_FAULT_INJECTION

> +	struct fault_attr	fail_data_crc;

> +	struct hrtimer		fault_timer;

> +#endif

>  };

>  

>  /* DMA ops for Internal/External DMAC interface */

>
Ulf Hansson Aug. 4, 2021, 11:34 a.m. UTC | #2
On Thu, 1 Jul 2021 at 10:05, Vincent Whitchurch
<vincent.whitchurch@axis.com> wrote:
>

> This driver has had problems when handling data errors.  Add fault

> injection support so that the abort handling can be easily triggered and

> regression-tested.  A hrtimer is used to indicate a data CRC error at

> various points during the data transfer.

>

> Note that for the recent problem with hangs in the case of some data CRC

> errors, a udelay(10) inserted at the start of send_stop_abort() greatly

> helped in triggering the error, but I've not included this as part of

> the fault injection support since it seemed too specific.

>

> Signed-off-by: Vincent Whitchurch <vincent.whitchurch@axis.com>


Applied for next, thanks!

Kind regards
Uffe


> ---

>

> Notes:

>     v2: Add missing includes.

>

>  drivers/mmc/host/dw_mmc.c | 73 +++++++++++++++++++++++++++++++++++++++

>  drivers/mmc/host/dw_mmc.h |  7 ++++

>  2 files changed, 80 insertions(+)

>

> diff --git a/drivers/mmc/host/dw_mmc.c b/drivers/mmc/host/dw_mmc.c

> index d333130d1531..dbbb94e6ff4b 100644

> --- a/drivers/mmc/host/dw_mmc.c

> +++ b/drivers/mmc/host/dw_mmc.c

> @@ -17,9 +17,11 @@

>  #include <linux/interrupt.h>

>  #include <linux/iopoll.h>

>  #include <linux/ioport.h>

> +#include <linux/ktime.h>

>  #include <linux/module.h>

>  #include <linux/platform_device.h>

>  #include <linux/pm_runtime.h>

> +#include <linux/prandom.h>

>  #include <linux/seq_file.h>

>  #include <linux/slab.h>

>  #include <linux/stat.h>

> @@ -181,6 +183,9 @@ static void dw_mci_init_debugfs(struct dw_mci_slot *slot)

>                            &host->pending_events);

>         debugfs_create_xul("completed_events", S_IRUSR, root,

>                            &host->completed_events);

> +#ifdef CONFIG_FAULT_INJECTION

> +       fault_create_debugfs_attr("fail_data_crc", root, &host->fail_data_crc);

> +#endif

>  }

>  #endif /* defined(CONFIG_DEBUG_FS) */

>

> @@ -1788,6 +1793,68 @@ static const struct mmc_host_ops dw_mci_ops = {

>         .prepare_hs400_tuning   = dw_mci_prepare_hs400_tuning,

>  };

>

> +#ifdef CONFIG_FAULT_INJECTION

> +static enum hrtimer_restart dw_mci_fault_timer(struct hrtimer *t)

> +{

> +       struct dw_mci *host = container_of(t, struct dw_mci, fault_timer);

> +       unsigned long flags;

> +

> +       spin_lock_irqsave(&host->irq_lock, flags);

> +

> +       if (!host->data_status)

> +               host->data_status = SDMMC_INT_DCRC;

> +       set_bit(EVENT_DATA_ERROR, &host->pending_events);

> +       tasklet_schedule(&host->tasklet);

> +

> +       spin_unlock_irqrestore(&host->irq_lock, flags);

> +

> +       return HRTIMER_NORESTART;

> +}

> +

> +static void dw_mci_start_fault_timer(struct dw_mci *host)

> +{

> +       struct mmc_data *data = host->data;

> +

> +       if (!data || data->blocks <= 1)

> +               return;

> +

> +       if (!should_fail(&host->fail_data_crc, 1))

> +               return;

> +

> +       /*

> +        * Try to inject the error at random points during the data transfer.

> +        */

> +       hrtimer_start(&host->fault_timer,

> +                     ms_to_ktime(prandom_u32() % 25),

> +                     HRTIMER_MODE_REL);

> +}

> +

> +static void dw_mci_stop_fault_timer(struct dw_mci *host)

> +{

> +       hrtimer_cancel(&host->fault_timer);

> +}

> +

> +static void dw_mci_init_fault(struct dw_mci *host)

> +{

> +       host->fail_data_crc = (struct fault_attr) FAULT_ATTR_INITIALIZER;

> +

> +       hrtimer_init(&host->fault_timer, CLOCK_MONOTONIC, HRTIMER_MODE_REL);

> +       host->fault_timer.function = dw_mci_fault_timer;

> +}

> +#else

> +static void dw_mci_init_fault(struct dw_mci *host)

> +{

> +}

> +

> +static void dw_mci_start_fault_timer(struct dw_mci *host)

> +{

> +}

> +

> +static void dw_mci_stop_fault_timer(struct dw_mci *host)

> +{

> +}

> +#endif

> +

>  static void dw_mci_request_end(struct dw_mci *host, struct mmc_request *mrq)

>         __releases(&host->lock)

>         __acquires(&host->lock)

> @@ -2102,6 +2169,7 @@ static void dw_mci_tasklet_func(struct tasklet_struct *t)

>                                 break;

>                         }

>

> +                       dw_mci_stop_fault_timer(host);

>                         host->data = NULL;

>                         set_bit(EVENT_DATA_COMPLETE, &host->completed_events);

>                         err = dw_mci_data_complete(host, data);

> @@ -2151,6 +2219,7 @@ static void dw_mci_tasklet_func(struct tasklet_struct *t)

>                         if (mrq->cmd->error && mrq->data)

>                                 dw_mci_reset(host);

>

> +                       dw_mci_stop_fault_timer(host);

>                         host->cmd = NULL;

>                         host->data = NULL;

>

> @@ -2600,6 +2669,8 @@ static void dw_mci_cmd_interrupt(struct dw_mci *host, u32 status)

>

>         set_bit(EVENT_CMD_COMPLETE, &host->pending_events);

>         tasklet_schedule(&host->tasklet);

> +

> +       dw_mci_start_fault_timer(host);

>  }

>

>  static void dw_mci_handle_cd(struct dw_mci *host)

> @@ -3223,6 +3294,8 @@ int dw_mci_probe(struct dw_mci *host)

>         spin_lock_init(&host->irq_lock);

>         INIT_LIST_HEAD(&host->queue);

>

> +       dw_mci_init_fault(host);

> +

>         /*

>          * Get the host data width - this assumes that HCON has been set with

>          * the correct values.

> diff --git a/drivers/mmc/host/dw_mmc.h b/drivers/mmc/host/dw_mmc.h

> index da5923a92e60..ce05d81477d9 100644

> --- a/drivers/mmc/host/dw_mmc.h

> +++ b/drivers/mmc/host/dw_mmc.h

> @@ -14,6 +14,8 @@

>  #include <linux/mmc/core.h>

>  #include <linux/dmaengine.h>

>  #include <linux/reset.h>

> +#include <linux/fault-inject.h>

> +#include <linux/hrtimer.h>

>  #include <linux/interrupt.h>

>

>  enum dw_mci_state {

> @@ -230,6 +232,11 @@ struct dw_mci {

>         struct timer_list       cmd11_timer;

>         struct timer_list       cto_timer;

>         struct timer_list       dto_timer;

> +

> +#ifdef CONFIG_FAULT_INJECTION

> +       struct fault_attr       fail_data_crc;

> +       struct hrtimer          fault_timer;

> +#endif

>  };

>

>  /* DMA ops for Internal/External DMAC interface */

> --

> 2.28.0

>
diff mbox series

Patch

diff --git a/drivers/mmc/host/dw_mmc.c b/drivers/mmc/host/dw_mmc.c
index d333130d1531..dbbb94e6ff4b 100644
--- a/drivers/mmc/host/dw_mmc.c
+++ b/drivers/mmc/host/dw_mmc.c
@@ -17,9 +17,11 @@ 
 #include <linux/interrupt.h>
 #include <linux/iopoll.h>
 #include <linux/ioport.h>
+#include <linux/ktime.h>
 #include <linux/module.h>
 #include <linux/platform_device.h>
 #include <linux/pm_runtime.h>
+#include <linux/prandom.h>
 #include <linux/seq_file.h>
 #include <linux/slab.h>
 #include <linux/stat.h>
@@ -181,6 +183,9 @@  static void dw_mci_init_debugfs(struct dw_mci_slot *slot)
 			   &host->pending_events);
 	debugfs_create_xul("completed_events", S_IRUSR, root,
 			   &host->completed_events);
+#ifdef CONFIG_FAULT_INJECTION
+	fault_create_debugfs_attr("fail_data_crc", root, &host->fail_data_crc);
+#endif
 }
 #endif /* defined(CONFIG_DEBUG_FS) */
 
@@ -1788,6 +1793,68 @@  static const struct mmc_host_ops dw_mci_ops = {
 	.prepare_hs400_tuning	= dw_mci_prepare_hs400_tuning,
 };
 
+#ifdef CONFIG_FAULT_INJECTION
+static enum hrtimer_restart dw_mci_fault_timer(struct hrtimer *t)
+{
+	struct dw_mci *host = container_of(t, struct dw_mci, fault_timer);
+	unsigned long flags;
+
+	spin_lock_irqsave(&host->irq_lock, flags);
+
+	if (!host->data_status)
+		host->data_status = SDMMC_INT_DCRC;
+	set_bit(EVENT_DATA_ERROR, &host->pending_events);
+	tasklet_schedule(&host->tasklet);
+
+	spin_unlock_irqrestore(&host->irq_lock, flags);
+
+	return HRTIMER_NORESTART;
+}
+
+static void dw_mci_start_fault_timer(struct dw_mci *host)
+{
+	struct mmc_data *data = host->data;
+
+	if (!data || data->blocks <= 1)
+		return;
+
+	if (!should_fail(&host->fail_data_crc, 1))
+		return;
+
+	/*
+	 * Try to inject the error at random points during the data transfer.
+	 */
+	hrtimer_start(&host->fault_timer,
+		      ms_to_ktime(prandom_u32() % 25),
+		      HRTIMER_MODE_REL);
+}
+
+static void dw_mci_stop_fault_timer(struct dw_mci *host)
+{
+	hrtimer_cancel(&host->fault_timer);
+}
+
+static void dw_mci_init_fault(struct dw_mci *host)
+{
+	host->fail_data_crc = (struct fault_attr) FAULT_ATTR_INITIALIZER;
+
+	hrtimer_init(&host->fault_timer, CLOCK_MONOTONIC, HRTIMER_MODE_REL);
+	host->fault_timer.function = dw_mci_fault_timer;
+}
+#else
+static void dw_mci_init_fault(struct dw_mci *host)
+{
+}
+
+static void dw_mci_start_fault_timer(struct dw_mci *host)
+{
+}
+
+static void dw_mci_stop_fault_timer(struct dw_mci *host)
+{
+}
+#endif
+
 static void dw_mci_request_end(struct dw_mci *host, struct mmc_request *mrq)
 	__releases(&host->lock)
 	__acquires(&host->lock)
@@ -2102,6 +2169,7 @@  static void dw_mci_tasklet_func(struct tasklet_struct *t)
 				break;
 			}
 
+			dw_mci_stop_fault_timer(host);
 			host->data = NULL;
 			set_bit(EVENT_DATA_COMPLETE, &host->completed_events);
 			err = dw_mci_data_complete(host, data);
@@ -2151,6 +2219,7 @@  static void dw_mci_tasklet_func(struct tasklet_struct *t)
 			if (mrq->cmd->error && mrq->data)
 				dw_mci_reset(host);
 
+			dw_mci_stop_fault_timer(host);
 			host->cmd = NULL;
 			host->data = NULL;
 
@@ -2600,6 +2669,8 @@  static void dw_mci_cmd_interrupt(struct dw_mci *host, u32 status)
 
 	set_bit(EVENT_CMD_COMPLETE, &host->pending_events);
 	tasklet_schedule(&host->tasklet);
+
+	dw_mci_start_fault_timer(host);
 }
 
 static void dw_mci_handle_cd(struct dw_mci *host)
@@ -3223,6 +3294,8 @@  int dw_mci_probe(struct dw_mci *host)
 	spin_lock_init(&host->irq_lock);
 	INIT_LIST_HEAD(&host->queue);
 
+	dw_mci_init_fault(host);
+
 	/*
 	 * Get the host data width - this assumes that HCON has been set with
 	 * the correct values.
diff --git a/drivers/mmc/host/dw_mmc.h b/drivers/mmc/host/dw_mmc.h
index da5923a92e60..ce05d81477d9 100644
--- a/drivers/mmc/host/dw_mmc.h
+++ b/drivers/mmc/host/dw_mmc.h
@@ -14,6 +14,8 @@ 
 #include <linux/mmc/core.h>
 #include <linux/dmaengine.h>
 #include <linux/reset.h>
+#include <linux/fault-inject.h>
+#include <linux/hrtimer.h>
 #include <linux/interrupt.h>
 
 enum dw_mci_state {
@@ -230,6 +232,11 @@  struct dw_mci {
 	struct timer_list       cmd11_timer;
 	struct timer_list       cto_timer;
 	struct timer_list       dto_timer;
+
+#ifdef CONFIG_FAULT_INJECTION
+	struct fault_attr	fail_data_crc;
+	struct hrtimer		fault_timer;
+#endif
 };
 
 /* DMA ops for Internal/External DMAC interface */