On Sun, Nov 22, 2015 at 02:05:16PM +0000, Simon Arlott wrote:
> There is a level triggered interrupt for the watchdog timer as part of
> the bcm63xx_timer device. The interrupt occurs when the hardware watchdog
> timer reaches 50% of the remaining time.
> 
> It is not possible to mask the interrupt within the bcm63xx_timer device.
> To get around this limitation, handle the interrupt by restarting the
> watchdog with the current remaining time (which will be half the previous
> timeout) so that the interrupt occurs again at 1/4th, 1/8th, etc. of the
> original timeout value until the watchdog forces a reboot.
> 
> The software timer was restarting the hardware watchdog with a 85 second
> timeout until the software timer expired, and then causing a panic()
> about 42.5 seconds later when the hardware interrupt occurred. The
> hardware watchdog would not reboot until a further 42.5 seconds had
> passed.
> 
> Remove the software timer and rely on the hardware timer directly,
> reducing the maximum timeout from 256 seconds to 85 seconds
> (2^32 / WDT_HZ).
> 

Florian,

can you have a look into this patch and confirm that there is no better
way to clear the interrupt status ?

Thanks,
Guenter

> Signed-off-by: Simon Arlott <si...@fire.lp0.eu>
> ---
>  drivers/watchdog/bcm63xx_wdt.c | 124 
> ++++++++++++++++++++++++-----------------
>  1 file changed, 72 insertions(+), 52 deletions(-)
> 
> diff --git a/drivers/watchdog/bcm63xx_wdt.c b/drivers/watchdog/bcm63xx_wdt.c
> index ab26fd9..f88fc97 100644
> --- a/drivers/watchdog/bcm63xx_wdt.c
> +++ b/drivers/watchdog/bcm63xx_wdt.c
> @@ -3,6 +3,7 @@
>   *
>   *  Copyright (C) 2007, Miguel Gaio <miguel.g...@efixo.com>
>   *  Copyright (C) 2008, Florian Fainelli <flor...@openwrt.org>
> + *  Copyright 2015 Simon Arlott
>   *
>   *  This program is free software; you can redistribute it and/or
>   *  modify it under the terms of the GNU General Public License
> @@ -20,11 +21,10 @@
>  #include <linux/miscdevice.h>
>  #include <linux/module.h>
>  #include <linux/moduleparam.h>
> +#include <linux/spinlock.h>
>  #include <linux/types.h>
>  #include <linux/uaccess.h>
>  #include <linux/watchdog.h>
> -#include <linux/timer.h>
> -#include <linux/jiffies.h>
>  #include <linux/interrupt.h>
>  #include <linux/ptrace.h>
>  #include <linux/resource.h>
> @@ -37,16 +37,17 @@
>  
>  #define PFX KBUILD_MODNAME
>  
> -#define WDT_HZ               50000000 /* Fclk */
> -#define WDT_DEFAULT_TIME     30      /* seconds */
> -#define WDT_MAX_TIME         256     /* seconds */
> +#define WDT_HZ                       50000000                /* Fclk */
> +#define WDT_DEFAULT_TIME     30                      /* seconds */
> +#define WDT_MAX_TIME         (0xffffffff / WDT_HZ)   /* seconds */
>  
> -static struct {
> +struct bcm63xx_wdt_hw {
> +     raw_spinlock_t lock;
>       void __iomem *regs;
> -     struct timer_list timer;
>       unsigned long inuse;
> -     atomic_t ticks;
> -} bcm63xx_wdt_device;
> +     bool running;
> +};
> +static struct bcm63xx_wdt_hw bcm63xx_wdt_device;
>  
>  static int expect_close;
>  
> @@ -59,48 +60,67 @@ MODULE_PARM_DESC(nowayout, "Watchdog cannot be stopped 
> once started (default="
>  /* HW functions */
>  static void bcm63xx_wdt_hw_start(void)
>  {
> -     bcm_writel(0xfffffffe, bcm63xx_wdt_device.regs + WDT_DEFVAL_REG);
> +     unsigned long flags;
> +
> +     raw_spin_lock_irqsave(&bcm63xx_wdt_device.lock, flags);
> +     bcm_writel(wdt_time * WDT_HZ, bcm63xx_wdt_device.regs + WDT_DEFVAL_REG);
>       bcm_writel(WDT_START_1, bcm63xx_wdt_device.regs + WDT_CTL_REG);
>       bcm_writel(WDT_START_2, bcm63xx_wdt_device.regs + WDT_CTL_REG);
> +     bcm63xx_wdt_device.running = true;
> +     raw_spin_unlock_irqrestore(&bcm63xx_wdt_device.lock, flags);
>  }
>  
>  static void bcm63xx_wdt_hw_stop(void)
>  {
> +     unsigned long flags;
> +
> +     raw_spin_lock_irqsave(&bcm63xx_wdt_device.lock, flags);
>       bcm_writel(WDT_STOP_1, bcm63xx_wdt_device.regs + WDT_CTL_REG);
>       bcm_writel(WDT_STOP_2, bcm63xx_wdt_device.regs + WDT_CTL_REG);
> +     bcm63xx_wdt_device.running = false;
> +     raw_spin_unlock_irqrestore(&bcm63xx_wdt_device.lock, flags);
>  }
>  
> +/* The watchdog interrupt occurs when half the timeout is remaining */
>  static void bcm63xx_wdt_isr(void *data)
>  {
> -     struct pt_regs *regs = get_irq_regs();
> -
> -     die(PFX " fire", regs);
> -}
> -
> -static void bcm63xx_timer_tick(unsigned long unused)
> -{
> -     if (!atomic_dec_and_test(&bcm63xx_wdt_device.ticks)) {
> -             bcm63xx_wdt_hw_start();
> -             mod_timer(&bcm63xx_wdt_device.timer, jiffies + HZ);
> -     } else
> -             pr_crit("watchdog will restart system\n");
> -}
> -
> -static void bcm63xx_wdt_pet(void)
> -{
> -     atomic_set(&bcm63xx_wdt_device.ticks, wdt_time);
> -}
> -
> -static void bcm63xx_wdt_start(void)
> -{
> -     bcm63xx_wdt_pet();
> -     bcm63xx_timer_tick(0);
> -}
> +     struct bcm63xx_wdt_hw *hw = &bcm63xx_wdt_device;
> +     unsigned long flags;
> +
> +     raw_spin_lock_irqsave(&hw->lock, flags);
> +     if (!hw->running) {
> +             /* Stop the watchdog as it shouldn't be running */
> +             bcm_writel(WDT_STOP_1, hw->regs + WDT_CTL_REG);
> +             bcm_writel(WDT_STOP_2, hw->regs + WDT_CTL_REG);
> +     } else {
> +             u32 timeleft = bcm_readl(hw->regs + WDT_CTL_REG);
> +             u32 ms;
> +
> +             if (timeleft >= 2) {
> +                     /* The only way to clear this level triggered interrupt
> +                      * without disrupting the normal running of the watchdog
> +                      * is to restart the watchdog with the current remaining
> +                      * time value (which will be half the previous timeout)
> +                      * so the interrupt occurs again at 1/4th, 1/8th, etc.
> +                      * of the original timeout value until we reboot.
> +                      *
> +                      * This is done with a lock held in case userspace is
> +                      * trying to restart the watchdog on another CPU.
> +                      */
> +                     bcm_writel(timeleft, hw->regs + WDT_DEFVAL_REG);
> +                     bcm_writel(WDT_START_1, hw->regs + WDT_CTL_REG);
> +                     bcm_writel(WDT_START_2, hw->regs + WDT_CTL_REG);
> +             } else {
> +                     /* The watchdog cannot be started with a time of less
> +                      * than 2 ticks (it won't fire).
> +                      */
> +                     die(PFX ": watchdog timer expired\n", get_irq_regs());
> +             }
>  
> -static void bcm63xx_wdt_pause(void)
> -{
> -     del_timer_sync(&bcm63xx_wdt_device.timer);
> -     bcm63xx_wdt_hw_stop();
> +             ms = timeleft / (WDT_HZ / 1000);
> +             pr_alert("warning timer fired, reboot in %ums\n", ms);
> +     }
> +     raw_spin_unlock_irqrestore(&hw->lock, flags);
>  }
>  
>  static int bcm63xx_wdt_settimeout(int new_time)
> @@ -118,17 +138,17 @@ static int bcm63xx_wdt_open(struct inode *inode, struct 
> file *file)
>       if (test_and_set_bit(0, &bcm63xx_wdt_device.inuse))
>               return -EBUSY;
>  
> -     bcm63xx_wdt_start();
> +     bcm63xx_wdt_hw_start();
>       return nonseekable_open(inode, file);
>  }
>  
>  static int bcm63xx_wdt_release(struct inode *inode, struct file *file)
>  {
>       if (expect_close == 42)
> -             bcm63xx_wdt_pause();
> +             bcm63xx_wdt_hw_stop();
>       else {
>               pr_crit("Unexpected close, not stopping watchdog!\n");
> -             bcm63xx_wdt_start();
> +             bcm63xx_wdt_hw_start();
>       }
>       clear_bit(0, &bcm63xx_wdt_device.inuse);
>       expect_close = 0;
> @@ -153,7 +173,7 @@ static ssize_t bcm63xx_wdt_write(struct file *file, const 
> char *data,
>                                       expect_close = 42;
>                       }
>               }
> -             bcm63xx_wdt_pet();
> +             bcm63xx_wdt_hw_start();
>       }
>       return len;
>  }
> @@ -187,18 +207,18 @@ static long bcm63xx_wdt_ioctl(struct file *file, 
> unsigned int cmd,
>                       return -EFAULT;
>  
>               if (new_value & WDIOS_DISABLECARD) {
> -                     bcm63xx_wdt_pause();
> +                     bcm63xx_wdt_hw_stop();
>                       retval = 0;
>               }
>               if (new_value & WDIOS_ENABLECARD) {
> -                     bcm63xx_wdt_start();
> +                     bcm63xx_wdt_hw_start();
>                       retval = 0;
>               }
>  
>               return retval;
>  
>       case WDIOC_KEEPALIVE:
> -             bcm63xx_wdt_pet();
> +             bcm63xx_wdt_hw_start();
>               return 0;
>  
>       case WDIOC_SETTIMEOUT:
> @@ -208,7 +228,7 @@ static long bcm63xx_wdt_ioctl(struct file *file, unsigned 
> int cmd,
>               if (bcm63xx_wdt_settimeout(new_value))
>                       return -EINVAL;
>  
> -             bcm63xx_wdt_pet();
> +             bcm63xx_wdt_hw_start();
>  
>       case WDIOC_GETTIMEOUT:
>               return put_user(wdt_time, p);
> @@ -240,8 +260,6 @@ static int bcm63xx_wdt_probe(struct platform_device *pdev)
>       int ret;
>       struct resource *r;
>  
> -     setup_timer(&bcm63xx_wdt_device.timer, bcm63xx_timer_tick, 0L);
> -
>       r = platform_get_resource(pdev, IORESOURCE_MEM, 0);
>       if (!r) {
>               dev_err(&pdev->dev, "failed to get resources\n");
> @@ -255,6 +273,8 @@ static int bcm63xx_wdt_probe(struct platform_device *pdev)
>               return -ENXIO;
>       }
>  
> +     raw_spin_lock_init(&bcm63xx_wdt_device.lock);
> +
>       ret = bcm63xx_timer_register(TIMER_WDT_ID, bcm63xx_wdt_isr, NULL);
>       if (ret < 0) {
>               dev_err(&pdev->dev, "failed to register wdt timer isr\n");
> @@ -264,8 +284,8 @@ static int bcm63xx_wdt_probe(struct platform_device *pdev)
>       if (bcm63xx_wdt_settimeout(wdt_time)) {
>               bcm63xx_wdt_settimeout(WDT_DEFAULT_TIME);
>               dev_info(&pdev->dev,
> -                     ": wdt_time value must be 1 <= wdt_time <= 256, using 
> %d\n",
> -                     wdt_time);
> +                     ": wdt_time value must be 1 <= wdt_time <= %d, using 
> %d\n",
> +                     WDT_MAX_TIME, wdt_time);
>       }
>  
>       ret = misc_register(&bcm63xx_wdt_miscdev);
> @@ -287,7 +307,7 @@ unregister_timer:
>  static int bcm63xx_wdt_remove(struct platform_device *pdev)
>  {
>       if (!nowayout)
> -             bcm63xx_wdt_pause();
> +             bcm63xx_wdt_hw_stop();
>  
>       misc_deregister(&bcm63xx_wdt_miscdev);
>       bcm63xx_timer_unregister(TIMER_WDT_ID);
> @@ -296,7 +316,7 @@ static int bcm63xx_wdt_remove(struct platform_device 
> *pdev)
>  
>  static void bcm63xx_wdt_shutdown(struct platform_device *pdev)
>  {
> -     bcm63xx_wdt_pause();
> +     bcm63xx_wdt_hw_stop();
>  }
>  
>  static struct platform_driver bcm63xx_wdt_driver = {
> -- 
> 2.1.4
> 
> -- 
> Simon Arlott
--
To unsubscribe from this list: send the line "unsubscribe linux-kernel" in
the body of a message to majord...@vger.kernel.org
More majordomo info at  http://vger.kernel.org/majordomo-info.html
Please read the FAQ at  http://www.tux.org/lkml/

Reply via email to