RE: [char-misc-next v3 6/8] watchdog: mei_wdt: register wd device only if required
From: Winkler, Tomas
Date: Wed Dec 23 2015 - 18:01:15 EST
next v3 6/8] watchdog: mei_wdt: register wd device only
> if required
>
> On 12/21/2015 03:17 PM, Tomas Winkler wrote:
> > From: Alexander Usyskin <alexander.usyskin@xxxxxxxxx>
> >
> > For Intel Broadwell and newer platforms, the ME device can inform
> > the host whether the watchdog functionality is activated or not.
> > If the watchdog functionality is not activated then the watchdog interface
> > can be not registered and eliminate unnecessary pings and hence lower the
> > power consumption by avoiding waking up the device.
> > The feature can be deactivated also without reboot
> > in that case the watchdog device should be unregistered at runtime.
> >
> > Signed-off-by: Alexander Usyskin <alexander.usyskin@xxxxxxxxx>
> > Signed-off-by: Tomas Winkler <tomas.winkler@xxxxxxxxx>
> > ---
> > V2: rework unregistration
> > V3: rebase; implement unregistraion also at runtime
> >
> > drivers/watchdog/mei_wdt.c | 183
> +++++++++++++++++++++++++++++++++++++++++----
> > 1 file changed, 169 insertions(+), 14 deletions(-)
> >
> > diff --git a/drivers/watchdog/mei_wdt.c b/drivers/watchdog/mei_wdt.c
> > index ab9aec218d69..3cd80aa75db1 100644
> > --- a/drivers/watchdog/mei_wdt.c
> > +++ b/drivers/watchdog/mei_wdt.c
> > @@ -16,6 +16,7 @@
> > #include <linux/slab.h>
> > #include <linux/interrupt.h>
> > #include <linux/debugfs.h>
> > +#include <linux/completion.h>
> > #include <linux/watchdog.h>
> >
> > #include <linux/uuid.h>
> > @@ -38,24 +39,30 @@
> >
> > /* Sub Commands */
> > #define MEI_MC_START_WD_TIMER_REQ 0x13
> > +#define MEI_MC_START_WD_TIMER_RES 0x83
> > +#define MEI_WDT_STATUS_SUCCESS 0
> > +#define MEI_WDT_WDSTATE_NOT_REQUIRED 0x1
> > #define MEI_MC_STOP_WD_TIMER_REQ 0x14
> >
> > /**
> > * enum mei_wdt_state - internal watchdog state
> > *
> > + * @MEI_WDT_PROBE: wd in probing stage
> > * @MEI_WDT_IDLE: wd is idle and not opened
> > * @MEI_WDT_START: wd was opened, start was called
> > * @MEI_WDT_RUNNING: wd is expecting keep alive pings
> > * @MEI_WDT_STOPPING: wd is stopping and will move to IDLE
> > + * @MEI_WDT_NOT_REQUIRED: wd device is not required
> > */
> > enum mei_wdt_state {
> > + MEI_WDT_PROBE,
> > MEI_WDT_IDLE,
> > MEI_WDT_START,
> > MEI_WDT_RUNNING,
> > MEI_WDT_STOPPING,
> > + MEI_WDT_NOT_REQUIRED,
> > };
> >
> > -#if IS_ENABLED(CONFIG_DEBUG_FS)
> > static const char *mei_wdt_state_str(enum mei_wdt_state state)
> > {
> > switch (state) {
> > @@ -71,7 +78,6 @@ static const char *mei_wdt_state_str(enum
> mei_wdt_state state)
> > return "unknown";
> > }
> > }
> > -#endif /* CONFIG_DEBUG_FS */
> >
> > struct mei_wdt;
> >
> > @@ -94,6 +100,10 @@ struct mei_wdt_dev {
> > *
> > * @cldev: mei watchdog client device
> > * @state: watchdog internal state
> > + * @resp_required: ping required response
> > + * @response: ping response completion
> > + * @unregister: unregister worker
> > + * @reg_lock: watchdog device registration lock
> > * @timeout: watchdog current timeout
> > *
> > * @dbgfs_dir: debugfs dir entry
> > @@ -103,6 +113,10 @@ struct mei_wdt {
> >
> > struct mei_cl_device *cldev;
> > enum mei_wdt_state state;
> > + bool resp_required;
> > + struct completion response;
> > + struct work_struct unregister;
> > + struct mutex reg_lock;
> > u16 timeout;
> >
> > #if IS_ENABLED(CONFIG_DEBUG_FS)
> > @@ -139,6 +153,19 @@ struct mei_wdt_start_request {
> > } __packed;
> >
> > /**
> > + * struct mei_wdt_start_response watchdog start/ping response
> > + *
> > + * @hdr: Management Control Command Header
> > + * @status: operation status
> > + * @wdstate: watchdog status bit mask
> > + */
> > +struct mei_wdt_start_response {
> > + struct mei_mc_hdr hdr;
> > + u8 status;
> > + u8 wdstate;
> > +} __packed;
> > +
> > +/**
> > * struct mei_wdt_stop_request - watchdog stop
> > *
> > * @hdr: Management Control Command Header
> > @@ -277,13 +304,18 @@ static int mei_wdt_ops_ping(struct watchdog_device
> *wdd)
> > if (wdt->state != MEI_WDT_START && wdt->state !=
> MEI_WDT_RUNNING)
> > return 0;
> >
> > + if (wdt->resp_required)
> > + init_completion(&wdt->response);
> > +
> > + wdt->state = MEI_WDT_RUNNING;
> > ret = mei_wdt_ping(wdt);
> > if (ret)
> > return ret;
> >
> > - wdt->state = MEI_WDT_RUNNING;
>
> The state is now set to RUNNING even if the ping failed.
> Is that on purpose ?
Yes, the state is checked in the response handler.
>
> > + if (wdt->resp_required)
> > + ret = wait_for_completion_killable(&wdt->response);
> >
> > - return 0;
> > + return ret;
> > }
> >
> > /**
> > @@ -358,15 +390,22 @@ static struct watchdog_info wd_info = {
> > */
> > static void mei_wdt_unregister(struct mei_wdt *wdt)
> > {
> > - struct mei_wdt_dev *mwd = wdt->mwd;
> > + struct mei_wdt_dev *mwd;
> >
> > - if (!mwd)
> > - return;
> > + mutex_lock(&wdt->reg_lock);
> > +
> > + if (!wdt->mwd)
> > + goto out;
> > +
>
> Is this because the error on registration was ignored ?
> Trying to understand the rationale for this check.
Protection against double call, mostly from testing hooks which are not part of the series.
>
> > + mwd = wdt->mwd;
> >
> > watchdog_unregister_device(&mwd->wdd);
> > +
>
> It would be better to make such changes in an earlier patch and avoid the
> whitespace change here.
>
> > wdt->mwd = NULL;
> > - wdt->state = MEI_WDT_IDLE;
> > kref_put(&mwd->refcnt, mei_wdt_release);
> > +
> > +out:
> > + mutex_unlock(&wdt->reg_lock);
> > }
> >
> > /**
> > @@ -387,9 +426,13 @@ static int mei_wdt_register(struct mei_wdt *wdt)
> >
> > dev = &wdt->cldev->dev;
> >
> > + mutex_lock(&wdt->reg_lock);
> > +
> > mwd = kzalloc(sizeof(struct mei_wdt_dev), GFP_KERNEL);
> > - if (!mwd)
> > - return -ENOMEM;
> > + if (!mwd) {
> > + ret = -ENOMEM;
> > + goto out;
> > + }
> >
> > mwd->wdt = wdt;
> > mwd->wdd.info = &wd_info;
> > @@ -405,13 +448,104 @@ static int mei_wdt_register(struct mei_wdt *wdt)
> > if (ret) {
> > dev_err(dev, "unable to register watchdog device = %d.\n", ret);
> > kref_put(&mwd->refcnt, mei_wdt_release);
> > - return ret;
> > + goto out;
> > }
> >
> > wdt->mwd = mwd;
> > +out:
> > + mutex_unlock(&wdt->reg_lock);
> > return 0;
>
> Do you want to return ret here ? Otherwise some of the code above does
> not really make sense (ie setting ret).
Thanks, good catch.
> > }
> >
> > +static void mei_wdt_unregister_work(struct work_struct *work)
> > +{
> > + struct mei_wdt *wdt = container_of(work, struct mei_wdt, unregister);
> > +
> > + mei_wdt_unregister(wdt);
> > +}
> > +
> > +/**
> > + * mei_wdt_event_rx - callback for data receive
> > + *
> > + * @cldev: bus device
> > + */
> > +static void mei_wdt_event_rx(struct mei_cl_device *cldev)
> > +{
> > + struct mei_wdt *wdt = mei_cldev_get_drvdata(cldev);
> > + struct mei_wdt_start_response res;
> > + const size_t res_len = sizeof(res);
> > + int ret;
> > +
> > + ret = mei_cldev_recv(wdt->cldev, (u8 *)&res, res_len);
> > + if (ret < 0) {
> > + dev_err(&cldev->dev, "failure in recv %d\n", ret);
>
> Not objecting, just concerned. Can those error messages
> result in filling up the kernel log if the mei hardware has a problem ?
I hope no, the HW will reset eventually.
> From an operational perspective, is it acceptable to ignore the errors ?
Not really, we want to know when it happens and from what flow.
> > + return;
> > + }
> > +
> > + /* Empty response can be sent on stop */
> > + if (ret == 0)
> > + return;
> > +
> > + if (ret < sizeof(struct mei_mc_hdr)) {
> > + dev_err(&cldev->dev, "recv small data %d\n", ret);
> > + return;
> > + }
> > +
> > + if (res.hdr.command != MEI_MANAGEMENT_CONTROL ||
> > + res.hdr.versionnumber != MEI_MC_VERSION_NUMBER) {
> > + dev_err(&cldev->dev, "wrong command received\n");
> > + return;
> > + }
> > +
> > + if (res.hdr.subcommand != MEI_MC_START_WD_TIMER_RES) {
> > + dev_warn(&cldev->dev, "unsupported command %d :%s[%d]\n",
> > + res.hdr.subcommand,
> > + mei_wdt_state_str(wdt->state),
> > + wdt->state);
> > + return;
> > + }
> > +
> > + if (wdt->state == MEI_WDT_RUNNING) {
> > + if (res.wdstate & MEI_WDT_WDSTATE_NOT_REQUIRED) {
> > + wdt->state = MEI_WDT_NOT_REQUIRED;
> > + schedule_work(&wdt->unregister);
> > + }
> > + goto out;
> > + }
> > +
> > + if (wdt->state == MEI_WDT_PROBE) {
> > + if (res.wdstate & MEI_WDT_WDSTATE_NOT_REQUIRED) {
> > + wdt->state = MEI_WDT_NOT_REQUIRED;
> > + } else {
> > + /* stop the ping register watchdog device */
>
> Should this be "stop the watchdog" ?
Maybe this needs rephrasing
>
> > + mei_wdt_stop(wdt);
> > + mei_wdt_register(wdt);
> > + }
> > + return;
> > + }
> > +
> > + dev_warn(&cldev->dev, "not in correct state %s[%d]\n",
> > + mei_wdt_state_str(wdt->state), wdt->state);
> > +
> > +out:
> > + if (!completion_done(&wdt->response))
> > + complete(&wdt->response);
> > +}
> > +
> > +/**
> > + * mei_wdt_event - callback for event receive
> > + *
> > + * @cldev: bus device
> > + * @events: event mask
> > + * @context: callback context
> > + */
> > +static void mei_wdt_event(struct mei_cl_device *cldev,
> > + u32 events, void *context)
> > +{
> > + if (events & BIT(MEI_CL_EVENT_RX))
> > + mei_wdt_event_rx(cldev);
> > +}
> > +
> > #if IS_ENABLED(CONFIG_DEBUG_FS)
> >
> > static ssize_t mei_dbgfs_read_state(struct file *file, char __user *ubuf,
> > @@ -482,8 +616,13 @@ static int mei_wdt_probe(struct mei_cl_device *cldev,
> > return -ENOMEM;
> >
> > wdt->timeout = MEI_WDT_DEFAULT_TIMEOUT;
> > - wdt->state = MEI_WDT_IDLE;
> > + wdt->state = MEI_WDT_PROBE;
> > wdt->cldev = cldev;
> > + wdt->resp_required = mei_cldev_ver(cldev) > 0x1;
> > + mutex_init(&wdt->reg_lock);
> > + init_completion(&wdt->response);
> > + INIT_WORK(&wdt->unregister, mei_wdt_unregister_work);
> > +
> > mei_cldev_set_drvdata(cldev, wdt);
> >
> > ret = mei_cldev_enable(cldev);
> > @@ -492,9 +631,19 @@ static int mei_wdt_probe(struct mei_cl_device *cldev,
> > goto err_out;
> > }
> >
> > + ret = mei_cldev_register_event_cb(wdt->cldev, BIT(MEI_CL_EVENT_RX),
> > + mei_wdt_event, NULL);
> > + if (ret) {
> > + dev_err(&cldev->dev, "Could not register event ret=%d\n", ret);
> > + goto err_disable;
> > + }
> > +
> Can there be an event before the call to mei_wdt_register() ?
> If so, it that case handled correctly ?
Yes, there is an first internal ping that checks whether the feature is enabled
>
> > wd_info.firmware_version = mei_cldev_ver(cldev);
> >
> > - ret = mei_wdt_register(wdt);
> > + if (wdt->resp_required)
> > + ret = mei_wdt_ping(wdt);
> > + else
> > + ret = mei_wdt_register(wdt);
> > if (ret)
> > goto err_disable;
> >
> > @@ -515,6 +664,12 @@ static int mei_wdt_remove(struct mei_cl_device
> *cldev)
> > {
> > struct mei_wdt *wdt = mei_cldev_get_drvdata(cldev);
> >
> > + /* Free the caller in case of fw initiated or unexpected reset */
> > + if (!completion_done(&wdt->response))
> > + complete(&wdt->response);
> > +
> > + cancel_work_sync(&wdt->unregister);
> > +
> > mei_wdt_unregister(wdt);
> >
> can there be an event callback after mei_wdt_unregister() but before
> mei_cldev_disable() ?
> If so, is the situation handled or would it result in a race condition ?
Not really, unless there is some glitch in the FW
> [ I think it is ok in both cases, just trying to make sure I didn't miss anything ]
>
> > mei_cldev_disable(cldev);
> > @@ -530,7 +685,7 @@ static int mei_wdt_remove(struct mei_cl_device *cldev)
> > 0x89, 0x9D, 0xA9, 0x15, 0x14, 0xCB, 0x32, 0xAB)
> >
> > static struct mei_cl_device_id mei_wdt_tbl[] = {
> > - { .uuid = MEI_UUID_WD, .version = 0x1},
> > + { .uuid = MEI_UUID_WD, .version = MEI_CL_VERSION_ANY },
> > /* required last entry */
> > { }
> > };
> >
--
To unsubscribe from this list: send the line "unsubscribe linux-kernel" in
the body of a message to majordomo@xxxxxxxxxxxxxxx
More majordomo info at http://vger.kernel.org/majordomo-info.html
Please read the FAQ at http://www.tux.org/lkml/