hwmon: (occ) Delay hwmon registration until user request

Instead of registering the hwmon device at probe time, use the
existing "occ_active" sysfs file to control when the driver polls
the OCC for sensor data and registers with hwmon. The reason for
this change is that the SBE, which is the device by which the
driver communicates with the OCC, cannot handle communications
during certain system state transitions, resulting in
unrecoverable system errors.

Signed-off-by: Eddie James <eajames@linux.ibm.com>
Link: https://lore.kernel.org/r/20220427140443.11428-1-eajames@linux.ibm.com
Signed-off-by: Guenter Roeck <linux@roeck-us.net>
This commit is contained in:
Eddie James 2022-04-27 09:04:43 -05:00 committed by Guenter Roeck
parent c3963bc0a0
commit 849b0156d9
5 changed files with 157 additions and 91 deletions

View File

@ -1149,44 +1149,75 @@ static void occ_parse_poll_response(struct occ *occ)
sizeof(*header), size + sizeof(*header)); sizeof(*header), size + sizeof(*header));
} }
int occ_setup(struct occ *occ, const char *name) int occ_active(struct occ *occ, bool active)
{
int rc = mutex_lock_interruptible(&occ->lock);
if (rc)
return rc;
if (active) {
if (occ->active) {
rc = -EALREADY;
goto unlock;
}
occ->error_count = 0;
occ->last_safe = 0;
rc = occ_poll(occ);
if (rc < 0) {
dev_err(occ->bus_dev,
"failed to get OCC poll response=%02x: %d\n",
occ->resp.return_status, rc);
goto unlock;
}
occ->active = true;
occ->next_update = jiffies + OCC_UPDATE_FREQUENCY;
occ_parse_poll_response(occ);
rc = occ_setup_sensor_attrs(occ);
if (rc) {
dev_err(occ->bus_dev,
"failed to setup sensor attrs: %d\n", rc);
goto unlock;
}
occ->hwmon = hwmon_device_register_with_groups(occ->bus_dev,
"occ", occ,
occ->groups);
if (IS_ERR(occ->hwmon)) {
rc = PTR_ERR(occ->hwmon);
occ->hwmon = NULL;
dev_err(occ->bus_dev,
"failed to register hwmon device: %d\n", rc);
goto unlock;
}
} else {
if (!occ->active) {
rc = -EALREADY;
goto unlock;
}
if (occ->hwmon)
hwmon_device_unregister(occ->hwmon);
occ->active = false;
occ->hwmon = NULL;
}
unlock:
mutex_unlock(&occ->lock);
return rc;
}
int occ_setup(struct occ *occ)
{ {
int rc; int rc;
mutex_init(&occ->lock); mutex_init(&occ->lock);
occ->groups[0] = &occ->group; occ->groups[0] = &occ->group;
/* no need to lock */
rc = occ_poll(occ);
if (rc == -ESHUTDOWN) {
dev_info(occ->bus_dev, "host is not ready\n");
return rc;
} else if (rc < 0) {
dev_err(occ->bus_dev,
"failed to get OCC poll response=%02x: %d\n",
occ->resp.return_status, rc);
return rc;
}
occ->next_update = jiffies + OCC_UPDATE_FREQUENCY;
occ_parse_poll_response(occ);
rc = occ_setup_sensor_attrs(occ);
if (rc) {
dev_err(occ->bus_dev, "failed to setup sensor attrs: %d\n",
rc);
return rc;
}
occ->hwmon = devm_hwmon_device_register_with_groups(occ->bus_dev, name,
occ, occ->groups);
if (IS_ERR(occ->hwmon)) {
rc = PTR_ERR(occ->hwmon);
dev_err(occ->bus_dev, "failed to register hwmon device: %d\n",
rc);
return rc;
}
rc = occ_setup_sysfs(occ); rc = occ_setup_sysfs(occ);
if (rc) if (rc)
dev_err(occ->bus_dev, "failed to setup sysfs: %d\n", rc); dev_err(occ->bus_dev, "failed to setup sysfs: %d\n", rc);
@ -1195,6 +1226,15 @@ int occ_setup(struct occ *occ, const char *name)
} }
EXPORT_SYMBOL_GPL(occ_setup); EXPORT_SYMBOL_GPL(occ_setup);
void occ_shutdown(struct occ *occ)
{
occ_shutdown_sysfs(occ);
if (occ->hwmon)
hwmon_device_unregister(occ->hwmon);
}
EXPORT_SYMBOL_GPL(occ_shutdown);
MODULE_AUTHOR("Eddie James <eajames@linux.ibm.com>"); MODULE_AUTHOR("Eddie James <eajames@linux.ibm.com>");
MODULE_DESCRIPTION("Common OCC hwmon code"); MODULE_DESCRIPTION("Common OCC hwmon code");
MODULE_LICENSE("GPL"); MODULE_LICENSE("GPL");

View File

@ -106,6 +106,7 @@ struct occ {
struct attribute_group group; struct attribute_group group;
const struct attribute_group *groups[2]; const struct attribute_group *groups[2];
bool active;
int error; /* final transfer error after retry */ int error; /* final transfer error after retry */
int last_error; /* latest transfer error */ int last_error; /* latest transfer error */
unsigned int error_count; /* number of xfr errors observed */ unsigned int error_count; /* number of xfr errors observed */
@ -123,9 +124,11 @@ struct occ {
u8 prev_mode; u8 prev_mode;
}; };
int occ_setup(struct occ *occ, const char *name); int occ_active(struct occ *occ, bool active);
int occ_setup(struct occ *occ);
int occ_setup_sysfs(struct occ *occ); int occ_setup_sysfs(struct occ *occ);
void occ_shutdown(struct occ *occ); void occ_shutdown(struct occ *occ);
void occ_shutdown_sysfs(struct occ *occ);
void occ_sysfs_poll_done(struct occ *occ); void occ_sysfs_poll_done(struct occ *occ);
int occ_update_response(struct occ *occ); int occ_update_response(struct occ *occ);

View File

@ -223,7 +223,7 @@ static int p8_i2c_occ_probe(struct i2c_client *client)
occ->poll_cmd_data = 0x10; /* P8 OCC poll data */ occ->poll_cmd_data = 0x10; /* P8 OCC poll data */
occ->send_cmd = p8_i2c_occ_send_cmd; occ->send_cmd = p8_i2c_occ_send_cmd;
return occ_setup(occ, "p8_occ"); return occ_setup(occ);
} }
static int p8_i2c_occ_remove(struct i2c_client *client) static int p8_i2c_occ_remove(struct i2c_client *client)

View File

@ -145,7 +145,7 @@ static int p9_sbe_occ_probe(struct platform_device *pdev)
occ->poll_cmd_data = 0x20; /* P9 OCC poll data */ occ->poll_cmd_data = 0x20; /* P9 OCC poll data */
occ->send_cmd = p9_sbe_occ_send_cmd; occ->send_cmd = p9_sbe_occ_send_cmd;
rc = occ_setup(occ, "p9_occ"); rc = occ_setup(occ);
if (rc == -ESHUTDOWN) if (rc == -ESHUTDOWN)
rc = -ENODEV; /* Host is shutdown, don't spew errors */ rc = -ENODEV; /* Host is shutdown, don't spew errors */

View File

@ -6,13 +6,13 @@
#include <linux/export.h> #include <linux/export.h>
#include <linux/hwmon-sysfs.h> #include <linux/hwmon-sysfs.h>
#include <linux/kernel.h> #include <linux/kernel.h>
#include <linux/kstrtox.h>
#include <linux/sysfs.h> #include <linux/sysfs.h>
#include "common.h" #include "common.h"
/* OCC status register */ /* OCC status register */
#define OCC_STAT_MASTER BIT(7) #define OCC_STAT_MASTER BIT(7)
#define OCC_STAT_ACTIVE BIT(0)
/* OCC extended status register */ /* OCC extended status register */
#define OCC_EXT_STAT_DVFS_OT BIT(7) #define OCC_EXT_STAT_DVFS_OT BIT(7)
@ -22,6 +22,25 @@
#define OCC_EXT_STAT_DVFS_VDD BIT(3) #define OCC_EXT_STAT_DVFS_VDD BIT(3)
#define OCC_EXT_STAT_GPU_THROTTLE GENMASK(2, 0) #define OCC_EXT_STAT_GPU_THROTTLE GENMASK(2, 0)
static ssize_t occ_active_store(struct device *dev,
struct device_attribute *attr,
const char *buf, size_t count)
{
int rc;
bool active;
struct occ *occ = dev_get_drvdata(dev);
rc = kstrtobool(buf, &active);
if (rc)
return rc;
rc = occ_active(occ, active);
if (rc)
return rc;
return count;
}
static ssize_t occ_sysfs_show(struct device *dev, static ssize_t occ_sysfs_show(struct device *dev,
struct device_attribute *attr, char *buf) struct device_attribute *attr, char *buf)
{ {
@ -31,54 +50,64 @@ static ssize_t occ_sysfs_show(struct device *dev,
struct occ_poll_response_header *header; struct occ_poll_response_header *header;
struct sensor_device_attribute *sattr = to_sensor_dev_attr(attr); struct sensor_device_attribute *sattr = to_sensor_dev_attr(attr);
rc = occ_update_response(occ); if (occ->active) {
if (rc) rc = occ_update_response(occ);
return rc; if (rc)
return rc;
header = (struct occ_poll_response_header *)occ->resp.data; header = (struct occ_poll_response_header *)occ->resp.data;
switch (sattr->index) { switch (sattr->index) {
case 0: case 0:
val = !!(header->status & OCC_STAT_MASTER); val = !!(header->status & OCC_STAT_MASTER);
break; break;
case 1: case 1:
val = !!(header->status & OCC_STAT_ACTIVE);
break;
case 2:
val = !!(header->ext_status & OCC_EXT_STAT_DVFS_OT);
break;
case 3:
val = !!(header->ext_status & OCC_EXT_STAT_DVFS_POWER);
break;
case 4:
val = !!(header->ext_status & OCC_EXT_STAT_MEM_THROTTLE);
break;
case 5:
val = !!(header->ext_status & OCC_EXT_STAT_QUICK_DROP);
break;
case 6:
val = header->occ_state;
break;
case 7:
if (header->status & OCC_STAT_MASTER)
val = hweight8(header->occs_present);
else
val = 1; val = 1;
break; break;
case 8: case 2:
val = header->ips_status; val = !!(header->ext_status & OCC_EXT_STAT_DVFS_OT);
break; break;
case 9: case 3:
val = header->mode; val = !!(header->ext_status & OCC_EXT_STAT_DVFS_POWER);
break; break;
case 10: case 4:
val = !!(header->ext_status & OCC_EXT_STAT_DVFS_VDD); val = !!(header->ext_status &
break; OCC_EXT_STAT_MEM_THROTTLE);
case 11: break;
val = header->ext_status & OCC_EXT_STAT_GPU_THROTTLE; case 5:
break; val = !!(header->ext_status & OCC_EXT_STAT_QUICK_DROP);
default: break;
return -EINVAL; case 6:
val = header->occ_state;
break;
case 7:
if (header->status & OCC_STAT_MASTER)
val = hweight8(header->occs_present);
else
val = 1;
break;
case 8:
val = header->ips_status;
break;
case 9:
val = header->mode;
break;
case 10:
val = !!(header->ext_status & OCC_EXT_STAT_DVFS_VDD);
break;
case 11:
val = header->ext_status & OCC_EXT_STAT_GPU_THROTTLE;
break;
default:
return -EINVAL;
}
} else {
if (sattr->index == 1)
val = 0;
else if (sattr->index <= 11)
val = -ENODATA;
else
return -EINVAL;
} }
return sysfs_emit(buf, "%d\n", val); return sysfs_emit(buf, "%d\n", val);
@ -95,7 +124,8 @@ static ssize_t occ_error_show(struct device *dev,
} }
static SENSOR_DEVICE_ATTR(occ_master, 0444, occ_sysfs_show, NULL, 0); static SENSOR_DEVICE_ATTR(occ_master, 0444, occ_sysfs_show, NULL, 0);
static SENSOR_DEVICE_ATTR(occ_active, 0444, occ_sysfs_show, NULL, 1); static SENSOR_DEVICE_ATTR(occ_active, 0644, occ_sysfs_show, occ_active_store,
1);
static SENSOR_DEVICE_ATTR(occ_dvfs_overtemp, 0444, occ_sysfs_show, NULL, 2); static SENSOR_DEVICE_ATTR(occ_dvfs_overtemp, 0444, occ_sysfs_show, NULL, 2);
static SENSOR_DEVICE_ATTR(occ_dvfs_power, 0444, occ_sysfs_show, NULL, 3); static SENSOR_DEVICE_ATTR(occ_dvfs_power, 0444, occ_sysfs_show, NULL, 3);
static SENSOR_DEVICE_ATTR(occ_mem_throttle, 0444, occ_sysfs_show, NULL, 4); static SENSOR_DEVICE_ATTR(occ_mem_throttle, 0444, occ_sysfs_show, NULL, 4);
@ -139,7 +169,7 @@ void occ_sysfs_poll_done(struct occ *occ)
* On the first poll response, we haven't yet created the sysfs * On the first poll response, we haven't yet created the sysfs
* attributes, so don't make any notify calls. * attributes, so don't make any notify calls.
*/ */
if (!occ->hwmon) if (!occ->active)
goto done; goto done;
if ((header->status & OCC_STAT_MASTER) != if ((header->status & OCC_STAT_MASTER) !=
@ -148,12 +178,6 @@ void occ_sysfs_poll_done(struct occ *occ)
sysfs_notify(&occ->bus_dev->kobj, NULL, name); sysfs_notify(&occ->bus_dev->kobj, NULL, name);
} }
if ((header->status & OCC_STAT_ACTIVE) !=
(occ->prev_stat & OCC_STAT_ACTIVE)) {
name = sensor_dev_attr_occ_active.dev_attr.attr.name;
sysfs_notify(&occ->bus_dev->kobj, NULL, name);
}
if ((header->ext_status & OCC_EXT_STAT_DVFS_OT) != if ((header->ext_status & OCC_EXT_STAT_DVFS_OT) !=
(occ->prev_ext_stat & OCC_EXT_STAT_DVFS_OT)) { (occ->prev_ext_stat & OCC_EXT_STAT_DVFS_OT)) {
name = sensor_dev_attr_occ_dvfs_overtemp.dev_attr.attr.name; name = sensor_dev_attr_occ_dvfs_overtemp.dev_attr.attr.name;
@ -227,8 +251,7 @@ int occ_setup_sysfs(struct occ *occ)
return sysfs_create_group(&occ->bus_dev->kobj, &occ_sysfs); return sysfs_create_group(&occ->bus_dev->kobj, &occ_sysfs);
} }
void occ_shutdown(struct occ *occ) void occ_shutdown_sysfs(struct occ *occ)
{ {
sysfs_remove_group(&occ->bus_dev->kobj, &occ_sysfs); sysfs_remove_group(&occ->bus_dev->kobj, &occ_sysfs);
} }
EXPORT_SYMBOL_GPL(occ_shutdown);