mirror of
git://git.kernel.org/pub/scm/linux/kernel/git/torvalds/linux.git
synced 2025-09-18 22:14:16 +00:00

Under some circumstances, firmware in the QAT devices could become unresponsive. The Heartbeat feature provides a mechanism to detect unresponsive devices. The QAT FW periodically writes to memory a set of counters that allow to detect the liveness of a device. This patch adds logic to enable the reporting of those counters, analyze them and report if a device is alive or not. In particular this adds (1) heartbeat enabling, reading and detection logic (2) reporting of heartbeat status and configuration via debugfs (3) documentation for the newly created sysfs entries (4) configuration of FW settings related to heartbeat, e.g. tick period (5) logic to convert time in ms (provided by the user) to clock ticks This patch introduces a new folder in debugfs called heartbeat with the following attributes: - status - queries_sent - queries_failed - config All attributes except config are reading only. In particular: - `status` file returns 0 when device is operational and -1 otherwise. - `queries_sent` returns the total number of heartbeat queries sent. - `queries_failed` returns the total number of heartbeat queries failed. - `config` allows to adjust the frequency at which the firmware writes counters to memory. This period is given in milliseconds and it is fixed for GEN4 devices. Signed-off-by: Damian Muszynski <damian.muszynski@intel.com> Reviewed-by: Giovanni Cabiddu <giovanni.cabiddu@intel.com> Reviewed-by: Andy Shevchenko <andriy.shevchenko@linux.intel.com> Signed-off-by: Herbert Xu <herbert@gondor.apana.org.au>
73 lines
1.7 KiB
C
73 lines
1.7 KiB
C
/* SPDX-License-Identifier: GPL-2.0-only */
|
|
/* Copyright(c) 2023 Intel Corporation */
|
|
|
|
#ifndef ADF_HEARTBEAT_H_
|
|
#define ADF_HEARTBEAT_H_
|
|
|
|
#include <linux/types.h>
|
|
|
|
struct adf_accel_dev;
|
|
struct dentry;
|
|
|
|
#define ADF_CFG_HB_TIMER_MIN_MS 200
|
|
#define ADF_CFG_HB_TIMER_DEFAULT_MS 500
|
|
#define ADF_CFG_HB_COUNT_THRESHOLD 3
|
|
|
|
enum adf_device_heartbeat_status {
|
|
HB_DEV_UNRESPONSIVE = 0,
|
|
HB_DEV_ALIVE,
|
|
HB_DEV_UNSUPPORTED,
|
|
};
|
|
|
|
struct adf_heartbeat {
|
|
unsigned int hb_sent_counter;
|
|
unsigned int hb_failed_counter;
|
|
unsigned int hb_timer;
|
|
u64 last_hb_check_time;
|
|
struct hb_dma_addr {
|
|
dma_addr_t phy_addr;
|
|
void *virt_addr;
|
|
} dma;
|
|
struct {
|
|
struct dentry *base_dir;
|
|
struct dentry *status;
|
|
struct dentry *cfg;
|
|
struct dentry *sent;
|
|
struct dentry *failed;
|
|
} dbgfs;
|
|
};
|
|
|
|
#ifdef CONFIG_DEBUG_FS
|
|
int adf_heartbeat_init(struct adf_accel_dev *accel_dev);
|
|
int adf_heartbeat_start(struct adf_accel_dev *accel_dev);
|
|
void adf_heartbeat_shutdown(struct adf_accel_dev *accel_dev);
|
|
|
|
int adf_heartbeat_ms_to_ticks(struct adf_accel_dev *accel_dev, unsigned int time_ms,
|
|
uint32_t *value);
|
|
int adf_heartbeat_save_cfg_param(struct adf_accel_dev *accel_dev,
|
|
unsigned int timer_ms);
|
|
void adf_heartbeat_status(struct adf_accel_dev *accel_dev,
|
|
enum adf_device_heartbeat_status *hb_status);
|
|
|
|
#else
|
|
static inline int adf_heartbeat_init(struct adf_accel_dev *accel_dev)
|
|
{
|
|
return 0;
|
|
}
|
|
|
|
static inline int adf_heartbeat_start(struct adf_accel_dev *accel_dev)
|
|
{
|
|
return 0;
|
|
}
|
|
|
|
static inline void adf_heartbeat_shutdown(struct adf_accel_dev *accel_dev)
|
|
{
|
|
}
|
|
|
|
static inline int adf_heartbeat_save_cfg_param(struct adf_accel_dev *accel_dev,
|
|
unsigned int timer_ms)
|
|
{
|
|
return 0;
|
|
}
|
|
#endif
|
|
#endif /* ADF_HEARTBEAT_H_ */
|