[PATCH] nvme-pci: expose active quirks in sysfs

Maurizio Lombardi mlombard at bsdbackstore.eu
Wed Oct 29 23:18:30 PDT 2025


On Thu Oct 30, 2025 at 12:25 AM CET, Chaitanya Kulkarni wrote:
> On 10/29/25 01:02, Maurizio Lombardi wrote:
>> On Wed Oct 29, 2025 at 6:47 AM CET, Chaitanya Kulkarni wrote:
>>> On 10/28/25 10:00, Maurizio Lombardi wrote:
>>>> On Tue Oct 28, 2025 at 5:32 PM CET, Bart Van Assche wrote:
>>>>> On 10/28/25 7:29 AM, Maurizio Lombardi wrote:
>>>>>> Currently, there is no straightforward way for a user to inspect
>>>>>> the quirks value from userspace.
>>>>>> Add a new read-only sysfs attribute "quirks";
>>>>>> reading this file will display the hexadecimal
>>>>>> value of the ctrl->quirks bitmask for the given NVMe device.
>>>>> This patch changes the constants in enum nvme_quirks from
>>>>> kernel-internal constants into an ABI. I'm not sure that's what we
>>>>> want.
>>>> I understand your concern.
>>>> I could respin it to export the names of the active quirks
>>>> rather than the raw bitmask, if there is an interest in having
>>>> this feature.
>>>>
>>>> Maurizio
>>>>
>>> question here: do we need to care about some kind of security before we
>>> expose controller information that is internal to the driver ?
>>> CAP_SYS_ADMIN ? -ck
>> IMO I don't think it's an information that needs to be hidden.
>> After all, any user could run "lscpi -nn", get the vendor and device
>> id and cross-reference them with the pci table in the source code
>> to get the enabled quirks, this sysfs entry would just make it faster.
>>
>> Maurizio
>
> Yes it is definitely useful after only decoding :-
>
> linux-block (for-next) # cat /sys/class/nvme/nvme0/quirks
> 0x0000000000040000
>
> Active quirks:
>    BOGUS_NID
> linux-block (for-next) #

Ah you anticipated me, I was preparing a somewhat similar patch.

************************

Currently, there is no straightforward way for a user to inspect
which quirks are active for a given device from userspace.

Add a new "quirks" sysfs attribute to the nvme controller device.

Reading this file will display a human-readable list
of all active quirks, with each quirk name on a new line.
If no quirks are active, it will display "none".

Signed-off-by: Maurizio Lombardi <mlombard at redhat.com>
---

V2: Do not expose kernel-internal constants to userspace.
    Move the quirks attribute to the controller device, where it belongs.

 drivers/nvme/host/nvme.h  | 54 +++++++++++++++++++++++++++++++++++++++
 drivers/nvme/host/sysfs.c | 23 +++++++++++++++++
 2 files changed, 77 insertions(+)

diff --git a/drivers/nvme/host/nvme.h b/drivers/nvme/host/nvme.h
index 102fae6a231c..647f19dd57e9 100644
--- a/drivers/nvme/host/nvme.h
+++ b/drivers/nvme/host/nvme.h
@@ -180,6 +180,60 @@ enum nvme_quirks {
 	NVME_QUIRK_DMAPOOL_ALIGN_512		= (1 << 22),
 };

+static inline char *nvme_quirk_name(enum nvme_quirks q)
+{
+	switch (q) {
+	case NVME_QUIRK_STRIPE_SIZE:
+		return "stripe_size";
+	case NVME_QUIRK_IDENTIFY_CNS:
+		return "identify_cns";
+	case NVME_QUIRK_DEALLOCATE_ZEROES:
+		return "deallocate_zeroes";
+	case NVME_QUIRK_DELAY_BEFORE_CHK_RDY:
+		return "delay_before_chk_rdy";
+	case NVME_QUIRK_NO_APST:
+		return "no_apst";
+	case NVME_QUIRK_NO_DEEPEST_PS:
+		return "no_deepest_ps";
+	case NVME_QUIRK_QDEPTH_ONE:
+		return "qdepth_one";
+	case NVME_QUIRK_MEDIUM_PRIO_SQ:
+		return "medium_prio_sq";
+	case NVME_QUIRK_IGNORE_DEV_SUBNQN:
+		return "ignore_dev_subnqn";
+	case NVME_QUIRK_DISABLE_WRITE_ZEROES:
+		return "disable_write_zeroes";
+	case NVME_QUIRK_SIMPLE_SUSPEND:
+		return "simple_suspend";
+	case NVME_QUIRK_SINGLE_VECTOR:
+		return "single_vector";
+	case NVME_QUIRK_128_BYTES_SQES:
+		return "128_bytes_sqes";
+	case NVME_QUIRK_SHARED_TAGS:
+		return "shared_tags";
+	case NVME_QUIRK_NO_TEMP_THRESH_CHANGE:
+		return "no_temp_thresh_change";
+	case NVME_QUIRK_NO_NS_DESC_LIST:
+		return "no_ns_desc_list";
+	case NVME_QUIRK_DMA_ADDRESS_BITS_48:
+		return "dma_address_bits_48";
+	case NVME_QUIRK_SKIP_CID_GEN:
+		return "skip_cid_gen";
+	case NVME_QUIRK_BOGUS_NID:
+		return "bogus_nid";
+	case NVME_QUIRK_NO_SECONDARY_TEMP_THRESH:
+		return "no_secondary_temp_thresh";
+	case NVME_QUIRK_FORCE_NO_SIMPLE_SUSPEND:
+		return "force_no_simple_suspend";
+	case NVME_QUIRK_BROKEN_MSI:
+		return "broken_msi";
+	case NVME_QUIRK_DMAPOOL_ALIGN_512:
+		return "dmapool_align_512";
+	}
+
+	return "unknown";
+}
+
 /*
  * Common request structure for NVMe passthrough.  All drivers must have
  * this structure as the first member of their request-private data.
diff --git a/drivers/nvme/host/sysfs.c b/drivers/nvme/host/sysfs.c
index 29430949ce2f..16c6fea4b2db 100644
--- a/drivers/nvme/host/sysfs.c
+++ b/drivers/nvme/host/sysfs.c
@@ -601,6 +601,28 @@ static ssize_t dctype_show(struct device *dev,
 }
 static DEVICE_ATTR_RO(dctype);

+static ssize_t quirks_show(struct device *dev, struct device_attribute *attr,
+                char *buf)
+{
+	int count = 0, i;
+	struct nvme_ctrl *ctrl = dev_get_drvdata(dev);
+	unsigned long quirks = ctrl->quirks;
+
+	if (!quirks)
+		return sysfs_emit(buf, "none\n");
+
+	for (i = 0; quirks; ++i) {
+		if (quirks & 1) {
+			count += sysfs_emit_at(buf, count, "%s\n",
+					nvme_quirk_name(BIT(i)));
+		}
+		quirks >>= 1;
+	}
+
+	return count;
+}
+static DEVICE_ATTR_RO(quirks);
+
 #ifdef CONFIG_NVME_HOST_AUTH
 static ssize_t nvme_ctrl_dhchap_secret_show(struct device *dev,
 		struct device_attribute *attr, char *buf)
@@ -742,6 +764,7 @@ static struct attribute *nvme_dev_attrs[] = {
 	&dev_attr_kato.attr,
 	&dev_attr_cntrltype.attr,
 	&dev_attr_dctype.attr,
+	&dev_attr_quirks.attr,
 #ifdef CONFIG_NVME_HOST_AUTH
 	&dev_attr_dhchap_secret.attr,
 	&dev_attr_dhchap_ctrl_secret.attr,
--
2.47.3

>
>
> diff --git a/drivers/nvme/host/pci.c b/drivers/nvme/host/pci.c
> index c916176bd9f0..1b9ad818b12d 100644
> --- a/drivers/nvme/host/pci.c
> +++ b/drivers/nvme/host/pci.c
> @@ -2497,6 +2497,80 @@ static ssize_t cmbsz_show(struct device *dev, struct device_attribute *attr,
>   }
>   static DEVICE_ATTR_RO(cmbsz);
>   
> +static int nvme_get_quirks_string(unsigned long quirks, char *buf, size_t buf_len)
> +{
> +	size_t len = 0;
> +
> +	if (!quirks) {
> +		len = scnprintf(buf, buf_len, "No quirks enabled\n");
> +		return len;
> +	}
> +
> +	len += scnprintf(buf + len, buf_len - len, "Active quirks:\n");
> +
> +	if (quirks & NVME_QUIRK_STRIPE_SIZE)
> +		len += scnprintf(buf + len, buf_len - len, "  STRIPE_SIZE\n");
> +	if (quirks & NVME_QUIRK_IDENTIFY_CNS)
> +		len += scnprintf(buf + len, buf_len - len, "  IDENTIFY_CNS\n");
> +	if (quirks & NVME_QUIRK_DEALLOCATE_ZEROES)
> +		len += scnprintf(buf + len, buf_len - len, "  DEALLOCATE_ZEROES\n");
> +	if (quirks & NVME_QUIRK_DELAY_BEFORE_CHK_RDY)
> +		len += scnprintf(buf + len, buf_len - len, "  DELAY_BEFORE_CHK_RDY\n");
> +	if (quirks & NVME_QUIRK_NO_APST)
> +		len += scnprintf(buf + len, buf_len - len, "  NO_APST\n");
> +	if (quirks & NVME_QUIRK_NO_DEEPEST_PS)
> +		len += scnprintf(buf + len, buf_len - len, "  NO_DEEPEST_PS\n");
> +	if (quirks & NVME_QUIRK_QDEPTH_ONE)
> +		len += scnprintf(buf + len, buf_len - len, "  QDEPTH_ONE\n");
> +	if (quirks & NVME_QUIRK_MEDIUM_PRIO_SQ)
> +		len += scnprintf(buf + len, buf_len - len, "  MEDIUM_PRIO_SQ\n");
> +	if (quirks & NVME_QUIRK_IGNORE_DEV_SUBNQN)
> +		len += scnprintf(buf + len, buf_len - len, "  IGNORE_DEV_SUBNQN\n");
> +	if (quirks & NVME_QUIRK_DISABLE_WRITE_ZEROES)
> +		len += scnprintf(buf + len, buf_len - len, "  DISABLE_WRITE_ZEROES\n");
> +	if (quirks & NVME_QUIRK_SIMPLE_SUSPEND)
> +		len += scnprintf(buf + len, buf_len - len, "  SIMPLE_SUSPEND\n");
> +	if (quirks & NVME_QUIRK_SINGLE_VECTOR)
> +		len += scnprintf(buf + len, buf_len - len, "  SINGLE_VECTOR\n");
> +	if (quirks & NVME_QUIRK_128_BYTES_SQES)
> +		len += scnprintf(buf + len, buf_len - len, "  128_BYTES_SQES\n");
> +	if (quirks & NVME_QUIRK_SHARED_TAGS)
> +		len += scnprintf(buf + len, buf_len - len, "  SHARED_TAGS\n");
> +	if (quirks & NVME_QUIRK_NO_TEMP_THRESH_CHANGE)
> +		len += scnprintf(buf + len, buf_len - len, "  NO_TEMP_THRESH_CHANGE\n");
> +	if (quirks & NVME_QUIRK_NO_NS_DESC_LIST)
> +		len += scnprintf(buf + len, buf_len - len, "  NO_NS_DESC_LIST\n");
> +	if (quirks & NVME_QUIRK_DMA_ADDRESS_BITS_48)
> +		len += scnprintf(buf + len, buf_len - len, "  DMA_ADDRESS_BITS_48\n");
> +	if (quirks & NVME_QUIRK_SKIP_CID_GEN)
> +		len += scnprintf(buf + len, buf_len - len, "  SKIP_CID_GEN\n");
> +	if (quirks & NVME_QUIRK_BOGUS_NID)
> +		len += scnprintf(buf + len, buf_len - len, "  BOGUS_NID\n");
> +	if (quirks & NVME_QUIRK_NO_SECONDARY_TEMP_THRESH)
> +		len += scnprintf(buf + len, buf_len - len, "  NO_SECONDARY_TEMP_THRESH\n");
> +	if (quirks & NVME_QUIRK_FORCE_NO_SIMPLE_SUSPEND)
> +		len += scnprintf(buf + len, buf_len - len, "  FORCE_NO_SIMPLE_SUSPEND\n");
> +	if (quirks & NVME_QUIRK_BROKEN_MSI)
> +		len += scnprintf(buf + len, buf_len - len, "  BROKEN_MSI\n");
> +	if (quirks & NVME_QUIRK_DMAPOOL_ALIGN_512)
> +		len += scnprintf(buf + len, buf_len - len, "  DMAPOOL_ALIGN_512\n");
> +
> +	return len;
> +}
> +
> +static ssize_t quirks_show(struct device *dev, struct device_attribute *attr,
> +			   char *buf)
> +{
> +	struct nvme_dev *ndev = to_nvme_dev(dev_get_drvdata(dev));
> +	int len;
> +
> +	len = sysfs_emit(buf, "0x%016lx\n\n", ndev->ctrl.quirks);
> +	len += nvme_get_quirks_string(ndev->ctrl.quirks, buf + len, PAGE_SIZE - len);
> +
> +	return len;
> +}
> +static DEVICE_ATTR_RO(quirks);
> +
>   static ssize_t hmb_show(struct device *dev, struct device_attribute *attr,
>   			char *buf)
>   {
> @@ -2557,6 +2631,7 @@ static struct attribute *nvme_pci_attrs[] = {
>   	&dev_attr_cmbloc.attr,
>   	&dev_attr_cmbsz.attr,
>   	&dev_attr_hmb.attr,
> +	&dev_attr_quirks.attr,
>   	NULL,
>   };
>   




More information about the Linux-nvme mailing list