]> git.proxmox.com Git - pve-kernel.git/blame - patches/kernel/0003-pci-Enable-overrides-for-missing-ACS-capabilities-4..patch
rebase patches on top of Ubuntu-5.15.0-24.24
[pve-kernel.git] / patches / kernel / 0003-pci-Enable-overrides-for-missing-ACS-capabilities-4..patch
CommitLineData
59d5af67 1From 0000000000000000000000000000000000000000 Mon Sep 17 00:00:00 2001
ba2f1a67 2From: Mark Weiman <mark.weiman@markzz.com>
55f9bfa9
FG
3Date: Wed, 7 Feb 2018 16:04:03 -0500
4Subject: [PATCH] pci: Enable overrides for missing ACS capabilities (4.15)
b9e76370
FG
5MIME-Version: 1.0
6Content-Type: text/plain; charset=UTF-8
7Content-Transfer-Encoding: 8bit
ba2f1a67
FG
8
9This an updated version of Alex Williamson's patch from:
10https://lkml.org/lkml/2013/5/30/513
11
12Original commit message follows:
ba2f1a67
FG
13PCIe ACS (Access Control Services) is the PCIe 2.0+ feature that
14allows us to control whether transactions are allowed to be redirected
15in various subnodes of a PCIe topology. For instance, if two
16endpoints are below a root port or downsteam switch port, the
17downstream port may optionally redirect transactions between the
18devices, bypassing upstream devices. The same can happen internally
19on multifunction devices. The transaction may never be visible to the
20upstream devices.
21
22One upstream device that we particularly care about is the IOMMU. If
23a redirection occurs in the topology below the IOMMU, then the IOMMU
24cannot provide isolation between devices. This is why the PCIe spec
25encourages topologies to include ACS support. Without it, we have to
26assume peer-to-peer DMA within a hierarchy can bypass IOMMU isolation.
27
28Unfortunately, far too many topologies do not support ACS to make this
29a steadfast requirement. Even the latest chipsets from Intel are only
30sporadically supporting ACS. We have trouble getting interconnect
31vendors to include the PCIe spec required PCIe capability, let alone
32suggested features.
33
34Therefore, we need to add some flexibility. The pcie_acs_override=
35boot option lets users opt-in specific devices or sets of devices to
36assume ACS support. The "downstream" option assumes full ACS support
37on root ports and downstream switch ports. The "multifunction"
38option assumes the subset of ACS features available on multifunction
39endpoints and upstream switch ports are supported. The "id:nnnn:nnnn"
40option enables ACS support on devices matching the provided vendor
41and device IDs, allowing more strategic ACS overrides. These options
42may be combined in any order. A maximum of 16 id specific overrides
43are available. It's suggested to use the most limited set of options
44necessary to avoid completely disabling ACS across the topology.
45Note to hardware vendors, we have facilities to permanently quirk
46specific devices which enforce isolation but not provide an ACS
47capability. Please contact me to have your devices added and save
48your customers the hassle of this boot option.
b9e76370
FG
49
50Signed-off-by: Fabian Grünbichler <f.gruenbichler@proxmox.com>
ff71f8b9 51Signed-off-by: Thomas Lamprecht <t.lamprecht@proxmox.com>
ba2f1a67 52---
0c12c00b 53 .../admin-guide/kernel-parameters.txt | 9 ++
ff71f8b9
TL
54 drivers/pci/quirks.c | 102 ++++++++++++++++++
55 2 files changed, 111 insertions(+)
ba2f1a67
FG
56
57diff --git a/Documentation/admin-guide/kernel-parameters.txt b/Documentation/admin-guide/kernel-parameters.txt
f641ad16 58index 369d7f3f63cb..92f35bf44f49 100644
ba2f1a67
FG
59--- a/Documentation/admin-guide/kernel-parameters.txt
60+++ b/Documentation/admin-guide/kernel-parameters.txt
55227d53 61@@ -3908,6 +3908,15 @@
4618decf
TL
62 Also, it enforces the PCI Local Bus spec
63 rule that those bits should be 0 in system reset
64 events (useful for kexec/kdump cases).
ba2f1a67 65+ pci_acs_override =
4618decf 66+ [PCIE] Override missing PCIe ACS support for:
ba2f1a67
FG
67+ downstream
68+ All downstream ports - full ACS capabilities
55f9bfa9
FG
69+ multifunction
70+ Add multifunction devices - multifunction ACS subset
ba2f1a67 71+ id:nnnn:nnnn
55f9bfa9 72+ Specific device - full ACS capabilities
ba2f1a67
FG
73+ Specified as vid:did (vendor/device ID) in hex
74 noioapicquirk [APIC] Disable all boot interrupt quirks.
75 Safety option to keep boot IRQs enabled. This
76 should never be necessary.
77diff --git a/drivers/pci/quirks.c b/drivers/pci/quirks.c
1615b3ee 78index bf3af7d81bdc..04ef248fb1af 100644
ba2f1a67
FG
79--- a/drivers/pci/quirks.c
80+++ b/drivers/pci/quirks.c
4fce1205 81@@ -193,6 +193,106 @@ static int __init pci_apply_final_quirks(void)
ff71f8b9 82 }
ba2f1a67
FG
83 fs_initcall_sync(pci_apply_final_quirks);
84
85+static bool acs_on_downstream;
86+static bool acs_on_multifunction;
87+
88+#define NUM_ACS_IDS 16
89+struct acs_on_id {
90+ unsigned short vendor;
91+ unsigned short device;
92+};
93+static struct acs_on_id acs_on_ids[NUM_ACS_IDS];
94+static u8 max_acs_id;
95+
96+static __init int pcie_acs_override_setup(char *p)
97+{
98+ if (!p)
99+ return -EINVAL;
100+
101+ while (*p) {
102+ if (!strncmp(p, "downstream", 10))
103+ acs_on_downstream = true;
104+ if (!strncmp(p, "multifunction", 13))
105+ acs_on_multifunction = true;
106+ if (!strncmp(p, "id:", 3)) {
107+ char opt[5];
108+ int ret;
109+ long val;
110+
111+ if (max_acs_id >= NUM_ACS_IDS - 1) {
112+ pr_warn("Out of PCIe ACS override slots (%d)\n",
113+ NUM_ACS_IDS);
114+ goto next;
115+ }
116+
117+ p += 3;
118+ snprintf(opt, 5, "%s", p);
119+ ret = kstrtol(opt, 16, &val);
120+ if (ret) {
121+ pr_warn("PCIe ACS ID parse error %d\n", ret);
122+ goto next;
123+ }
124+ acs_on_ids[max_acs_id].vendor = val;
ba2f1a67 125+ p += strcspn(p, ":");
cfe8ba0b 126+ if (*p != ':') {
ba2f1a67
FG
127+ pr_warn("PCIe ACS invalid ID\n");
128+ goto next;
129+ }
130+
131+ p++;
132+ snprintf(opt, 5, "%s", p);
133+ ret = kstrtol(opt, 16, &val);
134+ if (ret) {
135+ pr_warn("PCIe ACS ID parse error %d\n", ret);
136+ goto next;
137+ }
138+ acs_on_ids[max_acs_id].device = val;
139+ max_acs_id++;
140+ }
141+next:
142+ p += strcspn(p, ",");
143+ if (*p == ',')
144+ p++;
145+ }
146+
147+ if (acs_on_downstream || acs_on_multifunction || max_acs_id)
148+ pr_warn("Warning: PCIe ACS overrides enabled; This may allow non-IOMMU protected peer-to-peer DMA\n");
149+
150+ return 0;
151+}
152+early_param("pcie_acs_override", pcie_acs_override_setup);
153+
154+static int pcie_acs_overrides(struct pci_dev *dev, u16 acs_flags)
155+{
156+ int i;
157+
158+ /* Never override ACS for legacy devices or devices with ACS caps */
159+ if (!pci_is_pcie(dev) ||
160+ pci_find_ext_capability(dev, PCI_EXT_CAP_ID_ACS))
161+ return -ENOTTY;
162+
163+ for (i = 0; i < max_acs_id; i++)
164+ if (acs_on_ids[i].vendor == dev->vendor &&
165+ acs_on_ids[i].device == dev->device)
166+ return 1;
167+
168+ switch (pci_pcie_type(dev)) {
55f9bfa9
FG
169+ case PCI_EXP_TYPE_DOWNSTREAM:
170+ case PCI_EXP_TYPE_ROOT_PORT:
171+ if (acs_on_downstream)
172+ return 1;
173+ break;
174+ case PCI_EXP_TYPE_ENDPOINT:
175+ case PCI_EXP_TYPE_UPSTREAM:
176+ case PCI_EXP_TYPE_LEG_END:
177+ case PCI_EXP_TYPE_RC_END:
178+ if (acs_on_multifunction && dev->multifunction)
179+ return 1;
ba2f1a67
FG
180+ }
181+
182+ return -ENOTTY;
183+}
754ba827 184+
ba2f1a67 185 /*
ff71f8b9
TL
186 * Decoding should be disabled for a PCI device during BAR sizing to avoid
187 * conflict. But doing so may cause problems on host bridge and perhaps other
55227d53 188@@ -4915,6 +5015,8 @@ static const struct pci_dev_acs_enabled {
46951972 189 { PCI_VENDOR_ID_CAVIUM, 0xA060, pci_quirk_mf_endpoint_acs },
55f9bfa9
FG
190 /* APM X-Gene */
191 { PCI_VENDOR_ID_AMCC, 0xE004, pci_quirk_xgene_acs },
ff71f8b9 192+ /* Enable overrides for missing ACS capabilities */
ba2f1a67 193+ { PCI_ANY_ID, PCI_ANY_ID, pcie_acs_overrides },
ff71f8b9
TL
194 /* Ampere Computing */
195 { PCI_VENDOR_ID_AMPERE, 0xE005, pci_quirk_xgene_acs },
196 { PCI_VENDOR_ID_AMPERE, 0xE006, pci_quirk_xgene_acs },