blob: 39888cfe6b23e94d3552f1086cd23c6772f874f1 [file] [log] [blame]
Yu Zhaod1b054d2009-03-20 11:25:11 +08001/*
2 * drivers/pci/iov.c
3 *
4 * Copyright (C) 2009 Intel Corporation, Yu Zhao <yu.zhao@intel.com>
5 *
6 * PCI Express I/O Virtualization (IOV) support.
7 * Single Root IOV 1.0
Yu Zhao302b4212009-05-18 13:51:32 +08008 * Address Translation Service 1.0
Yu Zhaod1b054d2009-03-20 11:25:11 +08009 */
10
11#include <linux/pci.h>
Tejun Heo5a0e3ad2010-03-24 17:04:11 +090012#include <linux/slab.h>
Yu Zhaod1b054d2009-03-20 11:25:11 +080013#include <linux/mutex.h>
Paul Gortmaker363c75d2011-05-27 09:37:25 -040014#include <linux/export.h>
Yu Zhaod1b054d2009-03-20 11:25:11 +080015#include <linux/string.h>
16#include <linux/delay.h>
Joerg Roedel5cdede22011-04-04 15:55:18 +020017#include <linux/pci-ats.h>
Yu Zhaod1b054d2009-03-20 11:25:11 +080018#include "pci.h"
19
Yu Zhaodd7cc442009-03-20 11:25:15 +080020#define VIRTFN_ID_LEN 16
Yu Zhaod1b054d2009-03-20 11:25:11 +080021
Wei Yangb07579c2015-03-25 16:23:48 +080022int pci_iov_virtfn_bus(struct pci_dev *dev, int vf_id)
Yu Zhaoa28724b2009-03-20 11:25:13 +080023{
Wei Yangb07579c2015-03-25 16:23:48 +080024 if (!dev->is_physfn)
25 return -EINVAL;
Yu Zhaoa28724b2009-03-20 11:25:13 +080026 return dev->bus->number + ((dev->devfn + dev->sriov->offset +
Wei Yangb07579c2015-03-25 16:23:48 +080027 dev->sriov->stride * vf_id) >> 8);
Yu Zhaoa28724b2009-03-20 11:25:13 +080028}
29
Wei Yangb07579c2015-03-25 16:23:48 +080030int pci_iov_virtfn_devfn(struct pci_dev *dev, int vf_id)
Yu Zhaoa28724b2009-03-20 11:25:13 +080031{
Wei Yangb07579c2015-03-25 16:23:48 +080032 if (!dev->is_physfn)
33 return -EINVAL;
Yu Zhaoa28724b2009-03-20 11:25:13 +080034 return (dev->devfn + dev->sriov->offset +
Wei Yangb07579c2015-03-25 16:23:48 +080035 dev->sriov->stride * vf_id) & 0xff;
Yu Zhaoa28724b2009-03-20 11:25:13 +080036}
37
Wei Yangf59dca22015-03-25 16:23:46 +080038/*
39 * Per SR-IOV spec sec 3.3.10 and 3.3.11, First VF Offset and VF Stride may
40 * change when NumVFs changes.
41 *
42 * Update iov->offset and iov->stride when NumVFs is written.
43 */
44static inline void pci_iov_set_numvfs(struct pci_dev *dev, int nr_virtfn)
45{
46 struct pci_sriov *iov = dev->sriov;
47
48 pci_write_config_word(dev, iov->pos + PCI_SRIOV_NUM_VF, nr_virtfn);
49 pci_read_config_word(dev, iov->pos + PCI_SRIOV_VF_OFFSET, &iov->offset);
50 pci_read_config_word(dev, iov->pos + PCI_SRIOV_VF_STRIDE, &iov->stride);
51}
52
Wei Yang4449f072015-03-25 16:23:47 +080053/*
54 * The PF consumes one bus number. NumVFs, First VF Offset, and VF Stride
55 * determine how many additional bus numbers will be consumed by VFs.
56 *
Alexander Duyckea9a8852015-10-29 16:20:50 -050057 * Iterate over all valid NumVFs, validate offset and stride, and calculate
58 * the maximum number of bus numbers that could ever be required.
Wei Yang4449f072015-03-25 16:23:47 +080059 */
Alexander Duyckea9a8852015-10-29 16:20:50 -050060static int compute_max_vf_buses(struct pci_dev *dev)
Wei Yang4449f072015-03-25 16:23:47 +080061{
62 struct pci_sriov *iov = dev->sriov;
Alexander Duyckea9a8852015-10-29 16:20:50 -050063 int nr_virtfn, busnr, rc = 0;
Wei Yang4449f072015-03-25 16:23:47 +080064
Alexander Duyckea9a8852015-10-29 16:20:50 -050065 for (nr_virtfn = iov->total_VFs; nr_virtfn; nr_virtfn--) {
Wei Yang4449f072015-03-25 16:23:47 +080066 pci_iov_set_numvfs(dev, nr_virtfn);
Alexander Duyckea9a8852015-10-29 16:20:50 -050067 if (!iov->offset || (nr_virtfn > 1 && !iov->stride)) {
68 rc = -EIO;
69 goto out;
70 }
71
Wei Yangb07579c2015-03-25 16:23:48 +080072 busnr = pci_iov_virtfn_bus(dev, nr_virtfn - 1);
Alexander Duyckea9a8852015-10-29 16:20:50 -050073 if (busnr > iov->max_VF_buses)
74 iov->max_VF_buses = busnr;
Wei Yang4449f072015-03-25 16:23:47 +080075 }
76
Alexander Duyckea9a8852015-10-29 16:20:50 -050077out:
78 pci_iov_set_numvfs(dev, 0);
79 return rc;
Wei Yang4449f072015-03-25 16:23:47 +080080}
81
Yu Zhaodd7cc442009-03-20 11:25:15 +080082static struct pci_bus *virtfn_add_bus(struct pci_bus *bus, int busnr)
83{
Yu Zhaodd7cc442009-03-20 11:25:15 +080084 struct pci_bus *child;
85
86 if (bus->number == busnr)
87 return bus;
88
89 child = pci_find_bus(pci_domain_nr(bus), busnr);
90 if (child)
91 return child;
92
93 child = pci_add_new_bus(bus, NULL, busnr);
94 if (!child)
95 return NULL;
96
Yinghai Lub7eac052012-05-17 18:51:13 -070097 pci_bus_insert_busn_res(child, busnr, busnr);
Yu Zhaodd7cc442009-03-20 11:25:15 +080098
99 return child;
100}
101
Jiang Liudc087f22013-05-25 21:48:37 +0800102static void virtfn_remove_bus(struct pci_bus *physbus, struct pci_bus *virtbus)
Yu Zhaodd7cc442009-03-20 11:25:15 +0800103{
Jiang Liudc087f22013-05-25 21:48:37 +0800104 if (physbus != virtbus && list_empty(&virtbus->devices))
105 pci_remove_bus(virtbus);
Yu Zhaodd7cc442009-03-20 11:25:15 +0800106}
107
Wei Yang0e6c9122015-03-25 16:23:44 +0800108resource_size_t pci_iov_resource_size(struct pci_dev *dev, int resno)
109{
110 if (!dev->is_physfn)
111 return 0;
112
113 return dev->sriov->barsz[resno - PCI_IOV_RESOURCES];
114}
115
Wei Yangc194f7e2016-03-04 10:53:03 +1100116int pci_iov_add_virtfn(struct pci_dev *dev, int id, int reset)
Yu Zhaodd7cc442009-03-20 11:25:15 +0800117{
118 int i;
Jiang Liudc087f22013-05-25 21:48:37 +0800119 int rc = -ENOMEM;
Yu Zhaodd7cc442009-03-20 11:25:15 +0800120 u64 size;
121 char buf[VIRTFN_ID_LEN];
122 struct pci_dev *virtfn;
123 struct resource *res;
124 struct pci_sriov *iov = dev->sriov;
Gu Zheng8b1fce02013-05-25 21:48:31 +0800125 struct pci_bus *bus;
Yu Zhaodd7cc442009-03-20 11:25:15 +0800126
127 mutex_lock(&iov->dev->sriov->lock);
Wei Yangb07579c2015-03-25 16:23:48 +0800128 bus = virtfn_add_bus(dev->bus, pci_iov_virtfn_bus(dev, id));
Jiang Liudc087f22013-05-25 21:48:37 +0800129 if (!bus)
130 goto failed;
131
132 virtfn = pci_alloc_dev(bus);
133 if (!virtfn)
134 goto failed0;
135
Wei Yangb07579c2015-03-25 16:23:48 +0800136 virtfn->devfn = pci_iov_virtfn_devfn(dev, id);
Yu Zhaodd7cc442009-03-20 11:25:15 +0800137 virtfn->vendor = dev->vendor;
138 pci_read_config_word(dev, iov->pos + PCI_SRIOV_VF_DID, &virtfn->device);
Po Liu156c5532016-08-29 15:28:01 +0800139 rc = pci_setup_device(virtfn);
140 if (rc)
141 goto failed0;
142
Yu Zhaodd7cc442009-03-20 11:25:15 +0800143 virtfn->dev.parent = dev->dev.parent;
Xudong Haofbf33f52013-05-31 12:21:29 +0800144 virtfn->physfn = pci_dev_get(dev);
145 virtfn->is_virtfn = 1;
Alex Williamsonaa9319772014-01-09 08:36:08 -0700146 virtfn->multifunction = 0;
Yu Zhaodd7cc442009-03-20 11:25:15 +0800147
148 for (i = 0; i < PCI_SRIOV_NUM_BARS; i++) {
Bjorn Helgaasc1fe1f92015-03-25 16:23:45 +0800149 res = &dev->resource[i + PCI_IOV_RESOURCES];
Yu Zhaodd7cc442009-03-20 11:25:15 +0800150 if (!res->parent)
151 continue;
152 virtfn->resource[i].name = pci_name(virtfn);
153 virtfn->resource[i].flags = res->flags;
Wei Yang0e6c9122015-03-25 16:23:44 +0800154 size = pci_iov_resource_size(dev, i + PCI_IOV_RESOURCES);
Yu Zhaodd7cc442009-03-20 11:25:15 +0800155 virtfn->resource[i].start = res->start + size * id;
156 virtfn->resource[i].end = virtfn->resource[i].start + size - 1;
157 rc = request_resource(res, &virtfn->resource[i]);
158 BUG_ON(rc);
159 }
160
161 if (reset)
Yu Zhao8c1c6992009-06-13 15:52:13 +0800162 __pci_reset_function(virtfn);
Yu Zhaodd7cc442009-03-20 11:25:15 +0800163
164 pci_device_add(virtfn, virtfn->bus);
165 mutex_unlock(&iov->dev->sriov->lock);
166
Yijing Wangc893d132014-05-30 11:01:03 +0800167 pci_bus_add_device(virtfn);
Yu Zhaodd7cc442009-03-20 11:25:15 +0800168 sprintf(buf, "virtfn%u", id);
169 rc = sysfs_create_link(&dev->dev.kobj, &virtfn->dev.kobj, buf);
170 if (rc)
171 goto failed1;
172 rc = sysfs_create_link(&virtfn->dev.kobj, &dev->dev.kobj, "physfn");
173 if (rc)
174 goto failed2;
175
176 kobject_uevent(&virtfn->dev.kobj, KOBJ_CHANGE);
177
178 return 0;
179
180failed2:
181 sysfs_remove_link(&dev->dev.kobj, buf);
182failed1:
183 pci_dev_put(dev);
184 mutex_lock(&iov->dev->sriov->lock);
Yinghai Lu210647a2012-02-25 13:54:20 -0800185 pci_stop_and_remove_bus_device(virtfn);
Jiang Liudc087f22013-05-25 21:48:37 +0800186failed0:
187 virtfn_remove_bus(dev->bus, bus);
188failed:
Yu Zhaodd7cc442009-03-20 11:25:15 +0800189 mutex_unlock(&iov->dev->sriov->lock);
190
191 return rc;
192}
193
Wei Yangc194f7e2016-03-04 10:53:03 +1100194void pci_iov_remove_virtfn(struct pci_dev *dev, int id, int reset)
Yu Zhaodd7cc442009-03-20 11:25:15 +0800195{
196 char buf[VIRTFN_ID_LEN];
Yu Zhaodd7cc442009-03-20 11:25:15 +0800197 struct pci_dev *virtfn;
198 struct pci_sriov *iov = dev->sriov;
199
Jiang Liudc087f22013-05-25 21:48:37 +0800200 virtfn = pci_get_domain_bus_and_slot(pci_domain_nr(dev->bus),
Wei Yangb07579c2015-03-25 16:23:48 +0800201 pci_iov_virtfn_bus(dev, id),
202 pci_iov_virtfn_devfn(dev, id));
Yu Zhaodd7cc442009-03-20 11:25:15 +0800203 if (!virtfn)
204 return;
205
Yu Zhaodd7cc442009-03-20 11:25:15 +0800206 if (reset) {
207 device_release_driver(&virtfn->dev);
Yu Zhao8c1c6992009-06-13 15:52:13 +0800208 __pci_reset_function(virtfn);
Yu Zhaodd7cc442009-03-20 11:25:15 +0800209 }
210
211 sprintf(buf, "virtfn%u", id);
212 sysfs_remove_link(&dev->dev.kobj, buf);
Yinghai Lu09cedbe2012-02-04 22:55:01 -0800213 /*
214 * pci_stop_dev() could have been called for this virtfn already,
215 * so the directory for the virtfn may have been removed before.
216 * Double check to avoid spurious sysfs warnings.
217 */
218 if (virtfn->dev.kobj.sd)
219 sysfs_remove_link(&virtfn->dev.kobj, "physfn");
Yu Zhaodd7cc442009-03-20 11:25:15 +0800220
221 mutex_lock(&iov->dev->sriov->lock);
Yinghai Lu210647a2012-02-25 13:54:20 -0800222 pci_stop_and_remove_bus_device(virtfn);
Jiang Liudc087f22013-05-25 21:48:37 +0800223 virtfn_remove_bus(dev->bus, virtfn->bus);
Yu Zhaodd7cc442009-03-20 11:25:15 +0800224 mutex_unlock(&iov->dev->sriov->lock);
225
Jiang Liudc087f22013-05-25 21:48:37 +0800226 /* balance pci_get_domain_bus_and_slot() */
227 pci_dev_put(virtfn);
Yu Zhaodd7cc442009-03-20 11:25:15 +0800228 pci_dev_put(dev);
229}
230
Wei Yang995df522015-03-25 16:23:49 +0800231int __weak pcibios_sriov_enable(struct pci_dev *pdev, u16 num_vfs)
232{
Alexander Duycka39e3fc2015-10-29 16:21:11 -0500233 return 0;
234}
235
236int __weak pcibios_sriov_disable(struct pci_dev *pdev)
237{
238 return 0;
Wei Yang995df522015-03-25 16:23:49 +0800239}
240
Yu Zhaodd7cc442009-03-20 11:25:15 +0800241static int sriov_enable(struct pci_dev *dev, int nr_virtfn)
242{
243 int rc;
Alexander Duyck3443c382015-10-29 16:21:05 -0500244 int i;
Yu Zhaodd7cc442009-03-20 11:25:15 +0800245 int nres;
Alexander Duyckce288ec2015-10-29 16:20:57 -0500246 u16 initial;
Yu Zhaodd7cc442009-03-20 11:25:15 +0800247 struct resource *res;
248 struct pci_dev *pdev;
249 struct pci_sriov *iov = dev->sriov;
Ram Paibbef98a2011-11-06 10:33:10 +0800250 int bars = 0;
Wei Yangb07579c2015-03-25 16:23:48 +0800251 int bus;
Yu Zhaodd7cc442009-03-20 11:25:15 +0800252
253 if (!nr_virtfn)
254 return 0;
255
Bjorn Helgaas6b136722012-11-09 20:27:53 -0700256 if (iov->num_VFs)
Yu Zhaodd7cc442009-03-20 11:25:15 +0800257 return -EINVAL;
258
259 pci_read_config_word(dev, iov->pos + PCI_SRIOV_INITIAL_VF, &initial);
Bjorn Helgaas6b136722012-11-09 20:27:53 -0700260 if (initial > iov->total_VFs ||
261 (!(iov->cap & PCI_SRIOV_CAP_VFM) && (initial != iov->total_VFs)))
Yu Zhaodd7cc442009-03-20 11:25:15 +0800262 return -EIO;
263
Bjorn Helgaas6b136722012-11-09 20:27:53 -0700264 if (nr_virtfn < 0 || nr_virtfn > iov->total_VFs ||
Yu Zhaodd7cc442009-03-20 11:25:15 +0800265 (!(iov->cap & PCI_SRIOV_CAP_VFM) && (nr_virtfn > initial)))
266 return -EINVAL;
267
Yu Zhaodd7cc442009-03-20 11:25:15 +0800268 nres = 0;
269 for (i = 0; i < PCI_SRIOV_NUM_BARS; i++) {
Ram Paibbef98a2011-11-06 10:33:10 +0800270 bars |= (1 << (i + PCI_IOV_RESOURCES));
Bjorn Helgaasc1fe1f92015-03-25 16:23:45 +0800271 res = &dev->resource[i + PCI_IOV_RESOURCES];
Yu Zhaodd7cc442009-03-20 11:25:15 +0800272 if (res->parent)
273 nres++;
274 }
275 if (nres != iov->nres) {
276 dev_err(&dev->dev, "not enough MMIO resources for SR-IOV\n");
277 return -ENOMEM;
278 }
279
Wei Yangb07579c2015-03-25 16:23:48 +0800280 bus = pci_iov_virtfn_bus(dev, nr_virtfn - 1);
Bjorn Helgaas68f8e9f2015-03-25 16:23:42 +0800281 if (bus > dev->bus->busn_res.end) {
282 dev_err(&dev->dev, "can't enable %d VFs (bus %02x out of range of %pR)\n",
283 nr_virtfn, bus, &dev->bus->busn_res);
Yu Zhaodd7cc442009-03-20 11:25:15 +0800284 return -ENOMEM;
285 }
286
Ram Paibbef98a2011-11-06 10:33:10 +0800287 if (pci_enable_resources(dev, bars)) {
288 dev_err(&dev->dev, "SR-IOV: IOV BARS not allocated\n");
289 return -ENOMEM;
290 }
291
Yu Zhaodd7cc442009-03-20 11:25:15 +0800292 if (iov->link != dev->devfn) {
293 pdev = pci_get_slot(dev->bus, iov->link);
294 if (!pdev)
295 return -ENODEV;
296
Jiang Liudc087f22013-05-25 21:48:37 +0800297 if (!pdev->is_physfn) {
298 pci_dev_put(pdev);
Stefan Assmann652d1102013-07-31 16:47:56 -0600299 return -ENOSYS;
Jiang Liudc087f22013-05-25 21:48:37 +0800300 }
Yu Zhaodd7cc442009-03-20 11:25:15 +0800301
302 rc = sysfs_create_link(&dev->dev.kobj,
303 &pdev->dev.kobj, "dep_link");
Jiang Liudc087f22013-05-25 21:48:37 +0800304 pci_dev_put(pdev);
Yu Zhaodd7cc442009-03-20 11:25:15 +0800305 if (rc)
306 return rc;
307 }
308
Wei Yangf59dca22015-03-25 16:23:46 +0800309 pci_iov_set_numvfs(dev, nr_virtfn);
Yu Zhaodd7cc442009-03-20 11:25:15 +0800310 iov->ctrl |= PCI_SRIOV_CTRL_VFE | PCI_SRIOV_CTRL_MSE;
Jan Kiszkafb51ccb2011-11-04 09:45:59 +0100311 pci_cfg_access_lock(dev);
Yu Zhaodd7cc442009-03-20 11:25:15 +0800312 pci_write_config_word(dev, iov->pos + PCI_SRIOV_CTRL, iov->ctrl);
313 msleep(100);
Jan Kiszkafb51ccb2011-11-04 09:45:59 +0100314 pci_cfg_access_unlock(dev);
Yu Zhaodd7cc442009-03-20 11:25:15 +0800315
Bjorn Helgaas6b136722012-11-09 20:27:53 -0700316 iov->initial_VFs = initial;
Yu Zhaodd7cc442009-03-20 11:25:15 +0800317 if (nr_virtfn < initial)
318 initial = nr_virtfn;
319
Alexander Duyckc23b6132015-10-29 16:21:20 -0500320 rc = pcibios_sriov_enable(dev, initial);
321 if (rc) {
322 dev_err(&dev->dev, "failure %d from pcibios_sriov_enable()\n", rc);
323 goto err_pcibios;
Wei Yang995df522015-03-25 16:23:49 +0800324 }
325
Yu Zhaodd7cc442009-03-20 11:25:15 +0800326 for (i = 0; i < initial; i++) {
Wei Yangc194f7e2016-03-04 10:53:03 +1100327 rc = pci_iov_add_virtfn(dev, i, 0);
Yu Zhaodd7cc442009-03-20 11:25:15 +0800328 if (rc)
329 goto failed;
330 }
331
332 kobject_uevent(&dev->dev.kobj, KOBJ_CHANGE);
Bjorn Helgaas6b136722012-11-09 20:27:53 -0700333 iov->num_VFs = nr_virtfn;
Yu Zhaodd7cc442009-03-20 11:25:15 +0800334
335 return 0;
336
337failed:
Alexander Duyck3443c382015-10-29 16:21:05 -0500338 while (i--)
Wei Yangc194f7e2016-03-04 10:53:03 +1100339 pci_iov_remove_virtfn(dev, i, 0);
Yu Zhaodd7cc442009-03-20 11:25:15 +0800340
Alexander Duyckc23b6132015-10-29 16:21:20 -0500341 pcibios_sriov_disable(dev);
342err_pcibios:
Yu Zhaodd7cc442009-03-20 11:25:15 +0800343 iov->ctrl &= ~(PCI_SRIOV_CTRL_VFE | PCI_SRIOV_CTRL_MSE);
Jan Kiszkafb51ccb2011-11-04 09:45:59 +0100344 pci_cfg_access_lock(dev);
Yu Zhaodd7cc442009-03-20 11:25:15 +0800345 pci_write_config_word(dev, iov->pos + PCI_SRIOV_CTRL, iov->ctrl);
346 ssleep(1);
Jan Kiszkafb51ccb2011-11-04 09:45:59 +0100347 pci_cfg_access_unlock(dev);
Yu Zhaodd7cc442009-03-20 11:25:15 +0800348
349 if (iov->link != dev->devfn)
350 sysfs_remove_link(&dev->dev.kobj, "dep_link");
351
Alexander Duyckb3908642015-10-29 16:21:16 -0500352 pci_iov_set_numvfs(dev, 0);
Yu Zhaodd7cc442009-03-20 11:25:15 +0800353 return rc;
354}
355
356static void sriov_disable(struct pci_dev *dev)
357{
358 int i;
359 struct pci_sriov *iov = dev->sriov;
360
Bjorn Helgaas6b136722012-11-09 20:27:53 -0700361 if (!iov->num_VFs)
Yu Zhaodd7cc442009-03-20 11:25:15 +0800362 return;
363
Bjorn Helgaas6b136722012-11-09 20:27:53 -0700364 for (i = 0; i < iov->num_VFs; i++)
Wei Yangc194f7e2016-03-04 10:53:03 +1100365 pci_iov_remove_virtfn(dev, i, 0);
Yu Zhaodd7cc442009-03-20 11:25:15 +0800366
Wei Yang995df522015-03-25 16:23:49 +0800367 pcibios_sriov_disable(dev);
368
Yu Zhaodd7cc442009-03-20 11:25:15 +0800369 iov->ctrl &= ~(PCI_SRIOV_CTRL_VFE | PCI_SRIOV_CTRL_MSE);
Jan Kiszkafb51ccb2011-11-04 09:45:59 +0100370 pci_cfg_access_lock(dev);
Yu Zhaodd7cc442009-03-20 11:25:15 +0800371 pci_write_config_word(dev, iov->pos + PCI_SRIOV_CTRL, iov->ctrl);
372 ssleep(1);
Jan Kiszkafb51ccb2011-11-04 09:45:59 +0100373 pci_cfg_access_unlock(dev);
Yu Zhaodd7cc442009-03-20 11:25:15 +0800374
375 if (iov->link != dev->devfn)
376 sysfs_remove_link(&dev->dev.kobj, "dep_link");
377
Bjorn Helgaas6b136722012-11-09 20:27:53 -0700378 iov->num_VFs = 0;
Wei Yangf59dca22015-03-25 16:23:46 +0800379 pci_iov_set_numvfs(dev, 0);
Yu Zhaodd7cc442009-03-20 11:25:15 +0800380}
381
Yu Zhaod1b054d2009-03-20 11:25:11 +0800382static int sriov_init(struct pci_dev *dev, int pos)
383{
Wei Yang0e6c9122015-03-25 16:23:44 +0800384 int i, bar64;
Yu Zhaod1b054d2009-03-20 11:25:11 +0800385 int rc;
386 int nres;
387 u32 pgsz;
Alexander Duyckea9a8852015-10-29 16:20:50 -0500388 u16 ctrl, total;
Yu Zhaod1b054d2009-03-20 11:25:11 +0800389 struct pci_sriov *iov;
390 struct resource *res;
391 struct pci_dev *pdev;
392
Yu Zhaod1b054d2009-03-20 11:25:11 +0800393 pci_read_config_word(dev, pos + PCI_SRIOV_CTRL, &ctrl);
394 if (ctrl & PCI_SRIOV_CTRL_VFE) {
395 pci_write_config_word(dev, pos + PCI_SRIOV_CTRL, 0);
396 ssleep(1);
397 }
398
Yu Zhaod1b054d2009-03-20 11:25:11 +0800399 ctrl = 0;
400 list_for_each_entry(pdev, &dev->bus->devices, bus_list)
401 if (pdev->is_physfn)
402 goto found;
403
404 pdev = NULL;
405 if (pci_ari_enabled(dev->bus))
406 ctrl |= PCI_SRIOV_CTRL_ARI;
407
408found:
409 pci_write_config_word(dev, pos + PCI_SRIOV_CTRL, ctrl);
Yu Zhaod1b054d2009-03-20 11:25:11 +0800410
Ben Sheltonff45f9d2015-10-29 16:20:31 -0500411 pci_read_config_word(dev, pos + PCI_SRIOV_TOTAL_VF, &total);
412 if (!total)
413 return 0;
Yu Zhaod1b054d2009-03-20 11:25:11 +0800414
415 pci_read_config_dword(dev, pos + PCI_SRIOV_SUP_PGSIZE, &pgsz);
416 i = PAGE_SHIFT > 12 ? PAGE_SHIFT - 12 : 0;
417 pgsz &= ~((1 << i) - 1);
418 if (!pgsz)
419 return -EIO;
420
421 pgsz &= ~(pgsz - 1);
Vaidyanathan Srinivasan8161fe92012-02-02 23:11:20 +0530422 pci_write_config_dword(dev, pos + PCI_SRIOV_SYS_PGSIZE, pgsz);
Yu Zhaod1b054d2009-03-20 11:25:11 +0800423
Wei Yang0e6c9122015-03-25 16:23:44 +0800424 iov = kzalloc(sizeof(*iov), GFP_KERNEL);
425 if (!iov)
426 return -ENOMEM;
427
Yu Zhaod1b054d2009-03-20 11:25:11 +0800428 nres = 0;
429 for (i = 0; i < PCI_SRIOV_NUM_BARS; i++) {
Bjorn Helgaasc1fe1f92015-03-25 16:23:45 +0800430 res = &dev->resource[i + PCI_IOV_RESOURCES];
David Daney11183992015-10-29 17:35:40 -0500431 /*
432 * If it is already FIXED, don't change it, something
433 * (perhaps EA or header fixups) wants it this way.
434 */
435 if (res->flags & IORESOURCE_PCI_FIXED)
436 bar64 = (res->flags & IORESOURCE_MEM_64) ? 1 : 0;
437 else
438 bar64 = __pci_read_base(dev, pci_bar_unknown, res,
439 pos + PCI_SRIOV_BAR + i * 4);
Yu Zhaod1b054d2009-03-20 11:25:11 +0800440 if (!res->flags)
441 continue;
442 if (resource_size(res) & (PAGE_SIZE - 1)) {
443 rc = -EIO;
444 goto failed;
445 }
Wei Yang0e6c9122015-03-25 16:23:44 +0800446 iov->barsz[i] = resource_size(res);
Yu Zhaod1b054d2009-03-20 11:25:11 +0800447 res->end = res->start + resource_size(res) * total - 1;
Wei Yange88ae012015-03-25 16:23:43 +0800448 dev_info(&dev->dev, "VF(n) BAR%d space: %pR (contains BAR%d for %d VFs)\n",
449 i, res, i, total);
Wei Yang0e6c9122015-03-25 16:23:44 +0800450 i += bar64;
Yu Zhaod1b054d2009-03-20 11:25:11 +0800451 nres++;
452 }
453
Yu Zhaod1b054d2009-03-20 11:25:11 +0800454 iov->pos = pos;
455 iov->nres = nres;
456 iov->ctrl = ctrl;
Bjorn Helgaas6b136722012-11-09 20:27:53 -0700457 iov->total_VFs = total;
Yu Zhaod1b054d2009-03-20 11:25:11 +0800458 iov->pgsz = pgsz;
459 iov->self = dev;
460 pci_read_config_dword(dev, pos + PCI_SRIOV_CAP, &iov->cap);
461 pci_read_config_byte(dev, pos + PCI_SRIOV_FUNC_LINK, &iov->link);
Yijing Wang62f87c02012-07-24 17:20:03 +0800462 if (pci_pcie_type(dev) == PCI_EXP_TYPE_RC_END)
Yu Zhao4d135db2009-05-20 17:11:57 +0800463 iov->link = PCI_DEVFN(PCI_SLOT(dev->devfn), iov->link);
Yu Zhaod1b054d2009-03-20 11:25:11 +0800464
465 if (pdev)
466 iov->dev = pci_dev_get(pdev);
Yu Zhaoe277d2f2009-05-18 13:51:33 +0800467 else
Yu Zhaod1b054d2009-03-20 11:25:11 +0800468 iov->dev = dev;
Yu Zhaoe277d2f2009-05-18 13:51:33 +0800469
470 mutex_init(&iov->lock);
Yu Zhaod1b054d2009-03-20 11:25:11 +0800471
472 dev->sriov = iov;
473 dev->is_physfn = 1;
Alexander Duyckea9a8852015-10-29 16:20:50 -0500474 rc = compute_max_vf_buses(dev);
475 if (rc)
476 goto fail_max_buses;
Yu Zhaod1b054d2009-03-20 11:25:11 +0800477
478 return 0;
479
Alexander Duyckea9a8852015-10-29 16:20:50 -0500480fail_max_buses:
481 dev->sriov = NULL;
482 dev->is_physfn = 0;
Yu Zhaod1b054d2009-03-20 11:25:11 +0800483failed:
484 for (i = 0; i < PCI_SRIOV_NUM_BARS; i++) {
Bjorn Helgaasc1fe1f92015-03-25 16:23:45 +0800485 res = &dev->resource[i + PCI_IOV_RESOURCES];
Yu Zhaod1b054d2009-03-20 11:25:11 +0800486 res->flags = 0;
487 }
488
Wei Yang0e6c9122015-03-25 16:23:44 +0800489 kfree(iov);
Yu Zhaod1b054d2009-03-20 11:25:11 +0800490 return rc;
491}
492
493static void sriov_release(struct pci_dev *dev)
494{
Bjorn Helgaas6b136722012-11-09 20:27:53 -0700495 BUG_ON(dev->sriov->num_VFs);
Yu Zhaodd7cc442009-03-20 11:25:15 +0800496
Yu Zhaoe277d2f2009-05-18 13:51:33 +0800497 if (dev != dev->sriov->dev)
Yu Zhaod1b054d2009-03-20 11:25:11 +0800498 pci_dev_put(dev->sriov->dev);
499
Yu Zhaoe277d2f2009-05-18 13:51:33 +0800500 mutex_destroy(&dev->sriov->lock);
501
Yu Zhaod1b054d2009-03-20 11:25:11 +0800502 kfree(dev->sriov);
503 dev->sriov = NULL;
504}
505
Yu Zhao8c5cdb62009-03-20 11:25:12 +0800506static void sriov_restore_state(struct pci_dev *dev)
507{
508 int i;
509 u16 ctrl;
510 struct pci_sriov *iov = dev->sriov;
511
512 pci_read_config_word(dev, iov->pos + PCI_SRIOV_CTRL, &ctrl);
513 if (ctrl & PCI_SRIOV_CTRL_VFE)
514 return;
515
516 for (i = PCI_IOV_RESOURCES; i <= PCI_IOV_RESOURCE_END; i++)
517 pci_update_resource(dev, i);
518
519 pci_write_config_dword(dev, iov->pos + PCI_SRIOV_SYS_PGSIZE, iov->pgsz);
Wei Yangf59dca22015-03-25 16:23:46 +0800520 pci_iov_set_numvfs(dev, iov->num_VFs);
Yu Zhao8c5cdb62009-03-20 11:25:12 +0800521 pci_write_config_word(dev, iov->pos + PCI_SRIOV_CTRL, iov->ctrl);
522 if (iov->ctrl & PCI_SRIOV_CTRL_VFE)
523 msleep(100);
524}
525
Yu Zhaod1b054d2009-03-20 11:25:11 +0800526/**
527 * pci_iov_init - initialize the IOV capability
528 * @dev: the PCI device
529 *
530 * Returns 0 on success, or negative on failure.
531 */
532int pci_iov_init(struct pci_dev *dev)
533{
534 int pos;
535
Kenji Kaneshige5f4d91a2009-11-11 14:36:17 +0900536 if (!pci_is_pcie(dev))
Yu Zhaod1b054d2009-03-20 11:25:11 +0800537 return -ENODEV;
538
539 pos = pci_find_ext_capability(dev, PCI_EXT_CAP_ID_SRIOV);
540 if (pos)
541 return sriov_init(dev, pos);
542
543 return -ENODEV;
544}
545
546/**
547 * pci_iov_release - release resources used by the IOV capability
548 * @dev: the PCI device
549 */
550void pci_iov_release(struct pci_dev *dev)
551{
552 if (dev->is_physfn)
553 sriov_release(dev);
554}
555
556/**
557 * pci_iov_resource_bar - get position of the SR-IOV BAR
558 * @dev: the PCI device
559 * @resno: the resource number
Yu Zhaod1b054d2009-03-20 11:25:11 +0800560 *
561 * Returns position of the BAR encapsulated in the SR-IOV capability.
562 */
Myron Stowe26ff46c2014-11-11 08:04:50 -0700563int pci_iov_resource_bar(struct pci_dev *dev, int resno)
Yu Zhaod1b054d2009-03-20 11:25:11 +0800564{
565 if (resno < PCI_IOV_RESOURCES || resno > PCI_IOV_RESOURCE_END)
566 return 0;
567
568 BUG_ON(!dev->is_physfn);
569
Yu Zhaod1b054d2009-03-20 11:25:11 +0800570 return dev->sriov->pos + PCI_SRIOV_BAR +
571 4 * (resno - PCI_IOV_RESOURCES);
572}
Yu Zhao8c5cdb62009-03-20 11:25:12 +0800573
Bjorn Helgaas6a5f3e62017-03-17 00:48:22 +0000574/**
575 * pci_iov_update_resource - update a VF BAR
576 * @dev: the PCI device
577 * @resno: the resource number
578 *
579 * Update a VF BAR in the SR-IOV capability of a PF.
580 */
581void pci_iov_update_resource(struct pci_dev *dev, int resno)
582{
583 struct pci_sriov *iov = dev->is_physfn ? dev->sriov : NULL;
584 struct resource *res = dev->resource + resno;
585 int vf_bar = resno - PCI_IOV_RESOURCES;
586 struct pci_bus_region region;
587 u32 new;
588 int reg;
589
590 /*
591 * The generic pci_restore_bars() path calls this for all devices,
592 * including VFs and non-SR-IOV devices. If this is not a PF, we
593 * have nothing to do.
594 */
595 if (!iov)
596 return;
597
598 /*
599 * Ignore unimplemented BARs, unused resource slots for 64-bit
600 * BARs, and non-movable resources, e.g., those described via
601 * Enhanced Allocation.
602 */
603 if (!res->flags)
604 return;
605
606 if (res->flags & IORESOURCE_UNSET)
607 return;
608
609 if (res->flags & IORESOURCE_PCI_FIXED)
610 return;
611
612 pcibios_resource_to_bus(dev->bus, &region, res);
613 new = region.start;
614 new |= res->flags & ~PCI_BASE_ADDRESS_MEM_MASK;
615
616 reg = iov->pos + PCI_SRIOV_BAR + 4 * vf_bar;
617 pci_write_config_dword(dev, reg, new);
618 if (res->flags & IORESOURCE_MEM_64) {
619 new = region.start >> 16 >> 16;
620 pci_write_config_dword(dev, reg + 4, new);
621 }
622}
623
Wei Yang978d2d62015-03-25 16:23:50 +0800624resource_size_t __weak pcibios_iov_resource_alignment(struct pci_dev *dev,
625 int resno)
626{
627 return pci_iov_resource_size(dev, resno);
628}
629
Yu Zhao8c5cdb62009-03-20 11:25:12 +0800630/**
Chris Wright6faf17f2009-08-28 13:00:06 -0700631 * pci_sriov_resource_alignment - get resource alignment for VF BAR
632 * @dev: the PCI device
633 * @resno: the resource number
634 *
635 * Returns the alignment of the VF BAR found in the SR-IOV capability.
636 * This is not the same as the resource size which is defined as
637 * the VF BAR size multiplied by the number of VFs. The alignment
638 * is just the VF BAR size.
639 */
Cam Macdonell0e522472010-09-07 17:25:20 -0700640resource_size_t pci_sriov_resource_alignment(struct pci_dev *dev, int resno)
Chris Wright6faf17f2009-08-28 13:00:06 -0700641{
Wei Yang978d2d62015-03-25 16:23:50 +0800642 return pcibios_iov_resource_alignment(dev, resno);
Chris Wright6faf17f2009-08-28 13:00:06 -0700643}
644
645/**
Yu Zhao8c5cdb62009-03-20 11:25:12 +0800646 * pci_restore_iov_state - restore the state of the IOV capability
647 * @dev: the PCI device
648 */
649void pci_restore_iov_state(struct pci_dev *dev)
650{
651 if (dev->is_physfn)
652 sriov_restore_state(dev);
653}
Yu Zhaoa28724b2009-03-20 11:25:13 +0800654
655/**
656 * pci_iov_bus_range - find bus range used by Virtual Function
657 * @bus: the PCI bus
658 *
659 * Returns max number of buses (exclude current one) used by Virtual
660 * Functions.
661 */
662int pci_iov_bus_range(struct pci_bus *bus)
663{
664 int max = 0;
Yu Zhaoa28724b2009-03-20 11:25:13 +0800665 struct pci_dev *dev;
666
667 list_for_each_entry(dev, &bus->devices, bus_list) {
668 if (!dev->is_physfn)
669 continue;
Wei Yang4449f072015-03-25 16:23:47 +0800670 if (dev->sriov->max_VF_buses > max)
671 max = dev->sriov->max_VF_buses;
Yu Zhaoa28724b2009-03-20 11:25:13 +0800672 }
673
674 return max ? max - bus->number : 0;
675}
Yu Zhaodd7cc442009-03-20 11:25:15 +0800676
677/**
678 * pci_enable_sriov - enable the SR-IOV capability
679 * @dev: the PCI device
Randy Dunlap52a88732009-04-01 17:45:30 -0700680 * @nr_virtfn: number of virtual functions to enable
Yu Zhaodd7cc442009-03-20 11:25:15 +0800681 *
682 * Returns 0 on success, or negative on failure.
683 */
684int pci_enable_sriov(struct pci_dev *dev, int nr_virtfn)
685{
686 might_sleep();
687
688 if (!dev->is_physfn)
Stefan Assmann652d1102013-07-31 16:47:56 -0600689 return -ENOSYS;
Yu Zhaodd7cc442009-03-20 11:25:15 +0800690
691 return sriov_enable(dev, nr_virtfn);
692}
693EXPORT_SYMBOL_GPL(pci_enable_sriov);
694
695/**
696 * pci_disable_sriov - disable the SR-IOV capability
697 * @dev: the PCI device
698 */
699void pci_disable_sriov(struct pci_dev *dev)
700{
701 might_sleep();
702
703 if (!dev->is_physfn)
704 return;
705
706 sriov_disable(dev);
707}
708EXPORT_SYMBOL_GPL(pci_disable_sriov);
Yu Zhao74bb1bc2009-03-20 11:25:16 +0800709
710/**
Williams, Mitch Afb8a0d92010-02-10 01:43:04 +0000711 * pci_num_vf - return number of VFs associated with a PF device_release_driver
712 * @dev: the PCI device
713 *
714 * Returns number of VFs, or 0 if SR-IOV is not enabled.
715 */
716int pci_num_vf(struct pci_dev *dev)
717{
Bjorn Helgaas1452cd72012-11-09 20:35:01 -0700718 if (!dev->is_physfn)
Williams, Mitch Afb8a0d92010-02-10 01:43:04 +0000719 return 0;
Bjorn Helgaas1452cd72012-11-09 20:35:01 -0700720
721 return dev->sriov->num_VFs;
Williams, Mitch Afb8a0d92010-02-10 01:43:04 +0000722}
723EXPORT_SYMBOL_GPL(pci_num_vf);
Donald Dutilebff73152012-11-05 15:20:37 -0500724
725/**
Alexander Duyck5a8eb242013-04-25 04:42:29 +0000726 * pci_vfs_assigned - returns number of VFs are assigned to a guest
727 * @dev: the PCI device
728 *
729 * Returns number of VFs belonging to this device that are assigned to a guest.
Stefan Assmann652d1102013-07-31 16:47:56 -0600730 * If device is not a physical function returns 0.
Alexander Duyck5a8eb242013-04-25 04:42:29 +0000731 */
732int pci_vfs_assigned(struct pci_dev *dev)
733{
734 struct pci_dev *vfdev;
735 unsigned int vfs_assigned = 0;
736 unsigned short dev_id;
737
738 /* only search if we are a PF */
739 if (!dev->is_physfn)
740 return 0;
741
742 /*
743 * determine the device ID for the VFs, the vendor ID will be the
744 * same as the PF so there is no need to check for that one
745 */
746 pci_read_config_word(dev, dev->sriov->pos + PCI_SRIOV_VF_DID, &dev_id);
747
748 /* loop through all the VFs to see if we own any that are assigned */
749 vfdev = pci_get_device(dev->vendor, dev_id, NULL);
750 while (vfdev) {
751 /*
752 * It is considered assigned if it is a virtual function with
753 * our dev as the physical function and the assigned bit is set
754 */
755 if (vfdev->is_virtfn && (vfdev->physfn == dev) &&
Ethan Zhaobe634972014-09-09 10:21:28 +0800756 pci_is_dev_assigned(vfdev))
Alexander Duyck5a8eb242013-04-25 04:42:29 +0000757 vfs_assigned++;
758
759 vfdev = pci_get_device(dev->vendor, dev_id, vfdev);
760 }
761
762 return vfs_assigned;
763}
764EXPORT_SYMBOL_GPL(pci_vfs_assigned);
765
766/**
Donald Dutilebff73152012-11-05 15:20:37 -0500767 * pci_sriov_set_totalvfs -- reduce the TotalVFs available
768 * @dev: the PCI PF device
Randy Dunlap2094f162013-01-09 17:12:52 -0800769 * @numvfs: number that should be used for TotalVFs supported
Donald Dutilebff73152012-11-05 15:20:37 -0500770 *
771 * Should be called from PF driver's probe routine with
772 * device's mutex held.
773 *
774 * Returns 0 if PF is an SRIOV-capable device and
Stefan Assmann652d1102013-07-31 16:47:56 -0600775 * value of numvfs valid. If not a PF return -ENOSYS;
776 * if numvfs is invalid return -EINVAL;
Donald Dutilebff73152012-11-05 15:20:37 -0500777 * if VFs already enabled, return -EBUSY.
778 */
779int pci_sriov_set_totalvfs(struct pci_dev *dev, u16 numvfs)
780{
Stefan Assmann652d1102013-07-31 16:47:56 -0600781 if (!dev->is_physfn)
782 return -ENOSYS;
783 if (numvfs > dev->sriov->total_VFs)
Donald Dutilebff73152012-11-05 15:20:37 -0500784 return -EINVAL;
785
786 /* Shouldn't change if VFs already enabled */
787 if (dev->sriov->ctrl & PCI_SRIOV_CTRL_VFE)
788 return -EBUSY;
789 else
Bjorn Helgaas6b136722012-11-09 20:27:53 -0700790 dev->sriov->driver_max_VFs = numvfs;
Donald Dutilebff73152012-11-05 15:20:37 -0500791
792 return 0;
793}
794EXPORT_SYMBOL_GPL(pci_sriov_set_totalvfs);
795
796/**
Jonghwan Choiddc191f2013-07-08 14:02:43 -0600797 * pci_sriov_get_totalvfs -- get total VFs supported on this device
Donald Dutilebff73152012-11-05 15:20:37 -0500798 * @dev: the PCI PF device
799 *
800 * For a PCIe device with SRIOV support, return the PCIe
Bjorn Helgaas6b136722012-11-09 20:27:53 -0700801 * SRIOV capability value of TotalVFs or the value of driver_max_VFs
Stefan Assmann652d1102013-07-31 16:47:56 -0600802 * if the driver reduced it. Otherwise 0.
Donald Dutilebff73152012-11-05 15:20:37 -0500803 */
804int pci_sriov_get_totalvfs(struct pci_dev *dev)
805{
Bjorn Helgaas1452cd72012-11-09 20:35:01 -0700806 if (!dev->is_physfn)
Stefan Assmann652d1102013-07-31 16:47:56 -0600807 return 0;
Donald Dutilebff73152012-11-05 15:20:37 -0500808
Bjorn Helgaas6b136722012-11-09 20:27:53 -0700809 if (dev->sriov->driver_max_VFs)
810 return dev->sriov->driver_max_VFs;
Bjorn Helgaas1452cd72012-11-09 20:35:01 -0700811
812 return dev->sriov->total_VFs;
Donald Dutilebff73152012-11-05 15:20:37 -0500813}
814EXPORT_SYMBOL_GPL(pci_sriov_get_totalvfs);