forked from Minki/linux
a1eb03f546
The reason we defer kfree until release function is because it's a general rule for kobjects: kfree of the reference counter itself is only legal in the release function. Previous patch didn't make this clear, document this in code. Cc: stable@vger.kernel.org Signed-off-by: Michael S. Tsirkin <mst@redhat.com>
317 lines
8.8 KiB
C
317 lines
8.8 KiB
C
/*
|
|
* Virtio PCI driver - legacy device support
|
|
*
|
|
* This module allows virtio devices to be used over a virtual PCI device.
|
|
* This can be used with QEMU based VMMs like KVM or Xen.
|
|
*
|
|
* Copyright IBM Corp. 2007
|
|
* Copyright Red Hat, Inc. 2014
|
|
*
|
|
* Authors:
|
|
* Anthony Liguori <aliguori@us.ibm.com>
|
|
* Rusty Russell <rusty@rustcorp.com.au>
|
|
* Michael S. Tsirkin <mst@redhat.com>
|
|
*
|
|
* This work is licensed under the terms of the GNU GPL, version 2 or later.
|
|
* See the COPYING file in the top-level directory.
|
|
*
|
|
*/
|
|
|
|
#include "virtio_pci_common.h"
|
|
|
|
/* virtio config->get_features() implementation */
|
|
static u64 vp_get_features(struct virtio_device *vdev)
|
|
{
|
|
struct virtio_pci_device *vp_dev = to_vp_device(vdev);
|
|
|
|
/* When someone needs more than 32 feature bits, we'll need to
|
|
* steal a bit to indicate that the rest are somewhere else. */
|
|
return ioread32(vp_dev->ioaddr + VIRTIO_PCI_HOST_FEATURES);
|
|
}
|
|
|
|
/* virtio config->finalize_features() implementation */
|
|
static int vp_finalize_features(struct virtio_device *vdev)
|
|
{
|
|
struct virtio_pci_device *vp_dev = to_vp_device(vdev);
|
|
|
|
/* Give virtio_ring a chance to accept features. */
|
|
vring_transport_features(vdev);
|
|
|
|
/* Make sure we don't have any features > 32 bits! */
|
|
BUG_ON((u32)vdev->features != vdev->features);
|
|
|
|
/* We only support 32 feature bits. */
|
|
iowrite32(vdev->features, vp_dev->ioaddr + VIRTIO_PCI_GUEST_FEATURES);
|
|
|
|
return 0;
|
|
}
|
|
|
|
/* virtio config->get() implementation */
|
|
static void vp_get(struct virtio_device *vdev, unsigned offset,
|
|
void *buf, unsigned len)
|
|
{
|
|
struct virtio_pci_device *vp_dev = to_vp_device(vdev);
|
|
void __iomem *ioaddr = vp_dev->ioaddr +
|
|
VIRTIO_PCI_CONFIG(vp_dev) + offset;
|
|
u8 *ptr = buf;
|
|
int i;
|
|
|
|
for (i = 0; i < len; i++)
|
|
ptr[i] = ioread8(ioaddr + i);
|
|
}
|
|
|
|
/* the config->set() implementation. it's symmetric to the config->get()
|
|
* implementation */
|
|
static void vp_set(struct virtio_device *vdev, unsigned offset,
|
|
const void *buf, unsigned len)
|
|
{
|
|
struct virtio_pci_device *vp_dev = to_vp_device(vdev);
|
|
void __iomem *ioaddr = vp_dev->ioaddr +
|
|
VIRTIO_PCI_CONFIG(vp_dev) + offset;
|
|
const u8 *ptr = buf;
|
|
int i;
|
|
|
|
for (i = 0; i < len; i++)
|
|
iowrite8(ptr[i], ioaddr + i);
|
|
}
|
|
|
|
/* config->{get,set}_status() implementations */
|
|
static u8 vp_get_status(struct virtio_device *vdev)
|
|
{
|
|
struct virtio_pci_device *vp_dev = to_vp_device(vdev);
|
|
return ioread8(vp_dev->ioaddr + VIRTIO_PCI_STATUS);
|
|
}
|
|
|
|
static void vp_set_status(struct virtio_device *vdev, u8 status)
|
|
{
|
|
struct virtio_pci_device *vp_dev = to_vp_device(vdev);
|
|
/* We should never be setting status to 0. */
|
|
BUG_ON(status == 0);
|
|
iowrite8(status, vp_dev->ioaddr + VIRTIO_PCI_STATUS);
|
|
}
|
|
|
|
static void vp_reset(struct virtio_device *vdev)
|
|
{
|
|
struct virtio_pci_device *vp_dev = to_vp_device(vdev);
|
|
/* 0 status means a reset. */
|
|
iowrite8(0, vp_dev->ioaddr + VIRTIO_PCI_STATUS);
|
|
/* Flush out the status write, and flush in device writes,
|
|
* including MSi-X interrupts, if any. */
|
|
ioread8(vp_dev->ioaddr + VIRTIO_PCI_STATUS);
|
|
/* Flush pending VQ/configuration callbacks. */
|
|
vp_synchronize_vectors(vdev);
|
|
}
|
|
|
|
static u16 vp_config_vector(struct virtio_pci_device *vp_dev, u16 vector)
|
|
{
|
|
/* Setup the vector used for configuration events */
|
|
iowrite16(vector, vp_dev->ioaddr + VIRTIO_MSI_CONFIG_VECTOR);
|
|
/* Verify we had enough resources to assign the vector */
|
|
/* Will also flush the write out to device */
|
|
return ioread16(vp_dev->ioaddr + VIRTIO_MSI_CONFIG_VECTOR);
|
|
}
|
|
|
|
static struct virtqueue *setup_vq(struct virtio_pci_device *vp_dev,
|
|
struct virtio_pci_vq_info *info,
|
|
unsigned index,
|
|
void (*callback)(struct virtqueue *vq),
|
|
const char *name,
|
|
u16 msix_vec)
|
|
{
|
|
struct virtqueue *vq;
|
|
unsigned long size;
|
|
u16 num;
|
|
int err;
|
|
|
|
/* Select the queue we're interested in */
|
|
iowrite16(index, vp_dev->ioaddr + VIRTIO_PCI_QUEUE_SEL);
|
|
|
|
/* Check if queue is either not available or already active. */
|
|
num = ioread16(vp_dev->ioaddr + VIRTIO_PCI_QUEUE_NUM);
|
|
if (!num || ioread32(vp_dev->ioaddr + VIRTIO_PCI_QUEUE_PFN))
|
|
return ERR_PTR(-ENOENT);
|
|
|
|
info->num = num;
|
|
info->msix_vector = msix_vec;
|
|
|
|
size = PAGE_ALIGN(vring_size(num, VIRTIO_PCI_VRING_ALIGN));
|
|
info->queue = alloc_pages_exact(size, GFP_KERNEL|__GFP_ZERO);
|
|
if (info->queue == NULL)
|
|
return ERR_PTR(-ENOMEM);
|
|
|
|
/* activate the queue */
|
|
iowrite32(virt_to_phys(info->queue) >> VIRTIO_PCI_QUEUE_ADDR_SHIFT,
|
|
vp_dev->ioaddr + VIRTIO_PCI_QUEUE_PFN);
|
|
|
|
/* create the vring */
|
|
vq = vring_new_virtqueue(index, info->num,
|
|
VIRTIO_PCI_VRING_ALIGN, &vp_dev->vdev,
|
|
true, info->queue, vp_notify, callback, name);
|
|
if (!vq) {
|
|
err = -ENOMEM;
|
|
goto out_activate_queue;
|
|
}
|
|
|
|
vq->priv = (void __force *)vp_dev->ioaddr + VIRTIO_PCI_QUEUE_NOTIFY;
|
|
|
|
if (msix_vec != VIRTIO_MSI_NO_VECTOR) {
|
|
iowrite16(msix_vec, vp_dev->ioaddr + VIRTIO_MSI_QUEUE_VECTOR);
|
|
msix_vec = ioread16(vp_dev->ioaddr + VIRTIO_MSI_QUEUE_VECTOR);
|
|
if (msix_vec == VIRTIO_MSI_NO_VECTOR) {
|
|
err = -EBUSY;
|
|
goto out_assign;
|
|
}
|
|
}
|
|
|
|
return vq;
|
|
|
|
out_assign:
|
|
vring_del_virtqueue(vq);
|
|
out_activate_queue:
|
|
iowrite32(0, vp_dev->ioaddr + VIRTIO_PCI_QUEUE_PFN);
|
|
free_pages_exact(info->queue, size);
|
|
return ERR_PTR(err);
|
|
}
|
|
|
|
static void del_vq(struct virtio_pci_vq_info *info)
|
|
{
|
|
struct virtqueue *vq = info->vq;
|
|
struct virtio_pci_device *vp_dev = to_vp_device(vq->vdev);
|
|
unsigned long size;
|
|
|
|
iowrite16(vq->index, vp_dev->ioaddr + VIRTIO_PCI_QUEUE_SEL);
|
|
|
|
if (vp_dev->msix_enabled) {
|
|
iowrite16(VIRTIO_MSI_NO_VECTOR,
|
|
vp_dev->ioaddr + VIRTIO_MSI_QUEUE_VECTOR);
|
|
/* Flush the write out to device */
|
|
ioread8(vp_dev->ioaddr + VIRTIO_PCI_ISR);
|
|
}
|
|
|
|
vring_del_virtqueue(vq);
|
|
|
|
/* Select and deactivate the queue */
|
|
iowrite32(0, vp_dev->ioaddr + VIRTIO_PCI_QUEUE_PFN);
|
|
|
|
size = PAGE_ALIGN(vring_size(info->num, VIRTIO_PCI_VRING_ALIGN));
|
|
free_pages_exact(info->queue, size);
|
|
}
|
|
|
|
static const struct virtio_config_ops virtio_pci_config_ops = {
|
|
.get = vp_get,
|
|
.set = vp_set,
|
|
.get_status = vp_get_status,
|
|
.set_status = vp_set_status,
|
|
.reset = vp_reset,
|
|
.find_vqs = vp_find_vqs,
|
|
.del_vqs = vp_del_vqs,
|
|
.get_features = vp_get_features,
|
|
.finalize_features = vp_finalize_features,
|
|
.bus_name = vp_bus_name,
|
|
.set_vq_affinity = vp_set_vq_affinity,
|
|
};
|
|
|
|
static void virtio_pci_release_dev(struct device *_d)
|
|
{
|
|
struct virtio_device *vdev = dev_to_virtio(_d);
|
|
struct virtio_pci_device *vp_dev = to_vp_device(vdev);
|
|
|
|
/* As struct device is a kobject, it's not safe to
|
|
* free the memory (including the reference counter itself)
|
|
* until it's release callback. */
|
|
kfree(vp_dev);
|
|
}
|
|
|
|
/* the PCI probing function */
|
|
int virtio_pci_legacy_probe(struct pci_dev *pci_dev,
|
|
const struct pci_device_id *id)
|
|
{
|
|
struct virtio_pci_device *vp_dev;
|
|
int err;
|
|
|
|
/* We only own devices >= 0x1000 and <= 0x103f: leave the rest. */
|
|
if (pci_dev->device < 0x1000 || pci_dev->device > 0x103f)
|
|
return -ENODEV;
|
|
|
|
if (pci_dev->revision != VIRTIO_PCI_ABI_VERSION) {
|
|
printk(KERN_ERR "virtio_pci: expected ABI version %d, got %d\n",
|
|
VIRTIO_PCI_ABI_VERSION, pci_dev->revision);
|
|
return -ENODEV;
|
|
}
|
|
|
|
/* allocate our structure and fill it out */
|
|
vp_dev = kzalloc(sizeof(struct virtio_pci_device), GFP_KERNEL);
|
|
if (vp_dev == NULL)
|
|
return -ENOMEM;
|
|
|
|
vp_dev->vdev.dev.parent = &pci_dev->dev;
|
|
vp_dev->vdev.dev.release = virtio_pci_release_dev;
|
|
vp_dev->vdev.config = &virtio_pci_config_ops;
|
|
vp_dev->pci_dev = pci_dev;
|
|
INIT_LIST_HEAD(&vp_dev->virtqueues);
|
|
spin_lock_init(&vp_dev->lock);
|
|
|
|
/* Disable MSI/MSIX to bring device to a known good state. */
|
|
pci_msi_off(pci_dev);
|
|
|
|
/* enable the device */
|
|
err = pci_enable_device(pci_dev);
|
|
if (err)
|
|
goto out;
|
|
|
|
err = pci_request_regions(pci_dev, "virtio-pci");
|
|
if (err)
|
|
goto out_enable_device;
|
|
|
|
vp_dev->ioaddr = pci_iomap(pci_dev, 0, 0);
|
|
if (vp_dev->ioaddr == NULL) {
|
|
err = -ENOMEM;
|
|
goto out_req_regions;
|
|
}
|
|
|
|
vp_dev->isr = vp_dev->ioaddr + VIRTIO_PCI_ISR;
|
|
|
|
pci_set_drvdata(pci_dev, vp_dev);
|
|
pci_set_master(pci_dev);
|
|
|
|
/* we use the subsystem vendor/device id as the virtio vendor/device
|
|
* id. this allows us to use the same PCI vendor/device id for all
|
|
* virtio devices and to identify the particular virtio driver by
|
|
* the subsystem ids */
|
|
vp_dev->vdev.id.vendor = pci_dev->subsystem_vendor;
|
|
vp_dev->vdev.id.device = pci_dev->subsystem_device;
|
|
|
|
vp_dev->config_vector = vp_config_vector;
|
|
vp_dev->setup_vq = setup_vq;
|
|
vp_dev->del_vq = del_vq;
|
|
|
|
/* finally register the virtio device */
|
|
err = register_virtio_device(&vp_dev->vdev);
|
|
if (err)
|
|
goto out_set_drvdata;
|
|
|
|
return 0;
|
|
|
|
out_set_drvdata:
|
|
pci_iounmap(pci_dev, vp_dev->ioaddr);
|
|
out_req_regions:
|
|
pci_release_regions(pci_dev);
|
|
out_enable_device:
|
|
pci_disable_device(pci_dev);
|
|
out:
|
|
kfree(vp_dev);
|
|
return err;
|
|
}
|
|
|
|
void virtio_pci_legacy_remove(struct pci_dev *pci_dev)
|
|
{
|
|
struct virtio_pci_device *vp_dev = pci_get_drvdata(pci_dev);
|
|
|
|
unregister_virtio_device(&vp_dev->vdev);
|
|
|
|
vp_del_vqs(&vp_dev->vdev);
|
|
pci_iounmap(pci_dev, vp_dev->ioaddr);
|
|
pci_release_regions(pci_dev);
|
|
pci_disable_device(pci_dev);
|
|
}
|