d223f98f02
The compute shader dispatch interface is pretty simple -- just pass in the regs that userspace has passed us, with no CLs to run. However, with no CL to run it means that we need to do manual cache flushing of the L2 after the HW execution completes (for SSBO, atomic, and image_load_store writes that are the output of compute shaders). This doesn't yet expose the L2 cache's ability to have a region of the address space not write back to memory (which could be used for shared_var storage). So far, the Mesa side has been tested on V3D v4.2 simpenrose (passing the ES31 tests), and on the kernel side on 7278 (failing atomic compswap tests in a way that doesn't reproduce on simpenrose). v2: Fix excessive allocation for the clean_job (reported by Dan Carpenter). Keep refs on jobs until clean_job is finished, to avoid spurious MMU errors if the output BOs are freed by userspace before L2 cleaning is finished. Signed-off-by: Eric Anholt <eric@anholt.net> Link: https://patchwork.freedesktop.org/patch/msgid/20190416225856.20264-4-eric@anholt.net Acked-by: Rob Clark <robdclark@gmail.com>
298 lines
6.0 KiB
C
298 lines
6.0 KiB
C
// SPDX-License-Identifier: GPL-2.0+
|
|
/* Copyright (C) 2015-2018 Broadcom */
|
|
|
|
#if !defined(_V3D_TRACE_H_) || defined(TRACE_HEADER_MULTI_READ)
|
|
#define _V3D_TRACE_H_
|
|
|
|
#include <linux/stringify.h>
|
|
#include <linux/types.h>
|
|
#include <linux/tracepoint.h>
|
|
|
|
#undef TRACE_SYSTEM
|
|
#define TRACE_SYSTEM v3d
|
|
#define TRACE_INCLUDE_FILE v3d_trace
|
|
|
|
TRACE_EVENT(v3d_submit_cl_ioctl,
|
|
TP_PROTO(struct drm_device *dev, u32 ct1qba, u32 ct1qea),
|
|
TP_ARGS(dev, ct1qba, ct1qea),
|
|
|
|
TP_STRUCT__entry(
|
|
__field(u32, dev)
|
|
__field(u32, ct1qba)
|
|
__field(u32, ct1qea)
|
|
),
|
|
|
|
TP_fast_assign(
|
|
__entry->dev = dev->primary->index;
|
|
__entry->ct1qba = ct1qba;
|
|
__entry->ct1qea = ct1qea;
|
|
),
|
|
|
|
TP_printk("dev=%u, RCL 0x%08x..0x%08x",
|
|
__entry->dev,
|
|
__entry->ct1qba,
|
|
__entry->ct1qea)
|
|
);
|
|
|
|
TRACE_EVENT(v3d_submit_cl,
|
|
TP_PROTO(struct drm_device *dev, bool is_render,
|
|
uint64_t seqno,
|
|
u32 ctnqba, u32 ctnqea),
|
|
TP_ARGS(dev, is_render, seqno, ctnqba, ctnqea),
|
|
|
|
TP_STRUCT__entry(
|
|
__field(u32, dev)
|
|
__field(bool, is_render)
|
|
__field(u64, seqno)
|
|
__field(u32, ctnqba)
|
|
__field(u32, ctnqea)
|
|
),
|
|
|
|
TP_fast_assign(
|
|
__entry->dev = dev->primary->index;
|
|
__entry->is_render = is_render;
|
|
__entry->seqno = seqno;
|
|
__entry->ctnqba = ctnqba;
|
|
__entry->ctnqea = ctnqea;
|
|
),
|
|
|
|
TP_printk("dev=%u, %s, seqno=%llu, 0x%08x..0x%08x",
|
|
__entry->dev,
|
|
__entry->is_render ? "RCL" : "BCL",
|
|
__entry->seqno,
|
|
__entry->ctnqba,
|
|
__entry->ctnqea)
|
|
);
|
|
|
|
TRACE_EVENT(v3d_bcl_irq,
|
|
TP_PROTO(struct drm_device *dev,
|
|
uint64_t seqno),
|
|
TP_ARGS(dev, seqno),
|
|
|
|
TP_STRUCT__entry(
|
|
__field(u32, dev)
|
|
__field(u64, seqno)
|
|
),
|
|
|
|
TP_fast_assign(
|
|
__entry->dev = dev->primary->index;
|
|
__entry->seqno = seqno;
|
|
),
|
|
|
|
TP_printk("dev=%u, seqno=%llu",
|
|
__entry->dev,
|
|
__entry->seqno)
|
|
);
|
|
|
|
TRACE_EVENT(v3d_rcl_irq,
|
|
TP_PROTO(struct drm_device *dev,
|
|
uint64_t seqno),
|
|
TP_ARGS(dev, seqno),
|
|
|
|
TP_STRUCT__entry(
|
|
__field(u32, dev)
|
|
__field(u64, seqno)
|
|
),
|
|
|
|
TP_fast_assign(
|
|
__entry->dev = dev->primary->index;
|
|
__entry->seqno = seqno;
|
|
),
|
|
|
|
TP_printk("dev=%u, seqno=%llu",
|
|
__entry->dev,
|
|
__entry->seqno)
|
|
);
|
|
|
|
TRACE_EVENT(v3d_tfu_irq,
|
|
TP_PROTO(struct drm_device *dev,
|
|
uint64_t seqno),
|
|
TP_ARGS(dev, seqno),
|
|
|
|
TP_STRUCT__entry(
|
|
__field(u32, dev)
|
|
__field(u64, seqno)
|
|
),
|
|
|
|
TP_fast_assign(
|
|
__entry->dev = dev->primary->index;
|
|
__entry->seqno = seqno;
|
|
),
|
|
|
|
TP_printk("dev=%u, seqno=%llu",
|
|
__entry->dev,
|
|
__entry->seqno)
|
|
);
|
|
|
|
TRACE_EVENT(v3d_csd_irq,
|
|
TP_PROTO(struct drm_device *dev,
|
|
uint64_t seqno),
|
|
TP_ARGS(dev, seqno),
|
|
|
|
TP_STRUCT__entry(
|
|
__field(u32, dev)
|
|
__field(u64, seqno)
|
|
),
|
|
|
|
TP_fast_assign(
|
|
__entry->dev = dev->primary->index;
|
|
__entry->seqno = seqno;
|
|
),
|
|
|
|
TP_printk("dev=%u, seqno=%llu",
|
|
__entry->dev,
|
|
__entry->seqno)
|
|
);
|
|
|
|
TRACE_EVENT(v3d_submit_tfu_ioctl,
|
|
TP_PROTO(struct drm_device *dev, u32 iia),
|
|
TP_ARGS(dev, iia),
|
|
|
|
TP_STRUCT__entry(
|
|
__field(u32, dev)
|
|
__field(u32, iia)
|
|
),
|
|
|
|
TP_fast_assign(
|
|
__entry->dev = dev->primary->index;
|
|
__entry->iia = iia;
|
|
),
|
|
|
|
TP_printk("dev=%u, IIA 0x%08x",
|
|
__entry->dev,
|
|
__entry->iia)
|
|
);
|
|
|
|
TRACE_EVENT(v3d_submit_tfu,
|
|
TP_PROTO(struct drm_device *dev,
|
|
uint64_t seqno),
|
|
TP_ARGS(dev, seqno),
|
|
|
|
TP_STRUCT__entry(
|
|
__field(u32, dev)
|
|
__field(u64, seqno)
|
|
),
|
|
|
|
TP_fast_assign(
|
|
__entry->dev = dev->primary->index;
|
|
__entry->seqno = seqno;
|
|
),
|
|
|
|
TP_printk("dev=%u, seqno=%llu",
|
|
__entry->dev,
|
|
__entry->seqno)
|
|
);
|
|
|
|
TRACE_EVENT(v3d_submit_csd_ioctl,
|
|
TP_PROTO(struct drm_device *dev, u32 cfg5, u32 cfg6),
|
|
TP_ARGS(dev, cfg5, cfg6),
|
|
|
|
TP_STRUCT__entry(
|
|
__field(u32, dev)
|
|
__field(u32, cfg5)
|
|
__field(u32, cfg6)
|
|
),
|
|
|
|
TP_fast_assign(
|
|
__entry->dev = dev->primary->index;
|
|
__entry->cfg5 = cfg5;
|
|
__entry->cfg6 = cfg6;
|
|
),
|
|
|
|
TP_printk("dev=%u, CFG5 0x%08x, CFG6 0x%08x",
|
|
__entry->dev,
|
|
__entry->cfg5,
|
|
__entry->cfg6)
|
|
);
|
|
|
|
TRACE_EVENT(v3d_submit_csd,
|
|
TP_PROTO(struct drm_device *dev,
|
|
uint64_t seqno),
|
|
TP_ARGS(dev, seqno),
|
|
|
|
TP_STRUCT__entry(
|
|
__field(u32, dev)
|
|
__field(u64, seqno)
|
|
),
|
|
|
|
TP_fast_assign(
|
|
__entry->dev = dev->primary->index;
|
|
__entry->seqno = seqno;
|
|
),
|
|
|
|
TP_printk("dev=%u, seqno=%llu",
|
|
__entry->dev,
|
|
__entry->seqno)
|
|
);
|
|
|
|
TRACE_EVENT(v3d_cache_clean_begin,
|
|
TP_PROTO(struct drm_device *dev),
|
|
TP_ARGS(dev),
|
|
|
|
TP_STRUCT__entry(
|
|
__field(u32, dev)
|
|
),
|
|
|
|
TP_fast_assign(
|
|
__entry->dev = dev->primary->index;
|
|
),
|
|
|
|
TP_printk("dev=%u",
|
|
__entry->dev)
|
|
);
|
|
|
|
TRACE_EVENT(v3d_cache_clean_end,
|
|
TP_PROTO(struct drm_device *dev),
|
|
TP_ARGS(dev),
|
|
|
|
TP_STRUCT__entry(
|
|
__field(u32, dev)
|
|
),
|
|
|
|
TP_fast_assign(
|
|
__entry->dev = dev->primary->index;
|
|
),
|
|
|
|
TP_printk("dev=%u",
|
|
__entry->dev)
|
|
);
|
|
|
|
TRACE_EVENT(v3d_reset_begin,
|
|
TP_PROTO(struct drm_device *dev),
|
|
TP_ARGS(dev),
|
|
|
|
TP_STRUCT__entry(
|
|
__field(u32, dev)
|
|
),
|
|
|
|
TP_fast_assign(
|
|
__entry->dev = dev->primary->index;
|
|
),
|
|
|
|
TP_printk("dev=%u",
|
|
__entry->dev)
|
|
);
|
|
|
|
TRACE_EVENT(v3d_reset_end,
|
|
TP_PROTO(struct drm_device *dev),
|
|
TP_ARGS(dev),
|
|
|
|
TP_STRUCT__entry(
|
|
__field(u32, dev)
|
|
),
|
|
|
|
TP_fast_assign(
|
|
__entry->dev = dev->primary->index;
|
|
),
|
|
|
|
TP_printk("dev=%u",
|
|
__entry->dev)
|
|
);
|
|
|
|
#endif /* _V3D_TRACE_H_ */
|
|
|
|
/* This part must be outside protection */
|
|
#undef TRACE_INCLUDE_PATH
|
|
#define TRACE_INCLUDE_PATH .
|
|
#include <trace/define_trace.h>
|