drm/i915: Implement inter-engine read-read optimisations (b4716185) · Commits · e / devices / android_kernel_fairphone_FP3

drivers/gpu/drm/i915/i915_debugfs.c

+11 −5

Original line number	Diff line number	Diff line
		@@ -120,10 +120,13 @@ static inline const char get_global_flag(struct drm_i915_gem_object obj)
		static void
		describe_obj(struct seq_file m, struct drm_i915_gem_object obj)
		{
		struct drm_i915_private *dev_priv = to_i915(obj->base.dev);
		struct intel_engine_cs *ring;
		struct i915_vma *vma;
		int pin_count = 0;
		int i;

		seq_printf(m, "%pK: %s%s%s%s %8zdKiB %02x %02x %x %x %x%s%s%s",
		seq_printf(m, "%pK: %s%s%s%s %8zdKiB %02x %02x [ ",
		&obj->base,
		obj->active ? "*" : " ",
		get_pin_flag(obj),
		@@ -131,8 +134,11 @@ describe_obj(struct seq_file m, struct drm_i915_gem_object obj)
		get_global_flag(obj),
		obj->base.size / 1024,
		obj->base.read_domains,
		obj->base.write_domain,
		i915_gem_request_get_seqno(obj->last_read_req),
		obj->base.write_domain);
		for_each_ring(ring, dev_priv, i)
		seq_printf(m, "%x ",
		i915_gem_request_get_seqno(obj->last_read_req[i]));
		seq_printf(m, "] %x %x%s%s%s",
		i915_gem_request_get_seqno(obj->last_write_req),
		i915_gem_request_get_seqno(obj->last_fenced_req),
		i915_cache_level_str(to_i915(obj->base.dev), obj->cache_level),
		@@ -169,9 +175,9 @@ describe_obj(struct seq_file m, struct drm_i915_gem_object obj)
		*t = '\0';
		seq_printf(m, " (%s mappable)", s);
		}
		if (obj->last_read_req != NULL)
		if (obj->last_write_req != NULL)
		seq_printf(m, " (%s)",
		i915_gem_request_get_ring(obj->last_read_req)->name);
		i915_gem_request_get_ring(obj->last_write_req)->name);
		if (obj->frontbuffer_bits)
		seq_printf(m, " (frontbuffer: 0x%03x)", obj->frontbuffer_bits);
		}

drivers/gpu/drm/i915/i915_drv.h

+14 −5

Original line number	Diff line number	Diff line
		@@ -508,7 +508,7 @@ struct drm_i915_error_state {
		struct drm_i915_error_buffer {
		u32 size;
		u32 name;
		u32 rseqno, wseqno;
		u32 rseqno[I915_NUM_RINGS], wseqno;
		u32 gtt_offset;
		u32 read_domains;
		u32 write_domain;
		@@ -1939,7 +1939,7 @@ struct drm_i915_gem_object {
		struct drm_mm_node *stolen;
		struct list_head global_list;

		struct list_head ring_list;
		struct list_head ring_list[I915_NUM_RINGS];
		/** Used in execbuf to temporarily hold a ref */
		struct list_head obj_exec_link;

		@@ -1950,7 +1950,7 @@ struct drm_i915_gem_object {
		* rendering and so a non-zero seqno), and is not set if it i s on
		* inactive (ready to be unbound) list.
		*/
		unsigned int active:1;
		unsigned int active:I915_NUM_RINGS;

		/**
		* This is set if the object has been written to since last bound
		@@ -2021,8 +2021,17 @@ struct drm_i915_gem_object {
		void *dma_buf_vmapping;
		int vmapping_count;

		/** Breadcrumb of last rendering to the buffer. */
		struct drm_i915_gem_request *last_read_req;
		/** Breadcrumb of last rendering to the buffer.
		* There can only be one writer, but we allow for multiple readers.
		* If there is a writer that necessarily implies that all other
		* read requests are complete - but we may only be lazily clearing
		* the read requests. A read request is naturally the most recent
		* request on a ring, so we may have two different write and read
		* requests on one ring where the write request is older than the
		* read request. This allows for the CPU to read from an active
		* buffer by only waiting for the write to complete.
		* */
		struct drm_i915_gem_request *last_read_req[I915_NUM_RINGS];
		struct drm_i915_gem_request *last_write_req;
		/** Breadcrumb of last fenced GPU access to the buffer. */
		struct drm_i915_gem_request *last_fenced_req;

drivers/gpu/drm/i915/i915_gem.c

+331 −209

File changed.

Preview size limit exceeded, changes collapsed.

drivers/gpu/drm/i915/i915_gem_context.c

+0 −2

Original line number	Diff line number	Diff line
		@@ -753,8 +753,6 @@ static int do_switch(struct intel_engine_cs *ring,
		* swapped, but there is no way to do that yet.
		*/
		from->legacy_hw_ctx.rcs_state->dirty = 1;
		BUG_ON(i915_gem_request_get_ring(
		from->legacy_hw_ctx.rcs_state->last_read_req) != ring);

		/* obj is kept alive until the next request by its active ref */
		i915_gem_object_ggtt_unpin(from->legacy_hw_ctx.rcs_state);

drivers/gpu/drm/i915/i915_gem_debug.c

+22 −70

File changed.

Preview size limit exceeded, changes collapsed.