From ec153d79a5da727ec83c0b2edcc4ee56deac691f Mon Sep 17 00:00:00 2001 From: Asahi Lina Date: Fri, 7 Apr 2023 20:38:42 +0900 Subject: [PATCH] drm/asahi: Identify more Render fields & update to UAPI 10007 Also set the large_tib flag properly (implied from tib size for now, not sure if this should be a separate flag?) Signed-off-by: Asahi Lina --- drivers/gpu/drm/asahi/fw/fragment.rs | 8 +++---- drivers/gpu/drm/asahi/fw/job.rs | 2 +- drivers/gpu/drm/asahi/fw/microseq.rs | 2 +- drivers/gpu/drm/asahi/queue/compute.rs | 6 +++--- drivers/gpu/drm/asahi/queue/render.rs | 29 ++++++++++++++------------ 5 files changed, 25 insertions(+), 22 deletions(-) diff --git a/drivers/gpu/drm/asahi/fw/fragment.rs b/drivers/gpu/drm/asahi/fw/fragment.rs index eca275efb967a4..a01b0d0d7807f8 100644 --- a/drivers/gpu/drm/asahi/fw/fragment.rs +++ b/drivers/gpu/drm/asahi/fw/fragment.rs @@ -132,7 +132,7 @@ pub(crate) mod raw { pub(crate) utiles_per_mtile_x: u16, pub(crate) unk_24: u32, pub(crate) tile_counts: u32, - pub(crate) iogpu_unk_212: u32, + pub(crate) tib_blocks: u32, pub(crate) isp_bgobjdepth: u32, pub(crate) isp_bgobjvals: u32, pub(crate) unk_38: u32, @@ -171,7 +171,7 @@ pub(crate) mod raw { pub(crate) stencil_buffer_ptr3: U64, pub(crate) stencil_meta_buffer_ptr3: U64, pub(crate) unk_2f8: Array<2, U64>, - pub(crate) iogpu_unk_212: u32, + pub(crate) tib_blocks: u32, pub(crate) unk_30c: u32, pub(crate) aux_fb_info: AuxFBInfo::ver, pub(crate) unk_320_padding: Array<0x10, u8>, @@ -179,7 +179,7 @@ pub(crate) mod raw { pub(crate) partial_store_pipeline: StorePipelineBinding, pub(crate) isp_bgobjdepth: u32, pub(crate) isp_bgobjvals: u32, - pub(crate) iogpu_unk_49: u32, + pub(crate) sample_size: u32, pub(crate) unk_37c: u32, pub(crate) unk_380: U64, pub(crate) unk_388: U64, @@ -230,7 +230,7 @@ pub(crate) mod raw { pub(crate) encoder_params: job::raw::EncoderParams<'a>, pub(crate) process_empty_tiles: u32, pub(crate) no_clear_pipeline_textures: u32, - pub(crate) unk_param: u32, + pub(crate) msaa_zs: u32, pub(crate) unk_pointee: u32, pub(crate) meta: job::raw::JobMeta, pub(crate) unk_after_meta: u32, diff --git a/drivers/gpu/drm/asahi/fw/job.rs b/drivers/gpu/drm/asahi/fw/job.rs index 7027a763dffb11..2384b5c1119665 100644 --- a/drivers/gpu/drm/asahi/fw/job.rs +++ b/drivers/gpu/drm/asahi/fw/job.rs @@ -28,7 +28,7 @@ pub(crate) mod raw { #[repr(C)] pub(crate) struct EncoderParams<'a> { pub(crate) unk_8: u32, - pub(crate) unk_c: u32, + pub(crate) large_tib: u32, pub(crate) unk_10: u32, pub(crate) encoder_id: u32, pub(crate) unk_18: u32, diff --git a/drivers/gpu/drm/asahi/fw/microseq.rs b/drivers/gpu/drm/asahi/fw/microseq.rs index 274a2c7f741537..f47740a00fb5d6 100644 --- a/drivers/gpu/drm/asahi/fw/microseq.rs +++ b/drivers/gpu/drm/asahi/fw/microseq.rs @@ -239,7 +239,7 @@ pub(crate) struct StartFragment<'a> { pub(crate) unk_50: u32, pub(crate) event_generation: u32, pub(crate) buffer_slot: u32, - pub(crate) unk_5c: u32, + pub(crate) large_tib: u32, pub(crate) event_seq: U64, pub(crate) unk_68: u32, pub(crate) unk_758_flag: GpuWeakPointer, diff --git a/drivers/gpu/drm/asahi/queue/compute.rs b/drivers/gpu/drm/asahi/queue/compute.rs index 995371470a2584..69039edd3fbf8d 100644 --- a/drivers/gpu/drm/asahi/queue/compute.rs +++ b/drivers/gpu/drm/asahi/queue/compute.rs @@ -287,9 +287,9 @@ impl super::Queue::ver { unk_5c: 0, }, encoder_params: fw::job::raw::EncoderParams { - unk_8: 0x0, // fixed - unk_c: 0x0, // fixed - unk_10: 0x0, // fixed + unk_8: 0x0, // fixed + large_tib: 0x0, // check! + unk_10: 0x0, // fixed encoder_id: cmdbuf.encoder_id, unk_18: 0x0, // fixed iogpu_compute_unk44: cmdbuf.iogpu_unk_44, diff --git a/drivers/gpu/drm/asahi/queue/render.rs b/drivers/gpu/drm/asahi/queue/render.rs index 1a3f6e3438aeb9..0a12473c4ca89f 100644 --- a/drivers/gpu/drm/asahi/queue/render.rs +++ b/drivers/gpu/drm/asahi/queue/render.rs @@ -225,7 +225,9 @@ impl super::Queue::ver { | uapi::ASAHI_RENDER_SET_WHEN_RELOADING_Z_OR_S | uapi::ASAHI_RENDER_MEMORYLESS_RTS_USED | uapi::ASAHI_RENDER_PROCESS_EMPTY_TILES - | uapi::ASAHI_RENDER_NO_VERTEX_CLUSTERING) as u64 + | uapi::ASAHI_RENDER_NO_VERTEX_CLUSTERING + | uapi::ASAHI_RENDER_MSAA_ZS + | uapi::ASAHI_RENDER_UNK_FLAG1) as u64 != 0 { return Err(EINVAL); @@ -395,8 +397,7 @@ impl super::Queue::ver { let timestamps = Arc::try_new(kalloc.shared.new_default::()?)?; - let unk1 = debug_enabled(debug::DebugFlags::Debug1); - let unk2 = debug_enabled(debug::DebugFlags::Debug2); + let unk1 = cmdbuf.flags & uapi::ASAHI_RENDER_UNK_FLAG1 as u64 != 0; let mut tile_config: u64 = 0; if !unk1 { @@ -449,6 +450,8 @@ impl super::Queue::ver { #[ver(V >= V13_0B4)] let count_vtx = count_frag + 1; + let large_tib = cmdbuf.tib_blocks > 8; + mod_dev_dbg!(self.dev, "[Submission {}] Create Frag\n", id); let frag = GpuObject::new_prealloc( kalloc.private.alloc_object()?, @@ -475,7 +478,7 @@ impl super::Queue::ver { unk_50: 0x1, // fixed event_generation: self.id as u32, buffer_slot: scene.slot(), - unk_5c: 0, + large_tib: large_tib as u32, event_seq: U64(ev_frag.event_seq), unk_68: 0, unk_758_flag: inner_weak_ptr!(ptr, unk_758_flag), @@ -671,7 +674,7 @@ impl super::Queue::ver { utiles_per_mtile_x: tile_info.utiles_per_mtile_x as u16, unk_24: 0x0, tile_counts: ((tile_info.tiles_y - 1) << 12) | (tile_info.tiles_x - 1), - iogpu_unk_212: cmdbuf.iogpu_unk_212, + tib_blocks: cmdbuf.tib_blocks, isp_bgobjdepth: cmdbuf.isp_bgobjdepth, // TODO: does this flag need to be exposed to userspace? isp_bgobjvals: cmdbuf.isp_bgobjvals | 0x400, @@ -719,7 +722,7 @@ impl super::Queue::ver { stencil_buffer_ptr3: U64(cmdbuf.stencil_buffer_3), stencil_meta_buffer_ptr3: U64(cmdbuf.stencil_meta_buffer_3), unk_2f8: Default::default(), - iogpu_unk_212: cmdbuf.iogpu_unk_212, + tib_blocks: cmdbuf.tib_blocks, unk_30c: 0x0, aux_fb_info: aux_fb_info, unk_320_padding: Default::default(), @@ -734,7 +737,7 @@ impl super::Queue::ver { ), isp_bgobjdepth: cmdbuf.isp_bgobjdepth, isp_bgobjvals: cmdbuf.isp_bgobjvals, - iogpu_unk_49: cmdbuf.iogpu_unk_49, + sample_size: cmdbuf.sample_size, unk_37c: 0x0, unk_380: U64(0x0), unk_388: U64(0x0), @@ -752,8 +755,8 @@ impl super::Queue::ver { unk_8: (cmdbuf.flags & uapi::ASAHI_RENDER_SET_WHEN_RELOADING_Z_OR_S as u64 != 0) as u32, - unk_c: 0x0, // fixed - unk_10: 0x0, // fixed + large_tib: large_tib as u32, // fixed + unk_10: 0x0, // fixed encoder_id: cmdbuf.encoder_id, unk_18: 0x0, // fixed iogpu_compute_unk44: 0xffffffff, @@ -766,7 +769,7 @@ impl super::Queue::ver { no_clear_pipeline_textures: (cmdbuf.flags & uapi::ASAHI_RENDER_NO_CLEAR_PIPELINE_TEXTURES as u64 != 0) as u32, - unk_param: unk2.into(), // 1 for boot stuff? + msaa_zs: (cmdbuf.flags & uapi::ASAHI_RENDER_MSAA_ZS as u64 != 0) as u32, unk_pointee: 0, meta: fw::job::raw::JobMeta { unk_0: 0, @@ -1077,9 +1080,9 @@ impl super::Queue::ver { unk_520: U64(0x0), // fixed }, encoder_params: fw::job::raw::EncoderParams { - unk_8: 0x0, // fixed - unk_c: 0x0, // fixed - unk_10: 0x0, // fixed + unk_8: 0x0, // fixed + large_tib: 0x0, // fixed + unk_10: 0x0, // fixed encoder_id: cmdbuf.encoder_id, unk_18: 0x0, // fixed iogpu_compute_unk44: 0xffffffff,