1
0
Fork 0
forked from wry/wry

Merge pull request #269 from mahkoh/jorth/fb-explicit-sync

render: use explicit sync for framebuffers, vulkan: use transfer queue if available
This commit is contained in:
mahkoh 2024-09-18 17:22:40 +02:00 committed by GitHub
commit 13f54ff2de
No known key found for this signature in database
GPG key ID: B5690EEEBB952194
20 changed files with 662 additions and 155 deletions

View file

@ -9,7 +9,7 @@ use {
}, },
gfx_api::{ gfx_api::{
create_render_pass, AcquireSync, BufferResv, GfxApiOpt, GfxRenderPass, GfxTexture, create_render_pass, AcquireSync, BufferResv, GfxApiOpt, GfxRenderPass, GfxTexture,
SyncFile, ReleaseSync, SyncFile,
}, },
theme::Color, theme::Color,
time::Time, time::Time,
@ -43,7 +43,8 @@ pub struct DirectScanoutCache {
pub struct DirectScanoutData { pub struct DirectScanoutData {
tex: Rc<dyn GfxTexture>, tex: Rc<dyn GfxTexture>,
acquire_sync: AcquireSync, acquire_sync: AcquireSync,
_resv: Option<Rc<dyn BufferResv>>, release_sync: ReleaseSync,
resv: Option<Rc<dyn BufferResv>>,
fb: Rc<DrmFramebuffer>, fb: Rc<DrmFramebuffer>,
dma_buf_id: DmaBufId, dma_buf_id: DmaBufId,
position: DirectScanoutPosition, position: DirectScanoutPosition,
@ -618,7 +619,8 @@ impl MetalConnector {
return buffer.fb.as_ref().map(|fb| DirectScanoutData { return buffer.fb.as_ref().map(|fb| DirectScanoutData {
tex: buffer.tex.upgrade().unwrap(), tex: buffer.tex.upgrade().unwrap(),
acquire_sync: ct.acquire_sync.clone(), acquire_sync: ct.acquire_sync.clone(),
_resv: ct.buffer_resv.clone(), release_sync: ct.release_sync,
resv: ct.buffer_resv.clone(),
fb: fb.clone(), fb: fb.clone(),
dma_buf_id: dmabuf.id, dma_buf_id: dmabuf.id,
position, position,
@ -643,7 +645,8 @@ impl MetalConnector {
Ok(fb) => Some(DirectScanoutData { Ok(fb) => Some(DirectScanoutData {
tex: ct.tex.clone(), tex: ct.tex.clone(),
acquire_sync: ct.acquire_sync.clone(), acquire_sync: ct.acquire_sync.clone(),
_resv: ct.buffer_resv.clone(), release_sync: ct.release_sync,
resv: ct.buffer_resv.clone(),
fb: Rc::new(fb), fb: Rc::new(fb),
dma_buf_id: dmabuf.id, dma_buf_id: dmabuf.id,
position, position,
@ -708,7 +711,7 @@ impl MetalConnector {
None => { None => {
let sf = buffer let sf = buffer
.render_fb() .render_fb()
.perform_render_pass(pass) .perform_render_pass(AcquireSync::Unnecessary, ReleaseSync::Explicit, pass)
.map_err(MetalError::RenderFrame)?; .map_err(MetalError::RenderFrame)?;
sync_file = buffer.copy_to_dev(sf)?; sync_file = buffer.copy_to_dev(sf)?;
fb = buffer.drm.clone(); fb = buffer.drm.clone();
@ -748,11 +751,23 @@ impl MetalConnector {
let render_hardware_cursor = self.cursor_enabled.get(); let render_hardware_cursor = self.cursor_enabled.get();
match &fb.direct_scanout_data { match &fb.direct_scanout_data {
None => { None => {
output.perform_screencopies(&fb.tex, render_hardware_cursor, 0, 0, None); output.perform_screencopies(
&fb.tex,
None,
&AcquireSync::Unnecessary,
ReleaseSync::None,
render_hardware_cursor,
0,
0,
None,
);
} }
Some(dsd) => { Some(dsd) => {
output.perform_screencopies( output.perform_screencopies(
&dsd.tex, &dsd.tex,
dsd.resv.as_ref(),
&dsd.acquire_sync,
dsd.release_sync,
render_hardware_cursor, render_hardware_cursor,
dsd.position.crtc_x, dsd.position.crtc_x,
dsd.position.crtc_y, dsd.position.crtc_y,

View file

@ -2474,7 +2474,9 @@ impl MetalBackend {
Ok(fb) => fb, Ok(fb) => fb,
Err(e) => return Err(MetalError::ImportFb(e)), Err(e) => return Err(MetalError::ImportFb(e)),
}; };
dev_fb.clear().map_err(MetalError::Clear)?; dev_fb
.clear(AcquireSync::Unnecessary, ReleaseSync::None)
.map_err(MetalError::Clear)?;
let (dev_tex, render_tex, render_fb, render_bo) = if dev.id == render_ctx.dev_id { let (dev_tex, render_tex, render_fb, render_bo) = if dev.id == render_ctx.dev_id {
let render_tex = match dev_img.to_texture() { let render_tex = match dev_img.to_texture() {
Ok(fb) => fb, Ok(fb) => fb,
@ -2526,7 +2528,9 @@ impl MetalBackend {
Ok(fb) => fb, Ok(fb) => fb,
Err(e) => return Err(MetalError::ImportFb(e)), Err(e) => return Err(MetalError::ImportFb(e)),
}; };
render_fb.clear().map_err(MetalError::Clear)?; render_fb
.clear(AcquireSync::Unnecessary, ReleaseSync::None)
.map_err(MetalError::Clear)?;
let render_tex = match render_img.to_texture() { let render_tex = match render_img.to_texture() {
Ok(fb) => fb, Ok(fb) => fb,
Err(e) => return Err(MetalError::ImportTexture(e)), Err(e) => return Err(MetalError::ImportTexture(e)),
@ -2797,9 +2801,17 @@ impl RenderBuffer {
let Some(tex) = &self.dev_tex else { let Some(tex) = &self.dev_tex else {
return Ok(sync_file); return Ok(sync_file);
}; };
let acquire_point = AcquireSync::from_sync_file(sync_file);
self.dev_fb self.dev_fb
.copy_texture(tex, acquire_point, ReleaseSync::Implicit, 0, 0) .copy_texture(
AcquireSync::Unnecessary,
ReleaseSync::Explicit,
tex,
None,
AcquireSync::from_sync_file(sync_file),
ReleaseSync::None,
0,
0,
)
.map_err(MetalError::CopyToOutput) .map_err(MetalError::CopyToOutput)
} }
} }

View file

@ -10,7 +10,7 @@ use {
}, },
fixed::Fixed, fixed::Fixed,
format::XRGB8888, format::XRGB8888,
gfx_api::{GfxContext, GfxError, GfxFramebuffer, GfxTexture}, gfx_api::{AcquireSync, GfxContext, GfxError, GfxFramebuffer, GfxTexture, ReleaseSync},
ifs::wl_output::OutputId, ifs::wl_output::OutputId,
state::State, state::State,
utils::{ utils::{
@ -750,9 +750,14 @@ impl XBackend {
image.last_serial.set(serial); image.last_serial.set(serial);
if let Some(node) = self.state.root.outputs.get(&output.id) { if let Some(node) = self.state.root.outputs.get(&output.id) {
let res = self let res = self.state.present_output(
.state &node,
.present_output(&node, &image.fb.get(), &image.tex.get(), true); &image.fb.get(),
AcquireSync::Implicit,
ReleaseSync::Implicit,
&image.tex.get(),
true,
);
if let Err(e) = res { if let Err(e) = res {
log::error!("Could not render screen: {}", ErrorFmt(e)); log::error!("Could not render screen: {}", ErrorFmt(e));
return; return;

View file

@ -3,6 +3,7 @@ use {
backend::HardwareCursorUpdate, backend::HardwareCursorUpdate,
cursor::{Cursor, KnownCursor, DEFAULT_CURSOR_SIZE}, cursor::{Cursor, KnownCursor, DEFAULT_CURSOR_SIZE},
fixed::Fixed, fixed::Fixed,
gfx_api::{AcquireSync, ReleaseSync},
rect::Rect, rect::Rect,
scale::Scale, scale::Scale,
state::State, state::State,
@ -497,8 +498,14 @@ impl CursorUser {
} }
if render { if render {
let buffer = hc.get_buffer(); let buffer = hc.get_buffer();
let res = let res = buffer.render_hardware_cursor(
buffer.render_hardware_cursor(cursor.deref(), &self.group.state, scale, transform); AcquireSync::Unnecessary,
ReleaseSync::Explicit,
cursor.deref(),
&self.group.state,
scale,
transform,
);
match res { match res {
Ok(sync_file) => { Ok(sync_file) => {
hc.set_sync_file(sync_file); hc.set_sync_file(sync_file);

View file

@ -208,13 +208,13 @@ pub enum AcquireSync {
impl AcquireSync { impl AcquireSync {
pub fn from_sync_file(sync_file: Option<SyncFile>) -> Self { pub fn from_sync_file(sync_file: Option<SyncFile>) -> Self {
match sync_file { match sync_file {
None => Self::Implicit, None => Self::Unnecessary,
Some(sync_file) => Self::SyncFile { sync_file }, Some(sync_file) => Self::SyncFile { sync_file },
} }
} }
} }
#[derive(Copy, Clone, Eq, PartialEq)] #[derive(Copy, Clone, Eq, PartialEq, Debug)]
pub enum ReleaseSync { pub enum ReleaseSync {
None, None,
Implicit, Implicit,
@ -260,6 +260,8 @@ pub trait GfxFramebuffer: Debug {
fn render( fn render(
&self, &self,
acquire_sync: AcquireSync,
release_sync: ReleaseSync,
ops: &[GfxApiOpt], ops: &[GfxApiOpt],
clear: Option<&Color>, clear: Option<&Color>,
) -> Result<Option<SyncFile>, GfxError>; ) -> Result<Option<SyncFile>, GfxError>;
@ -279,12 +281,24 @@ pub trait GfxFramebuffer: Debug {
} }
impl dyn GfxFramebuffer { impl dyn GfxFramebuffer {
pub fn clear(&self) -> Result<Option<SyncFile>, GfxError> { pub fn clear(
self.clear_with(0.0, 0.0, 0.0, 0.0) &self,
acquire_sync: AcquireSync,
release_sync: ReleaseSync,
) -> Result<Option<SyncFile>, GfxError> {
self.clear_with(acquire_sync, release_sync, 0.0, 0.0, 0.0, 0.0)
} }
pub fn clear_with(&self, r: f32, g: f32, b: f32, a: f32) -> Result<Option<SyncFile>, GfxError> { pub fn clear_with(
self.render(&[], Some(&Color { r, g, b, a })) &self,
acquire_sync: AcquireSync,
release_sync: ReleaseSync,
r: f32,
g: f32,
b: f32,
a: f32,
) -> Result<Option<SyncFile>, GfxError> {
self.render(acquire_sync, release_sync, &[], Some(&Color { r, g, b, a }))
} }
pub fn logical_size(&self, transform: Transform) -> (i32, i32) { pub fn logical_size(&self, transform: Transform) -> (i32, i32) {
@ -302,7 +316,10 @@ impl dyn GfxFramebuffer {
pub fn copy_texture( pub fn copy_texture(
&self, &self,
fb_acquire_sync: AcquireSync,
fb_release_sync: ReleaseSync,
texture: &Rc<dyn GfxTexture>, texture: &Rc<dyn GfxTexture>,
resv: Option<&Rc<dyn BufferResv>>,
acquire_sync: AcquireSync, acquire_sync: AcquireSync,
release_sync: ReleaseSync, release_sync: ReleaseSync,
x: i32, x: i32,
@ -320,16 +337,18 @@ impl dyn GfxFramebuffer {
None, None,
scale, scale,
None, None,
None, resv.cloned(),
acquire_sync, acquire_sync,
release_sync, release_sync,
); );
let clear = self.format().has_alpha.then_some(&Color::TRANSPARENT); let clear = self.format().has_alpha.then_some(&Color::TRANSPARENT);
self.render(&ops, clear) self.render(fb_acquire_sync, fb_release_sync, &ops, clear)
} }
pub fn render_custom( pub fn render_custom(
&self, &self,
acquire_sync: AcquireSync,
release_sync: ReleaseSync,
scale: Scale, scale: Scale,
clear: Option<&Color>, clear: Option<&Color>,
f: &mut dyn FnMut(&mut RendererBase), f: &mut dyn FnMut(&mut RendererBase),
@ -337,7 +356,7 @@ impl dyn GfxFramebuffer {
let mut ops = vec![]; let mut ops = vec![];
let mut renderer = self.renderer_base(&mut ops, scale, Transform::None); let mut renderer = self.renderer_base(&mut ops, scale, Transform::None);
f(&mut renderer); f(&mut renderer);
self.render(&ops, clear) self.render(acquire_sync, release_sync, &ops, clear)
} }
pub fn create_render_pass( pub fn create_render_pass(
@ -366,12 +385,19 @@ impl dyn GfxFramebuffer {
) )
} }
pub fn perform_render_pass(&self, pass: &GfxRenderPass) -> Result<Option<SyncFile>, GfxError> { pub fn perform_render_pass(
self.render(&pass.ops, pass.clear.as_ref()) &self,
acquire_sync: AcquireSync,
release_sync: ReleaseSync,
pass: &GfxRenderPass,
) -> Result<Option<SyncFile>, GfxError> {
self.render(acquire_sync, release_sync, &pass.ops, pass.clear.as_ref())
} }
pub fn render_output( pub fn render_output(
&self, &self,
acquire_sync: AcquireSync,
release_sync: ReleaseSync,
node: &OutputNode, node: &OutputNode,
state: &State, state: &State,
cursor_rect: Option<Rect>, cursor_rect: Option<Rect>,
@ -379,6 +405,8 @@ impl dyn GfxFramebuffer {
render_hardware_cursor: bool, render_hardware_cursor: bool,
) -> Result<Option<SyncFile>, GfxError> { ) -> Result<Option<SyncFile>, GfxError> {
self.render_node( self.render_node(
acquire_sync,
release_sync,
node, node,
state, state,
cursor_rect, cursor_rect,
@ -392,6 +420,8 @@ impl dyn GfxFramebuffer {
pub fn render_node( pub fn render_node(
&self, &self,
acquire_sync: AcquireSync,
release_sync: ReleaseSync,
node: &dyn Node, node: &dyn Node,
state: &State, state: &State,
cursor_rect: Option<Rect>, cursor_rect: Option<Rect>,
@ -412,11 +442,13 @@ impl dyn GfxFramebuffer {
transform, transform,
None, None,
); );
self.perform_render_pass(&pass) self.perform_render_pass(acquire_sync, release_sync, &pass)
} }
pub fn render_hardware_cursor( pub fn render_hardware_cursor(
&self, &self,
acquire_sync: AcquireSync,
release_sync: ReleaseSync,
cursor: &dyn Cursor, cursor: &dyn Cursor,
state: &State, state: &State,
scale: Scale, scale: Scale,
@ -433,7 +465,7 @@ impl dyn GfxFramebuffer {
}, },
}; };
cursor.render_hardware_cursor(&mut renderer); cursor.render_hardware_cursor(&mut renderer);
self.render(&ops, Some(&Color::TRANSPARENT)) self.render(acquire_sync, release_sync, &ops, Some(&Color::TRANSPARENT))
} }
} }

View file

@ -73,6 +73,7 @@ use {
ReleaseSync, SyncFile, ReleaseSync, SyncFile,
}, },
gfx_apis::gl::{ gfx_apis::gl::{
egl::image::EglImage,
gl::texture::image_target, gl::texture::image_target,
renderer::{ renderer::{
context::{GlRenderContext, TexCopyType, TexSourceType}, context::{GlRenderContext, TexCopyType, TexSourceType},
@ -328,7 +329,7 @@ fn render_texture(ctx: &GlRenderContext, tex: &CopyTexture) {
assert!(rc_eq(&ctx.ctx, &texture.ctx.ctx)); assert!(rc_eq(&ctx.ctx, &texture.ctx.ctx));
let gles = ctx.ctx.dpy.gles; let gles = ctx.ctx.dpy.gles;
unsafe { unsafe {
handle_explicit_sync(ctx, texture, &tex.acquire_sync); handle_explicit_sync(ctx, texture.gl.img.as_ref(), &tex.acquire_sync);
(gles.glActiveTexture)(GL_TEXTURE0); (gles.glActiveTexture)(GL_TEXTURE0);
@ -395,7 +396,7 @@ fn render_texture(ctx: &GlRenderContext, tex: &CopyTexture) {
} }
} }
fn handle_explicit_sync(ctx: &GlRenderContext, texture: &Texture, sync: &AcquireSync) { fn handle_explicit_sync(ctx: &GlRenderContext, img: Option<&Rc<EglImage>>, sync: &AcquireSync) {
let sync_file = match sync { let sync_file = match sync {
AcquireSync::None | AcquireSync::Implicit | AcquireSync::Unnecessary => return, AcquireSync::None | AcquireSync::Implicit | AcquireSync::Unnecessary => return,
AcquireSync::SyncFile { sync_file } => sync_file, AcquireSync::SyncFile { sync_file } => sync_file,
@ -417,7 +418,7 @@ fn handle_explicit_sync(ctx: &GlRenderContext, texture: &Texture, sync: &Acquire
}; };
sync.wait(); sync.wait();
} else { } else {
if let Some(img) = &texture.gl.img { if let Some(img) = img {
if let Err(e) = img.dmabuf.import_sync_file(DMA_BUF_SYNC_READ, &sync_file) { if let Err(e) = img.dmabuf.import_sync_file(DMA_BUF_SYNC_READ, &sync_file) {
log::error!("Could not import sync file into dmabuf: {}", ErrorFmt(e)); log::error!("Could not import sync file into dmabuf: {}", ErrorFmt(e));
} }

View file

@ -1,12 +1,13 @@
use { use {
crate::{ crate::{
format::Format, format::Format,
gfx_api::{GfxApiOpt, GfxError, GfxFramebuffer, SyncFile}, gfx_api::{AcquireSync, GfxApiOpt, GfxError, GfxFramebuffer, ReleaseSync, SyncFile},
gfx_apis::gl::{ gfx_apis::gl::{
gl::{ gl::{
frame_buffer::GlFrameBuffer, frame_buffer::GlFrameBuffer,
sys::{GL_COLOR_BUFFER_BIT, GL_FRAMEBUFFER}, sys::{GL_COLOR_BUFFER_BIT, GL_FRAMEBUFFER},
}, },
handle_explicit_sync,
renderer::context::GlRenderContext, renderer::context::GlRenderContext,
run_ops, run_ops,
sys::{GL_ONE, GL_ONE_MINUS_SRC_ALPHA}, sys::{GL_ONE, GL_ONE_MINUS_SRC_ALPHA},
@ -69,11 +70,13 @@ impl Framebuffer {
pub fn render( pub fn render(
&self, &self,
acquire_sync: AcquireSync,
ops: &[GfxApiOpt], ops: &[GfxApiOpt],
clear: Option<&Color>, clear: Option<&Color>,
) -> Result<Option<SyncFile>, RenderError> { ) -> Result<Option<SyncFile>, RenderError> {
let gles = self.ctx.ctx.dpy.gles; let gles = self.ctx.ctx.dpy.gles;
self.ctx.ctx.with_current(|| { self.ctx.ctx.with_current(|| {
handle_explicit_sync(&self.ctx, self.gl.rb._img.as_ref(), &acquire_sync);
unsafe { unsafe {
(gles.glBindFramebuffer)(GL_FRAMEBUFFER, self.gl.fbo); (gles.glBindFramebuffer)(GL_FRAMEBUFFER, self.gl.fbo);
(gles.glViewport)(0, 0, self.gl.width, self.gl.height); (gles.glViewport)(0, 0, self.gl.width, self.gl.height);
@ -101,10 +104,12 @@ impl GfxFramebuffer for Framebuffer {
fn render( fn render(
&self, &self,
acquire_sync: AcquireSync,
_release_sync: ReleaseSync,
ops: &[GfxApiOpt], ops: &[GfxApiOpt],
clear: Option<&Color>, clear: Option<&Color>,
) -> Result<Option<SyncFile>, GfxError> { ) -> Result<Option<SyncFile>, GfxError> {
self.render(ops, clear).map_err(|e| e.into()) self.render(acquire_sync, ops, clear).map_err(|e| e.into())
} }
fn copy_to_shm( fn copy_to_shm(

View file

@ -86,8 +86,8 @@ impl VulkanDevice {
drm: &Drm, drm: &Drm,
) -> Result<VulkanBoAllocator, VulkanError> { ) -> Result<VulkanBoAllocator, VulkanError> {
let allocator = self.create_allocator()?; let allocator = self.create_allocator()?;
let pool = self.create_command_pool()?; let pool = self.create_command_pool(self.graphics_queue_idx)?;
let command_buffer = pool.allocate_buffer()?; let command_buffer = pool.allocate()?;
let drm = drm.dup_render().map_err(VulkanError::DupDrm)?; let drm = drm.dup_render().map_err(VulkanError::DupDrm)?;
Ok(VulkanBoAllocator { Ok(VulkanBoAllocator {
data: Rc::new(VulkanBoAllocatorData { data: Rc::new(VulkanBoAllocatorData {

View file

@ -1,5 +1,5 @@
use { use {
crate::gfx_apis::vulkan::{device::VulkanDevice, VulkanError}, crate::gfx_apis::vulkan::{device::VulkanDevice, renderer::CachedCommandBuffers, VulkanError},
ash::vk::{ ash::vk::{
CommandBuffer, CommandBufferAllocateInfo, CommandBufferLevel, CommandPool, CommandBuffer, CommandBufferAllocateInfo, CommandBufferLevel, CommandPool,
CommandPoolCreateFlags, CommandPoolCreateInfo, CommandPoolCreateFlags, CommandPoolCreateInfo,
@ -53,17 +53,24 @@ impl VulkanCommandPool {
} }
impl VulkanDevice { impl VulkanDevice {
pub fn create_command_pool(self: &Rc<Self>) -> Result<Rc<VulkanCommandPool>, VulkanError> { pub fn create_command_pool(
self: &Rc<Self>,
queue: u32,
) -> Result<CachedCommandBuffers, VulkanError> {
let info = CommandPoolCreateInfo::default() let info = CommandPoolCreateInfo::default()
.queue_family_index(self.graphics_queue_idx) .queue_family_index(queue)
.flags( .flags(
CommandPoolCreateFlags::TRANSIENT | CommandPoolCreateFlags::RESET_COMMAND_BUFFER, CommandPoolCreateFlags::TRANSIENT | CommandPoolCreateFlags::RESET_COMMAND_BUFFER,
); );
let pool = unsafe { self.device.create_command_pool(&info, None) }; let pool = unsafe { self.device.create_command_pool(&info, None) };
let pool = pool.map_err(VulkanError::AllocateCommandPool)?; let pool = pool.map_err(VulkanError::AllocateCommandPool)?;
Ok(Rc::new(VulkanCommandPool { Ok(CachedCommandBuffers {
device: self.clone(), pool: Rc::new(VulkanCommandPool {
pool, device: self.clone(),
})) pool,
}),
buffers: Default::default(),
total_buffers: Default::default(),
})
} }
} }

View file

@ -63,6 +63,9 @@ pub struct VulkanDevice {
pub(super) memory_types: ArrayVec<MemoryType, MAX_MEMORY_TYPES>, pub(super) memory_types: ArrayVec<MemoryType, MAX_MEMORY_TYPES>,
pub(super) graphics_queue: Queue, pub(super) graphics_queue: Queue,
pub(super) graphics_queue_idx: u32, pub(super) graphics_queue_idx: u32,
pub(super) transfer_queue: Option<Queue>,
pub(super) distinct_transfer_queue_family_idx: Option<u32>,
pub(super) transfer_granularity_mask: (u32, u32),
} }
impl Drop for VulkanDevice { impl Drop for VulkanDevice {
@ -185,16 +188,59 @@ impl VulkanInstance {
Err(VulkanError::NoDeviceFound(dev)) Err(VulkanError::NoDeviceFound(dev))
} }
fn find_graphics_queue(&self, phy_dev: PhysicalDevice) -> Result<u32, VulkanError> { fn find_queues(
&self,
phy_dev: PhysicalDevice,
) -> Result<(u32, Option<(u32, u32, u32)>), VulkanError> {
let props = unsafe { let props = unsafe {
self.instance self.instance
.get_physical_device_queue_family_properties(phy_dev) .get_physical_device_queue_family_properties(phy_dev)
}; };
props let gfx_queue = props
.iter() .iter()
.position(|p| p.queue_flags.contains(QueueFlags::GRAPHICS)) .position(|p| p.queue_flags.contains(QueueFlags::GRAPHICS))
.map(|v| v as _) .ok_or(VulkanError::NoGraphicsQueue)?;
.ok_or(VulkanError::NoGraphicsQueue) let transfer_queue = 'transfer: {
let mut transfer_only = None;
let mut compute_only = None;
let mut separate_gfx = None;
for (idx, props) in props.iter().enumerate() {
if idx == gfx_queue {
continue;
}
let g = &props.min_image_transfer_granularity;
if g.width == 0 || g.height == 0 {
continue;
}
let f = props.queue_flags;
use QueueFlags as F;
if !f.intersects(F::GRAPHICS | F::COMPUTE) && f.intersects(F::TRANSFER) {
transfer_only = Some(idx);
} else if !f.intersects(F::GRAPHICS) && f.intersects(F::COMPUTE) {
compute_only = Some(idx);
} else if f.intersects(F::GRAPHICS) {
separate_gfx = Some(idx);
}
}
if let Some(idx) = transfer_only.or(compute_only).or(separate_gfx) {
break 'transfer Some(idx);
}
if props[gfx_queue].queue_count > 1 {
break 'transfer Some(gfx_queue);
}
None
};
let mut width_mask = 0;
let mut height_mask = 0;
if let Some(idx) = transfer_queue {
let g = &props[idx].min_image_transfer_granularity;
width_mask = g.width.wrapping_sub(1);
height_mask = g.height.wrapping_sub(1);
}
Ok((
gfx_queue as _,
transfer_queue.map(|v| (v as _, width_mask, height_mask)),
))
} }
fn supports_semaphore_import(&self, phy_dev: PhysicalDevice) -> bool { fn supports_semaphore_import(&self, phy_dev: PhysicalDevice) -> bool {
@ -224,7 +270,15 @@ impl VulkanInstance {
return Err(VulkanError::MissingDeviceExtension(ext)); return Err(VulkanError::MissingDeviceExtension(ext));
} }
} }
let graphics_queue_idx = self.find_graphics_queue(phy_dev)?; let (graphics_queue_family_idx, transfer_queue_family) = self.find_queues(phy_dev)?;
let mut distinct_transfer_queue_family_idx = None;
let mut transfer_granularity_mask = (0, 0);
if let Some((idx, width_mask, height_mask)) = transfer_queue_family {
if idx != graphics_queue_family_idx {
distinct_transfer_queue_family_idx = Some(idx);
}
transfer_granularity_mask = (width_mask, height_mask);
}
if !self.supports_semaphore_import(phy_dev) { if !self.supports_semaphore_import(phy_dev) {
return Err(VulkanError::SyncobjImport); return Err(VulkanError::SyncobjImport);
} }
@ -238,14 +292,24 @@ impl VulkanInstance {
PhysicalDeviceSynchronization2Features::default().synchronization2(true); PhysicalDeviceSynchronization2Features::default().synchronization2(true);
let mut dynamic_rendering_features = let mut dynamic_rendering_features =
PhysicalDeviceDynamicRenderingFeatures::default().dynamic_rendering(true); PhysicalDeviceDynamicRenderingFeatures::default().dynamic_rendering(true);
let queue_create_info = DeviceQueueCreateInfo::default() let mut queue_create_infos = ArrayVec::<_, 2>::new();
.queue_family_index(graphics_queue_idx) queue_create_infos.push(
.queue_priorities(&[1.0]); DeviceQueueCreateInfo::default()
.queue_family_index(graphics_queue_family_idx)
.queue_priorities(&[1.0]),
);
if let Some((tq, _, _)) = transfer_queue_family {
queue_create_infos.push(
DeviceQueueCreateInfo::default()
.queue_family_index(tq)
.queue_priorities(&[1.0]),
);
}
let device_create_info = DeviceCreateInfo::default() let device_create_info = DeviceCreateInfo::default()
.push_next(&mut semaphore_features) .push_next(&mut semaphore_features)
.push_next(&mut synchronization2_features) .push_next(&mut synchronization2_features)
.push_next(&mut dynamic_rendering_features) .push_next(&mut dynamic_rendering_features)
.queue_create_infos(std::slice::from_ref(&queue_create_info)) .queue_create_infos(&queue_create_infos)
.enabled_extension_names(&enabled_extensions); .enabled_extension_names(&enabled_extensions);
let device = unsafe { let device = unsafe {
self.instance self.instance
@ -286,7 +350,14 @@ impl VulkanInstance {
.iter() .iter()
.copied() .copied()
.collect(); .collect();
let graphics_queue = unsafe { device.get_device_queue(graphics_queue_idx, 0) }; let graphics_queue = unsafe { device.get_device_queue(graphics_queue_family_idx, 0) };
let transfer_queue = transfer_queue_family.map(|(family_idx, _, _)| {
let queue_idx = match family_idx == graphics_queue_family_idx {
true => 1,
false => 0,
};
unsafe { device.get_device_queue(family_idx, queue_idx) }
});
Ok(Rc::new(VulkanDevice { Ok(Rc::new(VulkanDevice {
physical_device: phy_dev, physical_device: phy_dev,
render_node, render_node,
@ -302,7 +373,10 @@ impl VulkanInstance {
formats, formats,
memory_types, memory_types,
graphics_queue, graphics_queue,
graphics_queue_idx, graphics_queue_idx: graphics_queue_family_idx,
transfer_queue,
distinct_transfer_queue_family_idx,
transfer_granularity_mask,
})) }))
} }
} }

View file

@ -3,9 +3,9 @@ use {
clientmem::ClientMemOffset, clientmem::ClientMemOffset,
format::Format, format::Format,
gfx_api::{ gfx_api::{
AsyncShmGfxTexture, AsyncShmGfxTextureCallback, AsyncShmGfxTextureUploadCancellable, AcquireSync, AsyncShmGfxTexture, AsyncShmGfxTextureCallback,
GfxApiOpt, GfxError, GfxFramebuffer, GfxImage, GfxTexture, PendingShmUpload, AsyncShmGfxTextureUploadCancellable, GfxApiOpt, GfxError, GfxFramebuffer, GfxImage,
ShmGfxTexture, SyncFile, GfxTexture, PendingShmUpload, ReleaseSync, ShmGfxTexture, SyncFile,
}, },
gfx_apis::vulkan::{ gfx_apis::vulkan::{
allocator::VulkanAllocation, device::VulkanDevice, format::VulkanModifierLimits, allocator::VulkanAllocation, device::VulkanDevice, format::VulkanModifierLimits,
@ -58,10 +58,41 @@ pub struct VulkanImage {
pub(super) image: Image, pub(super) image: Image,
pub(super) is_undefined: Cell<bool>, pub(super) is_undefined: Cell<bool>,
pub(super) contents_are_undefined: Cell<bool>, pub(super) contents_are_undefined: Cell<bool>,
pub(super) queue_state: Cell<QueueState>,
pub(super) ty: VulkanImageMemory, pub(super) ty: VulkanImageMemory,
pub(super) bridge: Option<VulkanFramebufferBridge>, pub(super) bridge: Option<VulkanFramebufferBridge>,
} }
#[derive(Copy, Clone, Eq, PartialEq, Debug)]
pub enum QueueState {
Acquired { family: QueueFamily },
Releasing,
Released { to: QueueFamily },
}
#[derive(Copy, Clone, Eq, PartialEq, Debug)]
pub enum QueueFamily {
Gfx,
Transfer,
}
impl QueueState {
pub fn acquire(self, new: QueueFamily) -> QueueTransfer {
match self {
QueueState::Acquired { family } if family == new => QueueTransfer::Unnecessary,
QueueState::Released { to } if to == new => QueueTransfer::Possible,
_ => QueueTransfer::Impossible,
}
}
}
#[derive(Copy, Clone, Eq, PartialEq, Debug)]
pub enum QueueTransfer {
Unnecessary,
Possible,
Impossible,
}
pub enum VulkanImageMemory { pub enum VulkanImageMemory {
DmaBuf(VulkanDmaBufImage), DmaBuf(VulkanDmaBufImage),
Internal(VulkanShmImage), Internal(VulkanShmImage),
@ -384,6 +415,9 @@ impl VulkanDmaBufImageTemplate {
format: self.dmabuf.format, format: self.dmabuf.format,
is_undefined: Cell::new(true), is_undefined: Cell::new(true),
contents_are_undefined: Cell::new(false), contents_are_undefined: Cell::new(false),
queue_state: Cell::new(QueueState::Acquired {
family: QueueFamily::Gfx,
}),
bridge, bridge,
})) }))
} }
@ -465,11 +499,13 @@ impl GfxFramebuffer for VulkanImage {
fn render( fn render(
&self, &self,
acquire_sync: AcquireSync,
release_sync: ReleaseSync,
ops: &[GfxApiOpt], ops: &[GfxApiOpt],
clear: Option<&Color>, clear: Option<&Color>,
) -> Result<Option<SyncFile>, GfxError> { ) -> Result<Option<SyncFile>, GfxError> {
self.renderer self.renderer
.execute(self, ops, clear) .execute(self, acquire_sync, release_sync, ops, clear)
.map_err(|e| e.into()) .map_err(|e| e.into())
} }

View file

@ -13,7 +13,7 @@ use {
descriptor::VulkanDescriptorSetLayout, descriptor::VulkanDescriptorSetLayout,
device::VulkanDevice, device::VulkanDevice,
fence::VulkanFence, fence::VulkanFence,
image::{VulkanImage, VulkanImageMemory}, image::{QueueFamily, QueueState, QueueTransfer, VulkanImage, VulkanImageMemory},
pipeline::{PipelineCreateInfo, VulkanPipeline}, pipeline::{PipelineCreateInfo, VulkanPipeline},
semaphore::VulkanSemaphore, semaphore::VulkanSemaphore,
shaders::{ shaders::{
@ -60,13 +60,12 @@ pub struct VulkanRenderer {
pub(super) formats: Rc<AHashMap<u32, GfxFormat>>, pub(super) formats: Rc<AHashMap<u32, GfxFormat>>,
pub(super) device: Rc<VulkanDevice>, pub(super) device: Rc<VulkanDevice>,
pub(super) pipelines: CopyHashMap<vk::Format, Rc<VulkanFormatPipelines>>, pub(super) pipelines: CopyHashMap<vk::Format, Rc<VulkanFormatPipelines>>,
pub(super) command_pool: Rc<VulkanCommandPool>, pub(super) gfx_command_buffers: CachedCommandBuffers,
pub(super) command_buffers: Stack<Rc<VulkanCommandBuffer>>, pub(super) transfer_command_buffers: Option<CachedCommandBuffers>,
pub(super) wait_semaphores: Stack<Rc<VulkanSemaphore>>, pub(super) wait_semaphores: Stack<Rc<VulkanSemaphore>>,
pub(super) total_buffers: NumCell<usize>,
pub(super) memory: RefCell<Memory>, pub(super) memory: RefCell<Memory>,
pub(super) pending_frames: CopyHashMap<u64, Rc<PendingFrame>>, pub(super) pending_frames: CopyHashMap<u64, Rc<PendingFrame>>,
pub(super) pending_uploads: CopyHashMap<u64, SpawnedFuture<()>>, pub(super) pending_submits: CopyHashMap<u64, SpawnedFuture<()>>,
pub(super) allocator: Rc<VulkanAllocator>, pub(super) allocator: Rc<VulkanAllocator>,
pub(super) last_point: NumCell<u64>, pub(super) last_point: NumCell<u64>,
pub(super) buffer_resv_user: BufferResvUser, pub(super) buffer_resv_user: BufferResvUser,
@ -84,6 +83,26 @@ pub struct VulkanRenderer {
pub(super) shm_allocator: Rc<VulkanThreadedAllocator>, pub(super) shm_allocator: Rc<VulkanThreadedAllocator>,
} }
pub(super) struct CachedCommandBuffers {
pub(super) pool: Rc<VulkanCommandPool>,
pub(super) buffers: Stack<Rc<VulkanCommandBuffer>>,
pub(super) total_buffers: NumCell<usize>,
}
impl CachedCommandBuffers {
pub(super) fn allocate(&self) -> Result<Rc<VulkanCommandBuffer>, VulkanError> {
zone!("allocate_command_buffer");
let buf = match self.buffers.pop() {
Some(b) => b,
_ => {
self.total_buffers.fetch_add(1);
self.pool.allocate_buffer()?
}
};
Ok(buf)
}
}
pub(super) struct UsedTexture { pub(super) struct UsedTexture {
tex: Rc<VulkanImage>, tex: Rc<VulkanImage>,
resv: Option<Rc<dyn BufferResv>>, resv: Option<Rc<dyn BufferResv>>,
@ -105,7 +124,8 @@ pub(super) enum TexSourceType {
#[derive(Default)] #[derive(Default)]
pub(super) struct Memory { pub(super) struct Memory {
sample: Vec<Rc<VulkanImage>>, dmabuf_sample: Vec<Rc<VulkanImage>>,
queue_transfer: Vec<Rc<VulkanImage>>,
textures: Vec<UsedTexture>, textures: Vec<UsedTexture>,
image_barriers: Vec<ImageMemoryBarrier2<'static>>, image_barriers: Vec<ImageMemoryBarrier2<'static>>,
wait_semaphores: Vec<Rc<VulkanSemaphore>>, wait_semaphores: Vec<Rc<VulkanSemaphore>>,
@ -143,7 +163,11 @@ impl VulkanDevice {
let tex_frag_shader = self.create_shader(TEX_FRAG)?; let tex_frag_shader = self.create_shader(TEX_FRAG)?;
let tex_frag_mult_opaque_shader = self.create_shader(TEX_FRAG_MULT_OPAQUE)?; let tex_frag_mult_opaque_shader = self.create_shader(TEX_FRAG_MULT_OPAQUE)?;
let tex_frag_mult_alpha_shader = self.create_shader(TEX_FRAG_MULT_ALPHA)?; let tex_frag_mult_alpha_shader = self.create_shader(TEX_FRAG_MULT_ALPHA)?;
let command_pool = self.create_command_pool()?; let gfx_command_buffers = self.create_command_pool(self.graphics_queue_idx)?;
let transfer_command_buffers = self
.distinct_transfer_queue_family_idx
.map(|idx| self.create_command_pool(idx))
.transpose()?;
let formats: AHashMap<u32, _> = self let formats: AHashMap<u32, _> = self
.formats .formats
.iter() .iter()
@ -181,13 +205,12 @@ impl VulkanDevice {
formats: Rc::new(formats), formats: Rc::new(formats),
device: self.clone(), device: self.clone(),
pipelines: Default::default(), pipelines: Default::default(),
command_pool, gfx_command_buffers,
command_buffers: Default::default(), transfer_command_buffers,
wait_semaphores: Default::default(), wait_semaphores: Default::default(),
total_buffers: Default::default(),
memory: Default::default(), memory: Default::default(),
pending_frames: Default::default(), pending_frames: Default::default(),
pending_uploads: Default::default(), pending_submits: Default::default(),
allocator, allocator,
last_point: Default::default(), last_point: Default::default(),
buffer_resv_user: Default::default(), buffer_resv_user: Default::default(),
@ -276,15 +299,21 @@ impl VulkanRenderer {
fn collect_memory(&self, opts: &[GfxApiOpt]) { fn collect_memory(&self, opts: &[GfxApiOpt]) {
zone!("collect_memory"); zone!("collect_memory");
let mut memory = self.memory.borrow_mut(); let mut memory = self.memory.borrow_mut();
memory.sample.clear(); memory.dmabuf_sample.clear();
memory.queue_transfer.clear();
for cmd in opts { for cmd in opts {
if let GfxApiOpt::CopyTexture(c) = cmd { if let GfxApiOpt::CopyTexture(c) = cmd {
let tex = c.tex.clone().into_vk(&self.device.device); let tex = c.tex.clone().into_vk(&self.device.device);
if tex.contents_are_undefined.get() { if tex.contents_are_undefined.get() {
continue; continue;
} }
match tex.queue_state.get().acquire(QueueFamily::Gfx) {
QueueTransfer::Unnecessary => {}
QueueTransfer::Possible => memory.queue_transfer.push(tex.clone()),
QueueTransfer::Impossible => continue,
}
if let VulkanImageMemory::DmaBuf(_) = &tex.ty { if let VulkanImageMemory::DmaBuf(_) = &tex.ty {
memory.sample.push(tex.clone()) memory.dmabuf_sample.push(tex.clone())
} }
memory.textures.push(UsedTexture { memory.textures.push(UsedTexture {
tex, tex,
@ -340,7 +369,7 @@ impl VulkanRenderer {
}); });
} }
memory.image_barriers.push(fb_image_memory_barrier); memory.image_barriers.push(fb_image_memory_barrier);
for img in &memory.sample { for img in &memory.dmabuf_sample {
let image_memory_barrier = image_barrier() let image_memory_barrier = image_barrier()
.src_queue_family_index(QUEUE_FAMILY_FOREIGN_EXT) .src_queue_family_index(QUEUE_FAMILY_FOREIGN_EXT)
.dst_queue_family_index(self.device.graphics_queue_idx) .dst_queue_family_index(self.device.graphics_queue_idx)
@ -351,6 +380,19 @@ impl VulkanRenderer {
.dst_stage_mask(PipelineStageFlags2::FRAGMENT_SHADER); .dst_stage_mask(PipelineStageFlags2::FRAGMENT_SHADER);
memory.image_barriers.push(image_memory_barrier); memory.image_barriers.push(image_memory_barrier);
} }
if let Some(family_idx) = self.device.distinct_transfer_queue_family_idx {
for img in &memory.queue_transfer {
let image_memory_barrier = image_barrier()
.src_queue_family_index(family_idx)
.dst_queue_family_index(self.device.graphics_queue_idx)
.image(img.image)
.dst_access_mask(AccessFlags2::SHADER_SAMPLED_READ)
.dst_stage_mask(PipelineStageFlags2::FRAGMENT_SHADER)
.old_layout(ImageLayout::TRANSFER_DST_OPTIMAL)
.new_layout(ImageLayout::SHADER_READ_ONLY_OPTIMAL);
memory.image_barriers.push(image_memory_barrier);
}
}
let dep_info = DependencyInfoKHR::default().image_memory_barriers(&memory.image_barriers); let dep_info = DependencyInfoKHR::default().image_memory_barriers(&memory.image_barriers);
unsafe { unsafe {
self.device.device.cmd_pipeline_barrier2(buf, &dep_info); self.device.device.cmd_pipeline_barrier2(buf, &dep_info);
@ -471,6 +513,11 @@ impl VulkanRenderer {
log::warn!("Ignoring undefined texture"); log::warn!("Ignoring undefined texture");
continue; continue;
} }
if tex.queue_state.get().acquire(QueueFamily::Gfx) == QueueTransfer::Impossible
{
log::warn!("Ignoring texture owned by different queue");
continue;
}
let copy_type = match c.alpha.is_some() { let copy_type = match c.alpha.is_some() {
true => TexCopyType::Multiply, true => TexCopyType::Multiply,
false => TexCopyType::Identity, false => TexCopyType::Identity,
@ -616,7 +663,7 @@ impl VulkanRenderer {
.src_stage_mask(PipelineStageFlags2::COLOR_ATTACHMENT_OUTPUT); .src_stage_mask(PipelineStageFlags2::COLOR_ATTACHMENT_OUTPUT);
} }
memory.image_barriers.push(fb_image_memory_barrier); memory.image_barriers.push(fb_image_memory_barrier);
for img in &memory.sample { for img in &memory.dmabuf_sample {
let image_memory_barrier = image_barrier() let image_memory_barrier = image_barrier()
.src_queue_family_index(self.device.graphics_queue_idx) .src_queue_family_index(self.device.graphics_queue_idx)
.dst_queue_family_index(QUEUE_FAMILY_FOREIGN_EXT) .dst_queue_family_index(QUEUE_FAMILY_FOREIGN_EXT)
@ -643,7 +690,11 @@ impl VulkanRenderer {
} }
} }
fn create_wait_semaphores(&self, fb: &VulkanImage) -> Result<(), VulkanError> { fn create_wait_semaphores(
&self,
fb: &VulkanImage,
fb_acquire_sync: &AcquireSync,
) -> Result<(), VulkanError> {
zone!("create_wait_semaphores"); zone!("create_wait_semaphores");
let mut memory = self.memory.borrow_mut(); let mut memory = self.memory.borrow_mut();
let memory = &mut *memory; let memory = &mut *memory;
@ -699,13 +750,13 @@ impl VulkanRenderer {
&mut memory.wait_semaphore_infos, &mut memory.wait_semaphore_infos,
&mut memory.wait_semaphores, &mut memory.wait_semaphores,
fb, fb,
&AcquireSync::Implicit, fb_acquire_sync,
DMA_BUF_SYNC_WRITE, DMA_BUF_SYNC_WRITE,
)?; )?;
Ok(()) Ok(())
} }
fn import_release_semaphore(&self, fb: &VulkanImage) { fn import_release_semaphore(&self, fb: &VulkanImage, fb_release_sync: ReleaseSync) {
zone!("import_release_semaphore"); zone!("import_release_semaphore");
let memory = &mut *self.memory.borrow_mut(); let memory = &mut *self.memory.borrow_mut();
let sync_file = match memory.release_sync_file.as_ref() { let sync_file = match memory.release_sync_file.as_ref() {
@ -728,6 +779,8 @@ impl VulkanRenderer {
} }
} }
}; };
let attach_async_shm_sync_file = self.device.transfer_queue.is_some()
&& self.device.distinct_transfer_queue_family_idx.is_none();
for texture in &mut memory.textures { for texture in &mut memory.textures {
import( import(
&texture.tex, &texture.tex,
@ -735,8 +788,15 @@ impl VulkanRenderer {
texture.resv.take(), texture.resv.take(),
DMA_BUF_SYNC_READ, DMA_BUF_SYNC_READ,
); );
if attach_async_shm_sync_file {
if let VulkanImageMemory::Internal(shm) = &texture.tex.ty {
if let Some(data) = &shm.async_data {
data.last_sample.set(Some(sync_file.clone()));
}
}
}
} }
import(fb, ReleaseSync::Implicit, None, DMA_BUF_SYNC_WRITE); import(fb, fb_release_sync, None, DMA_BUF_SYNC_WRITE);
} }
fn submit(&self, buf: CommandBuffer) -> Result<(), VulkanError> { fn submit(&self, buf: CommandBuffer) -> Result<(), VulkanError> {
@ -773,6 +833,12 @@ impl VulkanRenderer {
fn store_layouts(&self, fb: &VulkanImage) { fn store_layouts(&self, fb: &VulkanImage) {
fb.is_undefined.set(false); fb.is_undefined.set(false);
let memory = self.memory.borrow();
for img in &*memory.queue_transfer {
img.queue_state.set(QueueState::Acquired {
family: QueueFamily::Gfx,
});
}
} }
fn create_pending_frame(self: &Rc<Self>, buf: Rc<VulkanCommandBuffer>) { fn create_pending_frame(self: &Rc<Self>, buf: Rc<VulkanCommandBuffer>) {
@ -838,7 +904,10 @@ impl VulkanRenderer {
)?; )?;
(&*tmp_tex as &dyn GfxFramebuffer) (&*tmp_tex as &dyn GfxFramebuffer)
.copy_texture( .copy_texture(
AcquireSync::None,
ReleaseSync::None,
&(tex.clone() as _), &(tex.clone() as _),
None,
AcquireSync::None, AcquireSync::None,
ReleaseSync::None, ReleaseSync::None,
x, x,
@ -925,7 +994,7 @@ impl VulkanRenderer {
final_barriers = final_barriers =
final_barriers.image_memory_barriers(slice::from_ref(&final_tex_barrier)); final_barriers.image_memory_barriers(slice::from_ref(&final_tex_barrier));
} }
let buf = self.allocate_command_buffer()?; let buf = self.gfx_command_buffers.allocate()?;
let mut semaphores = vec![]; let mut semaphores = vec![];
let mut semaphore_infos = vec![]; let mut semaphore_infos = vec![];
if let VulkanImageMemory::DmaBuf(buf) = &tex.ty { if let VulkanImageMemory::DmaBuf(buf) = &tex.ty {
@ -979,7 +1048,7 @@ impl VulkanRenderer {
.map_err(VulkanError::Submit)?; .map_err(VulkanError::Submit)?;
} }
self.block(); self.block();
self.command_buffers.push(buf); self.gfx_command_buffers.buffers.push(buf);
for semaphore in semaphores { for semaphore in semaphores {
self.wait_semaphores.push(semaphore); self.wait_semaphores.push(semaphore);
} }
@ -992,15 +1061,18 @@ impl VulkanRenderer {
pub fn execute( pub fn execute(
self: &Rc<Self>, self: &Rc<Self>,
fb: &VulkanImage, fb: &VulkanImage,
fb_acquire_sync: AcquireSync,
fb_release_sync: ReleaseSync,
opts: &[GfxApiOpt], opts: &[GfxApiOpt],
clear: Option<&Color>, clear: Option<&Color>,
) -> Result<Option<SyncFile>, VulkanError> { ) -> Result<Option<SyncFile>, VulkanError> {
zone!("execute"); zone!("execute");
let res = self.try_execute(fb, opts, clear); let res = self.try_execute(fb, fb_acquire_sync, fb_release_sync, opts, clear);
let sync_file = { let sync_file = {
let mut memory = self.memory.borrow_mut(); let mut memory = self.memory.borrow_mut();
memory.textures.clear(); memory.textures.clear();
memory.sample.clear(); memory.dmabuf_sample.clear();
memory.queue_transfer.clear();
memory.wait_semaphores.clear(); memory.wait_semaphores.clear();
memory.release_fence.take(); memory.release_fence.take();
memory.release_sync_file.take() memory.release_sync_file.take()
@ -1008,18 +1080,6 @@ impl VulkanRenderer {
res.map(|_| sync_file) res.map(|_| sync_file)
} }
pub(super) fn allocate_command_buffer(&self) -> Result<Rc<VulkanCommandBuffer>, VulkanError> {
zone!("allocate_command_buffer");
let buf = match self.command_buffers.pop() {
Some(b) => b,
_ => {
self.total_buffers.fetch_add(1);
self.command_pool.allocate_buffer()?
}
};
Ok(buf)
}
fn allocate_semaphore(&self) -> Result<Rc<VulkanSemaphore>, VulkanError> { fn allocate_semaphore(&self) -> Result<Rc<VulkanSemaphore>, VulkanError> {
zone!("allocate_semaphore"); zone!("allocate_semaphore");
let semaphore = match self.wait_semaphores.pop() { let semaphore = match self.wait_semaphores.pop() {
@ -1032,11 +1092,13 @@ impl VulkanRenderer {
fn try_execute( fn try_execute(
self: &Rc<Self>, self: &Rc<Self>,
fb: &VulkanImage, fb: &VulkanImage,
fb_acquire_sync: AcquireSync,
fb_release_sync: ReleaseSync,
opts: &[GfxApiOpt], opts: &[GfxApiOpt],
clear: Option<&Color>, clear: Option<&Color>,
) -> Result<(), VulkanError> { ) -> Result<(), VulkanError> {
self.check_defunct()?; self.check_defunct()?;
let buf = self.allocate_command_buffer()?; let buf = self.gfx_command_buffers.allocate()?;
self.collect_memory(opts); self.collect_memory(opts);
self.begin_command_buffer(buf.buffer)?; self.begin_command_buffer(buf.buffer)?;
self.initial_barriers(buf.buffer, fb); self.initial_barriers(buf.buffer, fb);
@ -1047,9 +1109,9 @@ impl VulkanRenderer {
self.copy_bridge_to_dmabuf(buf.buffer, fb); self.copy_bridge_to_dmabuf(buf.buffer, fb);
self.final_barriers(buf.buffer, fb); self.final_barriers(buf.buffer, fb);
self.end_command_buffer(buf.buffer)?; self.end_command_buffer(buf.buffer)?;
self.create_wait_semaphores(fb)?; self.create_wait_semaphores(fb, &fb_acquire_sync)?;
self.submit(buf.buffer)?; self.submit(buf.buffer)?;
self.import_release_semaphore(fb); self.import_release_semaphore(fb, fb_release_sync);
self.store_layouts(fb); self.store_layouts(fb);
self.create_pending_frame(buf); self.create_pending_frame(buf);
Ok(()) Ok(())
@ -1067,7 +1129,7 @@ impl VulkanRenderer {
pub fn on_drop(&self) { pub fn on_drop(&self) {
self.defunct.set(true); self.defunct.set(true);
let mut pending_frames = self.pending_frames.lock(); let mut pending_frames = self.pending_frames.lock();
let mut pending_uploads = self.pending_uploads.lock(); let mut pending_uploads = self.pending_submits.lock();
if pending_frames.is_not_empty() || pending_uploads.is_not_empty() { if pending_frames.is_not_empty() || pending_uploads.is_not_empty() {
log::warn!("Context dropped with pending frames."); log::warn!("Context dropped with pending frames.");
self.block(); self.block();
@ -1153,7 +1215,7 @@ async fn await_release(
frame.renderer.block(); frame.renderer.block();
} }
if let Some(buf) = frame.cmd.take() { if let Some(buf) = frame.cmd.take() {
frame.renderer.command_buffers.push(buf); frame.renderer.gfx_command_buffers.buffers.push(buf);
} }
for wait_semaphore in frame.wait_semaphores.take() { for wait_semaphore in frame.wait_semaphores.take() {
frame.renderer.wait_semaphores.push(wait_semaphore); frame.renderer.wait_semaphores.push(wait_semaphore);

View file

@ -14,7 +14,7 @@ use {
allocator::VulkanAllocation, allocator::VulkanAllocation,
command::VulkanCommandBuffer, command::VulkanCommandBuffer,
fence::VulkanFence, fence::VulkanFence,
image::{VulkanImage, VulkanImageMemory}, image::{QueueFamily, QueueState, QueueTransfer, VulkanImage, VulkanImageMemory},
renderer::{image_barrier, VulkanRenderer}, renderer::{image_barrier, VulkanRenderer},
staging::VulkanStagingBuffer, staging::VulkanStagingBuffer,
VulkanError, VulkanError,
@ -22,9 +22,10 @@ use {
rect::{Rect, Region}, rect::{Rect, Region},
utils::{clonecell::CloneCell, errorfmt::ErrorFmt, on_drop::OnDrop}, utils::{clonecell::CloneCell, errorfmt::ErrorFmt, on_drop::OnDrop},
}, },
arrayvec::ArrayVec,
ash::vk::{ ash::vk::{
AccessFlags2, BufferImageCopy2, BufferMemoryBarrier2, CommandBufferBeginInfo, AccessFlags2, BufferImageCopy2, BufferMemoryBarrier2, CommandBufferBeginInfo,
CommandBufferSubmitInfo, CommandBufferUsageFlags, CopyBufferToImageInfo2, CommandBufferSubmitInfo, CommandBufferUsageFlags, CopyBufferToImageInfo2, DependencyInfo,
DependencyInfoKHR, DeviceSize, Extent3D, ImageAspectFlags, ImageCreateInfo, ImageLayout, DependencyInfoKHR, DeviceSize, Extent3D, ImageAspectFlags, ImageCreateInfo, ImageLayout,
ImageSubresourceLayers, ImageSubresourceRange, ImageTiling, ImageType, ImageUsageFlags, ImageSubresourceLayers, ImageSubresourceRange, ImageTiling, ImageType, ImageUsageFlags,
ImageViewCreateInfo, ImageViewType, Offset3D, PipelineStageFlags2, SampleCountFlags, ImageViewCreateInfo, ImageViewType, Offset3D, PipelineStageFlags2, SampleCountFlags,
@ -58,6 +59,8 @@ pub struct VulkanShmImageAsyncData {
pub(super) callback_id: Cell<u64>, pub(super) callback_id: Cell<u64>,
pub(super) regions: RefCell<Vec<BufferImageCopy2<'static>>>, pub(super) regions: RefCell<Vec<BufferImageCopy2<'static>>>,
pub(super) cpu: Rc<CpuWorker>, pub(super) cpu: Rc<CpuWorker>,
pub(super) last_sample: Cell<Option<SyncFile>>,
pub(super) data_copied: Cell<bool>,
} }
impl VulkanShmImage { impl VulkanShmImage {
@ -160,7 +163,7 @@ impl VulkanShmImage {
} }
})?; })?;
let Some((cmd, fence, sync_file, point)) = let Some((cmd, fence, sync_file, point)) =
self.submit_buffer_to_image_copy(img, &staging, cpy)? self.submit_buffer_to_image_copy(img, &staging, cpy, false)?
else { else {
return Ok(()); return Ok(());
}; };
@ -168,7 +171,7 @@ impl VulkanShmImage {
"await upload", "await upload",
await_upload(point, img.clone(), cmd, sync_file, fence, staging), await_upload(point, img.clone(), cmd, sync_file, fence, staging),
); );
img.renderer.pending_uploads.set(point, future); img.renderer.pending_submits.set(point, future);
Ok(()) Ok(())
} }
@ -177,6 +180,7 @@ impl VulkanShmImage {
img: &Rc<VulkanImage>, img: &Rc<VulkanImage>,
staging: &VulkanStagingBuffer, staging: &VulkanStagingBuffer,
regions: &[BufferImageCopy2], regions: &[BufferImageCopy2],
use_transfer_queue: bool,
) -> Result<Option<(Rc<VulkanCommandBuffer>, Rc<VulkanFence>, SyncFile, u64)>, VulkanError> ) -> Result<Option<(Rc<VulkanCommandBuffer>, Rc<VulkanFence>, SyncFile, u64)>, VulkanError>
{ {
let memory_barrier = |sam, ssm, dam, dsm| { let memory_barrier = |sam, ssm, dam, dsm| {
@ -189,18 +193,29 @@ impl VulkanShmImage {
.dst_access_mask(dam) .dst_access_mask(dam)
.dst_stage_mask(dsm) .dst_stage_mask(dsm)
}; };
let initial_image_barrier = image_barrier() let mut transfer_queue_family_idx = img.renderer.device.graphics_queue_idx;
if use_transfer_queue {
if let Some(idx) = img.renderer.device.distinct_transfer_queue_family_idx {
transfer_queue_family_idx = idx;
}
}
let mut initial_image_barrier = image_barrier()
.image(img.image) .image(img.image)
.src_access_mask(AccessFlags2::SHADER_SAMPLED_READ) .src_queue_family_index(img.renderer.device.graphics_queue_idx)
.src_stage_mask(PipelineStageFlags2::FRAGMENT_SHADER) .dst_queue_family_index(transfer_queue_family_idx)
.dst_access_mask(AccessFlags2::TRANSFER_WRITE)
.dst_stage_mask(PipelineStageFlags2::TRANSFER)
.old_layout(if img.is_undefined.get() { .old_layout(if img.is_undefined.get() {
ImageLayout::UNDEFINED ImageLayout::UNDEFINED
} else { } else {
ImageLayout::SHADER_READ_ONLY_OPTIMAL ImageLayout::SHADER_READ_ONLY_OPTIMAL
}) })
.new_layout(ImageLayout::TRANSFER_DST_OPTIMAL) .new_layout(ImageLayout::TRANSFER_DST_OPTIMAL);
.dst_access_mask(AccessFlags2::TRANSFER_WRITE) if transfer_queue_family_idx == img.renderer.device.graphics_queue_idx {
.dst_stage_mask(PipelineStageFlags2::TRANSFER); initial_image_barrier = initial_image_barrier
.src_access_mask(AccessFlags2::SHADER_SAMPLED_READ)
.src_stage_mask(PipelineStageFlags2::FRAGMENT_SHADER)
}
let initial_buffer_barrier = memory_barrier( let initial_buffer_barrier = memory_barrier(
AccessFlags2::HOST_WRITE, AccessFlags2::HOST_WRITE,
PipelineStageFlags2::HOST, PipelineStageFlags2::HOST,
@ -210,14 +225,19 @@ impl VulkanShmImage {
let initial_dep_info = DependencyInfoKHR::default() let initial_dep_info = DependencyInfoKHR::default()
.buffer_memory_barriers(slice::from_ref(&initial_buffer_barrier)) .buffer_memory_barriers(slice::from_ref(&initial_buffer_barrier))
.image_memory_barriers(slice::from_ref(&initial_image_barrier)); .image_memory_barriers(slice::from_ref(&initial_image_barrier));
let final_image_barrier = image_barrier() let mut final_image_barrier = image_barrier()
.image(img.image) .image(img.image)
.src_queue_family_index(transfer_queue_family_idx)
.dst_queue_family_index(img.renderer.device.graphics_queue_idx)
.src_access_mask(AccessFlags2::TRANSFER_WRITE) .src_access_mask(AccessFlags2::TRANSFER_WRITE)
.src_stage_mask(PipelineStageFlags2::TRANSFER) .src_stage_mask(PipelineStageFlags2::TRANSFER)
.old_layout(ImageLayout::TRANSFER_DST_OPTIMAL) .old_layout(ImageLayout::TRANSFER_DST_OPTIMAL)
.new_layout(ImageLayout::SHADER_READ_ONLY_OPTIMAL) .new_layout(ImageLayout::SHADER_READ_ONLY_OPTIMAL);
.dst_access_mask(AccessFlags2::SHADER_SAMPLED_READ) if transfer_queue_family_idx == img.renderer.device.graphics_queue_idx {
.dst_stage_mask(PipelineStageFlags2::FRAGMENT_SHADER); final_image_barrier = final_image_barrier
.dst_access_mask(AccessFlags2::SHADER_SAMPLED_READ)
.dst_stage_mask(PipelineStageFlags2::FRAGMENT_SHADER);
}
let final_buffer_barrier = memory_barrier( let final_buffer_barrier = memory_barrier(
AccessFlags2::TRANSFER_READ, AccessFlags2::TRANSFER_READ,
PipelineStageFlags2::TRANSFER, PipelineStageFlags2::TRANSFER,
@ -232,7 +252,10 @@ impl VulkanShmImage {
.dst_image(img.image) .dst_image(img.image)
.dst_image_layout(ImageLayout::TRANSFER_DST_OPTIMAL) .dst_image_layout(ImageLayout::TRANSFER_DST_OPTIMAL)
.regions(regions); .regions(regions);
let cmd = img.renderer.allocate_command_buffer()?; let cmd = match &img.renderer.transfer_command_buffers {
Some(b) if use_transfer_queue => b.allocate()?,
_ => img.renderer.gfx_command_buffers.allocate()?,
};
let dev = &img.renderer.device.device; let dev = &img.renderer.device.device;
let command_buffer_info = CommandBufferSubmitInfo::default().command_buffer(cmd.buffer); let command_buffer_info = CommandBufferSubmitInfo::default().command_buffer(cmd.buffer);
let submit_info = let submit_info =
@ -249,7 +272,10 @@ impl VulkanShmImage {
dev.end_command_buffer(cmd.buffer) dev.end_command_buffer(cmd.buffer)
.map_err(VulkanError::EndCommandBuffer)?; .map_err(VulkanError::EndCommandBuffer)?;
dev.queue_submit2( dev.queue_submit2(
img.renderer.device.graphics_queue, match img.renderer.device.transfer_queue {
Some(q) if use_transfer_queue => q,
_ => img.renderer.device.graphics_queue,
},
slice::from_ref(&submit_info), slice::from_ref(&submit_info),
release_fence.fence, release_fence.fence,
) )
@ -286,8 +312,8 @@ async fn await_upload(
); );
img.renderer.block(); img.renderer.block();
} }
img.renderer.command_buffers.push(buf); img.renderer.gfx_command_buffers.buffers.push(buf);
img.renderer.pending_uploads.remove(&id); img.renderer.pending_submits.remove(&id);
} }
impl VulkanShmImageAsyncData { impl VulkanShmImageAsyncData {
@ -334,8 +360,9 @@ impl VulkanShmImage {
return Err(VulkanError::InvalidBufferSize); return Err(VulkanError::InvalidBufferSize);
} }
data.busy.set(true); data.busy.set(true);
data.data_copied.set(false);
if img.contents_are_undefined.get() { if img.contents_are_undefined.get() {
damage = Region::new2(Rect::new_sized(0, 0, img.width as _, img.height as _).unwrap()) damage = Region::new2(Rect::new_sized(0, 0, img.width as _, img.height as _).unwrap());
} }
let copies = &mut *data.regions.borrow_mut(); let copies = &mut *data.regions.borrow_mut();
@ -361,13 +388,18 @@ impl VulkanShmImage {
.buffer_row_length(img.stride / self.shm_info.bpp); .buffer_row_length(img.stride / self.shm_info.bpp);
copies.push(copy); copies.push(copy);
}; };
let (width_mask, height_mask) = img.renderer.device.transfer_granularity_mask;
let width_mask = width_mask as i32;
let height_mask = height_mask as i32;
for damage in damage.rects() { for damage in damage.rects() {
let Some(damage) = Rect::new( if damage.x2() < 0 || damage.y2() < 0 {
damage.x1().max(0), continue;
damage.y1().max(0), }
damage.x2().min(img.width as i32), let x1 = damage.x1().max(0) & !width_mask;
damage.y2().min(img.height as i32), let y1 = damage.y1().max(0) & !height_mask;
) else { let x2 = ((damage.x2() + width_mask) & !width_mask).min(img.width as i32);
let y2 = ((damage.y2() + height_mask) & !height_mask).min(img.height as i32);
let Some(damage) = Rect::new(x1, y1, x2, y2) else {
continue; continue;
}; };
if damage.is_empty() { if damage.is_empty() {
@ -381,6 +413,8 @@ impl VulkanShmImage {
); );
} }
self.async_release_from_gfx_queue(img, data)?;
if let Some(staging) = data.staging.get() { if let Some(staging) = data.staging.get() {
return self.async_upload_initiate_copy(img, data, &staging, copies, client_mem); return self.async_upload_initiate_copy(img, data, &staging, copies, client_mem);
} }
@ -404,6 +438,95 @@ impl VulkanShmImage {
) )
} }
fn async_release_from_gfx_queue(
&self,
img: &Rc<VulkanImage>,
data: &VulkanShmImageAsyncData,
) -> Result<(), VulkanError> {
img.renderer.check_defunct()?;
let Some(transfer_queue_idx) = img.renderer.device.distinct_transfer_queue_family_idx
else {
let Some(sync_file) = data.last_sample.take() else {
img.queue_state.set(QueueState::Released {
to: QueueFamily::Transfer,
});
return Ok(());
};
let id = img.renderer.allocate_point();
let pending = img.renderer.eng.spawn(
"await_transfer_to_transfer",
await_gfx_queue_release(id, img.clone(), None, None, sync_file),
);
img.renderer.pending_submits.set(id, pending);
img.queue_state.set(QueueState::Releasing);
return Ok(());
};
let mut barriers = ArrayVec::<_, 2>::new();
match img.queue_state.get() {
QueueState::Acquired { family } => {
assert_eq!(family, QueueFamily::Gfx);
}
QueueState::Releasing => {
unreachable!();
}
QueueState::Released { to } => {
assert_eq!(to, QueueFamily::Gfx);
let barrier = image_barrier()
.image(img.image)
.src_queue_family_index(transfer_queue_idx)
.dst_queue_family_index(img.renderer.device.graphics_queue_idx)
.dst_stage_mask(PipelineStageFlags2::ALL_COMMANDS)
.old_layout(ImageLayout::TRANSFER_DST_OPTIMAL)
.new_layout(ImageLayout::SHADER_READ_ONLY_OPTIMAL);
barriers.push(barrier);
}
}
let barrier = image_barrier()
.image(img.image)
.src_queue_family_index(img.renderer.device.graphics_queue_idx)
.dst_queue_family_index(transfer_queue_idx)
.src_access_mask(AccessFlags2::SHADER_SAMPLED_READ)
.src_stage_mask(PipelineStageFlags2::ALL_COMMANDS)
.old_layout(if img.is_undefined.get() {
ImageLayout::UNDEFINED
} else {
ImageLayout::SHADER_READ_ONLY_OPTIMAL
})
.new_layout(ImageLayout::TRANSFER_DST_OPTIMAL);
barriers.push(barrier);
let dep_info = DependencyInfo::default().image_memory_barriers(&barriers);
let release_fence = img.renderer.device.create_fence()?;
let dev = &img.renderer.device.device;
let begin_info =
CommandBufferBeginInfo::default().flags(CommandBufferUsageFlags::ONE_TIME_SUBMIT);
let cmd = img.renderer.gfx_command_buffers.allocate()?;
let command_buffer_info = CommandBufferSubmitInfo::default().command_buffer(cmd.buffer);
let submit_info =
SubmitInfo2::default().command_buffer_infos(slice::from_ref(&command_buffer_info));
unsafe {
dev.begin_command_buffer(cmd.buffer, &begin_info)
.map_err(VulkanError::BeginCommandBuffer)?;
dev.cmd_pipeline_barrier2(cmd.buffer, &dep_info);
dev.end_command_buffer(cmd.buffer)
.map_err(VulkanError::EndCommandBuffer)?;
dev.queue_submit2(
img.renderer.device.graphics_queue,
slice::from_ref(&submit_info),
release_fence.fence,
)
.map_err(VulkanError::Submit)?;
}
let sync_file = release_fence.export_sync_file()?;
let id = img.renderer.allocate_point();
let pending = img.renderer.eng.spawn(
"await_transfer_to_transfer",
await_gfx_queue_release(id, img.clone(), Some(cmd), Some(release_fence), sync_file),
);
img.renderer.pending_submits.set(id, pending);
img.queue_state.set(QueueState::Releasing);
Ok(())
}
fn async_upload_after_allocation( fn async_upload_after_allocation(
&self, &self,
img: &Rc<VulkanImage>, img: &Rc<VulkanImage>,
@ -501,25 +624,28 @@ impl VulkanShmImage {
&self, &self,
img: &Rc<VulkanImage>, img: &Rc<VulkanImage>,
data: &VulkanShmImageAsyncData, data: &VulkanShmImageAsyncData,
res: Result<(), ReadWriteJobError>,
) -> Result<(), VulkanError> { ) -> Result<(), VulkanError> {
if let Err(e) = res { if !data.data_copied.get() {
return Err(VulkanError::AsyncCopyToStaging(e)); return Ok(());
}
if img.queue_state.get().acquire(QueueFamily::Transfer) == QueueTransfer::Impossible {
return Ok(());
} }
img.renderer.check_defunct()?; img.renderer.check_defunct()?;
let regions = &*data.regions.borrow(); let regions = &*data.regions.borrow();
let staging = data.staging.get().unwrap(); let staging = data.staging.get().unwrap();
staging.upload(|_, _| ())?; staging.upload(|_, _| ())?;
let Some((cmd, fence, sync_file, point)) = let Some((cmd, fence, sync_file, point)) =
self.submit_buffer_to_image_copy(img, &staging, regions)? self.submit_buffer_to_image_copy(img, &staging, regions, true)?
else { else {
return Ok(()); return Ok(());
}; };
img.queue_state.set(QueueState::Releasing);
let future = img.renderer.eng.spawn( let future = img.renderer.eng.spawn(
"await async upload", "await async upload",
await_async_upload(point, img.clone(), cmd, fence, sync_file), await_async_upload(point, img.clone(), cmd, fence, sync_file),
); );
img.renderer.pending_uploads.set(point, future); img.renderer.pending_submits.set(point, future);
Ok(()) Ok(())
} }
} }
@ -577,7 +703,42 @@ fn complete_async_upload(
}; };
let data = shm.async_data.as_ref().unwrap(); let data = shm.async_data.as_ref().unwrap();
store(data); store(data);
if let Err(e) = shm.async_upload_copy_buffer_to_image(img, data, res) { if let Err(e) = res {
data.complete(Err(VulkanError::AsyncCopyToStaging(e)));
}
data.data_copied.set(true);
if let Err(e) = shm.async_upload_copy_buffer_to_image(img, data) {
data.complete(Err(e));
}
}
async fn await_gfx_queue_release(
id: u64,
img: Rc<VulkanImage>,
buf: Option<Rc<VulkanCommandBuffer>>,
_fence: Option<Rc<VulkanFence>>,
sync_file: SyncFile,
) {
let res = img.renderer.ring.readable(&sync_file.0).await;
if let Err(e) = res {
log::error!(
"Could not wait for sync file to become readable: {}",
ErrorFmt(e)
);
img.renderer.block();
}
if let Some(buf) = buf {
img.renderer.gfx_command_buffers.buffers.push(buf);
}
img.renderer.pending_submits.remove(&id);
img.queue_state.set(QueueState::Released {
to: QueueFamily::Transfer,
});
let VulkanImageMemory::Internal(shm) = &img.ty else {
unreachable!();
};
let data = shm.async_data.as_ref().unwrap();
if let Err(e) = shm.async_upload_copy_buffer_to_image(&img, data) {
data.complete(Err(e)); data.complete(Err(e));
} }
} }
@ -597,8 +758,14 @@ async fn await_async_upload(
); );
img.renderer.block(); img.renderer.block();
} }
img.renderer.command_buffers.push(buf); match &img.renderer.transfer_command_buffers {
img.renderer.pending_uploads.remove(&id); Some(b) => b.buffers.push(buf),
None => img.renderer.gfx_command_buffers.buffers.push(buf),
}
img.queue_state.set(QueueState::Released {
to: QueueFamily::Gfx,
});
img.renderer.pending_submits.remove(&id);
let VulkanImageMemory::Internal(shm) = &img.ty else { let VulkanImageMemory::Internal(shm) = &img.ty else {
unreachable!(); unreachable!();
}; };
@ -701,6 +868,8 @@ impl VulkanRenderer {
callback_id: Cell::new(0), callback_id: Cell::new(0),
regions: Default::default(), regions: Default::default(),
cpu: cpu.clone(), cpu: cpu.clone(),
last_sample: Default::default(),
data_copied: Default::default(),
}); });
} }
let shm = VulkanShmImage { let shm = VulkanShmImage {
@ -722,6 +891,9 @@ impl VulkanRenderer {
image, image,
is_undefined: Cell::new(true), is_undefined: Cell::new(true),
contents_are_undefined: Cell::new(true), contents_are_undefined: Cell::new(true),
queue_state: Cell::new(QueueState::Acquired {
family: QueueFamily::Gfx,
}),
ty: VulkanImageMemory::Internal(shm), ty: VulkanImageMemory::Internal(shm),
bridge: None, bridge: None,
}); });

View file

@ -3,7 +3,9 @@ use {
allocator::{AllocatorError, BufferObject, BO_USE_LINEAR, BO_USE_RENDERING}, allocator::{AllocatorError, BufferObject, BO_USE_LINEAR, BO_USE_RENDERING},
client::{Client, ClientError}, client::{Client, ClientError},
format::XRGB8888, format::XRGB8888,
gfx_api::{GfxContext, GfxError, GfxFramebuffer, GfxTexture}, gfx_api::{
AcquireSync, BufferResv, GfxContext, GfxError, GfxFramebuffer, GfxTexture, ReleaseSync,
},
ifs::{jay_output::JayOutput, jay_toplevel::JayToplevel, wl_buffer::WlBufferStorage}, ifs::{jay_output::JayOutput, jay_toplevel::JayToplevel, wl_buffer::WlBufferStorage},
leaks::Tracker, leaks::Tracker,
object::{Object, Version}, object::{Object, Version},
@ -189,6 +191,8 @@ impl JayScreencast {
for (idx, buffer) in buffer.deref_mut().iter_mut().enumerate() { for (idx, buffer) in buffer.deref_mut().iter_mut().enumerate() {
if buffer.free { if buffer.free {
let res = buffer.fb.render_node( let res = buffer.fb.render_node(
AcquireSync::Implicit,
ReleaseSync::Implicit,
tl.tl_as_node(), tl.tl_as_node(),
&self.client.state, &self.client.state,
Some(tl.node_absolute_position()), Some(tl.node_absolute_position()),
@ -298,6 +302,9 @@ impl JayScreencast {
&self, &self,
on: &OutputNode, on: &OutputNode,
texture: &Rc<dyn GfxTexture>, texture: &Rc<dyn GfxTexture>,
resv: Option<&Rc<dyn BufferResv>>,
acquire_sync: &AcquireSync,
release_sync: ReleaseSync,
render_hardware_cursors: bool, render_hardware_cursors: bool,
x_off: i32, x_off: i32,
y_off: i32, y_off: i32,
@ -320,7 +327,12 @@ impl JayScreencast {
if buffer.free { if buffer.free {
let res = self.client.state.perform_screencopy( let res = self.client.state.perform_screencopy(
texture, texture,
resv,
acquire_sync,
release_sync,
&buffer.fb, &buffer.fb,
AcquireSync::Implicit,
ReleaseSync::Implicit,
on.global.pos.get(), on.global.pos.get(),
render_hardware_cursors, render_hardware_cursors,
x_off, x_off,

View file

@ -5,9 +5,10 @@ use {
cpu_worker::CpuWorker, cpu_worker::CpuWorker,
format::{Format, ARGB8888, XRGB8888}, format::{Format, ARGB8888, XRGB8888},
gfx_api::{ gfx_api::{
AsyncShmGfxTexture, AsyncShmGfxTextureCallback, CopyTexture, FillRect, FramebufferRect, AcquireSync, AsyncShmGfxTexture, AsyncShmGfxTextureCallback, CopyTexture, FillRect,
GfxApiOpt, GfxContext, GfxError, GfxFormat, GfxFramebuffer, GfxImage, GfxTexture, FramebufferRect, GfxApiOpt, GfxContext, GfxError, GfxFormat, GfxFramebuffer, GfxImage,
GfxWriteModifier, PendingShmUpload, ResetStatus, ShmGfxTexture, SyncFile, GfxTexture, GfxWriteModifier, PendingShmUpload, ReleaseSync, ResetStatus,
ShmGfxTexture, SyncFile,
}, },
rect::{Rect, Region}, rect::{Rect, Region},
theme::Color, theme::Color,
@ -413,6 +414,8 @@ impl GfxFramebuffer for TestGfxFb {
fn render( fn render(
&self, &self,
_acquire_sync: AcquireSync,
_release_sync: ReleaseSync,
ops: &[GfxApiOpt], ops: &[GfxApiOpt],
clear: Option<&Color>, clear: Option<&Color>,
) -> Result<Option<SyncFile>, GfxError> { ) -> Result<Option<SyncFile>, GfxError> {

View file

@ -635,13 +635,17 @@ impl WindowData {
return; return;
}; };
let res = buf let res = buf.fb.render_custom(
.fb AcquireSync::Implicit,
.render_custom(self.scale.get(), Some(&Color::from_gray(0)), &mut |r| { ReleaseSync::Implicit,
self.scale.get(),
Some(&Color::from_gray(0)),
&mut |r| {
if let Some(content) = self.content.get() { if let Some(content) = self.content.get() {
content.render_at(r, 0.0, 0.0) content.render_at(r, 0.0, 0.0)
} }
}); },
);
if let Err(e) = res { if let Err(e) = res {
log::error!("Could not render frame: {}", ErrorFmt(e)); log::error!("Could not render frame: {}", ErrorFmt(e));
return; return;

View file

@ -2,7 +2,7 @@ use {
crate::{ crate::{
allocator::{AllocatorError, BufferObject, BufferUsage, BO_USE_RENDERING}, allocator::{AllocatorError, BufferObject, BufferUsage, BO_USE_RENDERING},
format::XRGB8888, format::XRGB8888,
gfx_api::{needs_render_usage, GfxError}, gfx_api::{needs_render_usage, AcquireSync, GfxError, ReleaseSync},
scale::Scale, scale::Scale,
state::State, state::State,
video::drm::DrmError, video::drm::DrmError,
@ -77,6 +77,8 @@ pub fn take_screenshot(
)?; )?;
let fb = ctx.clone().dmabuf_fb(bo.dmabuf())?; let fb = ctx.clone().dmabuf_fb(bo.dmabuf())?;
fb.render_node( fb.render_node(
AcquireSync::Unnecessary,
ReleaseSync::Implicit,
state.root.deref(), state.root.deref(),
state, state,
Some(state.root.extents.get()), Some(state.root.extents.get()),

View file

@ -27,8 +27,8 @@ use {
forker::ForkerProxy, forker::ForkerProxy,
format::Format, format::Format,
gfx_api::{ gfx_api::{
AcquireSync, GfxContext, GfxError, GfxFramebuffer, GfxTexture, ReleaseSync, SampleRect, AcquireSync, BufferResv, GfxContext, GfxError, GfxFramebuffer, GfxTexture, ReleaseSync,
SyncFile, SampleRect, SyncFile,
}, },
gfx_apis::create_gfx_context, gfx_apis::create_gfx_context,
globals::{Globals, GlobalsError, RemovableWaylandGlobal, WaylandGlobal}, globals::{Globals, GlobalsError, RemovableWaylandGlobal, WaylandGlobal},
@ -900,10 +900,14 @@ impl State {
&self, &self,
output: &OutputNode, output: &OutputNode,
fb: &Rc<dyn GfxFramebuffer>, fb: &Rc<dyn GfxFramebuffer>,
acquire_sync: AcquireSync,
release_sync: ReleaseSync,
tex: &Rc<dyn GfxTexture>, tex: &Rc<dyn GfxTexture>,
render_hw_cursor: bool, render_hw_cursor: bool,
) -> Result<Option<SyncFile>, GfxError> { ) -> Result<Option<SyncFile>, GfxError> {
let sync_file = fb.render_output( let sync_file = fb.render_output(
acquire_sync,
release_sync,
output, output,
self, self,
Some(output.global.pos.get()), Some(output.global.pos.get()),
@ -911,14 +915,28 @@ impl State {
render_hw_cursor, render_hw_cursor,
)?; )?;
output.latched(); output.latched();
output.perform_screencopies(tex, !render_hw_cursor, 0, 0, None); output.perform_screencopies(
tex,
None,
&AcquireSync::Unnecessary,
ReleaseSync::None,
!render_hw_cursor,
0,
0,
None,
);
Ok(sync_file) Ok(sync_file)
} }
pub fn perform_screencopy( pub fn perform_screencopy(
&self, &self,
src: &Rc<dyn GfxTexture>, src: &Rc<dyn GfxTexture>,
resv: Option<&Rc<dyn BufferResv>>,
acquire_sync: &AcquireSync,
release_sync: ReleaseSync,
target: &Rc<dyn GfxFramebuffer>, target: &Rc<dyn GfxFramebuffer>,
target_acquire_sync: AcquireSync,
target_release_sync: ReleaseSync,
position: Rect, position: Rect,
render_hardware_cursors: bool, render_hardware_cursors: bool,
x_off: i32, x_off: i32,
@ -947,9 +965,9 @@ impl State {
size, size,
Scale::from_int(1), Scale::from_int(1),
None, None,
None, resv.cloned(),
AcquireSync::None, acquire_sync.clone(),
ReleaseSync::Implicit, release_sync,
); );
if render_hardware_cursors { if render_hardware_cursors {
if let Some(cursor_user_group) = self.cursor_user_group_hardware_cursor.get() { if let Some(cursor_user_group) = self.cursor_user_group_hardware_cursor.get() {
@ -963,7 +981,12 @@ impl State {
} }
} }
} }
target.render(&ops, Some(&Color::SOLID_BLACK)) target.render(
target_acquire_sync,
target_release_sync,
&ops,
Some(&Color::SOLID_BLACK),
)
} }
fn have_hardware_cursor(&self) -> bool { fn have_hardware_cursor(&self) -> bool {
@ -980,6 +1003,7 @@ impl State {
pub fn perform_shm_screencopy( pub fn perform_shm_screencopy(
&self, &self,
src: &Rc<dyn GfxTexture>, src: &Rc<dyn GfxTexture>,
acquire_sync: &AcquireSync,
position: Rect, position: Rect,
x_off: i32, x_off: i32,
y_off: i32, y_off: i32,
@ -1011,7 +1035,12 @@ impl State {
.map_err(ShmScreencopyError::CreateTemporaryFb)?; .map_err(ShmScreencopyError::CreateTemporaryFb)?;
self.perform_screencopy( self.perform_screencopy(
src, src,
None,
acquire_sync,
ReleaseSync::None,
&fb, &fb,
AcquireSync::Unnecessary,
ReleaseSync::None,
position, position,
true, true,
x_off - capture.rect.x1(), x_off - capture.rect.x1(),

View file

@ -28,7 +28,7 @@ struct ZoneNameData {
unsafe impl Sync for ZoneNameData {} unsafe impl Sync for ZoneNameData {}
unsafe impl Send for ZoneNameData {} unsafe impl Send for ZoneNameData {}
static CACHE: LazyLock<Mutex<AHashMap<String, ZoneName>>> = LazyLock::new(|| Default::default()); static CACHE: LazyLock<Mutex<AHashMap<String, ZoneName>>> = LazyLock::new(Default::default);
impl ZoneName { impl ZoneName {
pub fn __get(name: &str) -> Self { pub fn __get(name: &str) -> Self {
@ -120,8 +120,7 @@ pub struct FrameName {
name: &'static CString, name: &'static CString,
} }
static FRAME_CACHE: LazyLock<Mutex<AHashMap<String, FrameName>>> = static FRAME_CACHE: LazyLock<Mutex<AHashMap<String, FrameName>>> = LazyLock::new(Default::default);
LazyLock::new(|| Default::default());
impl FrameName { impl FrameName {
pub fn get(name: &str) -> Self { pub fn get(name: &str) -> Self {
@ -177,7 +176,6 @@ impl Drop for RenderingFrame {
} }
#[no_mangle] #[no_mangle]
#[allow(static_mut_refs)]
unsafe extern "C" fn ___tracy_demangle( unsafe extern "C" fn ___tracy_demangle(
mangled: *const std::ffi::c_char, mangled: *const std::ffi::c_char,
) -> *const std::ffi::c_char { ) -> *const std::ffi::c_char {
@ -191,7 +189,7 @@ unsafe extern "C" fn ___tracy_demangle(
let demangled = rustc_demangle::demangle(mangled); let demangled = rustc_demangle::demangle(mangled);
static mut BUF: Vec<u8> = Vec::new(); static mut BUF: Vec<u8> = Vec::new();
BUF.clear(); BUF.clear();
if let Err(_) = write!(BUF, "{demangled:#}\0") { if write!(BUF, "{demangled:#}\0").is_err() {
return ptr::null(); return ptr::null();
} }
BUF.as_ptr().cast() BUF.as_ptr().cast()

View file

@ -4,7 +4,7 @@ use {
client::ClientId, client::ClientId,
cursor::KnownCursor, cursor::KnownCursor,
fixed::Fixed, fixed::Fixed,
gfx_api::GfxTexture, gfx_api::{AcquireSync, BufferResv, GfxTexture, ReleaseSync},
ifs::{ ifs::{
jay_output::JayOutput, jay_output::JayOutput,
jay_screencast::JayScreencast, jay_screencast::JayScreencast,
@ -186,6 +186,9 @@ impl OutputNode {
pub fn perform_screencopies( pub fn perform_screencopies(
&self, &self,
tex: &Rc<dyn GfxTexture>, tex: &Rc<dyn GfxTexture>,
resv: Option<&Rc<dyn BufferResv>>,
acquire_sync: &AcquireSync,
release_sync: ReleaseSync,
render_hardware_cursor: bool, render_hardware_cursor: bool,
x_off: i32, x_off: i32,
y_off: i32, y_off: i32,
@ -196,15 +199,37 @@ impl OutputNode {
return; return;
} }
} }
self.perform_wlr_screencopies(tex, render_hardware_cursor, x_off, y_off, size); self.perform_wlr_screencopies(
tex,
resv,
acquire_sync,
release_sync,
render_hardware_cursor,
x_off,
y_off,
size,
);
for sc in self.screencasts.lock().values() { for sc in self.screencasts.lock().values() {
sc.copy_texture(self, tex, render_hardware_cursor, x_off, y_off, size); sc.copy_texture(
self,
tex,
resv,
acquire_sync,
release_sync,
render_hardware_cursor,
x_off,
y_off,
size,
);
} }
} }
pub fn perform_wlr_screencopies( pub fn perform_wlr_screencopies(
&self, &self,
tex: &Rc<dyn GfxTexture>, tex: &Rc<dyn GfxTexture>,
resv: Option<&Rc<dyn BufferResv>>,
acquire_sync: &AcquireSync,
release_sync: ReleaseSync,
render_hardware_cursors: bool, render_hardware_cursors: bool,
x_off: i32, x_off: i32,
y_off: i32, y_off: i32,
@ -232,6 +257,7 @@ impl OutputNode {
WlBufferStorage::Shm { mem, stride } => { WlBufferStorage::Shm { mem, stride } => {
let res = self.state.perform_shm_screencopy( let res = self.state.perform_shm_screencopy(
tex, tex,
acquire_sync,
self.global.pos.get(), self.global.pos.get(),
x_off, x_off,
y_off, y_off,
@ -259,7 +285,12 @@ impl OutputNode {
}; };
let res = self.state.perform_screencopy( let res = self.state.perform_screencopy(
tex, tex,
resv,
acquire_sync,
release_sync,
&fb, &fb,
AcquireSync::Implicit,
ReleaseSync::Implicit,
self.global.pos.get(), self.global.pos.get(),
render_hardware_cursors, render_hardware_cursors,
x_off - capture.rect.x1(), x_off - capture.rect.x1(),