157 GLSLC(0,
layout(push_constant, scalar) uniform pushConstants { );
158 GLSLC(1, u8buf slice_state; );
159 GLSLC(1, u8buf scratch_data; );
160 GLSLC(1, u8buf out_data; );
162 GLSLC(1, ivec2 sar; );
163 GLSLC(1, uvec2 chroma_shift; );
165 GLSLC(1, uint plane_state_size; );
166 GLSLC(1, uint context_count; );
167 GLSLC(1, uint32_t crcref; );
168 GLSLC(1, uint32_t slice_size_max; );
170 GLSLC(1, uint8_t bits_per_raw_sample; );
171 GLSLC(1, uint8_t context_model; );
173 GLSLC(1, uint8_t micro_version; );
174 GLSLC(1, uint8_t force_pcm; );
175 GLSLC(1, uint8_t key_frame; );
177 GLSLC(1, uint8_t codec_planes; );
178 GLSLC(1, uint8_t transparency; );
179 GLSLC(1, uint8_t colorspace; );
180 GLSLC(1, uint8_t pic_mode; );
181 GLSLC(1, uint8_t ec; );
182 GLSLC(1, uint8_t ppi; );
183 GLSLC(1, uint8_t chunks; );
184 GLSLC(1, uint8_t padding[2]; );
187 VK_SHADER_STAGE_COMPUTE_BIT);
191 AVFrame *enc_in, VkImageView *enc_in_views,
192 AVFrame **intermediate_frame, VkImageView *intermediate_views,
193 VkImageMemoryBarrier2 *img_bar,
int *nb_img_bar,
194 VkBufferMemoryBarrier2 *buf_bar,
int *nb_buf_bar,
195 FFVkBuffer *slice_data_buf, uint32_t slice_data_size)
206 if (!(*intermediate_frame))
210 *intermediate_frame, 0));
213 VK_PIPELINE_STAGE_2_ALL_COMMANDS_BIT,
214 VK_PIPELINE_STAGE_2_COMPUTE_SHADER_BIT));
223 0, slice_data_size*
f->slice_count,
224 VK_FORMAT_UNDEFINED);
226 enc_in, enc_in_views,
228 VK_IMAGE_LAYOUT_GENERAL,
231 *intermediate_frame, intermediate_views,
233 VK_IMAGE_LAYOUT_GENERAL,
237 VK_PIPELINE_STAGE_2_ALL_COMMANDS_BIT,
238 VK_PIPELINE_STAGE_2_COMPUTE_SHADER_BIT,
239 VK_ACCESS_SHADER_WRITE_BIT,
240 VK_IMAGE_LAYOUT_GENERAL,
241 VK_QUEUE_FAMILY_IGNORED);
244 vk->CmdPipelineBarrier2(exec->
buf, &(VkDependencyInfo) {
245 .sType = VK_STRUCTURE_TYPE_DEPENDENCY_INFO,
246 .pImageMemoryBarriers = img_bar,
247 .imageMemoryBarrierCount = *nb_img_bar,
248 .pBufferMemoryBarriers = buf_bar,
249 .bufferMemoryBarrierCount = *nb_buf_bar,
253 slice_data_buf->
stage = buf_bar[0].dstStageMask;
254 slice_data_buf->
access = buf_bar[0].dstAccessMask;
261 .offset = 1 <<
f->bits_per_raw_sample,
262 .bits =
f->bits_per_raw_sample,
265 .transparency =
f->transparency,
272 memcpy(pd.fmt_lut, (
int [4]) { 2, 1, 0, 3 }, 4*
sizeof(
int));
277 VK_SHADER_STAGE_COMPUTE_BIT,
284 VK_PIPELINE_STAGE_2_ALL_COMMANDS_BIT,
285 VK_PIPELINE_STAGE_2_COMPUTE_SHADER_BIT,
286 VK_ACCESS_SHADER_READ_BIT,
287 VK_IMAGE_LAYOUT_GENERAL,
288 VK_QUEUE_FAMILY_IGNORED);
309 size_t tmp_data_size;
316 uint32_t plane_state_size;
317 uint32_t slice_state_size;
318 uint32_t slice_data_size;
327 int has_inter = avctx->
gop_size > 1;
328 uint32_t context_count =
f->context_count[
f->context_model];
334 VkImageView *enc_in_views = in_views;
336 VkImageMemoryBarrier2 img_bar[37];
338 VkBufferMemoryBarrier2 buf_bar[8];
345 f->cur_enc_frame = pict;
354 f->slice_count =
f->max_slice_count;
360 VK_BUFFER_USAGE_STORAGE_BUFFER_BIT |
361 VK_BUFFER_USAGE_SHADER_DEVICE_ADDRESS_BIT,
363 VK_MEMORY_PROPERTY_DEVICE_LOCAL_BIT));
369 plane_state_size = 8;
373 plane_state_size *= context_count;
374 slice_state_size = plane_state_size*
f->plane_count;
376 slice_data_size = 256;
377 slice_state_size += slice_data_size;
378 slice_state_size =
FFALIGN(slice_state_size, 8);
382 if (!slice_data_ref) {
385 VK_BUFFER_USAGE_STORAGE_BUFFER_BIT |
386 VK_BUFFER_USAGE_SHADER_DEVICE_ADDRESS_BIT,
387 NULL, slice_state_size*
f->slice_count,
388 VK_MEMORY_PROPERTY_DEVICE_LOCAL_BIT));
400 VK_BUFFER_USAGE_STORAGE_BUFFER_BIT |
401 VK_BUFFER_USAGE_SHADER_DEVICE_ADDRESS_BIT,
402 NULL, 2*
f->slice_count*
sizeof(uint64_t),
403 VK_MEMORY_PROPERTY_DEVICE_LOCAL_BIT |
404 VK_MEMORY_PROPERTY_HOST_VISIBLE_BIT));
415 VK_BUFFER_USAGE_TRANSFER_SRC_BIT |
416 VK_BUFFER_USAGE_STORAGE_BUFFER_BIT |
417 VK_BUFFER_USAGE_SHADER_DEVICE_ADDRESS_BIT,
419 maxsize < fv->max_heap_size ?
420 VK_MEMORY_PROPERTY_DEVICE_LOCAL_BIT : 0x0));
426 VK_PIPELINE_STAGE_2_ALL_COMMANDS_BIT,
427 VK_PIPELINE_STAGE_2_COMPUTE_SHADER_BIT));
432 VK_PIPELINE_STAGE_2_ALL_COMMANDS_BIT,
433 VK_PIPELINE_STAGE_2_COMPUTE_SHADER_BIT,
434 VK_ACCESS_SHADER_READ_BIT,
435 VK_IMAGE_LAYOUT_GENERAL,
436 VK_QUEUE_FAMILY_IGNORED);
442 0, slice_data_size*
f->slice_count,
443 VK_FORMAT_UNDEFINED);
445 enc_in, enc_in_views,
447 VK_IMAGE_LAYOUT_GENERAL,
452 buf_bar[nb_buf_bar++] = (VkBufferMemoryBarrier2) {
453 .sType = VK_STRUCTURE_TYPE_BUFFER_MEMORY_BARRIER_2,
454 .srcStageMask = slice_data_buf->
stage,
455 .dstStageMask = VK_PIPELINE_STAGE_2_COMPUTE_SHADER_BIT,
456 .srcAccessMask = slice_data_buf->
access,
457 .dstAccessMask = VK_ACCESS_2_SHADER_STORAGE_READ_BIT |
458 VK_ACCESS_2_SHADER_STORAGE_WRITE_BIT,
459 .srcQueueFamilyIndex = VK_QUEUE_FAMILY_IGNORED,
460 .dstQueueFamilyIndex = VK_QUEUE_FAMILY_IGNORED,
461 .buffer = slice_data_buf->
buf,
462 .size = VK_WHOLE_SIZE,
467 vk->CmdPipelineBarrier2(exec->
buf, &(VkDependencyInfo) {
468 .sType = VK_STRUCTURE_TYPE_DEPENDENCY_INFO,
469 .pImageMemoryBarriers = img_bar,
470 .imageMemoryBarrierCount = nb_img_bar,
471 .pBufferMemoryBarriers = buf_bar,
472 .bufferMemoryBarrierCount = nb_buf_bar,
476 slice_data_buf->
stage = buf_bar[0].dstStageMask;
477 slice_data_buf->
access = buf_bar[0].dstAccessMask;
485 .scratch_data = tmp_data_buf->
address,
486 .out_data = out_data_buf->
address,
487 .bits_per_raw_sample =
f->bits_per_raw_sample,
490 .chroma_shift[0] =
f->chroma_h_shift,
491 .chroma_shift[1] =
f->chroma_v_shift,
492 .plane_state_size = plane_state_size,
493 .context_count = context_count,
495 .slice_size_max = out_data_buf->
size /
f->slice_count,
497 .version =
f->version,
498 .micro_version =
f->micro_version,
500 .key_frame =
f->key_frame,
502 .codec_planes =
f->plane_count,
503 .transparency =
f->transparency,
504 .colorspace =
f->colorspace,
512 VK_SHADER_STAGE_COMPUTE_BIT,
517 buf_bar[nb_buf_bar++] = (VkBufferMemoryBarrier2) {
518 .sType = VK_STRUCTURE_TYPE_BUFFER_MEMORY_BARRIER_2,
519 .srcStageMask = slice_data_buf->
stage,
520 .dstStageMask = VK_PIPELINE_STAGE_2_COMPUTE_SHADER_BIT,
521 .srcAccessMask = slice_data_buf->
access,
522 .dstAccessMask = VK_ACCESS_2_SHADER_STORAGE_READ_BIT |
523 VK_ACCESS_2_SHADER_STORAGE_WRITE_BIT,
524 .srcQueueFamilyIndex = VK_QUEUE_FAMILY_IGNORED,
525 .dstQueueFamilyIndex = VK_QUEUE_FAMILY_IGNORED,
526 .buffer = slice_data_buf->
buf,
527 .size = slice_data_size*
f->slice_count,
531 if (
f->key_frame ||
f->version > 3) {
537 0, slice_data_size*
f->slice_count,
538 VK_FORMAT_UNDEFINED);
544 .plane_state_size = plane_state_size,
545 .context_count = context_count,
546 .codec_planes =
f->plane_count,
547 .key_frame =
f->key_frame,
550 VK_SHADER_STAGE_COMPUTE_BIT,
551 0,
sizeof(pd_reset), &pd_reset);
554 vk->CmdPipelineBarrier2(exec->
buf, &(VkDependencyInfo) {
555 .sType = VK_STRUCTURE_TYPE_DEPENDENCY_INFO,
556 .pBufferMemoryBarriers = buf_bar,
557 .bufferMemoryBarrierCount = nb_buf_bar,
559 slice_data_buf->
stage = buf_bar[0].dstStageMask;
560 slice_data_buf->
access = buf_bar[0].dstAccessMask;
570 enc_in, enc_in_views,
571 &intermediate_frame, intermediate_views,
572 img_bar, &nb_img_bar, buf_bar, &nb_buf_bar,
573 slice_data_buf, slice_data_size));
576 enc_in = intermediate_frame;
577 enc_in_views = intermediate_views;
581 if (
f->key_frame ||
f->version > 3) {
583 buf_bar[nb_buf_bar++] = (VkBufferMemoryBarrier2) {
584 .sType = VK_STRUCTURE_TYPE_BUFFER_MEMORY_BARRIER_2,
585 .srcStageMask = slice_data_buf->
stage,
586 .dstStageMask = VK_PIPELINE_STAGE_2_COMPUTE_SHADER_BIT,
587 .srcAccessMask = slice_data_buf->
access,
588 .dstAccessMask = VK_ACCESS_2_SHADER_STORAGE_READ_BIT |
589 VK_ACCESS_2_SHADER_STORAGE_WRITE_BIT,
590 .srcQueueFamilyIndex = VK_QUEUE_FAMILY_IGNORED,
591 .dstQueueFamilyIndex = VK_QUEUE_FAMILY_IGNORED,
592 .buffer = slice_data_buf->
buf,
593 .size = slice_data_buf->
size - slice_data_size*
f->slice_count,
594 .offset = slice_data_size*
f->slice_count,
599 vk->CmdPipelineBarrier2(exec->
buf, &(VkDependencyInfo) {
600 .sType = VK_STRUCTURE_TYPE_DEPENDENCY_INFO,
601 .pImageMemoryBarriers = img_bar,
602 .imageMemoryBarrierCount = nb_img_bar,
603 .pBufferMemoryBarriers = buf_bar,
604 .bufferMemoryBarrierCount = nb_buf_bar,
608 slice_data_buf->
stage = buf_bar[0].dstStageMask;
609 slice_data_buf->
access = buf_bar[0].dstAccessMask;
617 0, slice_data_size*
f->slice_count,
618 VK_FORMAT_UNDEFINED);
620 enc_in, enc_in_views,
622 VK_IMAGE_LAYOUT_GENERAL,
627 0, results_data_buf->
size,
628 VK_FORMAT_UNDEFINED);
632 VK_SHADER_STAGE_COMPUTE_BIT,
656 VkBufferCopy *buf_regions,
int nb_regions,
668 VkBufferMemoryBarrier2 buf_bar[8];
681 buf_bar[nb_buf_bar++] = (VkBufferMemoryBarrier2) {
682 .sType = VK_STRUCTURE_TYPE_BUFFER_MEMORY_BARRIER_2,
683 .srcStageMask = out_data_buf->
stage,
684 .dstStageMask = VK_PIPELINE_STAGE_2_TRANSFER_BIT,
685 .srcAccessMask = out_data_buf->
access,
686 .dstAccessMask = VK_ACCESS_2_TRANSFER_READ_BIT,
687 .srcQueueFamilyIndex = VK_QUEUE_FAMILY_IGNORED,
688 .dstQueueFamilyIndex = VK_QUEUE_FAMILY_IGNORED,
689 .buffer = out_data_buf->
buf,
690 .size = VK_WHOLE_SIZE,
693 vk->CmdPipelineBarrier2(exec->
buf, &(VkDependencyInfo) {
694 .sType = VK_STRUCTURE_TYPE_DEPENDENCY_INFO,
695 .pBufferMemoryBarriers = buf_bar,
696 .bufferMemoryBarrierCount = nb_buf_bar,
698 out_data_buf->
stage = buf_bar[0].dstStageMask;
699 out_data_buf->
access = buf_bar[0].dstAccessMask;
702 vk->CmdCopyBuffer(exec->
buf,
703 out_data_buf->
buf, pkt_data_buf->buf,
704 nb_regions, buf_regions);
715 if (!(pkt_data_buf->flags & VK_MEMORY_PROPERTY_HOST_COHERENT_BIT)) {
716 VkMappedMemoryRange invalidate_data = {
717 .sType = VK_STRUCTURE_TYPE_MAPPED_MEMORY_RANGE,
718 .memory = pkt_data_buf->mem,
720 .size = VK_WHOLE_SIZE,
723 1, &invalidate_data);
750 if (!(results_data_buf->
flags & VK_MEMORY_PROPERTY_HOST_COHERENT_BIT)) {
751 VkMappedMemoryRange invalidate_data = {
752 .sType = VK_STRUCTURE_TYPE_MAPPED_MEMORY_RANGE,
753 .memory = results_data_buf->
mem,
755 .size = VK_WHOLE_SIZE,
758 1, &invalidate_data);
763 for (
int i = 0;
i <
f->slice_count;
i++) {
764 sc = &((uint64_t *)results_data_buf->
mapped_mem)[
i*2];
766 "src offset = %"PRIu64
"\n",
782 VK_BUFFER_USAGE_TRANSFER_DST_BIT,
784 VK_MEMORY_PROPERTY_HOST_CACHED_BIT |
785 VK_MEMORY_PROPERTY_HOST_VISIBLE_BIT);
880 vk_frames = frames_ctx->
hwctx;
881 vk_frames->
tiling = VK_IMAGE_TILING_OPTIMAL;
882 vk_frames->
usage = VK_IMAGE_USAGE_STORAGE_BIT;
883 vk_frames->
img_flags = VK_IMAGE_CREATE_MUTABLE_FORMAT_BIT;
958 GLSLF(0, #define
TYPE int%i_t ,smp_bits);
959 GLSLF(0, #define VTYPE2
i%ivec2 ,smp_bits);
960 GLSLF(0, #define VTYPE3
i%ivec3 ,smp_bits);
978 void *spv_opaque =
NULL;
981 VK_SHADER_STAGE_COMPUTE_BIT,
982 (
const char *[]) {
"GL_EXT_buffer_reference",
983 "GL_EXT_buffer_reference2" }, 2,
997 .
name =
"rangecoder_static_buf",
998 .type = VK_DESCRIPTOR_TYPE_UNIFORM_BUFFER,
999 .stages = VK_SHADER_STAGE_COMPUTE_BIT,
1000 .mem_layout =
"scalar",
1001 .buf_content =
"uint8_t zero_one_state[512];",
1004 .name =
"quant_buf",
1005 .type = VK_DESCRIPTOR_TYPE_UNIFORM_BUFFER,
1006 .stages = VK_SHADER_STAGE_COMPUTE_BIT,
1007 .mem_layout =
"scalar",
1008 .buf_content =
"int16_t quant_table[MAX_QUANT_TABLES]"
1009 "[MAX_CONTEXT_INPUTS][MAX_QUANT_TABLE_SIZE];",
1018 .
name =
"slice_data_buf",
1019 .type = VK_DESCRIPTOR_TYPE_STORAGE_BUFFER,
1020 .stages = VK_SHADER_STAGE_COMPUTE_BIT,
1021 .buf_content =
"SliceContext slice_ctx[1024];",
1025 .type = VK_DESCRIPTOR_TYPE_STORAGE_IMAGE,
1030 .mem_quali =
"readonly",
1031 .stages = VK_SHADER_STAGE_COMPUTE_BIT,
1060 void *spv_opaque =
NULL;
1061 int wg_dim =
FFMIN(fv->
s.
props.properties.limits.maxComputeWorkGroupSize[0], 1024);
1064 VK_SHADER_STAGE_COMPUTE_BIT,
1065 (
const char *[]) {
"GL_EXT_buffer_reference",
1066 "GL_EXT_buffer_reference2" }, 2,
1073 GLSLC(0,
layout(push_constant, scalar) uniform pushConstants { );
1074 GLSLC(1, u8buf slice_state; );
1075 GLSLC(1, uint plane_state_size; );
1076 GLSLC(1, uint context_count; );
1077 GLSLC(1, uint8_t codec_planes; );
1078 GLSLC(1, uint8_t key_frame; );
1080 GLSLC(1, uint8_t micro_version; );
1081 GLSLC(1, uint8_t padding[1]; );
1084 VK_SHADER_STAGE_COMPUTE_BIT);
1092 .
name =
"rangecoder_static_buf",
1093 .type = VK_DESCRIPTOR_TYPE_UNIFORM_BUFFER,
1094 .stages = VK_SHADER_STAGE_COMPUTE_BIT,
1095 .mem_layout =
"scalar",
1096 .buf_content =
"uint8_t zero_one_state[512];",
1099 .name =
"quant_buf",
1100 .type = VK_DESCRIPTOR_TYPE_UNIFORM_BUFFER,
1101 .stages = VK_SHADER_STAGE_COMPUTE_BIT,
1102 .mem_layout =
"scalar",
1103 .buf_content =
"int16_t quant_table[MAX_QUANT_TABLES]"
1104 "[MAX_CONTEXT_INPUTS][MAX_QUANT_TABLE_SIZE];",
1113 .
name =
"slice_data_buf",
1114 .type = VK_DESCRIPTOR_TYPE_STORAGE_BUFFER,
1115 .mem_quali =
"readonly",
1116 .stages = VK_SHADER_STAGE_COMPUTE_BIT,
1117 .buf_content =
"SliceContext slice_ctx[1024];",
1146 void *spv_opaque =
NULL;
1147 int wg_count = sqrt(fv->
s.
props.properties.limits.maxComputeWorkGroupInvocations);
1152 "pixel format for RCT buffer!\n");
1159 VK_SHADER_STAGE_COMPUTE_BIT,
1160 (
const char *[]) {
"GL_EXT_buffer_reference",
1161 "GL_EXT_buffer_reference2" }, 2,
1162 wg_count, wg_count, 1,
1168 GLSLC(0,
layout(push_constant, scalar) uniform pushConstants { );
1169 GLSLC(1, ivec4 fmt_lut; );
1172 GLSLC(1, uint8_t planar_rgb; );
1173 GLSLC(1, uint8_t color_planes; );
1174 GLSLC(1, uint8_t transparency; );
1176 GLSLC(1, uint8_t micro_version; );
1177 GLSLC(1, uint8_t padding[2]; );
1180 VK_SHADER_STAGE_COMPUTE_BIT);
1188 .
name =
"rangecoder_static_buf",
1189 .type = VK_DESCRIPTOR_TYPE_UNIFORM_BUFFER,
1190 .stages = VK_SHADER_STAGE_COMPUTE_BIT,
1191 .mem_layout =
"scalar",
1192 .buf_content =
"uint8_t zero_one_state[512];",
1195 .name =
"quant_buf",
1196 .type = VK_DESCRIPTOR_TYPE_UNIFORM_BUFFER,
1197 .stages = VK_SHADER_STAGE_COMPUTE_BIT,
1198 .mem_layout =
"scalar",
1199 .buf_content =
"int16_t quant_table[MAX_QUANT_TABLES]"
1200 "[MAX_CONTEXT_INPUTS][MAX_QUANT_TABLE_SIZE];",
1209 .
name =
"slice_data_buf",
1210 .type = VK_DESCRIPTOR_TYPE_STORAGE_BUFFER,
1211 .mem_quali =
"readonly",
1212 .stages = VK_SHADER_STAGE_COMPUTE_BIT,
1213 .buf_content =
"SliceContext slice_ctx[1024];",
1217 .type = VK_DESCRIPTOR_TYPE_STORAGE_IMAGE,
1222 .mem_quali =
"readonly",
1223 .stages = VK_SHADER_STAGE_COMPUTE_BIT,
1227 .type = VK_DESCRIPTOR_TYPE_STORAGE_IMAGE,
1232 .mem_quali =
"writeonly",
1233 .stages = VK_SHADER_STAGE_COMPUTE_BIT,
1267 void *spv_opaque =
NULL;
1270 VK_SHADER_STAGE_COMPUTE_BIT,
1271 (
const char *[]) {
"GL_EXT_buffer_reference",
1272 "GL_EXT_buffer_reference2" }, 2,
1287 .
name =
"rangecoder_static_buf",
1288 .type = VK_DESCRIPTOR_TYPE_UNIFORM_BUFFER,
1289 .stages = VK_SHADER_STAGE_COMPUTE_BIT,
1290 .mem_layout =
"scalar",
1291 .buf_content =
"uint8_t zero_one_state[512];",
1294 .name =
"quant_buf",
1295 .type = VK_DESCRIPTOR_TYPE_UNIFORM_BUFFER,
1296 .stages = VK_SHADER_STAGE_COMPUTE_BIT,
1297 .mem_layout =
"scalar",
1298 .buf_content =
"int16_t quant_table[MAX_QUANT_TABLES]"
1299 "[MAX_CONTEXT_INPUTS][MAX_QUANT_TABLE_SIZE];",
1302 .name =
"crc_ieee_buf",
1303 .type = VK_DESCRIPTOR_TYPE_UNIFORM_BUFFER,
1304 .stages = VK_SHADER_STAGE_COMPUTE_BIT,
1305 .mem_layout =
"scalar",
1306 .buf_content =
"uint32_t crc_ieee[256];",
1316 .
name =
"slice_data_buf",
1317 .type = VK_DESCRIPTOR_TYPE_STORAGE_BUFFER,
1318 .stages = VK_SHADER_STAGE_COMPUTE_BIT,
1319 .buf_content =
"SliceContext slice_ctx[1024];",
1323 .type = VK_DESCRIPTOR_TYPE_STORAGE_IMAGE,
1328 .mem_quali =
"readonly",
1329 .stages = VK_SHADER_STAGE_COMPUTE_BIT,
1332 .name =
"results_data_buf",
1333 .type = VK_DESCRIPTOR_TYPE_STORAGE_BUFFER,
1334 .stages = VK_SHADER_STAGE_COMPUTE_BIT,
1335 .mem_quali =
"writeonly",
1336 .buf_content =
"uint64_t slice_results[2048];",
1370 size_t maxsize, max_heap_size, max_host_size;
1393 if (
f->bits_per_raw_sample > (
f->version > 3 ? 16 : 8)) {
1396 "forcing range coder\n");
1401 if (
f->version < 4 && avctx->
gop_size > 1) {
1412 if (
f->version == 4 &&
f->micro_version > 4)
1413 f->micro_version = 3;
1441 f->num_h_slices = w_sl;
1442 f->num_v_slices = h_sl;
1450 if (
f->num_h_slices <= 0 &&
f->num_v_slices <= 0) {
1456 f->num_h_slices = 32;
1457 f->num_v_slices = 32;
1459 }
else if (
f->num_h_slices &&
f->num_v_slices <= 0) {
1460 f->num_v_slices = 1024 /
f->num_h_slices;
1461 }
else if (
f->num_v_slices &&
f->num_h_slices <= 0) {
1462 f->num_h_slices = 1024 /
f->num_v_slices;
1465 f->num_h_slices =
FFMIN(
f->num_h_slices, avctx->
width);
1468 if (
f->num_h_slices *
f->num_v_slices > 1024) {
1470 "by the standard is 1024\n",
1471 f->num_h_slices *
f->num_v_slices);
1479 if (
f->version < 4) {
1480 if (((
f->chroma_h_shift > 0) && (avctx->
width % (64 <<
f->chroma_h_shift))) ||
1481 ((
f->chroma_v_shift > 0) && (avctx->
height % (64 <<
f->chroma_v_shift)))) {
1483 "dimensions is only supported in version 4 (-level 4)\n");
1489 if (
f->version < 4) {
1512 for (
int i = 0;
i < fv->
s.
mprops.memoryHeapCount;
i++) {
1513 if (fv->
s.
mprops.memoryHeaps[
i].flags & VK_MEMORY_HEAP_DEVICE_LOCAL_BIT)
1516 if (!(fv->
s.
mprops.memoryHeaps[
i].flags & VK_MEMORY_HEAP_DEVICE_LOCAL_BIT))
1517 max_host_size =
FFMAX(max_host_size,
1523 if (maxsize > fv->
s.
props_11.maxMemoryAllocationSize) {
1525 "than maximum device allocation (%zu), clipping\n",
1526 maxsize, fv->
s.
props_11.maxMemoryAllocationSize);
1527 maxsize = fv->
s.
props_11.maxMemoryAllocationSize;
1530 if (max_heap_size < maxsize) {
1532 "using host memory (slower)\n",
1536 max_heap_size = max_host_size - (max_host_size >> 1);
1539 max_heap_size = max_heap_size - (max_heap_size >> 3);
1542 av_log(avctx,
AV_LOG_INFO,
"Async buffers: %zuMiB per context, %zuMiB total, depth: %i\n",
1543 maxsize / (1024*1024),
1565 spv = ff_vk_spirv_init();
1578 if (!fv->
is_rgb &&
f->bits_per_raw_sample > 8)
1636 &fv->
setup, 0, 0, 0,
1639 VK_FORMAT_UNDEFINED));
1646 VK_FORMAT_UNDEFINED));
1651 VK_FORMAT_UNDEFINED));
1656 VK_FORMAT_UNDEFINED));
1671 f->max_slice_count =
f->num_h_slices *
f->num_v_slices;
1724 #define OFFSET(x) offsetof(VulkanEncodeFFv1Context, x)
1725 #define VE AV_OPT_FLAG_VIDEO_PARAM | AV_OPT_FLAG_ENCODING_PARAM
1728 { .i64 = -1 }, -1, 1,
VE },
1730 { .i64 = 0 }, 0, 1,
VE },
1740 { .i64 = -1 }, -1, 2,
VE , .unit =
"qtable"},
1744 { .i64 =
QTABLE_8BIT }, INT_MIN, INT_MAX,
VE, .unit =
"qtable" },
1749 { .i64 = -1 }, -1, 1024,
VE },
1751 { .i64 = -1 }, -1, 1024,
VE },
1754 { .i64 = 0 }, 0, 1,
VE },
1757 { .i64 = 1 }, 1, INT_MAX,
VE },
1780 .
p.
name =
"ffv1_vulkan",
1798 .p.wrapper_name =
"vulkan",