On Thu, Apr 28, 2022 at 05:18:13PM +0200, Thierry Reding wrote:
On Tue, Apr 26, 2022 at 02:07:59PM +0800, Cai Huoqing wrote: [...]
diff --git a/drivers/gpu/drm/nvdla/nvdla_drv.c b/drivers/gpu/drm/nvdla/nvdla_drv.c
I'll look at this from an architectural level and leave it to other experts to review the more technical things.
[...]
+static struct nvdla_config nvdla_config_os_initial = {
- .atom_size = 32,
- .bdma_enable = true,
- .rubik_enable = true,
- .weight_compress_support = true,
+};
+static struct nvdla_config nvdla_config_small = {
- //.atom_size = 8,
- .atom_size = 32, // nv_large config
- .bdma_enable = false,
- .rubik_enable = false,
- .weight_compress_support = false,
+};
[...]
+static union nvdla_operation_container operation_desc[NVDLA_OP_NUM][NVDLA_NUM_GROUPS]; +static union nvdla_surface_container surface_desc[NVDLA_OP_NUM][NVDLA_NUM_GROUPS];
+static struct nvdla_task_desc global_task;
+static struct nvdla_engine engine = {
- .processors[NVDLA_OP_BDMA] = {
.name = "BDMA",.op_type = NVDLA_OP_BDMA,.program = nvdla_bdma_program,.enable = nvdla_bdma_enable,.set_producer = nvdla_bdma_set_producer,.is_ready = nvdla_bdma_is_ready,.dump_config = nvdla_bdma_dump_config,.rdma_check = nvdla_bdma_rdma_check,.consumer_ptr = 0,.roi_index = 0,.group_status = 0,.rdma_status = 0,.last_group = 1,.groups[0] = {.id = 0,.rdma_id = 0,.active = 0,.events = 0,.roi_index = 0,.is_rdma_needed = 0,.lut_index = -1,.operation_desc = &operation_desc[NVDLA_OP_BDMA][0],.surface_desc = &surface_desc[NVDLA_OP_BDMA][0],},.groups[1] = {.id = 1,.rdma_id = 0,.active = 0,.events = 0,.roi_index = 0,.is_rdma_needed = 0,.lut_index = -1,.operation_desc = &operation_desc[NVDLA_OP_BDMA][1],.surface_desc = &surface_desc[NVDLA_OP_BDMA][1],},- },
- .processors[NVDLA_OP_CONV] = {
.name = "Convolution",.op_type = NVDLA_OP_CONV,.program = nvdla_conv_program,.enable = nvdla_conv_enable,.set_producer = nvdla_conv_set_producer,.is_ready = nvdla_conv_is_ready,.dump_config = nvdla_conv_dump_config,.rdma_check = nvdla_conv_rdma_check,.consumer_ptr = 0,.roi_index = 0,.group_status = 0,.rdma_status = 0,.last_group = 1,.groups[0] = {.id = 0,.rdma_id = 0,.active = 0,.events = 0,.roi_index = 0,.is_rdma_needed = 0,.lut_index = -1,.operation_desc = &operation_desc[NVDLA_OP_CONV][0],.surface_desc = &surface_desc[NVDLA_OP_CONV][0],},.groups[1] = {.id = 1,.rdma_id = 0,.active = 0,.events = 0,.roi_index = 0,.is_rdma_needed = 0,.lut_index = -1,.operation_desc = &operation_desc[NVDLA_OP_CONV][1],.surface_desc = &surface_desc[NVDLA_OP_CONV][1],},- },
- .processors[NVDLA_OP_SDP] = {
.name = "SDP",.op_type = NVDLA_OP_SDP,.program = nvdla_sdp_program,.enable = nvdla_sdp_enable,.set_producer = nvdla_sdp_set_producer,.is_ready = nvdla_sdp_is_ready,.dump_config = nvdla_sdp_dump_config,.rdma_check = nvdla_sdp_rdma_check,.consumer_ptr = 0,.roi_index = 0,.group_status = 0,.rdma_status = 0,.last_group = 1,.groups[0] = {.id = 0,.rdma_id = 0,.active = 0,.events = 0,.roi_index = 0,.is_rdma_needed = 0,.lut_index = -1,.operation_desc = &operation_desc[NVDLA_OP_SDP][0],.surface_desc = &surface_desc[NVDLA_OP_SDP][0],},.groups[1] = {.id = 1,.rdma_id = 0,.active = 0,.events = 0,.roi_index = 0,.is_rdma_needed = 0,.lut_index = -1,.operation_desc = &operation_desc[NVDLA_OP_SDP][1],.surface_desc = &surface_desc[NVDLA_OP_SDP][1],},- },
- .processors[NVDLA_OP_PDP] = {
.name = "PDP",.op_type = NVDLA_OP_PDP,.program = nvdla_pdp_program,.enable = nvdla_pdp_enable,.set_producer = nvdla_pdp_set_producer,.is_ready = nvdla_pdp_is_ready,.dump_config = nvdla_pdp_dump_config,.rdma_check = nvdla_pdp_rdma_check,.consumer_ptr = 0,.roi_index = 0,.group_status = 0,.rdma_status = 0,.last_group = 1,.groups[0] = {.id = 0,.rdma_id = 0,.active = 0,.events = 0,.roi_index = 0,.is_rdma_needed = 0,.lut_index = -1,.operation_desc = &operation_desc[NVDLA_OP_PDP][0],.surface_desc = &surface_desc[NVDLA_OP_PDP][0],},.groups[1] = {.id = 1,.rdma_id = 0,.active = 0,.events = 0,.roi_index = 0,.is_rdma_needed = 0,.lut_index = -1,.operation_desc = &operation_desc[NVDLA_OP_PDP][1],.surface_desc = &surface_desc[NVDLA_OP_PDP][1],},- },
- .processors[NVDLA_OP_CDP] = {
.name = "CDP",.op_type = NVDLA_OP_CDP,.program = nvdla_cdp_program,.enable = nvdla_cdp_enable,.set_producer = nvdla_cdp_set_producer,.is_ready = nvdla_cdp_is_ready,.dump_config = nvdla_cdp_dump_config,.rdma_check = nvdla_cdp_rdma_check,.consumer_ptr = 0,.roi_index = 0,.group_status = 0,.rdma_status = 0,.last_group = 1,.groups[0] = {.id = 0,.rdma_id = 0,.active = 0,.events = 0,.roi_index = 0,.is_rdma_needed = 0,.lut_index = -1,.operation_desc = &operation_desc[NVDLA_OP_CDP][0],.surface_desc = &surface_desc[NVDLA_OP_CDP][0],},.groups[1] = {.id = 1,.rdma_id = 0,.active = 0,.events = 0,.roi_index = 0,.is_rdma_needed = 0,.lut_index = -1,.operation_desc = &operation_desc[NVDLA_OP_CDP][1],.surface_desc = &surface_desc[NVDLA_OP_CDP][1],},- },
- .processors[NVDLA_OP_RUBIK] = {
.name = "RUBIK",.op_type = NVDLA_OP_RUBIK,.program = nvdla_rubik_program,.enable = nvdla_rubik_enable,.set_producer = nvdla_rubik_set_producer,.is_ready = nvdla_rubik_is_ready,.dump_config = nvdla_rubik_dump_config,.rdma_check = nvdla_rubik_rdma_check,.consumer_ptr = 0,.roi_index = 0,.group_status = 0,.rdma_status = 0,.last_group = 1,.groups[0] = {.id = 0,.rdma_id = 0,.active = 0,.events = 0,.roi_index = 0,.is_rdma_needed = 0,.lut_index = -1,.operation_desc = &operation_desc[NVDLA_OP_RUBIK][0],.surface_desc = &surface_desc[NVDLA_OP_RUBIK][0],},.groups[1] = {.id = 1,.rdma_id = 0,.active = 0,.events = 0,.roi_index = 0,.is_rdma_needed = 0,.lut_index = -1,.operation_desc = &operation_desc[NVDLA_OP_RUBIK][1],.surface_desc = &surface_desc[NVDLA_OP_RUBIK][1],},- },
+};
These global variables aren't going to work because Tegra234 (Tegra194's successor) has two instances of NVDLA.
Small correction: I just recalled that even Tegra194 has two DLA instances, so if we want both supported we'll need to get rid of those global variables for that chip already.
Thierry