From: Kieran Bingham <kieran.bingham+rene...@ideasonboard.com>

We are now able to configure a pipeline directly into a local display
list body. Take advantage of this fact, and create a cacheable body to
store the configuration of the pipeline in the video object.

vsp1_video_pipeline_run() is now the last user of the pipe->dl object.
Convert this function to use the cached video->config body and obtain a
local display list reference.

Attach the video->stream_config body to the display list when needed
before committing to hardware.

Use a flag 'configured' to know when we should attach our stream_config
to the next outgoing display list to reconfigure the hardware in the
event of our first frame, or the first frame following a suspend/resume
cycle.

Our video DL usage now looks like the below output:

dl->body0 contains our disposable runtime configuration. Max 41.
dl_child->body0 is our partition specific configuration. Max 12.
dl->bodies shows our constant configuration and LUTs.

  These two are LUT/CLU:
     * dl->bodies[x]->num_entries 256 / max 256
     * dl->bodies[x]->num_entries 4914 / max 4914

Which shows that our 'constant' configuration cache is currently
utilised to a maximum of 64 entries.

trace-cmd report | \
    grep max | sed 's/.*vsp1_dl_list_commit://g' | sort | uniq;

  dl->body0->num_entries 13 / max 128
  dl->body0->num_entries 14 / max 128
  dl->body0->num_entries 16 / max 128
  dl->body0->num_entries 20 / max 128
  dl->body0->num_entries 27 / max 128
  dl->body0->num_entries 34 / max 128
  dl->body0->num_entries 41 / max 128
  dl_child->body0->num_entries 10 / max 128
  dl_child->body0->num_entries 12 / max 128
  dl->bodies[x]->num_entries 15 / max 128
  dl->bodies[x]->num_entries 16 / max 128
  dl->bodies[x]->num_entries 17 / max 128
  dl->bodies[x]->num_entries 18 / max 128
  dl->bodies[x]->num_entries 20 / max 128
  dl->bodies[x]->num_entries 21 / max 128
  dl->bodies[x]->num_entries 256 / max 256
  dl->bodies[x]->num_entries 31 / max 128
  dl->bodies[x]->num_entries 32 / max 128
  dl->bodies[x]->num_entries 39 / max 128
  dl->bodies[x]->num_entries 40 / max 128
  dl->bodies[x]->num_entries 47 / max 128
  dl->bodies[x]->num_entries 48 / max 128
  dl->bodies[x]->num_entries 4914 / max 4914
  dl->bodies[x]->num_entries 55 / max 128
  dl->bodies[x]->num_entries 56 / max 128
  dl->bodies[x]->num_entries 63 / max 128
  dl->bodies[x]->num_entries 64 / max 128

Signed-off-by: Kieran Bingham <kieran.bingham+rene...@ideasonboard.com>
---
v11:
 - Remove dlbs pool from video object.
   Utilise the DLM pool for video->stream_config
 - Improve comments
 - clear the video->stream_config after it is released
   object.
 - stream_config and configured flag return to the pipe object.

v10:
 - Removed pipe->configured flag, and use
   pipe->state == VSP1_PIPELINE_STOPPED instead.

v8:
 - Fix comments
 - Rename video->pipe_config -> video->stream_config

v4:
 - Adjust pipe configured flag to be reset on resume rather than suspend
 - rename dl_child, dl_next

v3:
 - 's/fragment/body/', 's/fragments/bodies/'
 - video dlb cache allocation increased from 2 to 3 dlbs

 drivers/media/platform/vsp1/vsp1_dl.c    | 10 +++-
 drivers/media/platform/vsp1/vsp1_dl.h    |  1 +-
 drivers/media/platform/vsp1/vsp1_pipe.h  |  6 +-
 drivers/media/platform/vsp1/vsp1_video.c | 69 +++++++++++++++----------
 4 files changed, 56 insertions(+), 30 deletions(-)

diff --git a/drivers/media/platform/vsp1/vsp1_dl.c 
b/drivers/media/platform/vsp1/vsp1_dl.c
index c7fa1cb088cd..0f97305de965 100644
--- a/drivers/media/platform/vsp1/vsp1_dl.c
+++ b/drivers/media/platform/vsp1/vsp1_dl.c
@@ -813,6 +813,11 @@ void vsp1_dlm_reset(struct vsp1_dl_manager *dlm)
        dlm->pending = NULL;
 }
 
+struct vsp1_dl_body *vsp1_dlm_dl_body_get(struct vsp1_dl_manager *dlm)
+{
+       return vsp1_dl_body_get(dlm->pool);
+}
+
 struct vsp1_dl_manager *vsp1_dlm_create(struct vsp1_device *vsp1,
                                        unsigned int index,
                                        unsigned int prealloc)
@@ -838,13 +843,14 @@ struct vsp1_dl_manager *vsp1_dlm_create(struct 
vsp1_device *vsp1,
         * Initialize the display list body and allocate DMA memory for the body
         * and the optional header. Both are allocated together to avoid memory
         * fragmentation, with the header located right after the body in
-        * memory.
+        * memory. An extra body is allocated on top of the prealloc to account
+        * for the cached body used by the vsp1_video object.
         */
        header_size = dlm->mode == VSP1_DL_MODE_HEADER
                    ? ALIGN(sizeof(struct vsp1_dl_header), 8)
                    : 0;
 
-       dlm->pool = vsp1_dl_body_pool_create(vsp1, prealloc,
+       dlm->pool = vsp1_dl_body_pool_create(vsp1, prealloc + 1,
                                             VSP1_DL_NUM_ENTRIES, header_size);
        if (!dlm->pool)
                return NULL;
diff --git a/drivers/media/platform/vsp1/vsp1_dl.h 
b/drivers/media/platform/vsp1/vsp1_dl.h
index 216bd23029dd..7dba0469c92e 100644
--- a/drivers/media/platform/vsp1/vsp1_dl.h
+++ b/drivers/media/platform/vsp1/vsp1_dl.h
@@ -28,6 +28,7 @@ struct vsp1_dl_manager *vsp1_dlm_create(struct vsp1_device 
*vsp1,
 void vsp1_dlm_destroy(struct vsp1_dl_manager *dlm);
 void vsp1_dlm_reset(struct vsp1_dl_manager *dlm);
 unsigned int vsp1_dlm_irq_frame_end(struct vsp1_dl_manager *dlm);
+struct vsp1_dl_body *vsp1_dlm_dl_body_get(struct vsp1_dl_manager *dlm);
 
 struct vsp1_dl_list *vsp1_dl_list_get(struct vsp1_dl_manager *dlm);
 void vsp1_dl_list_put(struct vsp1_dl_list *dl);
diff --git a/drivers/media/platform/vsp1/vsp1_pipe.h 
b/drivers/media/platform/vsp1/vsp1_pipe.h
index f1155d20fa2d..743d8f0db45c 100644
--- a/drivers/media/platform/vsp1/vsp1_pipe.h
+++ b/drivers/media/platform/vsp1/vsp1_pipe.h
@@ -102,7 +102,8 @@ struct vsp1_partition {
  * @uds: UDS entity, if present
  * @uds_input: entity at the input of the UDS, if the UDS is present
  * @entities: list of entities in the pipeline
- * @dl: display list associated with the pipeline
+ * @stream_config: cached stream configuration for video pipelines
+ * @configured: when false the @stream_config shall be written to the hardware
  * @partitions: The number of partitions used to process one frame
  * @partition: The current partition for configuration to process
  * @part_table: The pre-calculated partitions used by the pipeline
@@ -139,7 +140,8 @@ struct vsp1_pipeline {
         */
        struct list_head entities;
 
-       struct vsp1_dl_list *dl;
+       struct vsp1_dl_body *stream_config;
+       bool configured;
 
        unsigned int partitions;
        struct vsp1_partition *partition;
diff --git a/drivers/media/platform/vsp1/vsp1_video.c 
b/drivers/media/platform/vsp1/vsp1_video.c
index c46291ff9e6b..81d47a09d7bc 100644
--- a/drivers/media/platform/vsp1/vsp1_video.c
+++ b/drivers/media/platform/vsp1/vsp1_video.c
@@ -392,42 +392,51 @@ static void vsp1_video_pipeline_run(struct vsp1_pipeline 
*pipe)
        struct vsp1_device *vsp1 = pipe->output->entity.vsp1;
        struct vsp1_entity *entity;
        struct vsp1_dl_body *dlb;
+       struct vsp1_dl_list *dl;
        unsigned int partition;
 
-       if (!pipe->dl)
-               pipe->dl = vsp1_dl_list_get(pipe->output->dlm);
+       dl = vsp1_dl_list_get(pipe->output->dlm);
 
-       dlb = vsp1_dl_list_get_body0(pipe->dl);
+       /*
+        * If the VSP hardware isn't configured yet (which occurs either when
+        * processing the first frame or after a system suspend/resume), add the
+        * cached stream configuration to the display list to perform a full
+        * initialisation.
+        */
+       if (!pipe->configured)
+               vsp1_dl_list_add_body(dl, pipe->stream_config);
+
+       dlb = vsp1_dl_list_get_body0(dl);
 
        list_for_each_entry(entity, &pipe->entities, list_pipe)
-               vsp1_entity_configure_frame(entity, pipe, pipe->dl, dlb);
+               vsp1_entity_configure_frame(entity, pipe, dl, dlb);
 
        /* Run the first partition. */
-       vsp1_video_pipeline_run_partition(pipe, pipe->dl, 0);
+       vsp1_video_pipeline_run_partition(pipe, dl, 0);
 
        /* Process consecutive partitions as necessary. */
        for (partition = 1; partition < pipe->partitions; ++partition) {
-               struct vsp1_dl_list *dl;
+               struct vsp1_dl_list *dl_next;
 
-               dl = vsp1_dl_list_get(pipe->output->dlm);
+               dl_next = vsp1_dl_list_get(pipe->output->dlm);
 
                /*
                 * An incomplete chain will still function, but output only
                 * the partitions that had a dl available. The frame end
                 * interrupt will be marked on the last dl in the chain.
                 */
-               if (!dl) {
+               if (!dl_next) {
                        dev_err(vsp1->dev, "Failed to obtain a dl list. Frame 
will be incomplete\n");
                        break;
                }
 
-               vsp1_video_pipeline_run_partition(pipe, dl, partition);
-               vsp1_dl_list_add_chain(pipe->dl, dl);
+               vsp1_video_pipeline_run_partition(pipe, dl_next, partition);
+               vsp1_dl_list_add_chain(dl, dl_next);
        }
 
        /* Complete, and commit the head display list. */
-       vsp1_dl_list_commit(pipe->dl, false);
-       pipe->dl = NULL;
+       vsp1_dl_list_commit(dl, false);
+       pipe->configured = true;
 
        vsp1_pipeline_run(pipe);
 }
@@ -791,7 +800,6 @@ static void vsp1_video_buffer_queue(struct vb2_buffer *vb)
 static int vsp1_video_setup_pipeline(struct vsp1_pipeline *pipe)
 {
        struct vsp1_entity *entity;
-       struct vsp1_dl_body *dlb;
        int ret;
 
        /* Determine this pipelines sizes for image partitioning support. */
@@ -799,14 +807,6 @@ static int vsp1_video_setup_pipeline(struct vsp1_pipeline 
*pipe)
        if (ret < 0)
                return ret;
 
-       /* Prepare the display list. */
-       pipe->dl = vsp1_dl_list_get(pipe->output->dlm);
-       if (!pipe->dl)
-               return -ENOMEM;
-
-       /* Retrieve the default DLB from the list. */
-       dlb = vsp1_dl_list_get_body0(pipe->dl);
-
        if (pipe->uds) {
                struct vsp1_uds *uds = to_uds(&pipe->uds->subdev);
 
@@ -828,9 +828,18 @@ static int vsp1_video_setup_pipeline(struct vsp1_pipeline 
*pipe)
                }
        }
 
+       /*
+        * Compute and cache the stream configuration into a body. The cached
+        * body will be added to the display list by vsp1_video_pipeline_run()
+        * whenever the pipeline needs to be fully reconfigured.
+        */
+       pipe->stream_config = vsp1_dlm_dl_body_get(pipe->output->dlm);
+       if (!pipe->stream_config)
+               return -ENOMEM;
+
        list_for_each_entry(entity, &pipe->entities, list_pipe) {
-               vsp1_entity_route_setup(entity, pipe, dlb);
-               vsp1_entity_configure_stream(entity, pipe, dlb);
+               vsp1_entity_route_setup(entity, pipe, pipe->stream_config);
+               vsp1_entity_configure_stream(entity, pipe, pipe->stream_config);
        }
 
        return 0;
@@ -853,12 +862,14 @@ static void vsp1_video_cleanup_pipeline(struct 
vsp1_pipeline *pipe)
 {
        lockdep_assert_held(&pipe->lock);
 
+       /* Release any cached configuration from our output video. */
+       vsp1_dl_body_put(pipe->stream_config);
+       pipe->stream_config = NULL;
+       pipe->configured = false;
+
        /* Release our partition table allocation */
        kfree(pipe->part_table);
        pipe->part_table = NULL;
-
-       vsp1_dl_list_put(pipe->dl);
-       pipe->dl = NULL;
 }
 
 static int vsp1_video_start_streaming(struct vb2_queue *vq, unsigned int count)
@@ -1232,6 +1243,12 @@ void vsp1_video_resume(struct vsp1_device *vsp1)
                if (pipe == NULL)
                        continue;
 
+               /*
+                * The hardware may have been reset during a suspend and will
+                * need a full reconfiguration.
+                */
+               pipe->configured = false;
+
                spin_lock_irqsave(&pipe->irqlock, flags);
                if (vsp1_pipeline_ready(pipe))
                        vsp1_video_pipeline_run(pipe);
-- 
git-series 0.9.1

Reply via email to