Re: [RESEND PATCH v2 07/15] ASoC: qcom: q6asm: Add support to memory map and unmap
From: Bjorn Andersson
Date: Tue Jan 02 2018 - 00:49:08 EST
On Thu 14 Dec 09:33 PST 2017, srinivas.kandagatla@xxxxxxxxxx wrote:
> From: Srinivas Kandagatla <srinivas.kandagatla@xxxxxxxxxx>
>
> This patch adds support to memory map and unmap regions commands in
> q6asm module.
>
> Signed-off-by: Srinivas Kandagatla <srinivas.kandagatla@xxxxxxxxxx>
> ---
> sound/soc/qcom/qdsp6/q6asm.c | 343 ++++++++++++++++++++++++++++++++++++++++++-
> sound/soc/qcom/qdsp6/q6asm.h | 5 +
> 2 files changed, 347 insertions(+), 1 deletion(-)
>
> diff --git a/sound/soc/qcom/qdsp6/q6asm.c b/sound/soc/qcom/qdsp6/q6asm.c
> index 9cc583afef4d..4be92441f524 100644
> --- a/sound/soc/qcom/qdsp6/q6asm.c
> +++ b/sound/soc/qcom/qdsp6/q6asm.c
> @@ -14,9 +14,46 @@
> #include "q6asm.h"
> #include "common.h"
>
> +#define ASM_CMD_SHARED_MEM_MAP_REGIONS 0x00010D92
> +#define ASM_CMDRSP_SHARED_MEM_MAP_REGIONS 0x00010D93
> +#define ASM_CMD_SHARED_MEM_UNMAP_REGIONS 0x00010D94
> +
> #define TUN_READ_IO_MODE 0x0004 /* tunnel read write mode */
> #define SYNC_IO_MODE 0x0001
> #define ASYNC_IO_MODE 0x0002
> +#define ASM_SHIFT_GAPLESS_MODE_FLAG 31
> +#define ADSP_MEMORY_MAP_SHMEM8_4K_POOL 3
> +
> +struct avs_cmd_shared_mem_map_regions {
> + struct apr_hdr hdr;
> + u16 mem_pool_id;
> + u16 num_regions;
> + u32 property_flag;
> +} __packed;
> +
> +struct avs_shared_map_region_payload {
> + u32 shm_addr_lsw;
> + u32 shm_addr_msw;
> + u32 mem_size_bytes;
> +} __packed;
> +
> +struct avs_cmd_shared_mem_unmap_regions {
> + struct apr_hdr hdr;
> + u32 mem_map_handle;
> +} __packed;
> +
> +struct audio_buffer {
> + dma_addr_t phys;
> + uint32_t used;
> + uint32_t size; /* size of buffer */
> +};
> +
> +struct audio_port_data {
> + struct audio_buffer *buf;
> + uint32_t max_buf_cnt;
This seems to denote the number of audio_buffers in the buf array, so
I'm not sure about the meaning of "max_".
> + uint32_t dsp_buf;
> + uint32_t mem_map_handle;
> +};
>
> struct audio_client {
> int session;
> @@ -27,6 +64,8 @@ struct audio_client {
> uint64_t time_stamp;
> struct apr_device *adev;
> struct mutex cmd_lock;
> + /* idx:1 out port, 0: in port */
> + struct audio_port_data port[2];
> wait_queue_head_t cmd_wait;
> int perf_mode;
> int stream_id;
> @@ -86,6 +125,260 @@ static void q6asm_session_free(struct audio_client *ac)
> mutex_unlock(&a->session_lock);
> }
>
> +static inline void q6asm_add_mmaphdr(struct audio_client *ac,
> + struct apr_hdr *hdr, u32 pkt_size,
> + bool cmd_flg, u32 token)
cmd_flg is true in both callers, so this function ends up simply
assigning hdr_field, pkt_size and token. Inlining these assignments
would make for cleaner call sites as well.
> +{
> + hdr->hdr_field = APR_SEQ_CMD_HDR_FIELD;
> + hdr->src_port = 0;
> + hdr->dest_port = 0;
> + hdr->pkt_size = pkt_size;
> + if (cmd_flg)
> + hdr->token = token;
> +}
> +
> +static inline void q6asm_add_hdr(struct audio_client *ac, struct apr_hdr *hdr,
This is unused.
> + uint32_t pkt_size, bool cmd_flg,
> + uint32_t stream_id)
> +{
> + hdr->hdr_field = APR_SEQ_CMD_HDR_FIELD;
> + hdr->src_svc = ac->adev->svc_id;
> + hdr->src_domain = APR_DOMAIN_APPS;
> + hdr->dest_svc = APR_SVC_ASM;
> + hdr->dest_domain = APR_DOMAIN_ADSP;
> + hdr->src_port = ((ac->session << 8) & 0xFF00) | (stream_id);
> + hdr->dest_port = ((ac->session << 8) & 0xFF00) | (stream_id);
> + hdr->pkt_size = pkt_size;
> + if (cmd_flg)
> + hdr->token = ac->session;
> +}
> +
> +static int __q6asm_memory_unmap(struct audio_client *ac,
> + phys_addr_t buf_add, int dir)
> +{
> + struct avs_cmd_shared_mem_unmap_regions mem_unmap;
If you name this "cmd" you will declutter below code a bit.
> + struct q6asm *a = dev_get_drvdata(ac->dev->parent);
> + int rc;
> +
> + if (!a)
> + return -ENODEV;
Does this NULL check add any real value?
> +
> + q6asm_add_mmaphdr(ac, &mem_unmap.hdr, sizeof(mem_unmap), true,
> + ((ac->session << 8) | dir));
> + a->mem_state = -1;
> +
> + mem_unmap.hdr.opcode = ASM_CMD_SHARED_MEM_UNMAP_REGIONS;
> + mem_unmap.mem_map_handle = ac->port[dir].mem_map_handle;
> +
> + if (mem_unmap.mem_map_handle == 0) {
Start the function by checking for !ac->port[dir].mem_map_handle
> + dev_err(ac->dev, "invalid mem handle\n");
> + return -EINVAL;
> + }
> +
> + rc = apr_send_pkt(a->adev, (uint32_t *) &mem_unmap);
> + if (rc < 0)
> + return rc;
> +
> + rc = wait_event_timeout(a->mem_wait, (a->mem_state >= 0),
> + 5 * HZ);
> + if (!rc) {
> + dev_err(ac->dev, "CMD timeout for memory_unmap 0x%x\n",
> + mem_unmap.mem_map_handle);
> + return -ETIMEDOUT;
> + } else if (a->mem_state > 0) {
> + return adsp_err_get_lnx_err_code(a->mem_state);
> + }
> + ac->port[dir].mem_map_handle = 0;
Does all errors indicate that the region is left mapped?
> +
> + return 0;
> +}
> +
> +/**
> + * q6asm_unmap_memory_regions() - unmap memory regions in the dsp.
> + *
> + * @dir: direction of audio stream
> + * @ac: audio client instanace
> + *
> + * Return: Will be an negative value on failure or zero on success
> + */
> +int q6asm_unmap_memory_regions(unsigned int dir, struct audio_client *ac)
> +{
> + struct audio_port_data *port;
> + int cnt = 0;
> + int rc = 0;
> +
> + mutex_lock(&ac->cmd_lock);
> + port = &ac->port[dir];
> + if (!port->buf) {
> + mutex_unlock(&ac->cmd_lock);
> + return 0;
Put a label right before the mutex_unlock below and return rc instead of
0, then you can replace these two lines with "goto unlock"
> + }
> + cnt = port->max_buf_cnt - 1;
What if we mapped 1 period? Why shouldn't we enter the unmap path?
> + if (cnt >= 0) {
> + rc = __q6asm_memory_unmap(ac, port->buf[dir].phys, dir);
> + if (rc < 0) {
> + dev_err(ac->dev, "%s: Memory_unmap_regions failed %d\n",
> + __func__, rc);
Most of the code paths through __q6asm_memory_unmap() will print an
error, make this consistent and print the warning once.
> + mutex_unlock(&ac->cmd_lock);
> + return rc;
Same here.
> + }
> + }
> +
> + port->max_buf_cnt = 0;
> + kfree(port->buf);
> + port->buf = NULL;
> + mutex_unlock(&ac->cmd_lock);
I think however that if you rearrange this function somewhat you can
start off by doing:
mutex_lock(&ac->cmd_lock);
port = &ac->port[dir];
bufs = port->buf;
cnt = port->max_buf_cnt;
port->max_buf_cnt = 0;
port->buf = NULL;
mutex_unlock(&ac->cmd_lock);
And then you can do the rest without locks.
> +
> + return 0;
> +}
> +EXPORT_SYMBOL_GPL(q6asm_unmap_memory_regions);
> +
> +static int __q6asm_memory_map_regions(struct audio_client *ac, int dir,
> + uint32_t period_sz, uint32_t periods,
period_sz is typical size_t material.
> + bool is_contiguous)
> +{
> + struct avs_cmd_shared_mem_map_regions *mmap_regions = NULL;
Calling this "cmd" would declutter the function.
> + struct avs_shared_map_region_payload *mregions = NULL;
> + struct q6asm *a = dev_get_drvdata(ac->dev->parent);
> + struct audio_port_data *port = NULL;
> + struct audio_buffer *ab = NULL;
> + void *mmap_region_cmd = NULL;
No need to initialize this.
Also, this really is a avs_cmd_shared_mem_map_regions with some extra
data at the end, not a void *.
> + void *payload = NULL;
> + int rc = 0;
> + int i = 0;
> + int cmd_size = 0;
Most of these can be left uninitialized.
> + uint32_t num_regions;
> + uint32_t buf_sz;
> +
> + if (!a)
> + return -ENODEV;
> + num_regions = is_contiguous ? 1 : periods;
> + buf_sz = is_contiguous ? (period_sz * periods) : period_sz;
> + buf_sz = PAGE_ALIGN(buf_sz);
> +
> + cmd_size = sizeof(*mmap_regions) + (sizeof(*mregions) * num_regions);
> +
> + mmap_region_cmd = kzalloc(cmd_size, GFP_KERNEL);
> + if (!mmap_region_cmd)
> + return -ENOMEM;
> +
> + mmap_regions = (struct avs_cmd_shared_mem_map_regions *)mmap_region_cmd;
> + q6asm_add_mmaphdr(ac, &mmap_regions->hdr, cmd_size, true,
> + ((ac->session << 8) | dir));
> + a->mem_state = -1;
> +
> + mmap_regions->hdr.opcode = ASM_CMD_SHARED_MEM_MAP_REGIONS;
> + mmap_regions->mem_pool_id = ADSP_MEMORY_MAP_SHMEM8_4K_POOL;
> + mmap_regions->num_regions = num_regions;
> + mmap_regions->property_flag = 0x00;
> +
> + payload = ((u8 *) mmap_region_cmd +
> + sizeof(struct avs_cmd_shared_mem_map_regions));
mmap_region_cmd is void *, so no need to type cast.
> +
> + mregions = (struct avs_shared_map_region_payload *)payload;
Payload is void *, so no need to type cast. But there's also no benefit
of having "payload", as this line can be written as:
mregions = mmap_region_cmd + sizeof(*mmap_regions);
But adding a flexible array member to the avs_cmd_shared_mem_map_regions
struct would make things even clearer, in particular you would be able
to read the struct definition and see that there's a payload following
the command.
> +
> + ac->port[dir].mem_map_handle = 0;
Isn't this already 0?
> + port = &ac->port[dir];
> +
> + for (i = 0; i < num_regions; i++) {
> + ab = &port->buf[i];
> + mregions->shm_addr_lsw = lower_32_bits(ab->phys);
> + mregions->shm_addr_msw = upper_32_bits(ab->phys);
> + mregions->mem_size_bytes = buf_sz;
Here you're dereferencing port->buf without holding cmd_lock.
> + ++mregions;
> + }
> +
> + rc = apr_send_pkt(a->adev, (uint32_t *) mmap_region_cmd);
> + if (rc < 0)
> + goto fail_cmd;
> +
> + rc = wait_event_timeout(a->mem_wait, (a->mem_state >= 0),
> + 5 * HZ);
> + if (!rc) {
> + dev_err(ac->dev, "timeout. waited for memory_map\n");
> + rc = -ETIMEDOUT;
> + goto fail_cmd;
> + }
> +
> + if (a->mem_state > 0) {
> + rc = adsp_err_get_lnx_err_code(a->mem_state);
> + goto fail_cmd;
> + }
> + rc = 0;
> +fail_cmd:
> + kfree(mmap_region_cmd);
> + return rc;
> +}
> +
> +/**
> + * q6asm_map_memory_regions() - map memory regions in the dsp.
> + *
> + * @dir: direction of audio stream
This sounds boolean, perhaps worth mentioning here if true means rx or
tx.
And it's idiomatic to have such a parameter later in the list, it would
probably be more natural to read the call sight if the order was:
q6asm_map_memory_regions(ac, phys, periods, size, true);
> + * @ac: audio client instanace
> + * @phys: physcial address that needs mapping.
> + * @period_sz: audio period size
> + * @periods: number of periods
> + *
> + * Return: Will be an negative value on failure or zero on success
> + */
> +int q6asm_map_memory_regions(unsigned int dir, struct audio_client *ac,
> + dma_addr_t phys,
> + unsigned int period_sz, unsigned int periods)
period_sz could with benefit be of type size_t.
> +{
> + struct audio_buffer *buf;
> + int cnt;
> + int rc;
> +
> + if (ac->port[dir].buf) {
> + dev_err(ac->dev, "Buffer already allocated\n");
> + return 0;
> + }
> +
> + mutex_lock(&ac->cmd_lock);
I believe this lock should cover above check.
> +
> + buf = kzalloc(((sizeof(struct audio_buffer)) * periods), GFP_KERNEL);
Loose a few of those parenthesis and use *buf in the sizeof.
> + if (!buf) {
> + mutex_unlock(&ac->cmd_lock);
> + return -ENOMEM;
> + }
> +
> +
> + ac->port[dir].buf = buf;
> +
> + buf[0].phys = phys;
> + buf[0].used = dir ^ 1;
Why would this be called "used", and it's probably cleaner to just use
!!dir.
> + buf[0].size = period_sz;
> + cnt = 1;
> + while (cnt < periods) {
cnt goes from 1 to periods and is incremented 1 each step, this would be
more succinct as a for loop.
> + if (period_sz > 0) {
> + buf[cnt].phys = buf[0].phys + (cnt * period_sz);
> + buf[cnt].used = dir ^ 1;
> + buf[cnt].size = period_sz;
> + }
> + cnt++;
> + }
> +
> + ac->port[dir].max_buf_cnt = periods;
> + mutex_unlock(&ac->cmd_lock);
The only possible purpose of taking cmd_lock here is to protect
ac->port[dir].buf, but
> +
> + rc = __q6asm_memory_map_regions(ac, dir, period_sz, periods, 1);
The last parameter should be "true".
> + if (rc < 0) {
> + dev_err(ac->dev,
> + "CMD Memory_map_regions failed %d for size %d\n", rc,
> + period_sz);
> +
> +
> + ac->port[dir].max_buf_cnt = 0;
> + kfree(buf);
> + ac->port[dir].buf = NULL;
These operations are done without holding cmd_lock.
> +
> + return rc;
> + }
> +
> + return 0;
> +}
> +EXPORT_SYMBOL_GPL(q6asm_map_memory_regions);
> +
> /**
> * q6asm_audio_client_free() - Freee allocated audio client
> *
> @@ -117,8 +410,10 @@ static struct audio_client *q6asm_get_audio_client(struct q6asm *a,
>
> static int q6asm_srvc_callback(struct apr_device *adev, struct apr_client_data *data)
> {
> - struct q6asm *q6asm = dev_get_drvdata(&adev->dev);
> + struct q6asm *a, *q6asm = dev_get_drvdata(&adev->dev);
> struct audio_client *ac = NULL;
> + struct audio_port_data *port;
> + uint32_t dir = 0;
> uint32_t sid = 0;
> uint32_t *payload;
>
> @@ -135,6 +430,52 @@ static int q6asm_srvc_callback(struct apr_device *adev, struct apr_client_data *
> return 0;
> }
>
> + a = dev_get_drvdata(ac->dev->parent);
> + if (data->opcode == APR_BASIC_RSP_RESULT) {
This is a case in below switch statement.
> + switch (payload[0]) {
> + case ASM_CMD_SHARED_MEM_MAP_REGIONS:
> + case ASM_CMD_SHARED_MEM_UNMAP_REGIONS:
> + if (payload[1] != 0) {
> + dev_err(ac->dev,
> + "cmd = 0x%x returned error = 0x%x sid:%d\n",
> + payload[0], payload[1], sid);
> + a->mem_state = payload[1];
> + } else {
> + a->mem_state = 0;
Just assign a->mem_state = payload[1] outside the conditional, as it
will be the same value.
> + }
> +
> + wake_up(&a->mem_wait);
> + break;
> + default:
> + dev_err(&adev->dev, "command[0x%x] not expecting rsp\n",
> + payload[0]);
> + break;
> + }
> + return 0;
> + }
Regards,
Bjorn