diff mbox series

[v2,26/37] ml/cnxk: dequeue a burst of inference requests

Message ID	20221208201806.21893-27-syalavarthi@marvell.com (mailing list archive)
State	Superseded, archived
Delegated to:	Thomas Monjalon
Headers	From: Srikanth Yalavarthi <syalavarthi@marvell.com> To: Srikanth Yalavarthi <syalavarthi@marvell.com> CC: <dev@dpdk.org>, <sshankarnara@marvell.com>, <jerinj@marvell.com>, <aprabhu@marvell.com> Subject: [PATCH v2 26/37] ml/cnxk: dequeue a burst of inference requests Date: Thu, 8 Dec 2022 12:17:54 -0800 Message-ID: <20221208201806.21893-27-syalavarthi@marvell.com> In-Reply-To: <20221208201806.21893-1-syalavarthi@marvell.com> References: <20221208200220.20267-1-syalavarthi@marvell.com> <20221208201806.21893-1-syalavarthi@marvell.com> MIME-Version: 1.0 Content-Type: text/plain Precedence: list Errors-To: dev-bounces@dpdk.org
Series	Implementation of ML CNXK driver \| [v2,00/37] Implementation of ML CNXK driver [v2,01/37] ml/cnxk: add skeleton for ML cnxk driver [v2,02/37] ml/cnxk: enable probe and remove of ML device [v2,03/37] ml/cnxk: add driver support to get device info [v2,04/37] ml/cnxk: add support for configure and close [v2,05/37] ml/cnxk: parse ML firmware path from device args [v2,06/37] ml/cnxk: enable firmware load and device reset [v2,07/37] ml/cnxk: enable support for simulator environment [v2,08/37] ml/cnxk: enable support for device start and stop [v2,09/37] ml/cnxk: add support to create device queue-pairs [v2,10/37] ml/cnxk: add functions to load and unload models [v2,11/37] ml/cnxk: enable validity checks for model metadata [v2,12/37] ml/cnxk: add internal structures for derived info [v2,13/37] ml/cnxk: add internal structures for tiles and OCM [v2,14/37] ml/cnxk: add structures for slow and fast path JDs [v2,15/37] ml/cnxk: find OCM mask and page slots for a model [v2,16/37] ml/cnxk: add support to reserve and free OCM pages [v2,17/37] ml/cnxk: enable support to start an ML model [v2,18/37] ml/cnxk: enable support to stop an ML models [v2,19/37] ml/cnxk: enable support to get model information [v2,20/37] ml/cnxk: enable support to update model params [v2,21/37] ml/cnxk: add support to get IO buffer sizes [v2,22/37] ml/cnxk: enable quantization and dequantization [v2,23/37] ml/cnxk: enable support to dump device debug info [v2,24/37] ml/cnxk: add driver support for device selftest [v2,25/37] ml/cnxk: enqueue a burst of inference requests [v2,26/37] ml/cnxk: dequeue a burst of inference requests [v2,27/37] ml/cnxk: add internal function for sync mode run [v2,28/37] ml/cnxk: enable support for firmware error codes [v2,29/37] ml/cnxk: add support to get and reset device stats [v2,30/37] ml/cnxk: add support to handle extended dev stats [v2,31/37] ml/cnxk: enable support to get xstats in cycles [v2,32/37] ml/cnxk: add support to report DPE FW warnings [v2,33/37] ml/cnxk: add support to enable model data caching [v2,34/37] ml/cnxk: add support to select OCM allocation mode [v2,35/37] ml/cnxk: add support to use lock during jcmd enq [v2,36/37] ml/cnxk: add support to select poll memory region [v2,37/37] ml/cnxk: add user guide for marvell cnxk ml driver

Checks

Context	Check	Description
ci/checkpatch	success	coding style OK

Commit Message

Srikanth Yalavarthi Dec. 8, 2022, 8:17 p.m. UTC

  Enabled driver support to dequeue inference requests from
internal queue. Dequeue checks for request completion by
polling the status field of the job request.

Signed-off-by: Srikanth Yalavarthi <syalavarthi@marvell.com>
---
 drivers/ml/cnxk/cn10k_ml_ops.c | 61 ++++++++++++++++++++++++++++++++++
 drivers/ml/cnxk/cn10k_ml_ops.h |  2 ++
 2 files changed, 63 insertions(+)

diff mbox series

Patch

diff --git a/drivers/ml/cnxk/cn10k_ml_ops.c b/drivers/ml/cnxk/cn10k_ml_ops.c
index 6f2d1adac8..83ec064c82 100644
--- a/drivers/ml/cnxk/cn10k_ml_ops.c
+++ b/drivers/ml/cnxk/cn10k_ml_ops.c
@@ -473,6 +473,7 @@  cn10k_ml_dev_configure(struct rte_ml_dev *dev, const struct rte_ml_dev_config *c
 	rte_spinlock_init(&ocm->lock);
 
 	dev->enqueue_burst = cn10k_ml_enqueue_burst;
+	dev->dequeue_burst = cn10k_ml_dequeue_burst;
 
 	mldev->nb_models_loaded = 0;
 	mldev->state = ML_CN10K_DEV_STATE_CONFIGURED;
@@ -1421,6 +1422,23 @@  queue_free_count(uint64_t head, uint64_t tail, uint64_t nb_desc)
 	return nb_desc - queue_pending_count(head, tail, nb_desc) - 1;
 }
 
+static __rte_always_inline void
+cn10k_ml_result_update(struct rte_ml_dev *dev, int qp_id, struct cn10k_ml_result *result,
+		       struct rte_ml_op *op)
+{
+	PLT_SET_USED(dev);
+	PLT_SET_USED(qp_id);
+
+	op->impl_opaque = result->error_code;
+
+	if (likely(result->error_code == 0))
+		op->status = RTE_ML_OP_STATUS_SUCCESS;
+	else
+		op->status = RTE_ML_OP_STATUS_ERROR;
+
+	op->user_ptr = result->user_ptr;
+}
+
 __rte_hot uint16_t
 cn10k_ml_enqueue_burst(struct rte_ml_dev *dev, uint16_t qp_id, struct rte_ml_op **ops,
 		       uint16_t nb_ops)
@@ -1475,6 +1493,49 @@  cn10k_ml_enqueue_burst(struct rte_ml_dev *dev, uint16_t qp_id, struct rte_ml_op
 	return count;
 }
 
+__rte_hot uint16_t
+cn10k_ml_dequeue_burst(struct rte_ml_dev *dev, uint16_t qp_id, struct rte_ml_op **ops,
+		       uint16_t nb_ops)
+{
+	struct cn10k_ml_queue *queue;
+	struct cn10k_ml_req *req;
+	struct cn10k_ml_qp *qp;
+
+	uint64_t status;
+	uint16_t count;
+	uint64_t tail;
+
+	qp = dev->data->queue_pairs[qp_id];
+	queue = &qp->queue;
+
+	tail = queue->tail;
+	nb_ops = PLT_MIN(nb_ops, queue_pending_count(queue->head, tail, qp->nb_desc));
+	count = 0;
+
+	if (unlikely(nb_ops == 0))
+		goto empty_or_active;
+
+dequeue_req:
+	req = &queue->reqs[tail];
+	status = plt_read64(&req->status);
+	if (unlikely(status != ML_CN10K_POLL_JOB_FINISH))
+		goto empty_or_active;
+
+	cn10k_ml_result_update(dev, qp_id, &req->result, req->op);
+	ops[count] = req->op;
+
+	queue_index_advance(&tail, qp->nb_desc);
+	count++;
+
+	if (count < nb_ops)
+		goto dequeue_req;
+
+empty_or_active:
+	queue->tail = tail;
+
+	return count;
+}
+
 struct rte_ml_dev_ops cn10k_ml_ops = {
 	/* Device control ops */
 	.dev_info_get = cn10k_ml_dev_info_get,
diff --git a/drivers/ml/cnxk/cn10k_ml_ops.h b/drivers/ml/cnxk/cn10k_ml_ops.h
index e3f61beeab..3c5342dcc7 100644
--- a/drivers/ml/cnxk/cn10k_ml_ops.h
+++ b/drivers/ml/cnxk/cn10k_ml_ops.h
@@ -73,5 +73,7 @@  int cn10k_ml_model_stop(struct rte_ml_dev *dev, int16_t model_id);
 /* Fast-path ops */
 __rte_hot uint16_t cn10k_ml_enqueue_burst(struct rte_ml_dev *dev, uint16_t qp_id,
 					  struct rte_ml_op **ops, uint16_t nb_ops);
+__rte_hot uint16_t cn10k_ml_dequeue_burst(struct rte_ml_dev *dev, uint16_t qp_id,
+					  struct rte_ml_op **ops, uint16_t nb_ops);
 
 #endif /* _CN10K_ML_OPS_H_ */