We need the synchronous way for multi-process communication,
i.e., blockingly waiting for reply message when we send a request
to the peer process.

We add two APIs rte_eal_mp_request() and rte_eal_mp_reply() for
such use case. By invoking rte_eal_mp_request(), a request message
is sent out, and then it waits there for a reply message. The
timeout is hard-coded 5 Sec. And the replied message will be copied
in the parameters of this API so that the caller can decide how
to translate those information (including params and fds). Note
if a primary process owns multiple secondary processes, this API
will fail.

The API rte_eal_mp_reply() is always called by an mp action handler.
Here we add another parameter for rte_eal_mp_t so that the action
handler knows which peer address to reply.

We use mutex in rte_eal_mp_request() to guarantee that only one
request is on the fly for one pair of processes.

Suggested-by: Anatoly Burakov <anatoly.bura...@intel.com>
Signed-off-by: Jianfeng Tan <jianfeng....@intel.com>
---
 lib/librte_eal/common/eal_common_proc.c | 144 +++++++++++++++++++++++++++++---
 lib/librte_eal/common/include/rte_eal.h |  73 +++++++++++++++-
 lib/librte_eal/rte_eal_version.map      |   2 +
 3 files changed, 206 insertions(+), 13 deletions(-)

diff --git a/lib/librte_eal/common/eal_common_proc.c 
b/lib/librte_eal/common/eal_common_proc.c
index 70519cc..f194a52 100644
--- a/lib/librte_eal/common/eal_common_proc.c
+++ b/lib/librte_eal/common/eal_common_proc.c
@@ -32,6 +32,7 @@
 static int mp_fd = -1;
 static char *mp_sec_sockets[MAX_SECONDARY_PROCS];
 static pthread_mutex_t mp_mutex_action = PTHREAD_MUTEX_INITIALIZER;
+static pthread_mutex_t mp_mutex_request = PTHREAD_MUTEX_INITIALIZER;
 
 struct action_entry {
        TAILQ_ENTRY(action_entry) next;      /**< Next attached action entry */
@@ -49,6 +50,10 @@ static struct action_entry_list action_entry_list =
 
 struct mp_msghdr {
        char action_name[MAX_ACTION_NAME_LEN];
+#define MP_MSG 0 /* Share message with peers, will not block */
+#define MP_REQ 1 /* Request for information, Will block for a reply */
+#define MP_REP 2 /* Reply to previously-received request */
+       int type;
        int fds_num;
        int len_params;
        char params[0];
@@ -138,7 +143,8 @@ rte_eal_mp_action_unregister(const char *name)
 }
 
 static int
-read_msg(int fd, char *buf, int buflen, int *fds, int fds_num)
+read_msg(int fd, char *buf, int buflen,
+        int *fds, int fds_num, struct sockaddr_un *s)
 {
        int ret;
        struct iovec iov;
@@ -151,6 +157,8 @@ read_msg(int fd, char *buf, int buflen, int *fds, int 
fds_num)
        iov.iov_base = buf;
        iov.iov_len  = buflen;
 
+       msgh.msg_name = s;
+       msgh.msg_namelen = sizeof(*s);
        msgh.msg_iov = &iov;
        msgh.msg_iovlen = 1;
        msgh.msg_control = control;
@@ -181,7 +189,7 @@ read_msg(int fd, char *buf, int buflen, int *fds, int 
fds_num)
 }
 
 static int
-process_msg(struct mp_msghdr *hdr, int len, int fds[])
+process_msg(struct mp_msghdr *hdr, int len, int fds[], struct sockaddr_un *s)
 {
        int ret;
        int params_len;
@@ -199,10 +207,10 @@ process_msg(struct mp_msghdr *hdr, int len, int fds[])
        }
 
        params_len = len - sizeof(struct mp_msghdr);
-       ret = entry->action(hdr->params, params_len, fds, hdr->fds_num);
+       ret = entry->action(hdr->params, params_len,
+                           fds, hdr->fds_num, s->sun_path);
        pthread_mutex_unlock(&mp_mutex_action);
        return ret;
-
 }
 
 static void *
@@ -211,11 +219,12 @@ mp_handle(void *arg __rte_unused)
        int len;
        int fds[SCM_MAX_FD];
        char buf[MAX_MSG_LENGTH];
+       struct sockaddr_un sa;
 
        while (1) {
-               len = read_msg(mp_fd, buf, MAX_MSG_LENGTH, fds, SCM_MAX_FD);
+               len = read_msg(mp_fd, buf, MAX_MSG_LENGTH, fds, SCM_MAX_FD, 
&sa);
                if (len > 0)
-                       process_msg((struct mp_msghdr *)buf, len, fds);
+                       process_msg((struct mp_msghdr *)buf, len, fds, &sa);
        }
 
        return NULL;
@@ -255,7 +264,8 @@ static int
 mp_primary_proc(const void *params,
                int len __rte_unused,
                int fds[] __rte_unused,
-               int fds_num __rte_unused)
+               int fds_num __rte_unused,
+               const void *peer __rte_unused)
 {
        const struct proc_request *r = (const struct proc_request *)params;
 
@@ -362,7 +372,8 @@ rte_eal_mp_channel_init(void)
 }
 
 static inline struct mp_msghdr *
-format_msg(const char *act_name, const void *p, int len_params, int fds_num)
+format_msg(const char *act_name, const void *p,
+          int len_params, int fds_num, int type)
 {
        int len_msg;
        struct mp_msghdr *msg;
@@ -384,6 +395,7 @@ format_msg(const char *act_name, const void *p, int 
len_params, int fds_num)
        strcpy(msg->action_name, act_name);
        msg->fds_num = fds_num;
        msg->len_params = len_params;
+       msg->type = type;
        memcpy(msg->params, p, len_params);
        return msg;
 }
@@ -455,7 +467,9 @@ mp_send(const char *action_name,
        const void *params,
        int len_params,
        int fds[],
-       int fds_num)
+       int fds_num,
+       int type,
+       const void *peer)
 {
        int i;
        int n = 0;
@@ -468,7 +482,7 @@ mp_send(const char *action_name,
                return 0;
        }
 
-       msg = format_msg(action_name, params, len_params, fds_num);
+       msg = format_msg(action_name, params, len_params, fds_num, type);
        if (msg == NULL)
                return 0;
 
@@ -477,6 +491,11 @@ mp_send(const char *action_name,
                return 0;
        }
 
+       if (peer) {
+               n += send_msg(sockfd, peer, msg, fds);
+               goto ret;
+       }
+
        if (rte_eal_process_type() == RTE_PROC_PRIMARY) {
                /* broadcast to all secondaries */
                for (i = 0; i < MAX_SECONDARY_PROCS; ++i) {
@@ -488,6 +507,7 @@ mp_send(const char *action_name,
        } else
                n += send_msg(sockfd, eal_mp_unix_path(), msg, fds);
 
+ret:
        free(msg);
        close(sockfd);
        return n;
@@ -501,5 +521,107 @@ rte_eal_mp_sendmsg(const char *action_name,
                   int fds_num)
 {
        RTE_LOG(DEBUG, EAL, "sendmsg: %s\n", action_name);
-       return mp_send(action_name, params, len_params, fds, fds_num);
+       return mp_send(action_name, params, len_params,
+                       fds, fds_num, MP_MSG, NULL);
+}
+
+int
+rte_eal_mp_request(const char *action_name,
+                  void *params,
+                  int len_p,
+                  int fds[],
+                  int fds_in,
+                  int fds_out)
+{
+       int i, j;
+       int sockfd;
+       int nprocs;
+       int ret = 0;
+       struct mp_msghdr *req;
+       struct timeval tv;
+       char buf[MAX_MSG_LENGTH];
+       struct mp_msghdr *hdr;
+
+       RTE_LOG(DEBUG, EAL, "request: %s\n", action_name);
+
+       if (fds_in > SCM_MAX_FD || fds_out > SCM_MAX_FD) {
+               RTE_LOG(ERR, EAL, "Cannot send more than %d FDs\n", SCM_MAX_FD);
+               rte_errno = -E2BIG;
+               return 0;
+       }
+
+       req = format_msg(action_name, params, len_p, fds_in, MP_REQ);
+       if (req == NULL)
+               return 0;
+
+       if ((sockfd = open_unix_fd(0)) < 0) {
+               free(req);
+               return 0;
+       }
+
+       tv.tv_sec = 5;  /* 5 Secs Timeout */
+       tv.tv_usec = 0;
+       if (setsockopt(sockfd, SOL_SOCKET, SO_RCVTIMEO,
+                       (const void *)&tv, sizeof(struct timeval)) < 0)
+               RTE_LOG(INFO, EAL, "Failed to set recv timeout\n");
+
+       /* Only allow one req at a time */
+       pthread_mutex_lock(&mp_mutex_request);
+
+       if (rte_eal_process_type() == RTE_PROC_PRIMARY) {
+               nprocs = 0;
+               for (i = 0; i < MAX_SECONDARY_PROCS; ++i)
+                       if (!mp_sec_sockets[i]) {
+                               j = i;
+                               nprocs++;
+                       }
+
+               if (nprocs > 1) {
+                       RTE_LOG(ERR, EAL,
+                               "multi secondary processes not supported\n");
+                       goto free_and_ret;
+               }
+
+               ret = send_msg(sockfd, mp_sec_sockets[j], req, fds);
+       } else
+               ret = send_msg(sockfd, eal_mp_unix_path(), req, fds);
+
+       if (ret == 0) {
+               RTE_LOG(ERR, EAL, "failed to send request: %s\n", action_name);
+               ret = -1;
+               goto free_and_ret;
+       }
+
+       ret = read_msg(sockfd, buf, MAX_MSG_LENGTH, fds, fds_out, NULL);
+       if (ret > 0) {
+               hdr = (struct mp_msghdr *)buf;
+               if (hdr->len_params == len_p)
+                       memcpy(params, hdr->params, len_p);
+               else {
+                       RTE_LOG(ERR, EAL, "invalid reply\n");
+                       ret = 0;
+               }
+       }
+
+free_and_ret:
+       free(req);
+       close(sockfd);
+       pthread_mutex_unlock(&mp_mutex_request);
+       return ret;
+}
+
+int
+rte_eal_mp_reply(const char *action_name,
+                const void *params,
+                int len_p,
+                int fds[],
+                int fds_in,
+                const void *peer)
+{
+       RTE_LOG(DEBUG, EAL, "reply: %s\n", action_name);
+       if (peer == NULL) {
+               RTE_LOG(ERR, EAL, "peer is not specified\n");
+               return 0;
+       }
+       return mp_send(action_name, params, len_p, fds, fds_in, MP_REP, peer);
 }
diff --git a/lib/librte_eal/common/include/rte_eal.h 
b/lib/librte_eal/common/include/rte_eal.h
index 9884c0b..2690a77 100644
--- a/lib/librte_eal/common/include/rte_eal.h
+++ b/lib/librte_eal/common/include/rte_eal.h
@@ -192,7 +192,7 @@ int rte_eal_primary_proc_alive(const char 
*config_file_path);
  * this function typedef to register action for coming messages.
  */
 typedef int (*rte_eal_mp_t)(const void *params, int len,
-                           int fds[], int fds_num);
+                           int fds[], int fds_num, const void *peer);
 
 /**
  * Register an action function for primary/secondary communication.
@@ -245,7 +245,7 @@ void rte_eal_mp_action_unregister(const char *name);
  *   The fds argument is an array of fds sent with sendmsg.
  *
  * @param fds_num
- *   The fds_num argument is number of fds to be sent with sendmsg.
+ *   The number of fds to be sent with sendmsg.
  *
  * @return
  *  - Returns the number of messages being sent successfully.
@@ -255,6 +255,75 @@ rte_eal_mp_sendmsg(const char *action_name, const void 
*params,
                   int len_params, int fds[], int fds_num);
 
 /**
+ * Send a request to the peer process and expect a reply.
+ *
+ * This function sends a request message to the peer process, and will
+ * block until receiving reply message from the peer process. Note:
+ * this does not work for the primary process sending requests to its
+ * multiple (>1) secondary processes.
+ *
+ * @param action_name
+ *   The action_name argument is used to identify which action will be used.
+ *
+ * @param params
+ *   The params argument contains the customized message; as the reply is
+ *   received, the replied params will be copied to this pointer. 
+ *
+ * @param len_p
+ *   The length of the customized message.
+ *
+ * @param fds
+ *   The fds argument is an array of fds sent with sendmsg; as the reply
+ *   is received, the replied fds will be copied into this array.
+ *
+ * @param fds_in
+ *   The number of fds to be sent.
+ *
+ * @param fds_out
+ *   The number of fds to be received.
+ *
+ * @return
+ *  - (1) on success;
+ *  - (0) on sending request successfully but no valid reply received.
+ *  - (<0) on failing to sending request.
+ */
+int
+rte_eal_mp_request(const char *action_name, void *params,
+                  int len_p, int fds[], int fds_in, int fds_out);
+
+/**
+ * Send a reply to the peer process.
+ *
+ * This function will send a reply message in response to a request message
+ * received previously.
+ *
+ * @param action_name
+ *   The action_name argument is used to identify which action will be used.
+ *
+ * @param params
+ *   The params argument contains the customized message.
+ *
+ * @param len_p
+ *   The length of the customized message.
+ *
+ * @param fds
+ *   The fds argument is an array of fds sent with sendmsg.
+ *
+ * @param fds_in
+ *   The number of fds to be sent with sendmsg.
+ *
+ * @param peer
+ *   The fds_num argument is number of fds to be sent with sendmsg.
+ *
+ * @return
+ *  - (1) on success;
+ *  - (0) on failure.
+ */
+int
+rte_eal_mp_reply(const char *action_name, const void *params,
+                int len_p, int fds[], int fds_in, const void *peer);
+
+/**
  * Usage function typedef used by the application usage function.
  *
  * Use this function typedef to define and call 
rte_set_application_usage_hook()
diff --git a/lib/librte_eal/rte_eal_version.map 
b/lib/librte_eal/rte_eal_version.map
index 5dacde5..068ac0b 100644
--- a/lib/librte_eal/rte_eal_version.map
+++ b/lib/librte_eal/rte_eal_version.map
@@ -243,5 +243,7 @@ DPDK_18.02 {
        rte_eal_mp_action_register;
        rte_eal_mp_action_unregister;
        rte_eal_mp_sendmsg;
+       rte_eal_mp_request;
+       rte_eal_mp_reply;
 
 } DPDK_17.11;
-- 
2.7.4

Reply via email to