Re: [dpdk-dev] [PATCH v4 3/5] vhost: add apis for datapath configuration

2018-03-31 Thread Maxime Coquelin



On 03/10/2018 11:01 AM, Zhihong Wang wrote:

This patch adds APIs for datapath configuration.

The did of the vhost-user socket can be set to identify the backend device,
in this case each vhost-user socket can have only 1 connection. The did is
set to -1 by default when the software datapath is used.

Signed-off-by: Zhihong Wang 
---
Changes in v4:

  1. Remove the "engine" concept in the lib.

  lib/librte_vhost/rte_vhost.h   | 35 +
  lib/librte_vhost/rte_vhost_version.map |  3 +++
  lib/librte_vhost/socket.c  | 36 ++
  lib/librte_vhost/vhost.c   | 25 +++
  lib/librte_vhost/vhost.h   |  9 +
  5 files changed, 108 insertions(+)

diff --git a/lib/librte_vhost/rte_vhost.h b/lib/librte_vhost/rte_vhost.h
index 671ea5053..d50f4c67d 100644
--- a/lib/librte_vhost/rte_vhost.h
+++ b/lib/librte_vhost/rte_vhost.h
@@ -200,6 +200,30 @@ int rte_vhost_driver_register(const char *path, uint64_t 
flags);
  int rte_vhost_driver_unregister(const char *path);
  
  /**

+ * Set the device id, enforce single connection per socket
+ *
+ * @param path
+ *  The vhost-user socket file path
+ * @param did
+ *  Device id
+ * @return
+ *  0 on success, -1 on failure
+ */
+int __rte_experimental
+rte_vhost_driver_set_vdpa_did(const char *path, int did);


IIUC, we call this to attach a VDPA device to a Vhost-user port?

What about having this named explicitly? Something like:

rte_vhost_driver_attach_vdpa_did(const char *path, int did)
rte_vhost_driver_detach_vdpa_did(const char *path)

The later would set to did -1

This is not mandatory though


+
+/**
+ * Get the device id
+ *
+ * @param path
+ *  The vhost-user socket file path
+ * @return
+ *  Device id, -1 on failure
+ */
+int __rte_experimental
+rte_vhost_driver_get_vdpa_did(const char *path);
+
+/**
   * Set the feature bits the vhost-user driver supports.
   *
   * @param path
@@ -464,6 +488,17 @@ int rte_vhost_vring_call(int vid, uint16_t vring_idx);
   */
  uint32_t rte_vhost_rx_queue_count(int vid, uint16_t qid);
  
+/**

+ * Get vdpa device id for vhost device.
+ *
+ * @param vid
+ *  vhost device ID
+ * @return
+ *  device id
+ */
+int __rte_experimental
+rte_vhost_get_vdpa_did(int vid);
+
  #ifdef __cplusplus
  }
  #endif
diff --git a/lib/librte_vhost/rte_vhost_version.map 
b/lib/librte_vhost/rte_vhost_version.map
index 7bcffb490..6e2d5364a 100644
--- a/lib/librte_vhost/rte_vhost_version.map
+++ b/lib/librte_vhost/rte_vhost_version.map
@@ -64,4 +64,7 @@ EXPERIMENTAL {
rte_vdpa_register_device;
rte_vdpa_unregister_device;
rte_vdpa_find_device_id;
+   rte_vhost_driver_set_vdpa_did;
+   rte_vhost_driver_get_vdpa_did;
+   rte_vhost_get_vdpa_did;
  } DPDK_18.02;
diff --git a/lib/librte_vhost/socket.c b/lib/librte_vhost/socket.c
index cfc31e179..3d58da94e 100644
--- a/lib/librte_vhost/socket.c
+++ b/lib/librte_vhost/socket.c
@@ -52,6 +52,13 @@ struct vhost_user_socket {
uint64_t supported_features;
uint64_t features;
  
+	/*

+* Device id to identify a specific backend device.
+* It's set to -1 for the default software implementation.
+* If valid, one socket can have 1 connection only.
+*/
+   int did;

I would rename it to something like vdpa_did or even better,
vdpa_dev_id. At least prefix it with vdpa not to confuse the user.


+
struct vhost_device_ops const *notify_ops;
  };
  
@@ -545,6 +552,35 @@ find_vhost_user_socket(const char *path)

  }
  
  int

+rte_vhost_driver_set_vdpa_did(const char *path, int did)
+{
+   struct vhost_user_socket *vsocket;
+
+   pthread_mutex_lock(&vhost_user.mutex);
+   vsocket = find_vhost_user_socket(path);
+   if (vsocket)
+   vsocket->did = did;


I guess it is possible to know whether the did exists
at that time. Maybe we could check this?


+   pthread_mutex_unlock(&vhost_user.mutex);
+
+   return vsocket ? 0 : -1;
+}
+
+int
+rte_vhost_driver_get_vdpa_did(const char *path)
+{
+   struct vhost_user_socket *vsocket;
+   int did = -1;
+
+   pthread_mutex_lock(&vhost_user.mutex);
+   vsocket = find_vhost_user_socket(path);
+   if (vsocket)
+   did = vsocket->did;
+   pthread_mutex_unlock(&vhost_user.mutex);
+
+   return did;
+}
+
+int
  rte_vhost_driver_disable_features(const char *path, uint64_t features)
  {
struct vhost_user_socket *vsocket;
diff --git a/lib/librte_vhost/vhost.c b/lib/librte_vhost/vhost.c
index f6f12a03b..1740cc1ab 100644
--- a/lib/librte_vhost/vhost.c
+++ b/lib/librte_vhost/vhost.c
@@ -283,6 +283,7 @@ vhost_new_device(void)
dev->vid = i;
dev->flags = VIRTIO_DEV_BUILTIN_VIRTIO_NET;
dev->slave_req_fd = -1;
+   dev->did = -1;
  
  	return i;

  }
@@ -311,6 +312,20 @@ vhost_destroy_device(int vid)
  }
  
  void

+vhost_set_vdpa_did(int vid, int did)
+{
+   struct virtio_net *dev

Re: [dpdk-dev] [PATCH v4 4/5] vhost: adapt vhost lib for selective datapath

2018-03-31 Thread Maxime Coquelin



On 03/10/2018 11:01 AM, Zhihong Wang wrote:

This patch adapts vhost lib for selective datapath by calling device ops
at the corresponding stage.

Signed-off-by: Zhihong Wang 
---
Changes in v4:

  1. Remove the "engine" concept in the lib.

---
Changes in v2:

  1. Ensure negotiated capabilities are supported in vhost-user lib.

  2. Configure the data path at the right time.

  lib/librte_vhost/rte_vhost.h   | 27 ++
  lib/librte_vhost/rte_vhost_version.map |  2 +
  lib/librte_vhost/socket.c  | 94 --
  lib/librte_vhost/vhost.c   |  3 ++
  lib/librte_vhost/vhost.h   |  2 +
  lib/librte_vhost/vhost_user.c  | 54 +--
  6 files changed, 172 insertions(+), 10 deletions(-)

diff --git a/lib/librte_vhost/rte_vhost.h b/lib/librte_vhost/rte_vhost.h
index d50f4c67d..3c3334d3e 100644
--- a/lib/librte_vhost/rte_vhost.h
+++ b/lib/librte_vhost/rte_vhost.h
@@ -279,6 +279,33 @@ int rte_vhost_driver_disable_features(const char *path, 
uint64_t features);
  int rte_vhost_driver_get_features(const char *path, uint64_t *features);
  
  /**

+ * Get the protocol feature bits before feature negotiation.
+ *
+ * @param path
+ *  The vhost-user socket file path
+ * @param protocol_features
+ *  A pointer to store the queried protocol feature bits
+ * @return
+ *  0 on success, -1 on failure
+ */
+int __rte_experimental
+rte_vhost_driver_get_protocol_features(const char *path,
+   uint64_t *protocol_features);
+
+/**
+ * Get the queue number bits before feature negotiation.
+ *
+ * @param path
+ *  The vhost-user socket file path
+ * @param queue_num
+ *  A pointer to store the queried queue number bits
+ * @return
+ *  0 on success, -1 on failure
+ */
+int __rte_experimental
+rte_vhost_driver_get_queue_num(const char *path, uint32_t *queue_num);
+
+/**
   * Get the feature bits after negotiation
   *
   * @param vid
diff --git a/lib/librte_vhost/rte_vhost_version.map 
b/lib/librte_vhost/rte_vhost_version.map
index 6e2d5364a..812ccd72b 100644
--- a/lib/librte_vhost/rte_vhost_version.map
+++ b/lib/librte_vhost/rte_vhost_version.map
@@ -67,4 +67,6 @@ EXPERIMENTAL {
rte_vhost_driver_set_vdpa_did;
rte_vhost_driver_get_vdpa_did;
rte_vhost_get_vdpa_did;
+   rte_vhost_driver_get_protocol_features;
+   rte_vhost_driver_get_queue_num;
  } DPDK_18.02;
diff --git a/lib/librte_vhost/socket.c b/lib/librte_vhost/socket.c
index 3d58da94e..ba7b422a0 100644
--- a/lib/librte_vhost/socket.c
+++ b/lib/librte_vhost/socket.c
@@ -216,6 +216,8 @@ vhost_user_add_connection(int fd, struct vhost_user_socket 
*vsocket)
  
  	vhost_set_builtin_virtio_net(vid, vsocket->use_builtin_virtio_net);
  
+	vhost_set_vdpa_did(vid, vsocket->did);

+
if (vsocket->dequeue_zero_copy)
vhost_enable_dequeue_zero_copy(vid);
  
@@ -648,20 +650,102 @@ int

  rte_vhost_driver_get_features(const char *path, uint64_t *features)
  {
struct vhost_user_socket *vsocket;
+   uint64_t vdpa_features;
+   int did = -1;
+   int ret = 0;
  
  	pthread_mutex_lock(&vhost_user.mutex);

vsocket = find_vhost_user_socket(path);
-   if (vsocket)
-   *features = vsocket->features;
+   if (vsocket) {
+   did = vsocket->did;
+   if (did < 0 || vdpa_devices[did]->ops->feature_get == NULL)
+   *features = vsocket->features;
+   else if (vdpa_devices[did]->ops->feature_get(did,
+   &vdpa_features) < 0) {
+   RTE_LOG(ERR, VHOST_CONFIG,
+   "failed to get vdpa features "
+   "for socket file %s.\n", path);
+   ret = -1;
+   } else
+   *features = vsocket->features & vdpa_features;


It seems correct but it is not very intuitive.
Also, you have to put braces everywhere if one of the if/else if/else
have some.

What about something like this:

rte_vhost_driver_get_features(const char *path, uint64_t *features)
{
struct vhost_user_socket *vsocket;
uint64_t vdpa_features;
int did = -1;
int ret = 0;
struct rte_vdpa_device *vdpa_dev;

pthread_mutex_lock(&vhost_user.mutex);
vsocket = find_vhost_user_socket(path);
if (!vsocket) {
RTE_LOG(ERR, VHOST_CONFIG,
"socket file %s is not registered yet.\n"
, path);
ret = -1;
goto out_unlock;
}

did = vsocket->did;
vdpa_dev = rte_vdpa_device_get(did);
if (!vdpa_dev || !vdpa->ops->feature_get) {
*features = vsocket->features;
goto out_unlock;
}

if (vdpa_dev->ops->feature_get(did, &vdpa_features) < 0) {
RTE_LOG(ERR, VHOST_CONFIG,
"failed 

Re: [dpdk-dev] [PATCH v4 2/5] vhost: support selective datapath

2018-03-31 Thread Maxime Coquelin



On 03/10/2018 11:01 AM, Zhihong Wang wrote:

+   uint64_t *size);
+/* Device ops */
+struct rte_vdpa_dev_ops {
+   vdpa_dev_queue_num_get_t  queue_num_get;
+   vdpa_dev_feature_get_tfeature_get;
+   vdpa_dev_feature_get_tprotocol_feature_get;


I would prefer them to be named as in Vhost-user spec:

get_queue_num
get_features
get_protocol_features

Thanks,
Maxime


Re: [dpdk-dev] [PATCH v4 5/5] vhost: add apis for live migration

2018-03-31 Thread Maxime Coquelin



On 03/10/2018 11:01 AM, Zhihong Wang wrote:

This patch adds APIs to enable live migration for non-builtin data paths.

At src side, last_avail/used_idx from the device need to be set into the
virtio_net structure, and the log_base and log_size from the virtio_net
structure need to be set into the device.

At dst side, last_avail/used_idx need to be read from the virtio_net
structure and set into the device.

Signed-off-by: Zhihong Wang 
---
  lib/librte_vhost/rte_vhost.h   | 51 +++
  lib/librte_vhost/rte_vhost_version.map |  3 ++
  lib/librte_vhost/vhost.c   | 63 ++
  3 files changed, 117 insertions(+)



Reviewed-by: Maxime Coquelin 

Thanks,
Maxime


[dpdk-dev] [PATCH v4 3/7] crypto/virtio: core code of virtio crypto PMD

2018-03-31 Thread Jay Zhou
The virtio crypto device has two types of queues, data
queue and control queue. It has one data queue at least and has one and
only one control queue. For example, if a virtio crypto device has
N queues, then [0, N-2] is the data queue index, N-1 is the control
queue index.
The virtio crypto PMD provides poll mode driver support for the
virtio crypto device.
The cryptodev is created at the virtio crypto pci device probing stage.
For now, it only supports the session-oriented API implementation, the
supported symmetrical algorithms are AES-CBC ciphering and AES-CBC with
HMAC-SHA1 algorithm-chaining. The function
virtio_crypto_sym_configure_session() is used to create a session, then
virtio_crypto_pkt_tx_burst() can be used to burst transfer packets and
virtio_crypto_pkt_rx_burst() can be used to burst receive packets.

Signed-off-by: Jay Zhou 
Reviewed-by: Fan Zhang 
Acked-by: Fan Zhang 
---
 drivers/crypto/virtio/virtio_crypto_capabilities.h |   51 +
 drivers/crypto/virtio/virtio_cryptodev.c   | 1508 
 drivers/crypto/virtio/virtio_cryptodev.h   |   66 +
 drivers/crypto/virtio/virtio_rxtx.c|  541 +++
 4 files changed, 2166 insertions(+)
 create mode 100644 drivers/crypto/virtio/virtio_crypto_capabilities.h
 create mode 100644 drivers/crypto/virtio/virtio_cryptodev.c
 create mode 100644 drivers/crypto/virtio/virtio_cryptodev.h
 create mode 100644 drivers/crypto/virtio/virtio_rxtx.c

diff --git a/drivers/crypto/virtio/virtio_crypto_capabilities.h 
b/drivers/crypto/virtio/virtio_crypto_capabilities.h
new file mode 100644
index 000..03c30de
--- /dev/null
+++ b/drivers/crypto/virtio/virtio_crypto_capabilities.h
@@ -0,0 +1,51 @@
+/* SPDX-License-Identifier: BSD-3-Clause
+ * Copyright(c) 2018 HUAWEI TECHNOLOGIES CO., LTD.
+ */
+
+#ifndef _VIRTIO_CRYPTO_CAPABILITIES_H_
+#define _VIRTIO_CRYPTO_CAPABILITIES_H_
+
+#define VIRTIO_SYM_CAPABILITIES\
+   {   /* SHA1 HMAC */ \
+   .op = RTE_CRYPTO_OP_TYPE_SYMMETRIC, \
+   {.sym = {   \
+   .xform_type = RTE_CRYPTO_SYM_XFORM_AUTH,\
+   {.auth = {  \
+   .algo = RTE_CRYPTO_AUTH_SHA1_HMAC,  \
+   .block_size = 64,   \
+   .key_size = {   \
+   .min = 1,   \
+   .max = 64,  \
+   .increment = 1  \
+   },  \
+   .digest_size = {\
+   .min = 1,   \
+   .max = 20,  \
+   .increment = 1  \
+   },  \
+   .iv_size = { 0 }\
+   }, }\
+   }, }\
+   },  \
+   {   /* AES CBC */   \
+   .op = RTE_CRYPTO_OP_TYPE_SYMMETRIC, \
+   {.sym = {   \
+   .xform_type = RTE_CRYPTO_SYM_XFORM_CIPHER,  \
+   {.cipher = {\
+   .algo = RTE_CRYPTO_CIPHER_AES_CBC,  \
+   .block_size = 16,   \
+   .key_size = {   \
+   .min = 16,  \
+   .max = 32,  \
+   .increment = 8  \
+   },  \
+   .iv_size = {\
+   .min = 16,  \
+   .max = 16,  \
+   .increment = 0  \
+   }   \
+   }, }\
+   }, }\
+   }
+
+#endif /* _VIRTIO_CRYPTO_CAPABILITIES_H_ */
diff --git a/dr

[dpdk-dev] [PATCH v4 5/7] doc: add virtio crypto PMD guide

2018-03-31 Thread Jay Zhou
Signed-off-by: Jay Zhou 
Reviewed-by: Fan Zhang 
Acked-by: Fan Zhang 
---
 doc/guides/cryptodevs/features/virtio.ini |  26 +++
 doc/guides/cryptodevs/index.rst   |   1 +
 doc/guides/cryptodevs/virtio.rst  | 117 ++
 3 files changed, 144 insertions(+)
 create mode 100644 doc/guides/cryptodevs/features/virtio.ini
 create mode 100644 doc/guides/cryptodevs/virtio.rst

diff --git a/doc/guides/cryptodevs/features/virtio.ini 
b/doc/guides/cryptodevs/features/virtio.ini
new file mode 100644
index 000..168fc17
--- /dev/null
+++ b/doc/guides/cryptodevs/features/virtio.ini
@@ -0,0 +1,26 @@
+; Supported features of the 'virtio' crypto driver.
+;
+; Refer to default.ini for the full list of available PMD features.
+;
+[Features]
+Symmetric crypto   = Y
+Sym operation chaining = Y
+
+;
+; Supported crypto algorithms of the 'virtio' crypto driver.
+;
+[Cipher]
+AES CBC (128)  = Y
+AES CBC (192)  = Y
+AES CBC (256)  = Y
+
+;
+; Supported authentication algorithms of the 'virtio' crypto driver.
+;
+[Auth]
+SHA1 HMAC  = Y
+
+;
+; Supported AEAD algorithms of the 'virtio' crypto driver.
+;
+[AEAD]
diff --git a/doc/guides/cryptodevs/index.rst b/doc/guides/cryptodevs/index.rst
index 558c926..ef16ab3 100644
--- a/doc/guides/cryptodevs/index.rst
+++ b/doc/guides/cryptodevs/index.rst
@@ -22,4 +22,5 @@ Crypto Device Drivers
 scheduler
 snow3g
 qat
+virtio
 zuc
diff --git a/doc/guides/cryptodevs/virtio.rst b/doc/guides/cryptodevs/virtio.rst
new file mode 100644
index 000..f3aa7c6
--- /dev/null
+++ b/doc/guides/cryptodevs/virtio.rst
@@ -0,0 +1,117 @@
+..  SPDX-License-Identifier: BSD-3-Clause
+Copyright(c) 2018 HUAWEI TECHNOLOGIES CO., LTD.
+
+Virtio Crypto Poll Mode Driver
+==
+
+The virtio crypto PMD provides poll mode driver support for the virtio crypto
+device.
+
+Features
+
+
+The virtio crypto PMD has support for:
+
+Cipher algorithms:
+
+* ``RTE_CRYPTO_CIPHER_AES_CBC``
+
+Hash algorithms:
+
+* ``RTE_CRYPTO_AUTH_SHA1_HMAC``
+
+Limitations
+---
+
+*  Only supports the session-oriented API implementation (session-less APIs are
+   not supported).
+*  Only supports modern mode since virtio crypto conforms to virtio-1.0.
+*  Only has two types of queues: data queue and control queue. These two queues
+   only support indirect buffers to communication with the virtio backend.
+*  Only supports AES_CBC cipher only algorithm and AES_CBC with HMAC_SHA1
+   chaining algorithm since the vhost crypto backend only these algorithms
+   are supported.
+*  Does not support Link State interrupt.
+*  Does not support runtime configuration.
+
+Virtio crypto PMD Rx/Tx Callbacks
+-
+
+Rx callbacks:
+
+* ``virtio_crypto_pkt_rx_burst``
+
+Tx callbacks:
+
+* ``virtio_crypto_pkt_tx_burst``
+
+Installation
+
+
+Quick instructions are as follows:
+
+Firstly run DPDK vhost crypto sample as a server side and build QEMU with
+vhost crypto enabled.
+QEMU can then be started using the following parameters:
+
+.. code-block:: console
+
+qemu-system-x86_64 \
+[...] \
+-chardev socket,id=charcrypto0,path=/path/to/your/socket \
+-object cryptodev-vhost-user,id=cryptodev0,chardev=charcrypto0 \
+-device virtio-crypto-pci,id=crypto0,cryptodev=cryptodev0
+[...]
+
+Secondly bind the uio_generic driver for the virtio-crypto device.
+For example, :00:04.0 is the domain, bus, device and function
+number of the virtio-crypto device:
+
+.. code-block:: console
+
+modprobe uio_pci_generic
+echo -n :00:04.0 > /sys/bus/pci/drivers/virtio-pci/unbind
+echo "1af4 1054" > /sys/bus/pci/drivers/uio_pci_generic/new_id
+
+Finally the front-end virtio crypto PMD driver can be installed:
+
+.. code-block:: console
+
+cd to the top-level DPDK directory
+sed -i 's,\(CONFIG_RTE_LIBRTE_PMD_VIRTIO_CRYPTO\)=n,\1=y,' 
config/common_base
+make config T=x86_64-native-linuxapp-gcc
+make install T=x86_64-native-linuxapp-gcc
+
+Tests
+-
+
+The unit test cases can be tested as below:
+
+.. code-block:: console
+
+reserve enough huge pages
+cd to the top-level DPDK directory
+export RTE_TARGET=x86_64-native-linuxapp-gcc
+export RTE_SDK=`pwd`
+cd to test/test
+type the command "make" to compile
+run the tests with "./test"
+type the command "cryptodev_virtio_autotest" to test
+
+The performance can be tested as below:
+
+.. code-block:: console
+
+reserve enough huge pages
+cd to the top-level DPDK directory
+export RTE_TARGET=x86_64-native-linuxapp-gcc
+export RTE_SDK=`pwd`
+cd to app/test-crypto-perf
+type the command "make" to compile
+run the tests with the following command:
+
+./dpdk-test-crypto-perf -l 0,1 -- --devtype crypto_virtio \
+--ptest throughput --optype cipher-then-auth --cipher-algo aes-cbc \
+--cipher-op encrypt --cipher-key-sz 16 --auth-algo sha1-hmac \

[dpdk-dev] [PATCH v4 0/7] crypto: add virtio poll mode driver

2018-03-31 Thread Jay Zhou
This patch series introduce virtio crypto poll mode driver.

Since it is limited by the vhost crypto backend of the virtio-crypto,
this patch series only supports a limited subset of crypto services.
Only the following algorithms are tested:

Cipher algorithms:
  - RTE_CRYPTO_CIPHER_AES_CBC (128-bit, 192-bit and 256-bit keys)

Cipher then hash algorithms:
  - RTE_CRYPTO_CIPHER_AES_CBC with RTE_CRYPTO_AUTH_SHA1_HMAC

The qemu side has supported vhost crypto and the vhost user crypto server
side patches had been sent to DPDK community, pls see

[PATCH v2 00/10] lib/librte_vhost: introduce new vhost user crypto backend
support
https://dpdk.org/ml/archives/dev/2018-February/091594.html

Firstly run DPDK vhost crypto sample as a server side and build QEMU with
vhost crypto enabled. 
QEMU can then be started using the following parameters:

qemu-system-x86_64 \
[...] \
-chardev socket,id=charcrypto0,path=/path/to/your/socket \
-object cryptodev-vhost-user,id=cryptodev0,chardev=charcrypto0 \
-device virtio-crypto-pci,id=crypto0,cryptodev=cryptodev0
[...]

Bind the uio_generic driver for the virtio-crypto device.
For example, :00:04.0 is the domain, bus, device and function
number of the virtio-crypto device:
modprobe uio_pci_generic
echo -n :00:04.0 > /sys/bus/pci/drivers/virtio-pci/unbind
echo "1af4 1054" > /sys/bus/pci/drivers/uio_pci_generic/new_id

The front-end virtio crypto PMD driver can be installed:
cd to the top-level DPDK directory
sed -i 's,\(CONFIG_RTE_LIBRTE_PMD_VIRTIO_CRYPTO\)=n,\1=y,' 
config/common_base
make config T=x86_64-native-linuxapp-gcc
make install T=x86_64-native-linuxapp-gcc

The unit test cases can be compiled as below:
cd to the top-level DPDK directory
export RTE_TARGET=x86_64-native-linuxapp-gcc
export RTE_SDK=`pwd`
cd to test/test
make
./test (MUST reserve enough huge pages memory)
type the command "cryptodev_virtio_autotest" to test

The result should be like this:
RTE>>cryptodev_virtio_autotest
 + --- +
 + Test Suite : Crypto VIRTIO Unit Test Suite
 + --- +
  0) TestCase AES-128-CBC Encryption PASS
  1) TestCase AES-128-CBC Decryption PASS
  2) TestCase AES-192-CBC Encryption PASS
  3) TestCase AES-192-CBC Decryption PASS
  4) TestCase AES-256-CBC Encryption PASS
  5) TestCase AES-256-CBC Decryption PASS
  6) TestCase AES-256-CBC OOP Encryption PASS
  7) TestCase AES-256-CBC OOP Decryption PASS
  8) TestCase AES-128-CTR Encryption PASS
  9) TestCase AES-128-CTR Decryption PASS
  10) TestCase AES-192-CTR Encryption PASS
  11) TestCase AES-192-CTR Decryption PASS
  12) TestCase AES-256-CTR Encryption PASS
  13) TestCase AES-256-CTR Decryption PASS
 + TestCase [ 0] : test_AES_cipheronly_virtio_all succeeded
 + --- +
 + Test Suite Summary
 + Tests Total :1
 + Tests Skipped :  0
 + Tests Executed : 1
 + Tests Unsupported:   0
 + Tests Passed :   1
 + Tests Failed :   0
 + --- +
Test OK

The performance can be tested as below:

reserve enough huge pages
cd to the top-level DPDK directory
export RTE_TARGET=x86_64-native-linuxapp-gcc
export RTE_SDK=`pwd`
cd to app/test-crypto-perf
type the command "make" to compile
run the tests with the following command:

./dpdk-test-crypto-perf -l 0,1 -- --devtype crypto_virtio \
--ptest throughput --optype cipher-then-auth --cipher-algo aes-cbc \
--cipher-op encrypt --cipher-key-sz 16 --auth-algo sha1-hmac \
--auth-op generate --auth-key-sz 64 --digest-sz 12 \
--total-ops 1 --burst-sz 64 --buffer-sz 2048

Please help to review, thanks!

Changes in v4:
 - using dynamic logging [Pablo]
 - elaborate on the core code [Pablo]
 - delete algorithms which can not be tested [Pablo]
 - rebased on dpdk-next-crypto [Pablo]
 - fix doc compilation error [Pablo]
 - add release note for this PMD [Pablo]
 - add R-b from Fan Zhang
 - fix some typos

Changes in v3:
 - set up capabilities for virtio crypto PMD [Fan]
 - delete AES-CTR unit test cases since vhost_user crypto backend does not
   support [Fan]
 - fix a variable uninitialized in virtio_crypto_queue_setup() [Xin, Fan]
 - fix a bug in virtqueue_dequeue_burst_rx()

Changes in v2:
 - using pre-allocated mempool instead of rte_malloc to improve performance 
[Fan]
 - split the patch into a patchset [Fan]
 - using linux/virtio_crypto.h instead of creating a copy of the file [Fan]
 - update doc/guides/cryptodevs for describing virtio crypto PMD [Fan]
 - update copyright
 - delete virtio legacy mode code since virtio-crypto conforms to virtio-1.0
 - refine the function and variable names
 - fix errors and warnings reported by checkpatch

Jay Zhou (7):
  crypto/virtio: add virtio related fundamental functions
  crypto/virtio:

[dpdk-dev] [PATCH v4 1/7] crypto/virtio: add virtio related fundamental functions

2018-03-31 Thread Jay Zhou
Since there does not have the common virtio library, we have to put
these files here. They are basically the same with virtio net related files
with some minor changes.

Meanwhile, adding virtio crypto PMD related release note for 18.05.

Signed-off-by: Jay Zhou 
Reviewed-by: Fan Zhang 
Acked-by: Fan Zhang 
---
 config/common_base |  14 +
 doc/guides/rel_notes/release_18_05.rst |   4 +
 drivers/crypto/virtio/virtio_logs.h|  91 +++
 drivers/crypto/virtio/virtio_pci.c | 460 +
 drivers/crypto/virtio/virtio_pci.h | 253 ++
 drivers/crypto/virtio/virtio_ring.h| 137 ++
 drivers/crypto/virtio/virtqueue.c  |  43 +++
 drivers/crypto/virtio/virtqueue.h  | 172 
 8 files changed, 1174 insertions(+)
 create mode 100644 drivers/crypto/virtio/virtio_logs.h
 create mode 100644 drivers/crypto/virtio/virtio_pci.c
 create mode 100644 drivers/crypto/virtio/virtio_pci.h
 create mode 100644 drivers/crypto/virtio/virtio_ring.h
 create mode 100644 drivers/crypto/virtio/virtqueue.c
 create mode 100644 drivers/crypto/virtio/virtqueue.h

diff --git a/config/common_base b/config/common_base
index ee10b44..91d3102 100644
--- a/config/common_base
+++ b/config/common_base
@@ -486,6 +486,20 @@ CONFIG_RTE_LIBRTE_PMD_QAT_DEBUG_DRIVER=n
 CONFIG_RTE_QAT_PMD_MAX_NB_SESSIONS=2048
 
 #
+# Compile PMD for virtio crypto devices
+#
+CONFIG_RTE_LIBRTE_PMD_VIRTIO_CRYPTO=n
+#
+# Number of maximum virtio crypto devices
+#
+CONFIG_RTE_MAX_VIRTIO_CRYPTO=32
+#
+# Number of sessions to create in the session memory pool
+# on a single virtio crypto device.
+#
+CONFIG_RTE_VIRTIO_CRYPTO_PMD_MAX_NB_SESSIONS=1024
+
+#
 # Compile PMD for AESNI backed device
 #
 CONFIG_RTE_LIBRTE_PMD_AESNI_MB=n
diff --git a/doc/guides/rel_notes/release_18_05.rst 
b/doc/guides/rel_notes/release_18_05.rst
index 3923dc2..32c39d5 100644
--- a/doc/guides/rel_notes/release_18_05.rst
+++ b/doc/guides/rel_notes/release_18_05.rst
@@ -41,6 +41,10 @@ New Features
  Also, make sure to start the actual text at the margin.
  =
 
+* **Added Virtio Crypto PMD.**
+
+  Added new Virtio Crypto PMD, which provides AES-CBC ciphering and AES-CBC
+  with HMAC-SHA1 algorithm-chaining.
 
 API Changes
 ---
diff --git a/drivers/crypto/virtio/virtio_logs.h 
b/drivers/crypto/virtio/virtio_logs.h
new file mode 100644
index 000..26a286c
--- /dev/null
+++ b/drivers/crypto/virtio/virtio_logs.h
@@ -0,0 +1,91 @@
+/* SPDX-License-Identifier: BSD-3-Clause
+ * Copyright(c) 2018 HUAWEI TECHNOLOGIES CO., LTD.
+ */
+
+#ifndef _VIRTIO_LOGS_H_
+#define _VIRTIO_LOGS_H_
+
+#include 
+
+#define PMD_INIT_LOG(level, fmt, args...) \
+   rte_log(RTE_LOG_ ## level, RTE_LOGTYPE_PMD, \
+   "PMD: %s(): " fmt "\n", __func__, ##args)
+
+#define PMD_INIT_FUNC_TRACE() PMD_INIT_LOG(DEBUG, " >>")
+
+extern int virtio_crypto_logtype_init;
+
+#define VIRTIO_CRYPTO_INIT_LOG_IMPL(level, fmt, args...) \
+   rte_log(RTE_LOG_ ## level, virtio_crypto_logtype_init, \
+   "INIT: %s(): " fmt "\n", __func__, ##args)
+
+#define VIRTIO_CRYPTO_INIT_LOG_INFO(fmt, args...) \
+   VIRTIO_CRYPTO_INIT_LOG_IMPL(INFO, fmt, ## args)
+
+#define VIRTIO_CRYPTO_INIT_LOG_DBG(fmt, args...) \
+   VIRTIO_CRYPTO_INIT_LOG_IMPL(DEBUG, fmt, ## args)
+
+#define VIRTIO_CRYPTO_INIT_LOG_ERR(fmt, args...) \
+   VIRTIO_CRYPTO_INIT_LOG_IMPL(ERR, fmt, ## args)
+
+extern int virtio_crypto_logtype_session;
+
+#define VIRTIO_CRYPTO_SESSION_LOG_IMPL(level, fmt, args...) \
+   rte_log(RTE_LOG_ ## level, virtio_crypto_logtype_session, \
+   "SESSION: %s(): " fmt "\n", __func__, ##args)
+
+#define VIRTIO_CRYPTO_SESSION_LOG_INFO(fmt, args...) \
+   VIRTIO_CRYPTO_SESSION_LOG_IMPL(INFO, fmt, ## args)
+
+#define VIRTIO_CRYPTO_SESSION_LOG_DBG(fmt, args...) \
+   VIRTIO_CRYPTO_SESSION_LOG_IMPL(DEBUG, fmt, ## args)
+
+#define VIRTIO_CRYPTO_SESSION_LOG_ERR(fmt, args...) \
+   VIRTIO_CRYPTO_SESSION_LOG_IMPL(ERR, fmt, ## args)
+
+extern int virtio_crypto_logtype_rx;
+
+#define VIRTIO_CRYPTO_RX_LOG_IMPL(level, fmt, args...) \
+   rte_log(RTE_LOG_ ## level, virtio_crypto_logtype_rx, \
+   "RX: %s(): " fmt "\n", __func__, ##args)
+
+#define VIRTIO_CRYPTO_RX_LOG_INFO(fmt, args...) \
+   VIRTIO_CRYPTO_RX_LOG_IMPL(INFO, fmt, ## args)
+
+#define VIRTIO_CRYPTO_RX_LOG_DBG(fmt, args...) \
+   VIRTIO_CRYPTO_RX_LOG_IMPL(DEBUG, fmt, ## args)
+
+#define VIRTIO_CRYPTO_RX_LOG_ERR(fmt, args...) \
+   VIRTIO_CRYPTO_RX_LOG_IMPL(ERR, fmt, ## args)
+
+extern int virtio_crypto_logtype_tx;
+
+#define VIRTIO_CRYPTO_TX_LOG_IMPL(level, fmt, args...) \
+   rte_log(RTE_LOG_ ## level, virtio_crypto_logtype_tx, \
+   "TX: %s(): " fmt "\n", __func__, ##args)
+
+#define VIRTIO_CRYPTO_TX_LOG_INFO(fmt, args...) \
+   VIRTIO_CRYPTO_TX_LOG_IMPL(INFO, fmt, ## args)
+
+#define VIRTIO_CRYPTO_TX_LOG_DBG(fmt, args...) \
+   VIRT

[dpdk-dev] [PATCH v4 2/7] crypto/virtio: add crypto related session structure

2018-03-31 Thread Jay Zhou
This structure will be used in the following patches, especially
at creating and destroying crypto sessions.

Signed-off-by: Jay Zhou 
Reviewed-by: Fan Zhang 
Acked-by: Fan Zhang 
---
 drivers/crypto/virtio/virtio_crypto_algs.h | 27 +++
 1 file changed, 27 insertions(+)
 create mode 100644 drivers/crypto/virtio/virtio_crypto_algs.h

diff --git a/drivers/crypto/virtio/virtio_crypto_algs.h 
b/drivers/crypto/virtio/virtio_crypto_algs.h
new file mode 100644
index 000..5f1e9df
--- /dev/null
+++ b/drivers/crypto/virtio/virtio_crypto_algs.h
@@ -0,0 +1,27 @@
+/* SPDX-License-Identifier: BSD-3-Clause
+ * Copyright(c) 2018 HUAWEI TECHNOLOGIES CO., LTD.
+ */
+
+#ifndef _VIRTIO_CRYPTO_ALGS_H_
+#define _VIRTIO_CRYPTO_ALGS_H_
+
+#include 
+#include 
+
+struct virtio_crypto_session {
+   uint64_t session_id;
+
+   struct {
+   uint16_t offset;
+   uint16_t length;
+   } iv;
+
+   struct {
+   uint32_t length;
+   phys_addr_t phys_addr;
+   } aad;
+
+   struct virtio_crypto_op_ctrl_req ctrl;
+};
+
+#endif /* _VIRTIO_CRYPTO_ALGS_H_ */
-- 
1.8.3.1




[dpdk-dev] [PATCH v4 6/7] test/crypto: add function tests for virtio crypto PMD

2018-03-31 Thread Jay Zhou
Only RTE_CRYPTO_CIPHER_AES_CBC cipher
algorithm are tested as unit test, it is supported both by the
cryptodev-backend-builtin and cryptodev-vhost-user of qemu side.

Signed-off-by: Jay Zhou 
Reviewed-by: Fan Zhang 
Acked-by: Fan Zhang 
---
 test/test/test_cryptodev.c  | 49 +
 test/test/test_cryptodev.h  |  1 +
 test/test/test_cryptodev_aes_test_vectors.h | 24 +-
 test/test/test_cryptodev_blockcipher.c  |  9 +-
 test/test/test_cryptodev_blockcipher.h  |  1 +
 5 files changed, 75 insertions(+), 9 deletions(-)

diff --git a/test/test/test_cryptodev.c b/test/test/test_cryptodev.c
index 1417482..357e1df 100644
--- a/test/test/test_cryptodev.c
+++ b/test/test/test_cryptodev.c
@@ -1765,6 +1765,26 @@ struct crypto_unittest_params {
 }
 
 static int
+test_AES_cipheronly_virtio_all(void)
+{
+   struct crypto_testsuite_params *ts_params = &testsuite_params;
+   int status;
+
+   status = test_blockcipher_all_tests(ts_params->mbuf_pool,
+   ts_params->op_mpool,
+   ts_params->session_mpool,
+   ts_params->valid_devs[0],
+   rte_cryptodev_driver_id_get(
+   RTE_STR(CRYPTODEV_NAME_VIRTIO_PMD)),
+   BLKCIPHER_AES_CIPHERONLY_TYPE);
+
+   TEST_ASSERT_EQUAL(status, 0, "Test failed");
+
+   return TEST_SUCCESS;
+}
+
+
+static int
 test_AES_chain_dpaa_sec_all(void)
 {
struct crypto_testsuite_params *ts_params = &testsuite_params;
@@ -8767,6 +8787,18 @@ struct test_crypto_vector {
}
 };
 
+static struct unit_test_suite cryptodev_virtio_testsuite  = {
+   .suite_name = "Crypto VIRTIO Unit Test Suite",
+   .setup = testsuite_setup,
+   .teardown = testsuite_teardown,
+   .unit_test_cases = {
+   TEST_CASE_ST(ut_setup, ut_teardown,
+   test_AES_cipheronly_virtio_all),
+
+   TEST_CASES_END() /**< NULL terminate unit test array */
+   }
+};
+
 static struct unit_test_suite cryptodev_aesni_mb_testsuite  = {
.suite_name = "Crypto Device AESNI MB Unit Test Suite",
.setup = testsuite_setup,
@@ -9664,6 +9696,22 @@ struct test_crypto_vector {
 }
 
 static int
+test_cryptodev_virtio(void /*argv __rte_unused, int argc __rte_unused*/)
+{
+   gbl_driver_id = rte_cryptodev_driver_id_get(
+   RTE_STR(CRYPTODEV_NAME_VIRTIO_PMD));
+
+   if (gbl_driver_id == -1) {
+   RTE_LOG(ERR, USER1, "VIRTIO PMD must be loaded. Check if "
+   "CONFIG_RTE_LIBRTE_PMD_VIRTIO_CRYPTO is enabled 
"
+   "in config file to run this testsuite.\n");
+   return TEST_FAILED;
+   }
+
+   return unit_test_suite_runner(&cryptodev_virtio_testsuite);
+}
+
+static int
 test_cryptodev_aesni_mb(void /*argv __rte_unused, int argc __rte_unused*/)
 {
gbl_driver_id = rte_cryptodev_driver_id_get(
@@ -9879,3 +9927,4 @@ struct test_crypto_vector {
 REGISTER_TEST_COMMAND(cryptodev_sw_mrvl_autotest, test_cryptodev_mrvl);
 REGISTER_TEST_COMMAND(cryptodev_dpaa2_sec_autotest, test_cryptodev_dpaa2_sec);
 REGISTER_TEST_COMMAND(cryptodev_dpaa_sec_autotest, test_cryptodev_dpaa_sec);
+REGISTER_TEST_COMMAND(cryptodev_virtio_autotest, test_cryptodev_virtio);
diff --git a/test/test/test_cryptodev.h b/test/test/test_cryptodev.h
index 8cdc087..c311277 100644
--- a/test/test/test_cryptodev.h
+++ b/test/test/test_cryptodev.h
@@ -61,6 +61,7 @@
 #define CRYPTODEV_NAME_DPAA2_SEC_PMD   crypto_dpaa2_sec
 #define CRYPTODEV_NAME_SCHEDULER_PMD   crypto_scheduler
 #define CRYPTODEV_NAME_MRVL_PMDcrypto_mrvl
+#define CRYPTODEV_NAME_VIRTIO_PMD   crypto_virtio
 
 /**
  * Write (spread) data from buffer to mbuf data
diff --git a/test/test/test_cryptodev_aes_test_vectors.h 
b/test/test/test_cryptodev_aes_test_vectors.h
index 3577ef4..cac7cda 100644
--- a/test/test/test_cryptodev_aes_test_vectors.h
+++ b/test/test/test_cryptodev_aes_test_vectors.h
@@ -1526,7 +1526,8 @@
BLOCKCIPHER_TEST_TARGET_PMD_SCHEDULER |
BLOCKCIPHER_TEST_TARGET_PMD_DPAA2_SEC |
BLOCKCIPHER_TEST_TARGET_PMD_DPAA_SEC |
-   BLOCKCIPHER_TEST_TARGET_PMD_MRVL
+   BLOCKCIPHER_TEST_TARGET_PMD_MRVL |
+   BLOCKCIPHER_TEST_TARGET_PMD_VIRTIO
},
{
.test_descr = "AES-128-CBC Decryption",
@@ -1538,7 +1539,8 @@
BLOCKCIPHER_TEST_TARGET_PMD_SCHEDULER |
BLOCKCIPHER_TEST_TARGET_PMD_DPAA2_SEC |
BLOCKCIPHER_TEST_TARGET_PMD_DPAA_SEC |
-   BLOCKCIPHER_TEST_TARGET_PMD_MRVL
+   BLOCKCIPHER_TEST_TARGET_PMD_MRVL |
+   BLOCKCIPHER_TEST_TARGET_PMD_VIRTIO
},
{
.test_descr = "AES-192-CBC Encryption",
@@ -1549,7 +1551,8 @@

[dpdk-dev] [PATCH v4 4/7] crypto/virtio: add makefile

2018-03-31 Thread Jay Zhou
The virtio crypto PMD driver can be compiled now.

Signed-off-by: Jay Zhou 
Reviewed-by: Fan Zhang 
Acked-by: Fan Zhang 
---
 drivers/crypto/Makefile|  1 +
 drivers/crypto/virtio/Makefile | 31 ++
 .../virtio/rte_pmd_virtio_crypto_version.map   |  3 +++
 mk/rte.app.mk  |  1 +
 4 files changed, 36 insertions(+)
 create mode 100644 drivers/crypto/virtio/Makefile
 create mode 100644 drivers/crypto/virtio/rte_pmd_virtio_crypto_version.map

diff --git a/drivers/crypto/Makefile b/drivers/crypto/Makefile
index 26e503e..e48bbdd 100644
--- a/drivers/crypto/Makefile
+++ b/drivers/crypto/Makefile
@@ -20,5 +20,6 @@ endif
 ifeq ($(CONFIG_RTE_LIBRTE_DPAA_BUS),y)
 DIRS-$(CONFIG_RTE_LIBRTE_PMD_DPAA_SEC) += dpaa_sec
 endif
+DIRS-$(CONFIG_RTE_LIBRTE_PMD_VIRTIO_CRYPTO) += virtio
 
 include $(RTE_SDK)/mk/rte.subdir.mk
diff --git a/drivers/crypto/virtio/Makefile b/drivers/crypto/virtio/Makefile
new file mode 100644
index 000..c4727ea
--- /dev/null
+++ b/drivers/crypto/virtio/Makefile
@@ -0,0 +1,31 @@
+# SPDX-License-Identifier: BSD-3-Clause
+# Copyright(c) 2018 HUAWEI TECHNOLOGIES CO., LTD.
+
+include $(RTE_SDK)/mk/rte.vars.mk
+
+#
+# library name
+#
+LIB = librte_pmd_virtio_crypto.a
+
+CFLAGS += -O3
+CFLAGS += $(WERROR_FLAGS)
+
+EXPORT_MAP := rte_pmd_virtio_crypto_version.map
+
+LIBABIVER := 1
+
+#
+# all source are stored in SRCS-y
+#
+SRCS-$(CONFIG_RTE_LIBRTE_PMD_VIRTIO_CRYPTO) += virtqueue.c
+SRCS-$(CONFIG_RTE_LIBRTE_PMD_VIRTIO_CRYPTO) += virtio_pci.c
+SRCS-$(CONFIG_RTE_LIBRTE_PMD_VIRTIO_CRYPTO) += virtio_rxtx.c
+SRCS-$(CONFIG_RTE_LIBRTE_PMD_VIRTIO_CRYPTO) += virtio_cryptodev.c
+
+# this lib depends upon:
+DEPDIRS-$(CONFIG_RTE_LIBRTE_PMD_VIRTIO_CRYPTO) += lib/librte_eal
+DEPDIRS-$(CONFIG_RTE_LIBRTE_PMD_VIRTIO_CRYPTO) += lib/librte_mempool 
lib/librte_mbuf
+DEPDIRS-$(CONFIG_RTE_LIBRTE_PMD_VIRTIO_CRYPTO) += lib/librte_cryptodev
+
+include $(RTE_SDK)/mk/rte.lib.mk
diff --git a/drivers/crypto/virtio/rte_pmd_virtio_crypto_version.map 
b/drivers/crypto/virtio/rte_pmd_virtio_crypto_version.map
new file mode 100644
index 000..de8e412
--- /dev/null
+++ b/drivers/crypto/virtio/rte_pmd_virtio_crypto_version.map
@@ -0,0 +1,3 @@
+DPDK_18.05 {
+   local: *;
+};
diff --git a/mk/rte.app.mk b/mk/rte.app.mk
index 94525dc..d7ddda4 100644
--- a/mk/rte.app.mk
+++ b/mk/rte.app.mk
@@ -204,6 +204,7 @@ _LDLIBS-$(CONFIG_RTE_LIBRTE_PMD_AESNI_GCM)   += 
-L$(AESNI_MULTI_BUFFER_LIB_PATH)
 _LDLIBS-$(CONFIG_RTE_LIBRTE_PMD_OPENSSL) += -lrte_pmd_openssl -lcrypto
 _LDLIBS-$(CONFIG_RTE_LIBRTE_PMD_NULL_CRYPTO) += -lrte_pmd_null_crypto
 _LDLIBS-$(CONFIG_RTE_LIBRTE_PMD_QAT) += -lrte_pmd_qat -lcrypto
+_LDLIBS-$(CONFIG_RTE_LIBRTE_PMD_VIRTIO_CRYPTO) += -lrte_pmd_virtio_crypto 
-lcrypto
 _LDLIBS-$(CONFIG_RTE_LIBRTE_PMD_SNOW3G)  += -lrte_pmd_snow3g
 _LDLIBS-$(CONFIG_RTE_LIBRTE_PMD_SNOW3G)  += -L$(LIBSSO_SNOW3G_PATH)/build 
-lsso_snow3g
 _LDLIBS-$(CONFIG_RTE_LIBRTE_PMD_KASUMI)  += -lrte_pmd_kasumi
-- 
1.8.3.1




[dpdk-dev] [PATCH v4 7/7] MAINTAINERS: add myself as virtio crypto PMD maintainer

2018-03-31 Thread Jay Zhou
Signed-off-by: Jay Zhou 
Reviewed-by: Fan Zhang 
Acked-by: Fan Zhang 
---
 MAINTAINERS | 6 ++
 1 file changed, 6 insertions(+)

diff --git a/MAINTAINERS b/MAINTAINERS
index 75d3e92..24c5af8 100644
--- a/MAINTAINERS
+++ b/MAINTAINERS
@@ -718,6 +718,12 @@ F: drivers/crypto/snow3g/
 F: doc/guides/cryptodevs/snow3g.rst
 F: doc/guides/cryptodevs/features/snow3g.ini
 
+Virtio
+M: Jay Zhou 
+F: drivers/crypto/virtio/
+F: doc/guides/cryptodevs/virtio.rst
+F: doc/guides/cryptodevs/features/virtio.ini
+
 ZUC
 M: Pablo de Lara 
 F: drivers/crypto/zuc/
-- 
1.8.3.1




Re: [dpdk-dev] [PATCH v4 0/7] crypto: add virtio poll mode driver

2018-03-31 Thread Zhoujian (jay)
I find that my dpdk-next-crypto repo is not the newest, I'll send a new version.
Sorry about that.

Regards,
Jay

> -Original Message-
> From: Zhoujian (jay)
> Sent: Saturday, March 31, 2018 3:49 PM
> To: dev@dpdk.org
> Cc: pablo.de.lara.gua...@intel.com; roy.fan.zh...@intel.com;
> tho...@monjalon.net; Gonglei (Arei) ;
> xin.z...@intel.com; Huangweidong (C) ; wangxin (U)
> ; longpeng ; Zhoujian (jay)
> 
> Subject: [PATCH v4 0/7] crypto: add virtio poll mode driver
> 
> This patch series introduce virtio crypto poll mode driver.
> 
> Since it is limited by the vhost crypto backend of the virtio-crypto, this
> patch series only supports a limited subset of crypto services.
> Only the following algorithms are tested:
> 
> Cipher algorithms:
>   - RTE_CRYPTO_CIPHER_AES_CBC (128-bit, 192-bit and 256-bit keys)
> 
> Cipher then hash algorithms:
>   - RTE_CRYPTO_CIPHER_AES_CBC with RTE_CRYPTO_AUTH_SHA1_HMAC
> 
> The qemu side has supported vhost crypto and the vhost user crypto server
> side patches had been sent to DPDK community, pls see
> 
> [PATCH v2 00/10] lib/librte_vhost: introduce new vhost user crypto backend
> support https://dpdk.org/ml/archives/dev/2018-February/091594.html
> 
> Firstly run DPDK vhost crypto sample as a server side and build QEMU with
> vhost crypto enabled.
> QEMU can then be started using the following parameters:
> 
> qemu-system-x86_64 \
> [...] \
> -chardev socket,id=charcrypto0,path=/path/to/your/socket \
> -object cryptodev-vhost-user,id=cryptodev0,chardev=charcrypto0 \
> -device virtio-crypto-pci,id=crypto0,cryptodev=cryptodev0
> [...]
> 
> Bind the uio_generic driver for the virtio-crypto device.
> For example, :00:04.0 is the domain, bus, device and function number of
> the virtio-crypto device:
> modprobe uio_pci_generic
> echo -n :00:04.0 > /sys/bus/pci/drivers/virtio-pci/unbind
> echo "1af4 1054" > /sys/bus/pci/drivers/uio_pci_generic/new_id
> 
> The front-end virtio crypto PMD driver can be installed:
> cd to the top-level DPDK directory
> sed -i 's,\(CONFIG_RTE_LIBRTE_PMD_VIRTIO_CRYPTO\)=n,\1=y,'
> config/common_base
> make config T=x86_64-native-linuxapp-gcc
> make install T=x86_64-native-linuxapp-gcc
> 
> The unit test cases can be compiled as below:
> cd to the top-level DPDK directory
> export RTE_TARGET=x86_64-native-linuxapp-gcc
> export RTE_SDK=`pwd`
> cd to test/test
> make
> ./test (MUST reserve enough huge pages memory)
> type the command "cryptodev_virtio_autotest" to test
> 
> The result should be like this:
> RTE>>cryptodev_virtio_autotest
>  + --- +  + Test Suite :
> Crypto VIRTIO Unit Test Suite  + 
> --- +
>   0) TestCase AES-128-CBC Encryption PASS
>   1) TestCase AES-128-CBC Decryption PASS
>   2) TestCase AES-192-CBC Encryption PASS
>   3) TestCase AES-192-CBC Decryption PASS
>   4) TestCase AES-256-CBC Encryption PASS
>   5) TestCase AES-256-CBC Decryption PASS
>   6) TestCase AES-256-CBC OOP Encryption PASS
>   7) TestCase AES-256-CBC OOP Decryption PASS
>   8) TestCase AES-128-CTR Encryption PASS
>   9) TestCase AES-128-CTR Decryption PASS
>   10) TestCase AES-192-CTR Encryption PASS
>   11) TestCase AES-192-CTR Decryption PASS
>   12) TestCase AES-256-CTR Encryption PASS
>   13) TestCase AES-256-CTR Decryption PASS  + TestCase [ 0] :
> test_AES_cipheronly_virtio_all succeeded  + -
> -- +  + Test Suite Summary
>  + Tests Total :1
>  + Tests Skipped :  0
>  + Tests Executed : 1
>  + Tests Unsupported:   0
>  + Tests Passed :   1
>  + Tests Failed :   0
>  + --- + Test OK
> 
> The performance can be tested as below:
> 
> reserve enough huge pages
> cd to the top-level DPDK directory
> export RTE_TARGET=x86_64-native-linuxapp-gcc
> export RTE_SDK=`pwd`
> cd to app/test-crypto-perf
> type the command "make" to compile
> run the tests with the following command:
> 
> ./dpdk-test-crypto-perf -l 0,1 -- --devtype crypto_virtio \
> --ptest throughput --optype cipher-then-auth --cipher-algo aes-cbc \
> --cipher-op encrypt --cipher-key-sz 16 --auth-algo sha1-hmac \
> --auth-op generate --auth-key-sz 64 --digest-sz 12 \
> --total-ops 1 --burst-sz 64 --buffer-sz 2048
> 
> Please help to review, thanks!
> 
> Changes in v4:
>  - using dynamic logging [Pablo]
>  - elaborate on the core code [Pablo]
>  - delete algorithms which can not be tested [Pablo]
>  - rebased on dpdk-next-crypto [Pablo]
>  - fix doc compilation error [Pablo]
>  - add release note for this PMD [Pablo]
>  - add R-b from Fan Zhang
>  - fix some typos
> 
> Changes in v3:
>  - set up capabilities for virtio crypto PMD [Fan]
>  - delete AES-CTR unit test cases since vhost_user crypto backend does n

[dpdk-dev] [PATCH v5 0/7] crypto: add virtio poll mode driver

2018-03-31 Thread Jay Zhou
This patch series introduce virtio crypto poll mode driver.

Since it is limited by the vhost crypto backend of the virtio-crypto,
this patch series only supports a limited subset of crypto services.
Only the following algorithms are tested:

Cipher algorithms:
  - RTE_CRYPTO_CIPHER_AES_CBC (128-bit, 192-bit and 256-bit keys)

Cipher then hash algorithms:
  - RTE_CRYPTO_CIPHER_AES_CBC with RTE_CRYPTO_AUTH_SHA1_HMAC

The qemu side has supported vhost crypto and the vhost user crypto server
side patches had been sent to DPDK community, pls see

[PATCH v2 00/10] lib/librte_vhost: introduce new vhost user crypto backend
support
https://dpdk.org/ml/archives/dev/2018-February/091594.html

Firstly run DPDK vhost crypto sample as a server side and build QEMU with
vhost crypto enabled. 
QEMU can then be started using the following parameters:

qemu-system-x86_64 \
[...] \
-chardev socket,id=charcrypto0,path=/path/to/your/socket \
-object cryptodev-vhost-user,id=cryptodev0,chardev=charcrypto0 \
-device virtio-crypto-pci,id=crypto0,cryptodev=cryptodev0
[...]

Bind the uio_generic driver for the virtio-crypto device.
For example, :00:04.0 is the domain, bus, device and function
number of the virtio-crypto device:
modprobe uio_pci_generic
echo -n :00:04.0 > /sys/bus/pci/drivers/virtio-pci/unbind
echo "1af4 1054" > /sys/bus/pci/drivers/uio_pci_generic/new_id

The front-end virtio crypto PMD driver can be installed:
cd to the top-level DPDK directory
sed -i 's,\(CONFIG_RTE_LIBRTE_PMD_VIRTIO_CRYPTO\)=n,\1=y,' 
config/common_base
make config T=x86_64-native-linuxapp-gcc
make install T=x86_64-native-linuxapp-gcc

The unit test cases can be compiled as below:
cd to the top-level DPDK directory
export RTE_TARGET=x86_64-native-linuxapp-gcc
export RTE_SDK=`pwd`
cd to test/test
make
./test (MUST reserve enough huge pages memory)
type the command "cryptodev_virtio_autotest" to test

The result should be like this:
RTE>>cryptodev_virtio_autotest
 + --- +
 + Test Suite : Crypto VIRTIO Unit Test Suite
 + --- +
  0) TestCase AES-128-CBC Encryption PASS
  1) TestCase AES-128-CBC Decryption PASS
  2) TestCase AES-192-CBC Encryption PASS
  3) TestCase AES-192-CBC Decryption PASS
  4) TestCase AES-256-CBC Encryption PASS
  5) TestCase AES-256-CBC Decryption PASS
  6) TestCase AES-256-CBC OOP Encryption PASS
  7) TestCase AES-256-CBC OOP Decryption PASS
 + TestCase [ 0] : test_AES_cipheronly_virtio_all succeeded
 + --- +
 + Test Suite Summary
 + Tests Total :1
 + Tests Skipped :  0
 + Tests Executed : 1
 + Tests Unsupported:   0
 + Tests Passed :   1
 + Tests Failed :   0
 + --- +
Test OK

The performance can be tested as below:

reserve enough huge pages
cd to the top-level DPDK directory
export RTE_TARGET=x86_64-native-linuxapp-gcc
export RTE_SDK=`pwd`
cd to app/test-crypto-perf
type the command "make" to compile
run the tests with the following command:

./dpdk-test-crypto-perf -l 0,1 -- --devtype crypto_virtio \
--ptest throughput --optype cipher-then-auth --cipher-algo aes-cbc \
--cipher-op encrypt --cipher-key-sz 16 --auth-algo sha1-hmac \
--auth-op generate --auth-key-sz 64 --digest-sz 12 \
--total-ops 1 --burst-sz 64 --buffer-sz 2048

Please help to review, thanks!

Changes in v5:
 - rebased on the newest dpdk-next-crypto

Changes in v4:
 - using dynamic logging [Pablo]
 - elaborate on the core code [Pablo]
 - delete algorithms which can not be tested [Pablo]
 - rebased on dpdk-next-crypto [Pablo]
 - fix doc compilation error [Pablo]
 - add release note for this PMD [Pablo]
 - add R-b from Fan Zhang
 - fix some typos

Changes in v3:
 - set up capabilities for virtio crypto PMD [Fan]
 - delete AES-CTR unit test cases since vhost_user crypto backend does not
   support [Fan]
 - fix a variable uninitialized in virtio_crypto_queue_setup() [Xin, Fan]
 - fix a bug in virtqueue_dequeue_burst_rx()

Changes in v2:
 - using pre-allocated mempool instead of rte_malloc to improve performance 
[Fan]
 - split the patch into a patchset [Fan]
 - using linux/virtio_crypto.h instead of creating a copy of the file [Fan]
 - update doc/guides/cryptodevs for describing virtio crypto PMD [Fan]
 - update copyright
 - delete virtio legacy mode code since virtio-crypto conforms to virtio-1.0
 - refine the function and variable names
 - fix errors and warnings reported by checkpatch

Jay Zhou (7):
  crypto/virtio: add virtio related fundamental functions
  crypto/virtio: add crypto related session structure
  crypto/virtio: core code of virtio crypto PMD
  crypto/virtio: add makefile
  doc: add virtio crypto PMD guide
  test/crypto: add function tests for virtio cr

[dpdk-dev] [PATCH v5 1/7] crypto/virtio: add virtio related fundamental functions

2018-03-31 Thread Jay Zhou
Since there does not have the common virtio library, we have to put
these files here. They are basically the same with virtio net related files
with some minor changes.

Meanwhile, adding virtio crypto PMD related release note for 18.05.

Signed-off-by: Jay Zhou 
Reviewed-by: Fan Zhang 
Acked-by: Fan Zhang 
---
 config/common_base |  14 +
 doc/guides/rel_notes/release_18_05.rst |   6 +
 drivers/crypto/virtio/virtio_logs.h|  91 +++
 drivers/crypto/virtio/virtio_pci.c | 460 +
 drivers/crypto/virtio/virtio_pci.h | 253 ++
 drivers/crypto/virtio/virtio_ring.h| 137 ++
 drivers/crypto/virtio/virtqueue.c  |  43 +++
 drivers/crypto/virtio/virtqueue.h  | 172 
 8 files changed, 1176 insertions(+)
 create mode 100644 drivers/crypto/virtio/virtio_logs.h
 create mode 100644 drivers/crypto/virtio/virtio_pci.c
 create mode 100644 drivers/crypto/virtio/virtio_pci.h
 create mode 100644 drivers/crypto/virtio/virtio_ring.h
 create mode 100644 drivers/crypto/virtio/virtqueue.c
 create mode 100644 drivers/crypto/virtio/virtqueue.h

diff --git a/config/common_base b/config/common_base
index a842478..bf6bbc7 100644
--- a/config/common_base
+++ b/config/common_base
@@ -486,6 +486,20 @@ CONFIG_RTE_LIBRTE_PMD_QAT_DEBUG_DRIVER=n
 CONFIG_RTE_QAT_PMD_MAX_NB_SESSIONS=2048
 
 #
+# Compile PMD for virtio crypto devices
+#
+CONFIG_RTE_LIBRTE_PMD_VIRTIO_CRYPTO=n
+#
+# Number of maximum virtio crypto devices
+#
+CONFIG_RTE_MAX_VIRTIO_CRYPTO=32
+#
+# Number of sessions to create in the session memory pool
+# on a single virtio crypto device.
+#
+CONFIG_RTE_VIRTIO_CRYPTO_PMD_MAX_NB_SESSIONS=1024
+
+#
 # Compile PMD for AESNI backed device
 #
 CONFIG_RTE_LIBRTE_PMD_AESNI_MB=n
diff --git a/doc/guides/rel_notes/release_18_05.rst 
b/doc/guides/rel_notes/release_18_05.rst
index 0eeabf5..a90c25e 100644
--- a/doc/guides/rel_notes/release_18_05.rst
+++ b/doc/guides/rel_notes/release_18_05.rst
@@ -53,6 +53,12 @@ New Features
   :doc:`../cryptodevs/ccp` crypto driver guide for more details on
   this new driver.
 
+* **Added the virtio crypto PMD.**
+
+  Added a new virtio crypto PMD, which provides AES-CBC ciphering and
+  AES-CBC with HMAC-SHA1 algorithm-chaining. See the
+  :doc:`../cryptodevs/virtio` crypto driver guide for more details on
+  this new driver.
 
 API Changes
 ---
diff --git a/drivers/crypto/virtio/virtio_logs.h 
b/drivers/crypto/virtio/virtio_logs.h
new file mode 100644
index 000..26a286c
--- /dev/null
+++ b/drivers/crypto/virtio/virtio_logs.h
@@ -0,0 +1,91 @@
+/* SPDX-License-Identifier: BSD-3-Clause
+ * Copyright(c) 2018 HUAWEI TECHNOLOGIES CO., LTD.
+ */
+
+#ifndef _VIRTIO_LOGS_H_
+#define _VIRTIO_LOGS_H_
+
+#include 
+
+#define PMD_INIT_LOG(level, fmt, args...) \
+   rte_log(RTE_LOG_ ## level, RTE_LOGTYPE_PMD, \
+   "PMD: %s(): " fmt "\n", __func__, ##args)
+
+#define PMD_INIT_FUNC_TRACE() PMD_INIT_LOG(DEBUG, " >>")
+
+extern int virtio_crypto_logtype_init;
+
+#define VIRTIO_CRYPTO_INIT_LOG_IMPL(level, fmt, args...) \
+   rte_log(RTE_LOG_ ## level, virtio_crypto_logtype_init, \
+   "INIT: %s(): " fmt "\n", __func__, ##args)
+
+#define VIRTIO_CRYPTO_INIT_LOG_INFO(fmt, args...) \
+   VIRTIO_CRYPTO_INIT_LOG_IMPL(INFO, fmt, ## args)
+
+#define VIRTIO_CRYPTO_INIT_LOG_DBG(fmt, args...) \
+   VIRTIO_CRYPTO_INIT_LOG_IMPL(DEBUG, fmt, ## args)
+
+#define VIRTIO_CRYPTO_INIT_LOG_ERR(fmt, args...) \
+   VIRTIO_CRYPTO_INIT_LOG_IMPL(ERR, fmt, ## args)
+
+extern int virtio_crypto_logtype_session;
+
+#define VIRTIO_CRYPTO_SESSION_LOG_IMPL(level, fmt, args...) \
+   rte_log(RTE_LOG_ ## level, virtio_crypto_logtype_session, \
+   "SESSION: %s(): " fmt "\n", __func__, ##args)
+
+#define VIRTIO_CRYPTO_SESSION_LOG_INFO(fmt, args...) \
+   VIRTIO_CRYPTO_SESSION_LOG_IMPL(INFO, fmt, ## args)
+
+#define VIRTIO_CRYPTO_SESSION_LOG_DBG(fmt, args...) \
+   VIRTIO_CRYPTO_SESSION_LOG_IMPL(DEBUG, fmt, ## args)
+
+#define VIRTIO_CRYPTO_SESSION_LOG_ERR(fmt, args...) \
+   VIRTIO_CRYPTO_SESSION_LOG_IMPL(ERR, fmt, ## args)
+
+extern int virtio_crypto_logtype_rx;
+
+#define VIRTIO_CRYPTO_RX_LOG_IMPL(level, fmt, args...) \
+   rte_log(RTE_LOG_ ## level, virtio_crypto_logtype_rx, \
+   "RX: %s(): " fmt "\n", __func__, ##args)
+
+#define VIRTIO_CRYPTO_RX_LOG_INFO(fmt, args...) \
+   VIRTIO_CRYPTO_RX_LOG_IMPL(INFO, fmt, ## args)
+
+#define VIRTIO_CRYPTO_RX_LOG_DBG(fmt, args...) \
+   VIRTIO_CRYPTO_RX_LOG_IMPL(DEBUG, fmt, ## args)
+
+#define VIRTIO_CRYPTO_RX_LOG_ERR(fmt, args...) \
+   VIRTIO_CRYPTO_RX_LOG_IMPL(ERR, fmt, ## args)
+
+extern int virtio_crypto_logtype_tx;
+
+#define VIRTIO_CRYPTO_TX_LOG_IMPL(level, fmt, args...) \
+   rte_log(RTE_LOG_ ## level, virtio_crypto_logtype_tx, \
+   "TX: %s(): " fmt "\n", __func__, ##args)
+
+#define VIRTIO_CRYPTO_TX_LOG_INFO(fmt, args...) \
+   VIRTIO_CRYPTO_TX_LOG_IMPL(INFO, fmt, ## arg

[dpdk-dev] [PATCH v5 6/7] test/crypto: add function tests for virtio crypto PMD

2018-03-31 Thread Jay Zhou
Only RTE_CRYPTO_CIPHER_AES_CBC cipher
algorithm are tested as unit test, it is supported both by the
cryptodev-backend-builtin and cryptodev-vhost-user of qemu side.

Signed-off-by: Jay Zhou 
Reviewed-by: Fan Zhang 
Acked-by: Fan Zhang 
---
 test/test/test_cryptodev.c  | 48 +
 test/test/test_cryptodev.h  |  1 +
 test/test/test_cryptodev_aes_test_vectors.h | 24 ++-
 test/test/test_cryptodev_blockcipher.c  |  9 +-
 test/test/test_cryptodev_blockcipher.h  |  1 +
 5 files changed, 74 insertions(+), 9 deletions(-)

diff --git a/test/test/test_cryptodev.c b/test/test/test_cryptodev.c
index d1d7925..2f31ec9 100644
--- a/test/test/test_cryptodev.c
+++ b/test/test/test_cryptodev.c
@@ -1820,6 +1820,25 @@ struct crypto_unittest_params {
 }
 
 static int
+test_AES_cipheronly_virtio_all(void)
+{
+   struct crypto_testsuite_params *ts_params = &testsuite_params;
+   int status;
+
+   status = test_blockcipher_all_tests(ts_params->mbuf_pool,
+   ts_params->op_mpool,
+   ts_params->session_mpool,
+   ts_params->valid_devs[0],
+   rte_cryptodev_driver_id_get(
+   RTE_STR(CRYPTODEV_NAME_VIRTIO_PMD)),
+   BLKCIPHER_AES_CIPHERONLY_TYPE);
+
+   TEST_ASSERT_EQUAL(status, 0, "Test failed");
+
+   return TEST_SUCCESS;
+}
+
+static int
 test_AES_chain_dpaa_sec_all(void)
 {
struct crypto_testsuite_params *ts_params = &testsuite_params;
@@ -8879,6 +8898,18 @@ struct test_crypto_vector {
}
 };
 
+static struct unit_test_suite cryptodev_virtio_testsuite = {
+   .suite_name = "Crypto VIRTIO Unit Test Suite",
+   .setup = testsuite_setup,
+   .teardown = testsuite_teardown,
+   .unit_test_cases = {
+   TEST_CASE_ST(ut_setup, ut_teardown,
+   test_AES_cipheronly_virtio_all),
+
+   TEST_CASES_END() /**< NULL terminate unit test array */
+   }
+};
+
 static struct unit_test_suite cryptodev_aesni_mb_testsuite  = {
.suite_name = "Crypto Device AESNI MB Unit Test Suite",
.setup = testsuite_setup,
@@ -9808,6 +9839,22 @@ struct test_crypto_vector {
 }
 
 static int
+test_cryptodev_virtio(void /*argv __rte_unused, int argc __rte_unused*/)
+{
+   gbl_driver_id = rte_cryptodev_driver_id_get(
+   RTE_STR(CRYPTODEV_NAME_VIRTIO_PMD));
+
+   if (gbl_driver_id == -1) {
+   RTE_LOG(ERR, USER1, "VIRTIO PMD must be loaded. Check if "
+   "CONFIG_RTE_LIBRTE_PMD_VIRTIO_CRYPTO is enabled 
"
+   "in config file to run this testsuite.\n");
+   return TEST_FAILED;
+   }
+
+   return unit_test_suite_runner(&cryptodev_virtio_testsuite);
+}
+
+static int
 test_cryptodev_aesni_mb(void /*argv __rte_unused, int argc __rte_unused*/)
 {
gbl_driver_id = rte_cryptodev_driver_id_get(
@@ -10040,3 +10087,4 @@ struct test_crypto_vector {
 REGISTER_TEST_COMMAND(cryptodev_dpaa2_sec_autotest, test_cryptodev_dpaa2_sec);
 REGISTER_TEST_COMMAND(cryptodev_dpaa_sec_autotest, test_cryptodev_dpaa_sec);
 REGISTER_TEST_COMMAND(cryptodev_ccp_autotest, test_cryptodev_ccp);
+REGISTER_TEST_COMMAND(cryptodev_virtio_autotest, test_cryptodev_virtio);
diff --git a/test/test/test_cryptodev.h b/test/test/test_cryptodev.h
index d45fb7b..a7acad8 100644
--- a/test/test/test_cryptodev.h
+++ b/test/test/test_cryptodev.h
@@ -62,6 +62,7 @@
 #define CRYPTODEV_NAME_SCHEDULER_PMD   crypto_scheduler
 #define CRYPTODEV_NAME_MRVL_PMDcrypto_mrvl
 #define CRYPTODEV_NAME_CCP_PMD crypto_ccp
+#define CRYPTODEV_NAME_VIRTIO_PMD  crypto_virtio
 
 /**
  * Write (spread) data from buffer to mbuf data
diff --git a/test/test/test_cryptodev_aes_test_vectors.h 
b/test/test/test_cryptodev_aes_test_vectors.h
index 6f2422a..724c1e0 100644
--- a/test/test/test_cryptodev_aes_test_vectors.h
+++ b/test/test/test_cryptodev_aes_test_vectors.h
@@ -1544,7 +1544,8 @@
BLOCKCIPHER_TEST_TARGET_PMD_DPAA2_SEC |
BLOCKCIPHER_TEST_TARGET_PMD_DPAA_SEC |
BLOCKCIPHER_TEST_TARGET_PMD_MRVL |
-   BLOCKCIPHER_TEST_TARGET_PMD_CCP
+   BLOCKCIPHER_TEST_TARGET_PMD_CCP |
+   BLOCKCIPHER_TEST_TARGET_PMD_VIRTIO
},
{
.test_descr = "AES-128-CBC Decryption",
@@ -1557,7 +1558,8 @@
BLOCKCIPHER_TEST_TARGET_PMD_DPAA2_SEC |
BLOCKCIPHER_TEST_TARGET_PMD_DPAA_SEC |
BLOCKCIPHER_TEST_TARGET_PMD_MRVL |
-   BLOCKCIPHER_TEST_TARGET_PMD_CCP
+   BLOCKCIPHER_TEST_TARGET_PMD_CCP |
+   BLOCKCIPHER_TEST_TARGET_PMD_VIRTIO
},
{
.test_descr = "AES-192-CBC Encryption",
@@ -1569,7 +1571,8 @@
BLOCKCIPHER_TEST_TARGE

[dpdk-dev] [PATCH v5 4/7] crypto/virtio: add makefile

2018-03-31 Thread Jay Zhou
The virtio crypto PMD driver can be compiled now.

Signed-off-by: Jay Zhou 
Reviewed-by: Fan Zhang 
Acked-by: Fan Zhang 
---
 drivers/crypto/Makefile|  1 +
 drivers/crypto/virtio/Makefile | 31 ++
 .../virtio/rte_pmd_virtio_crypto_version.map   |  3 +++
 mk/rte.app.mk  |  1 +
 4 files changed, 36 insertions(+)
 create mode 100644 drivers/crypto/virtio/Makefile
 create mode 100644 drivers/crypto/virtio/rte_pmd_virtio_crypto_version.map

diff --git a/drivers/crypto/Makefile b/drivers/crypto/Makefile
index 9fbd986..e9e8b1f 100644
--- a/drivers/crypto/Makefile
+++ b/drivers/crypto/Makefile
@@ -21,5 +21,6 @@ ifeq ($(CONFIG_RTE_LIBRTE_DPAA_BUS),y)
 DIRS-$(CONFIG_RTE_LIBRTE_PMD_DPAA_SEC) += dpaa_sec
 endif
 DIRS-$(CONFIG_RTE_LIBRTE_PMD_CCP) += ccp
+DIRS-$(CONFIG_RTE_LIBRTE_PMD_VIRTIO_CRYPTO) += virtio
 
 include $(RTE_SDK)/mk/rte.subdir.mk
diff --git a/drivers/crypto/virtio/Makefile b/drivers/crypto/virtio/Makefile
new file mode 100644
index 000..c4727ea
--- /dev/null
+++ b/drivers/crypto/virtio/Makefile
@@ -0,0 +1,31 @@
+# SPDX-License-Identifier: BSD-3-Clause
+# Copyright(c) 2018 HUAWEI TECHNOLOGIES CO., LTD.
+
+include $(RTE_SDK)/mk/rte.vars.mk
+
+#
+# library name
+#
+LIB = librte_pmd_virtio_crypto.a
+
+CFLAGS += -O3
+CFLAGS += $(WERROR_FLAGS)
+
+EXPORT_MAP := rte_pmd_virtio_crypto_version.map
+
+LIBABIVER := 1
+
+#
+# all source are stored in SRCS-y
+#
+SRCS-$(CONFIG_RTE_LIBRTE_PMD_VIRTIO_CRYPTO) += virtqueue.c
+SRCS-$(CONFIG_RTE_LIBRTE_PMD_VIRTIO_CRYPTO) += virtio_pci.c
+SRCS-$(CONFIG_RTE_LIBRTE_PMD_VIRTIO_CRYPTO) += virtio_rxtx.c
+SRCS-$(CONFIG_RTE_LIBRTE_PMD_VIRTIO_CRYPTO) += virtio_cryptodev.c
+
+# this lib depends upon:
+DEPDIRS-$(CONFIG_RTE_LIBRTE_PMD_VIRTIO_CRYPTO) += lib/librte_eal
+DEPDIRS-$(CONFIG_RTE_LIBRTE_PMD_VIRTIO_CRYPTO) += lib/librte_mempool 
lib/librte_mbuf
+DEPDIRS-$(CONFIG_RTE_LIBRTE_PMD_VIRTIO_CRYPTO) += lib/librte_cryptodev
+
+include $(RTE_SDK)/mk/rte.lib.mk
diff --git a/drivers/crypto/virtio/rte_pmd_virtio_crypto_version.map 
b/drivers/crypto/virtio/rte_pmd_virtio_crypto_version.map
new file mode 100644
index 000..de8e412
--- /dev/null
+++ b/drivers/crypto/virtio/rte_pmd_virtio_crypto_version.map
@@ -0,0 +1,3 @@
+DPDK_18.05 {
+   local: *;
+};
diff --git a/mk/rte.app.mk b/mk/rte.app.mk
index 8071aa6..c2767b0 100644
--- a/mk/rte.app.mk
+++ b/mk/rte.app.mk
@@ -204,6 +204,7 @@ _LDLIBS-$(CONFIG_RTE_LIBRTE_PMD_AESNI_GCM)   +=  -lIPSec_MB
 _LDLIBS-$(CONFIG_RTE_LIBRTE_PMD_OPENSSL) += -lrte_pmd_openssl -lcrypto
 _LDLIBS-$(CONFIG_RTE_LIBRTE_PMD_NULL_CRYPTO) += -lrte_pmd_null_crypto
 _LDLIBS-$(CONFIG_RTE_LIBRTE_PMD_QAT) += -lrte_pmd_qat -lcrypto
+_LDLIBS-$(CONFIG_RTE_LIBRTE_PMD_VIRTIO_CRYPTO) += -lrte_pmd_virtio_crypto 
-lcrypto
 _LDLIBS-$(CONFIG_RTE_LIBRTE_PMD_SNOW3G)  += -lrte_pmd_snow3g
 _LDLIBS-$(CONFIG_RTE_LIBRTE_PMD_SNOW3G)  += -L$(LIBSSO_SNOW3G_PATH)/build 
-lsso_snow3g
 _LDLIBS-$(CONFIG_RTE_LIBRTE_PMD_KASUMI)  += -lrte_pmd_kasumi
-- 
1.8.3.1




[dpdk-dev] [PATCH v5 7/7] MAINTAINERS: add myself as virtio crypto PMD maintainer

2018-03-31 Thread Jay Zhou
Signed-off-by: Jay Zhou 
Reviewed-by: Fan Zhang 
Acked-by: Fan Zhang 
---
 MAINTAINERS | 6 ++
 1 file changed, 6 insertions(+)

diff --git a/MAINTAINERS b/MAINTAINERS
index b262e55..5424e74 100644
--- a/MAINTAINERS
+++ b/MAINTAINERS
@@ -724,6 +724,12 @@ F: drivers/crypto/snow3g/
 F: doc/guides/cryptodevs/snow3g.rst
 F: doc/guides/cryptodevs/features/snow3g.ini
 
+Virtio
+M: Jay Zhou 
+F: drivers/crypto/virtio/
+F: doc/guides/cryptodevs/virtio.rst
+F: doc/guides/cryptodevs/features/virtio.ini
+
 ZUC
 M: Pablo de Lara 
 F: drivers/crypto/zuc/
-- 
1.8.3.1




[dpdk-dev] [PATCH v5 2/7] crypto/virtio: add crypto related session structure

2018-03-31 Thread Jay Zhou
This structure will be used in the following patches, especially
at creating and destroying crypto sessions.

Signed-off-by: Jay Zhou 
Reviewed-by: Fan Zhang 
Acked-by: Fan Zhang 
---
 drivers/crypto/virtio/virtio_crypto_algs.h | 27 +++
 1 file changed, 27 insertions(+)
 create mode 100644 drivers/crypto/virtio/virtio_crypto_algs.h

diff --git a/drivers/crypto/virtio/virtio_crypto_algs.h 
b/drivers/crypto/virtio/virtio_crypto_algs.h
new file mode 100644
index 000..5f1e9df
--- /dev/null
+++ b/drivers/crypto/virtio/virtio_crypto_algs.h
@@ -0,0 +1,27 @@
+/* SPDX-License-Identifier: BSD-3-Clause
+ * Copyright(c) 2018 HUAWEI TECHNOLOGIES CO., LTD.
+ */
+
+#ifndef _VIRTIO_CRYPTO_ALGS_H_
+#define _VIRTIO_CRYPTO_ALGS_H_
+
+#include 
+#include 
+
+struct virtio_crypto_session {
+   uint64_t session_id;
+
+   struct {
+   uint16_t offset;
+   uint16_t length;
+   } iv;
+
+   struct {
+   uint32_t length;
+   phys_addr_t phys_addr;
+   } aad;
+
+   struct virtio_crypto_op_ctrl_req ctrl;
+};
+
+#endif /* _VIRTIO_CRYPTO_ALGS_H_ */
-- 
1.8.3.1




[dpdk-dev] [PATCH v5 3/7] crypto/virtio: core code of virtio crypto PMD

2018-03-31 Thread Jay Zhou
The virtio crypto device has two types of queues, data
queue and control queue. It has one data queue at least and has one and
only one control queue. For example, if a virtio crypto device has
N queues, then [0, N-2] is the data queue index, N-1 is the control
queue index.
The virtio crypto PMD provides poll mode driver support for the
virtio crypto device.
The cryptodev is created at the virtio crypto pci device probing stage.
For now, it only supports the session-oriented API implementation, the
supported symmetrical algorithms are AES-CBC ciphering and AES-CBC with
HMAC-SHA1 algorithm-chaining. The function
virtio_crypto_sym_configure_session() is used to create a session, then
virtio_crypto_pkt_tx_burst() can be used to burst transfer packets and
virtio_crypto_pkt_rx_burst() can be used to burst receive packets.

Signed-off-by: Jay Zhou 
Reviewed-by: Fan Zhang 
Acked-by: Fan Zhang 
---
 drivers/crypto/virtio/virtio_crypto_capabilities.h |   51 +
 drivers/crypto/virtio/virtio_cryptodev.c   | 1508 
 drivers/crypto/virtio/virtio_cryptodev.h   |   66 +
 drivers/crypto/virtio/virtio_rxtx.c|  541 +++
 4 files changed, 2166 insertions(+)
 create mode 100644 drivers/crypto/virtio/virtio_crypto_capabilities.h
 create mode 100644 drivers/crypto/virtio/virtio_cryptodev.c
 create mode 100644 drivers/crypto/virtio/virtio_cryptodev.h
 create mode 100644 drivers/crypto/virtio/virtio_rxtx.c

diff --git a/drivers/crypto/virtio/virtio_crypto_capabilities.h 
b/drivers/crypto/virtio/virtio_crypto_capabilities.h
new file mode 100644
index 000..03c30de
--- /dev/null
+++ b/drivers/crypto/virtio/virtio_crypto_capabilities.h
@@ -0,0 +1,51 @@
+/* SPDX-License-Identifier: BSD-3-Clause
+ * Copyright(c) 2018 HUAWEI TECHNOLOGIES CO., LTD.
+ */
+
+#ifndef _VIRTIO_CRYPTO_CAPABILITIES_H_
+#define _VIRTIO_CRYPTO_CAPABILITIES_H_
+
+#define VIRTIO_SYM_CAPABILITIES\
+   {   /* SHA1 HMAC */ \
+   .op = RTE_CRYPTO_OP_TYPE_SYMMETRIC, \
+   {.sym = {   \
+   .xform_type = RTE_CRYPTO_SYM_XFORM_AUTH,\
+   {.auth = {  \
+   .algo = RTE_CRYPTO_AUTH_SHA1_HMAC,  \
+   .block_size = 64,   \
+   .key_size = {   \
+   .min = 1,   \
+   .max = 64,  \
+   .increment = 1  \
+   },  \
+   .digest_size = {\
+   .min = 1,   \
+   .max = 20,  \
+   .increment = 1  \
+   },  \
+   .iv_size = { 0 }\
+   }, }\
+   }, }\
+   },  \
+   {   /* AES CBC */   \
+   .op = RTE_CRYPTO_OP_TYPE_SYMMETRIC, \
+   {.sym = {   \
+   .xform_type = RTE_CRYPTO_SYM_XFORM_CIPHER,  \
+   {.cipher = {\
+   .algo = RTE_CRYPTO_CIPHER_AES_CBC,  \
+   .block_size = 16,   \
+   .key_size = {   \
+   .min = 16,  \
+   .max = 32,  \
+   .increment = 8  \
+   },  \
+   .iv_size = {\
+   .min = 16,  \
+   .max = 16,  \
+   .increment = 0  \
+   }   \
+   }, }\
+   }, }\
+   }
+
+#endif /* _VIRTIO_CRYPTO_CAPABILITIES_H_ */
diff --git a/dr

[dpdk-dev] [PATCH v5 5/7] doc: add virtio crypto PMD guide

2018-03-31 Thread Jay Zhou
Signed-off-by: Jay Zhou 
Reviewed-by: Fan Zhang 
Acked-by: Fan Zhang 
---
 doc/guides/cryptodevs/features/virtio.ini |  26 +++
 doc/guides/cryptodevs/index.rst   |   1 +
 doc/guides/cryptodevs/virtio.rst  | 117 ++
 3 files changed, 144 insertions(+)
 create mode 100644 doc/guides/cryptodevs/features/virtio.ini
 create mode 100644 doc/guides/cryptodevs/virtio.rst

diff --git a/doc/guides/cryptodevs/features/virtio.ini 
b/doc/guides/cryptodevs/features/virtio.ini
new file mode 100644
index 000..168fc17
--- /dev/null
+++ b/doc/guides/cryptodevs/features/virtio.ini
@@ -0,0 +1,26 @@
+; Supported features of the 'virtio' crypto driver.
+;
+; Refer to default.ini for the full list of available PMD features.
+;
+[Features]
+Symmetric crypto   = Y
+Sym operation chaining = Y
+
+;
+; Supported crypto algorithms of the 'virtio' crypto driver.
+;
+[Cipher]
+AES CBC (128)  = Y
+AES CBC (192)  = Y
+AES CBC (256)  = Y
+
+;
+; Supported authentication algorithms of the 'virtio' crypto driver.
+;
+[Auth]
+SHA1 HMAC  = Y
+
+;
+; Supported AEAD algorithms of the 'virtio' crypto driver.
+;
+[AEAD]
diff --git a/doc/guides/cryptodevs/index.rst b/doc/guides/cryptodevs/index.rst
index 8a921dd..0529583 100644
--- a/doc/guides/cryptodevs/index.rst
+++ b/doc/guides/cryptodevs/index.rst
@@ -23,4 +23,5 @@ Crypto Device Drivers
 scheduler
 snow3g
 qat
+virtio
 zuc
diff --git a/doc/guides/cryptodevs/virtio.rst b/doc/guides/cryptodevs/virtio.rst
new file mode 100644
index 000..f3aa7c6
--- /dev/null
+++ b/doc/guides/cryptodevs/virtio.rst
@@ -0,0 +1,117 @@
+..  SPDX-License-Identifier: BSD-3-Clause
+Copyright(c) 2018 HUAWEI TECHNOLOGIES CO., LTD.
+
+Virtio Crypto Poll Mode Driver
+==
+
+The virtio crypto PMD provides poll mode driver support for the virtio crypto
+device.
+
+Features
+
+
+The virtio crypto PMD has support for:
+
+Cipher algorithms:
+
+* ``RTE_CRYPTO_CIPHER_AES_CBC``
+
+Hash algorithms:
+
+* ``RTE_CRYPTO_AUTH_SHA1_HMAC``
+
+Limitations
+---
+
+*  Only supports the session-oriented API implementation (session-less APIs are
+   not supported).
+*  Only supports modern mode since virtio crypto conforms to virtio-1.0.
+*  Only has two types of queues: data queue and control queue. These two queues
+   only support indirect buffers to communication with the virtio backend.
+*  Only supports AES_CBC cipher only algorithm and AES_CBC with HMAC_SHA1
+   chaining algorithm since the vhost crypto backend only these algorithms
+   are supported.
+*  Does not support Link State interrupt.
+*  Does not support runtime configuration.
+
+Virtio crypto PMD Rx/Tx Callbacks
+-
+
+Rx callbacks:
+
+* ``virtio_crypto_pkt_rx_burst``
+
+Tx callbacks:
+
+* ``virtio_crypto_pkt_tx_burst``
+
+Installation
+
+
+Quick instructions are as follows:
+
+Firstly run DPDK vhost crypto sample as a server side and build QEMU with
+vhost crypto enabled.
+QEMU can then be started using the following parameters:
+
+.. code-block:: console
+
+qemu-system-x86_64 \
+[...] \
+-chardev socket,id=charcrypto0,path=/path/to/your/socket \
+-object cryptodev-vhost-user,id=cryptodev0,chardev=charcrypto0 \
+-device virtio-crypto-pci,id=crypto0,cryptodev=cryptodev0
+[...]
+
+Secondly bind the uio_generic driver for the virtio-crypto device.
+For example, :00:04.0 is the domain, bus, device and function
+number of the virtio-crypto device:
+
+.. code-block:: console
+
+modprobe uio_pci_generic
+echo -n :00:04.0 > /sys/bus/pci/drivers/virtio-pci/unbind
+echo "1af4 1054" > /sys/bus/pci/drivers/uio_pci_generic/new_id
+
+Finally the front-end virtio crypto PMD driver can be installed:
+
+.. code-block:: console
+
+cd to the top-level DPDK directory
+sed -i 's,\(CONFIG_RTE_LIBRTE_PMD_VIRTIO_CRYPTO\)=n,\1=y,' 
config/common_base
+make config T=x86_64-native-linuxapp-gcc
+make install T=x86_64-native-linuxapp-gcc
+
+Tests
+-
+
+The unit test cases can be tested as below:
+
+.. code-block:: console
+
+reserve enough huge pages
+cd to the top-level DPDK directory
+export RTE_TARGET=x86_64-native-linuxapp-gcc
+export RTE_SDK=`pwd`
+cd to test/test
+type the command "make" to compile
+run the tests with "./test"
+type the command "cryptodev_virtio_autotest" to test
+
+The performance can be tested as below:
+
+.. code-block:: console
+
+reserve enough huge pages
+cd to the top-level DPDK directory
+export RTE_TARGET=x86_64-native-linuxapp-gcc
+export RTE_SDK=`pwd`
+cd to app/test-crypto-perf
+type the command "make" to compile
+run the tests with the following command:
+
+./dpdk-test-crypto-perf -l 0,1 -- --devtype crypto_virtio \
+--ptest throughput --optype cipher-then-auth --cipher-algo aes-cbc \
+--cipher-op encrypt --cipher-key-sz 16 --auth-algo sha1-hmac \

Re: [dpdk-dev] [PATCH v3 1/4] eal/vfio: add support for multiple container

2018-03-31 Thread Maxime Coquelin



On 03/31/2018 04:29 AM, Xiao Wang wrote:

From: Junjie Chen 

Currently eal vfio framework binds vfio group fd to the default
container fd, while in some cases, e.g. vDPA (vhost data path
acceleration), we want to set vfio group to a new container and
program DMA mapping via this new container, so this patch adds
APIs to support multiple container.

Signed-off-by: Junjie Chen 
Signed-off-by: Xiao Wang 
---
  config/common_base   |   1 +
  lib/librte_eal/bsdapp/eal/eal.c  |  51 ++-
  lib/librte_eal/common/include/rte_vfio.h | 116 +++
  lib/librte_eal/linuxapp/eal/eal_vfio.c   | 552 +--
  lib/librte_eal/linuxapp/eal/eal_vfio.h   |   1 +
  lib/librte_eal/rte_eal_version.map   |   7 +
  6 files changed, 627 insertions(+), 101 deletions(-)



FWIW:

Reviewed-by: Maxime Coquelin 

Thanks,
Maxime


Re: [dpdk-dev] [PATCH v3 2/4] net/virtio: skip device probe in vdpa mode

2018-03-31 Thread Maxime Coquelin

Hi Xiao,

On 03/31/2018 04:29 AM, Xiao Wang wrote:

If we want a virtio device to work in vDPA (vhost data path acceleration)
mode, we could add a "vdpa=1" devarg for this device to specify the mode.

This patch let virtio pmd skip device probe when detecting this parameter.

Signed-off-by: Xiao Wang 
---
  drivers/net/virtio/virtio_ethdev.c | 43 ++
  1 file changed, 43 insertions(+)



As we discussed, I would prefer a generic solution at EAL level.
But as a start, I agree with this solution:

Reviewed-by: Maxime Coquelin 

Thanks!
Maxime


Re: [dpdk-dev] [PATCH v3 3/4] net/ifcvf: add ifcvf vdpa driver

2018-03-31 Thread Maxime Coquelin



On 03/31/2018 04:29 AM, Xiao Wang wrote:

The IFCVF vDPA (vhost data path acceleration) driver provides support for
the Intel FPGA 100G VF (IFCVF). IFCVF's datapath is virtio ring compatible,
it works as a HW vhost backend which can send/receive packets to/from
virtio directly by DMA.

Different VF devices serve different virtio frontends which are in
different VMs, so each VF needs to have its own DMA address translation
service. During the driver probe a new container is created, with this
container vDPA driver can program DMA remapping table with the VM's memory
region information.

Key vDPA driver ops implemented:

- ifcvf_dev_config:
   Enable VF data path with virtio information provided by vhost lib,
   including IOMMU programming to enable VF DMA to VM's memory, VFIO
   interrupt setup to route HW interrupt to virtio driver, create notify
   relay thread to translate virtio driver's kick to a MMIO write onto HW,
   HW queues configuration.

- ifcvf_dev_close:
   Revoke all the setup in ifcvf_dev_config.

Live migration feature is supported by IFCVF and this driver enables
it. For the dirty page logging, VF helps to log for packet buffer write,
driver helps to make the used ring as dirty when device stops.

Because vDPA driver needs to set up MSI-X vector to interrupt the
guest, only vfio-pci is supported currently.

Signed-off-by: Xiao Wang 
Signed-off-by: Rosen Xu 
---
  config/common_base|   7 +
  config/common_linuxapp|   1 +
  drivers/net/Makefile  |   3 +
  drivers/net/ifc/Makefile  |  36 ++
  drivers/net/ifc/base/ifcvf.c  | 329 +
  drivers/net/ifc/base/ifcvf.h  | 160 +++
  drivers/net/ifc/base/ifcvf_osdep.h|  52 +++
  drivers/net/ifc/ifcvf_vdpa.c  | 842 ++
  drivers/net/ifc/rte_ifcvf_version.map |   4 +
  mk/rte.app.mk |   3 +
  10 files changed, 1437 insertions(+)
  create mode 100644 drivers/net/ifc/Makefile
  create mode 100644 drivers/net/ifc/base/ifcvf.c
  create mode 100644 drivers/net/ifc/base/ifcvf.h
  create mode 100644 drivers/net/ifc/base/ifcvf_osdep.h
  create mode 100644 drivers/net/ifc/ifcvf_vdpa.c
  create mode 100644 drivers/net/ifc/rte_ifcvf_version.map


Thanks for having handled the changes, please see minor comments below.

Feel free to add my:
Reviewed-by: Maxime Coquelin 

Thanks!
Maxime


+static uint64_t
+qva_to_gpa(int vid, uint64_t qva)


We might want to have this in vhost-lib to avoid duplication,
but that can be done later.


+{
+   struct rte_vhost_memory *mem = NULL;
+   struct rte_vhost_mem_region *reg;
+   uint32_t i;
+   uint64_t gpa = 0;
+
+   if (rte_vhost_get_mem_table(vid, &mem) < 0)
+   goto exit;
+
+   for (i = 0; i < mem->nregions; i++) {
+   reg = &mem->regions[i];
+
+   if (qva >= reg->host_user_addr &&
+   qva < reg->host_user_addr + reg->size) {
+   gpa = qva - reg->host_user_addr + reg->guest_phys_addr;
+   break;
+   }
+   }
+
+exit:
+   if (gpa == 0)
+   rte_panic("failed to get gpa\n");
+   if (mem)
+   free(mem);
+   return gpa;
+}
+
+static int
+vdpa_ifcvf_start(struct ifcvf_internal *internal)
+{
+   struct ifcvf_hw *hw = &internal->hw;
+   int i, nr_vring;
+   int vid;
+   struct rte_vhost_vring vq;
+
+   vid = internal->vid;
+   nr_vring = rte_vhost_get_vring_num(vid);
+   rte_vhost_get_negotiated_features(vid, &hw->req_features);
+
+   for (i = 0; i < nr_vring; i++) {
+   rte_vhost_get_vhost_vring(vid, i, &vq);
+   hw->vring[i].desc = qva_to_gpa(vid, (uint64_t)vq.desc);
+   hw->vring[i].avail = qva_to_gpa(vid, (uint64_t)vq.avail);
+   hw->vring[i].used = qva_to_gpa(vid, (uint64_t)vq.used);
+   hw->vring[i].size = vq.size;
+   rte_vhost_get_vring_base(vid, i, &hw->vring[i].last_avail_idx,
+   &hw->vring[i].last_used_idx);
+   }
+   hw->nr_vring = i;
+
+   return ifcvf_start_hw(&internal->hw);
+}
+
+static void
+vdpa_ifcvf_stop(struct ifcvf_internal *internal)
+{
+   struct ifcvf_hw *hw = &internal->hw;
+   int i, j;
+   int vid;
+   uint64_t features, pfn;
+   uint64_t log_base, log_size;
+   uint8_t *log_buf;
+
+   vid = internal->vid;
+   ifcvf_stop_hw(hw);
+
+   for (i = 0; i < hw->nr_vring; i++)
+   rte_vhost_set_vring_base(vid, i, hw->vring[i].last_avail_idx,
+   hw->vring[i].last_used_idx);
+
+   rte_vhost_get_negotiated_features(vid, &features);
+   if (RTE_VHOST_NEED_LOG(features)) {
+   ifcvf_disable_logging(hw);
+   rte_vhost_get_log_base(internal->vid, &log_base, &log_size);
+   /*
+* IFCVF marks dirty memory page

Re: [dpdk-dev] [PATCH v3 4/4] net/ifcvf: add driver document and release note

2018-03-31 Thread Maxime Coquelin



On 03/31/2018 04:29 AM, Xiao Wang wrote:

Signed-off-by: Xiao Wang 
---
  doc/guides/nics/features/ifcvf.ini |  8 
  doc/guides/nics/ifcvf.rst  | 85 ++
  doc/guides/nics/index.rst  |  1 +
  doc/guides/rel_notes/release_18_05.rst |  9 
  4 files changed, 103 insertions(+)
  create mode 100644 doc/guides/nics/features/ifcvf.ini
  create mode 100644 doc/guides/nics/ifcvf.rst



Reviewed-by: Maxime Coquelin 

Thanks!
Maxime


Re: [dpdk-dev] [PATCH v3 2/4] net/virtio: skip device probe in vdpa mode

2018-03-31 Thread Thomas Monjalon
Hi,

31/03/2018 13:13, Maxime Coquelin:
> On 03/31/2018 04:29 AM, Xiao Wang wrote:
> > If we want a virtio device to work in vDPA (vhost data path acceleration)
> > mode, we could add a "vdpa=1" devarg for this device to specify the mode.
> > 
> > This patch let virtio pmd skip device probe when detecting this parameter.
> 
> As we discussed, I would prefer a generic solution at EAL level.

Please could you explain the requirement and the context?
Can we use RTE_ETH_DEV_DEFERRED state and device ownership?

Without knowing what's behind, I would say that a PMD should
never skip a device by itself, but let other entities decide
what to do with the probed device (thanks to probe notifications).




Re: [dpdk-dev] Build is broken in dpdk-next-net

2018-03-31 Thread Neil Horman
On Fri, Mar 30, 2018 at 10:47:09PM +0800, Tonghao Zhang wrote:
> I rebuild it on ubuntu 17.10 and cash it. I use the 'RTE_SET_USED' to fix it.
> 
> 
> diff --git a/lib/librte_vhost/fd_man.c b/lib/librte_vhost/fd_man.c
> index 771675718..f11803191 100644
> --- a/lib/librte_vhost/fd_man.c
> +++ b/lib/librte_vhost/fd_man.c
> @@ -279,7 +279,8 @@ fdset_pipe_read_cb(int readfd, void *dat __rte_unused,
>int *remove __rte_unused)
>  {
> char charbuf[16];
> -   read(readfd, charbuf, sizeof(charbuf));
> +   int r = read(readfd, charbuf, sizeof(charbuf));
> +   RTE_SET_USED(r);
>  }
> 
>  void
> @@ -319,5 +320,6 @@ fdset_pipe_init(struct fdset *fdset)
>  void
>  fdset_pipe_notify(struct fdset *fdset)
>  {
> -   write(fdset->u.writefd, "1", 1);
> +   int r = write(fdset->u.writefd, "1", 1);
> +   RTE_SET_USED(r);
>  }
> 

A better option might be to use _Pragma

Something like this perhaps

#define ALLOW_UNUSED(x) \
_Pragma(push) \
_Pragma(diagnostic ignored "-Wunused-result") \
#x;\
_Pragma(pop)

This is of course untested, so it probably needs some tweaking, but this method
avoids the need to declare an additional stack variable, which i don't think can
be eliminated due to the cast.  I believe that this method should also work
accross compilers (the gcc and clang compilers support this, and i think the
intel compiler should as well)

Neil



Re: [dpdk-dev] [PATCH v6] eal: provide API for querying valid socket id's

2018-03-31 Thread Burakov, Anatoly

On 27-Mar-18 5:24 PM, Thomas Monjalon wrote:

22/03/2018 13:36, Anatoly Burakov:

--- a/lib/librte_eal/common/include/rte_eal.h
+++ b/lib/librte_eal/common/include/rte_eal.h
@@ -57,6 +57,9 @@ enum rte_proc_type_t {
  struct rte_config {
uint32_t master_lcore;   /**< Id of the master lcore */
uint32_t lcore_count;/**< Number of available logical cores. */
+   uint32_t numa_node_count;/**< Number of detected NUMA nodes. */
+   uint32_t numa_nodes[RTE_MAX_NUMA_NODES];
+   /**< List of detected numa nodes. */


Please keep this comment on the same line if it's below 99 chars.


If this is allowed, can we fix checkpatch to not report error in these 
cases?


--
Thanks,
Anatoly


Re: [dpdk-dev] Build is broken in dpdk-next-net

2018-03-31 Thread Gaëtan Rivet
On Sat, Mar 31, 2018 at 09:33:43AM -0400, Neil Horman wrote:
> On Fri, Mar 30, 2018 at 10:47:09PM +0800, Tonghao Zhang wrote:
> > I rebuild it on ubuntu 17.10 and cash it. I use the 'RTE_SET_USED' to fix 
> > it.
> > 
> > 
> > diff --git a/lib/librte_vhost/fd_man.c b/lib/librte_vhost/fd_man.c
> > index 771675718..f11803191 100644
> > --- a/lib/librte_vhost/fd_man.c
> > +++ b/lib/librte_vhost/fd_man.c
> > @@ -279,7 +279,8 @@ fdset_pipe_read_cb(int readfd, void *dat __rte_unused,
> >int *remove __rte_unused)
> >  {
> > char charbuf[16];
> > -   read(readfd, charbuf, sizeof(charbuf));
> > +   int r = read(readfd, charbuf, sizeof(charbuf));
> > +   RTE_SET_USED(r);
> >  }
> > 
> >  void
> > @@ -319,5 +320,6 @@ fdset_pipe_init(struct fdset *fdset)
> >  void
> >  fdset_pipe_notify(struct fdset *fdset)
> >  {
> > -   write(fdset->u.writefd, "1", 1);
> > +   int r = write(fdset->u.writefd, "1", 1);
> > +   RTE_SET_USED(r);
> >  }
> > 
> 
> A better option might be to use _Pragma
> 
> Something like this perhaps
> 
> #define ALLOW_UNUSED(x) \
> _Pragma(push) \
> _Pragma(diagnostic ignored "-Wunused-result") \
> #x;\
> _Pragma(pop)
> 
> This is of course untested, so it probably needs some tweaking, but this 
> method
> avoids the need to declare an additional stack variable, which i don't think 
> can
> be eliminated due to the cast.  I believe that this method should also work
> accross compilers (the gcc and clang compilers support this, and i think the
> intel compiler should as well)
> 
> Neil
> 

It would be nice to avoid the definition of a useless variable.
An alternative could be

   if (read() < 0) {
   /* Failure here is acceptable for such and such reason. */
   }

to ensure all-around compatibility, and the definition or another macro.
Just a suggestion.

-- 
Gaëtan Rivet
6WIND


Re: [dpdk-dev] Build is broken in dpdk-next-net

2018-03-31 Thread Neil Horman
On Sat, Mar 31, 2018 at 05:09:47PM +0200, Gaëtan Rivet wrote:
> On Sat, Mar 31, 2018 at 09:33:43AM -0400, Neil Horman wrote:
> > On Fri, Mar 30, 2018 at 10:47:09PM +0800, Tonghao Zhang wrote:
> > > I rebuild it on ubuntu 17.10 and cash it. I use the 'RTE_SET_USED' to fix 
> > > it.
> > > 
> > > 
> > > diff --git a/lib/librte_vhost/fd_man.c b/lib/librte_vhost/fd_man.c
> > > index 771675718..f11803191 100644
> > > --- a/lib/librte_vhost/fd_man.c
> > > +++ b/lib/librte_vhost/fd_man.c
> > > @@ -279,7 +279,8 @@ fdset_pipe_read_cb(int readfd, void *dat __rte_unused,
> > >int *remove __rte_unused)
> > >  {
> > > char charbuf[16];
> > > -   read(readfd, charbuf, sizeof(charbuf));
> > > +   int r = read(readfd, charbuf, sizeof(charbuf));
> > > +   RTE_SET_USED(r);
> > >  }
> > > 
> > >  void
> > > @@ -319,5 +320,6 @@ fdset_pipe_init(struct fdset *fdset)
> > >  void
> > >  fdset_pipe_notify(struct fdset *fdset)
> > >  {
> > > -   write(fdset->u.writefd, "1", 1);
> > > +   int r = write(fdset->u.writefd, "1", 1);
> > > +   RTE_SET_USED(r);
> > >  }
> > > 
> > 
> > A better option might be to use _Pragma
> > 
> > Something like this perhaps
> > 
> > #define ALLOW_UNUSED(x) \
> > _Pragma(push) \
> > _Pragma(diagnostic ignored "-Wunused-result") \
> > #x;\
> > _Pragma(pop)
> > 
> > This is of course untested, so it probably needs some tweaking, but this 
> > method
> > avoids the need to declare an additional stack variable, which i don't 
> > think can
> > be eliminated due to the cast.  I believe that this method should also work
> > accross compilers (the gcc and clang compilers support this, and i think the
> > intel compiler should as well)
> > 
> > Neil
> > 
> 
> It would be nice to avoid the definition of a useless variable.
> An alternative could be
> 
>if (read() < 0) {
>/* Failure here is acceptable for such and such reason. */
>}
> 
> to ensure all-around compatibility, and the definition or another macro.
> Just a suggestion.
> 
That would be a good alternative, but I think its effectiveness is dependent on
when the compiler does with the return value check. Without any code inside the
conditional, the compiler may optimize the check out, meaning the warning will
still be asserted.  If it doesn't optimize the check out, then you have a
useless compare and jump instruction left in the code path.

Best
Neil



Re: [dpdk-dev] [PATCH v4 09/20] eal/dev: implement device iteration initialization

2018-03-31 Thread Gaëtan Rivet
On Fri, Mar 30, 2018 at 04:22:15PM +, Wiles, Keith wrote:
> 
> 
> > On Mar 30, 2018, at 10:53 AM, Gaëtan Rivet  wrote:
> > 
> > Hello Keith,
> 
> Hello Gaëtan,
> 
> >>> + layers[i].kvlist = rte_kvargs_parse(copy, NULL);
> >>> + free(copy);
> >> 
> >> I am sorry this method of not adding blank lines is a bit silly and we 
> >> need to rethink at least adding a few blank lines to help with grouping 
> >> the code. This style will cause problems for new readers (old readers) to 
> >> understand the code. This to me is a maintenance problem for the future 
> >> and we need to fix this now.
> >> 
> >> Blank lines after if statements (with possible more comments) can help 
> >> along with adding blank lines to group code is really the minimum amount 
> >> of lines required. I have never seen someone state you have to many blanks 
> >> lines in the code except two or more blank lines in a row. This is akin to 
> >> having a single paragraph in a novel or letter and it makes it very hard 
> >> to read. It is not hard to add some blank lines to the code for 
> >> readability.
> >> 
> > 
> > I understand. What I dislike is having inconsistencies in the layout of
> > the code.
> > 
> > "Paragraphs", for lack of a better word, are high subjective and a
> > matter of taste.
> 
> I bet your teacher(s) would disagree with that statement with one single 
> paragraph in your book reports :-)

The utility of using paragraph is not a matter of subjectivity.
How to use them and how to structure information is what I deemed
subjective.

> > 
> > Given that subjectivity is not helpful in review and taste is hard to
> > debate, I prefer to have a single terse rule, that is to avoid any
> > additional bytes beside the bare minimum to respect checkpatch.
> 
> Taste is hard to debate, but you have gone the extreme route with only the 
> bare minimum blank lines and that is not good as well. A silly script does 
> not read code or understand code we the humans have to make the code readable.
> > 
> > When I feel the need to have a new "conceptual group", then I am forced
> > to add a comment to explain what is happening. By not allowing blank
> > lines, I thus feel the pressure for space and explanation more acutely.
> 
> A blank can give somewhat convey the same information without a comment, but 
> not in all cases. Even a blank before a group of lines can convey this is a 
> new logic section. I do not buy the point for needing the same terse rule 
> here as most of the coding style is free form and allows for reading between 
> the lines a bit.
> 
> We can make a rule here, but no blank lines in a function this size and the 
> patch of this size is making DPDK not as professional looking as it could be.
> 

I think one of the main issue anyway is that this function is simply too
large as it is.

As it turns out, I am working on the second side of this work, which is
revamping the device declaration path.

This function will be split in different parts, that will be shorter and
more palatable.

This is a big work, still in progress (the device declaration, not the
split of this function).

-- 
Gaëtan Rivet
6WIND


[dpdk-dev] [PATCH v4 2/3] Add Intel FPGA BUS Rawdev Driver

2018-03-31 Thread Rosen Xu
Signed-off-by: Rosen Xu 
Signed-off-by: Yanglong Wu  
---
 config/common_base |   1 +
 drivers/raw/Makefile   |   1 +
 drivers/raw/ifpga_rawdev/Makefile  |  34 ++
 drivers/raw/ifpga_rawdev/ifpga_rawdev.c| 594 +
 drivers/raw/ifpga_rawdev/ifpga_rawdev.h|  37 ++
 .../raw/ifpga_rawdev/rte_ifpga_rawdev_version.map  |   4 +
 mk/rte.app.mk  |   1 +
 7 files changed, 672 insertions(+)
 create mode 100644 drivers/raw/ifpga_rawdev/Makefile
 create mode 100644 drivers/raw/ifpga_rawdev/ifpga_rawdev.c
 create mode 100644 drivers/raw/ifpga_rawdev/ifpga_rawdev.h
 create mode 100644 drivers/raw/ifpga_rawdev/rte_ifpga_rawdev_version.map

diff --git a/config/common_base b/config/common_base
index 49f6b09..08b7cce 100644
--- a/config/common_base
+++ b/config/common_base
@@ -137,6 +137,7 @@ CONFIG_RTE_LIBRTE_VDEV_BUS=y
 # Compile the Intel FPGA bus
 #
 CONFIG_RTE_LIBRTE_IFPGA_BUS=y
+CONFIG_RTE_LIBRTE_IFPGA_RAWDEV=y
 
 #
 # Compile ARK PMD
diff --git a/drivers/raw/Makefile b/drivers/raw/Makefile
index da7c8b4..6fc8f2f 100644
--- a/drivers/raw/Makefile
+++ b/drivers/raw/Makefile
@@ -5,5 +5,6 @@ include $(RTE_SDK)/mk/rte.vars.mk
 
 # DIRS-$() += 
 DIRS-$(CONFIG_RTE_LIBRTE_PMD_SKELETON_RAWDEV) += skeleton_rawdev
+DIRS-$(CONFIG_RTE_LIBRTE_IFPGA_RAWDEV) += ifpga_rawdev
 
 include $(RTE_SDK)/mk/rte.subdir.mk
diff --git a/drivers/raw/ifpga_rawdev/Makefile 
b/drivers/raw/ifpga_rawdev/Makefile
new file mode 100644
index 000..118c729
--- /dev/null
+++ b/drivers/raw/ifpga_rawdev/Makefile
@@ -0,0 +1,34 @@
+# SPDX-License-Identifier: BSD-3-Clause
+# Copyright(c) 2018 Intel Corporation
+
+include $(RTE_SDK)/mk/rte.vars.mk
+
+#
+# library name
+#
+LIB = librte_ifpga_rawdev.a
+
+CFLAGS += -DALLOW_EXPERIMENTAL_API
+CFLAGS += -O3
+CFLAGS += $(WERROR_FLAGS)
+CFLAGS += -I$(RTE_SDK)/drivers/bus/ifpga
+CFLAGS += -I$(RTE_SDK)/drivers/raw/ifpga_rawdev
+LDLIBS += -lrte_eal
+LDLIBS += -lrte_rawdev
+LDLIBS += -lrte_bus_vdev
+LDLIBS += -lrte_kvargs
+
+EXPORT_MAP := rte_ifpga_rawdev_version.map
+
+LIBABIVER := 1
+
+VPATH += $(SRCDIR)/base
+
+include $(RTE_SDK)/drivers/raw/ifpga_rawdev/base/Makefile
+
+#
+# all source are stored in SRCS-y
+#
+SRCS-$(CONFIG_RTE_LIBRTE_IFPGA_RAWDEV) += ifpga_rawdev.c
+
+include $(RTE_SDK)/mk/rte.lib.mk
diff --git a/drivers/raw/ifpga_rawdev/ifpga_rawdev.c 
b/drivers/raw/ifpga_rawdev/ifpga_rawdev.c
new file mode 100644
index 000..e46c014
--- /dev/null
+++ b/drivers/raw/ifpga_rawdev/ifpga_rawdev.c
@@ -0,0 +1,594 @@
+/* SPDX-License-Identifier: BSD-3-Clause
+ * Copyright(c) 2010-2018 Intel Corporation
+ */
+
+#include 
+#include 
+#include 
+#include 
+#include 
+#include 
+#include 
+#include 
+#include 
+#include 
+#include 
+#include 
+#include 
+#include 
+#include 
+#include 
+#include 
+
+#include 
+#include 
+#include 
+#include 
+#include 
+#include 
+#include 
+
+#include "base/opae_hw_api.h"
+#include "rte_rawdev.h"
+#include "rte_rawdev_pmd.h"
+#include "rte_bus_ifpga.h"
+#include "ifpga_common.h"
+#include "ifpga_logs.h"
+#include "ifpga_rawdev.h"
+
+int ifpga_rawdev_logtype;
+
+#define PCI_VENDOR_ID_INTEL  0x8086
+/* PCI Device ID */
+#define PCIE_DEVICE_ID_PF_INT_5_X0xBCBD
+#define PCIE_DEVICE_ID_PF_INT_6_X0xBCC0
+#define PCIE_DEVICE_ID_PF_DSC_1_X0x09C4
+/* VF Device */
+#define PCIE_DEVICE_ID_VF_INT_5_X0xBCBF
+#define PCIE_DEVICE_ID_VF_INT_6_X0xBCC1
+#define PCIE_DEVICE_ID_VF_DSC_1_X0x09C5
+#define RTE_MAX_RAW_DEVICE   10
+
+static const struct rte_pci_id pci_ifpga_map[] = {
+   { RTE_PCI_DEVICE(PCI_VENDOR_ID_INTEL, PCIE_DEVICE_ID_PF_INT_5_X) },
+   { RTE_PCI_DEVICE(PCI_VENDOR_ID_INTEL, PCIE_DEVICE_ID_VF_INT_5_X) },
+   { RTE_PCI_DEVICE(PCI_VENDOR_ID_INTEL, PCIE_DEVICE_ID_PF_INT_6_X) },
+   { RTE_PCI_DEVICE(PCI_VENDOR_ID_INTEL, PCIE_DEVICE_ID_VF_INT_6_X) },
+   { RTE_PCI_DEVICE(PCI_VENDOR_ID_INTEL, PCIE_DEVICE_ID_PF_DSC_1_X) },
+   { RTE_PCI_DEVICE(PCI_VENDOR_ID_INTEL, PCIE_DEVICE_ID_VF_DSC_1_X) },
+   { .vendor_id = 0, /* sentinel */ },
+};
+
+static int ifpga_fill_afu_dev(struct opae_accelerator *acc,
+   struct rte_afu_device *afu_dev)
+{
+   struct rte_mem_resource *res = afu_dev->mem_resource;
+   struct opae_acc_region_info region_info;
+   struct opae_acc_info info;
+   unsigned long i;
+   int ret;
+
+   ret = opae_acc_get_info(acc, &info);
+   if (ret)
+   return ret;
+
+   if (info.num_regions > PCI_MAX_RESOURCE)
+   return -EFAULT;
+
+   afu_dev->num_region = info.num_regions;
+
+   for (i = 0; i < info.num_regions; i++) {
+   region_info.index = i;
+   ret = opae_acc_get_region_info(acc, ®ion_info);
+   if (ret)
+   return ret;
+
+   if ((region_info.flags & ACC_REGION_MMIO) &&
+   (region_info.flags & ACC_REGION_READ

[dpdk-dev] [PATCH v4 0/3] Introduce Intel FPGA BUS

2018-03-31 Thread Rosen Xu
Intel FPGA BUS in DPDK
-

This patch set introduces Intel FPGA BUS support in DPDK.

v4 updates:
===
 - Remove all modifications from eal
 - Create vdev to take IFPGA parameters configuration
 - AFU Device Driver bind to AFU Device by uuid
 - Take more test in scenario of Multi-FPGA System
 
v3 updates:
===
 - Remove all modifications of bus scan and probe
 - FPGA BUS Scan is trigged by hotplug of Rawdev
 - Took Modifications of comments
 - Move AFU Device to IFPGA
 - FPGA BUS Scan depend on it??s IFPGA Rawdev
 - Add Build Macros for FPGA BUS and IFPGA Rawdev

Questions
=
Why not PCI Bus?
All of the AFUs of one FPGA may share same PCI BDF.
Why not vdev Bus?
Because AFUs depend on Rawdev, and it's hardware specpic.

Motivation
==
FPGA is used more and more widely in Cloud and NFV, one primary reason is
that FPGA not only provide ASIC performance but also it's more flexible 
than ASIC. FPGA use Partial Reconfigure(PR) Parts of Bitstream to achieve 
its flexibility. Another reason is that one FPGA can be shared 
by different Users, and each User can use some of AFUs of One FPGA.

That means One FPGA Device Bitstream is divided into many Parts of 
Bitstream(each Part of Bitstream is defined as AFU-Accelerated 
Function Unit), and each AFU is a Hardware Acceleration Unit and 
it can dynamically Reload respectively.

Proposed Solution
=
 - Involve Rawdev to take FPGA Partial Configuration(Download/PR)
 - Defined FPGA-BUS for Acceleration Drivers of AFUs
   - FPGA PCI Scan(1st Scan) follows DPDK UIO/VFIO PCI Scan Process, 
 probe Intel FPGA Rawdev Driver. FPGA-BUS scan is called, but AFU
 depend on Rawdev, so this scan doesn't trig AFU device create.
   - AFU Scan(2nd Scan) bind DPDK Driver to FPGA Partial-Bitstream.
 This scan is trigged by hotplug of IFPGA Rawdev probe, in this
 scan the AFUs will be created and their dirves are also probed.

Scope
=
The Intel FPGA BUS implementation is target towards various FPGA Devices 
use PR to provide many Acceleration Function. Specific PMDs may also 
bind to its AFU. And Applications don't care they are using ASIC 
Acceleration or FPGA AFU Acceleration.


Status
=
With integrating Intel PSG FPGA Software Stack OPAE(Open Programmable 
Acceleration Engine) Share Code, Intel FPGA BUS runs well in 
Intel PSG FPGA Cards.

Rosen Xu (3):
  Add Intel FPGA BUS Lib Code
  Add Intel FPGA BUS Rawdev Driver
  Add Intel FPGA OPAE Share Code

 config/common_base |6 +
 drivers/bus/Makefile   |1 +
 drivers/bus/ifpga/Makefile |   33 +
 drivers/bus/ifpga/ifpga_bus.c  |  517 ++
 drivers/bus/ifpga/ifpga_common.c   |  141 ++
 drivers/bus/ifpga/ifpga_common.h   |   22 +
 drivers/bus/ifpga/ifpga_logs.h |   31 +
 drivers/bus/ifpga/rte_bus_ifpga.h  |  175 ++
 drivers/bus/ifpga/rte_bus_ifpga_version.map|8 +
 drivers/raw/Makefile   |1 +
 drivers/raw/ifpga_rawdev/Makefile  |   34 +
 drivers/raw/ifpga_rawdev/base/Makefile |   54 +
 drivers/raw/ifpga_rawdev/base/ifpga_api.c  |  529 ++
 drivers/raw/ifpga_rawdev/base/ifpga_api.h  |   73 +
 drivers/raw/ifpga_rawdev/base/ifpga_compat.h   |   84 +
 drivers/raw/ifpga_rawdev/base/ifpga_defines.h  | 1688 
 drivers/raw/ifpga_rawdev/base/ifpga_enumerate.c|  851 ++
 drivers/raw/ifpga_rawdev/base/ifpga_enumerate.h|   38 +
 drivers/raw/ifpga_rawdev/base/ifpga_feature_dev.c  |  341 
 drivers/raw/ifpga_rawdev/base/ifpga_feature_dev.h  |  191 +++
 drivers/raw/ifpga_rawdev/base/ifpga_fme.c  |  761 +
 drivers/raw/ifpga_rawdev/base/ifpga_fme_dperf.c|  328 
 drivers/raw/ifpga_rawdev/base/ifpga_fme_error.c|  430 +
 drivers/raw/ifpga_rawdev/base/ifpga_fme_iperf.c|  742 +
 drivers/raw/ifpga_rawdev/base/ifpga_fme_pr.c   |  399 +
 drivers/raw/ifpga_rawdev/base/ifpga_hw.h   |  154 ++
 drivers/raw/ifpga_rawdev/base/ifpga_port.c |  435 +
 drivers/raw/ifpga_rawdev/base/ifpga_port_error.c   |  192 +++
 drivers/raw/ifpga_rawdev/base/opae_debug.c |  126 ++
 drivers/raw/ifpga_rawdev/base/opae_debug.h |   46 +
 drivers/raw/ifpga_rawdev/base/opae_hw_api.c|  408 +
 drivers/raw/ifpga_rawdev/base/opae_hw_api.h|  280 
 drivers/raw/ifpga_rawdev/base/opae_ifpga_hw_api.c  |  172 ++
 drivers/raw/ifpga_rawdev/base/opae_ifpga_hw_api.h  |  306 
 drivers/raw/ifpga_rawdev/base/opae_osdep.h |  115 ++
 .../ifpga_rawdev/base/osdep_raw/osdep_generic.h|  104 ++
 .../ifpga_rawdev/base/osdep_rte/osdep_generic.h|   72 +
 drivers/raw/ifpga_rawdev/ifpga_rawdev.c|  594 +++
 drivers/raw/ifpga_rawdev/ifpga_rawdev.h|   37 +
 .../raw/ifpga_raw

[dpdk-dev] [PATCH v4 1/3] Add Intel FPGA BUS Lib Code

2018-03-31 Thread Rosen Xu
Signed-off-by: Rosen Xu 
---
 config/common_base  |   5 +
 drivers/bus/Makefile|   1 +
 drivers/bus/ifpga/Makefile  |  33 ++
 drivers/bus/ifpga/ifpga_bus.c   | 517 
 drivers/bus/ifpga/ifpga_common.c| 141 
 drivers/bus/ifpga/ifpga_common.h|  22 ++
 drivers/bus/ifpga/ifpga_logs.h  |  31 ++
 drivers/bus/ifpga/rte_bus_ifpga.h   | 175 ++
 drivers/bus/ifpga/rte_bus_ifpga_version.map |   8 +
 mk/rte.app.mk   |   2 +
 10 files changed, 935 insertions(+)
 create mode 100644 drivers/bus/ifpga/Makefile
 create mode 100644 drivers/bus/ifpga/ifpga_bus.c
 create mode 100644 drivers/bus/ifpga/ifpga_common.c
 create mode 100644 drivers/bus/ifpga/ifpga_common.h
 create mode 100644 drivers/bus/ifpga/ifpga_logs.h
 create mode 100644 drivers/bus/ifpga/rte_bus_ifpga.h
 create mode 100644 drivers/bus/ifpga/rte_bus_ifpga_version.map

diff --git a/config/common_base b/config/common_base
index ad03cf4..49f6b09 100644
--- a/config/common_base
+++ b/config/common_base
@@ -134,6 +134,11 @@ CONFIG_RTE_LIBRTE_PCI_BUS=y
 CONFIG_RTE_LIBRTE_VDEV_BUS=y
 
 #
+# Compile the Intel FPGA bus
+#
+CONFIG_RTE_LIBRTE_IFPGA_BUS=y
+
+#
 # Compile ARK PMD
 #
 CONFIG_RTE_LIBRTE_ARK_PMD=y
diff --git a/drivers/bus/Makefile b/drivers/bus/Makefile
index 7ef2593..55d2dfe 100644
--- a/drivers/bus/Makefile
+++ b/drivers/bus/Makefile
@@ -7,5 +7,6 @@ DIRS-$(CONFIG_RTE_LIBRTE_DPAA_BUS) += dpaa
 DIRS-$(CONFIG_RTE_LIBRTE_FSLMC_BUS) += fslmc
 DIRS-$(CONFIG_RTE_LIBRTE_PCI_BUS) += pci
 DIRS-$(CONFIG_RTE_LIBRTE_VDEV_BUS) += vdev
+DIRS-$(CONFIG_RTE_LIBRTE_IFPGA_BUS) += ifpga
 
 include $(RTE_SDK)/mk/rte.subdir.mk
diff --git a/drivers/bus/ifpga/Makefile b/drivers/bus/ifpga/Makefile
new file mode 100644
index 000..1b569af
--- /dev/null
+++ b/drivers/bus/ifpga/Makefile
@@ -0,0 +1,33 @@
+# SPDX-License-Identifier: BSD-3-Clause
+# Copyright(c) 2018 Intel Corporation
+
+include $(RTE_SDK)/mk/rte.vars.mk
+
+#
+# library name
+#
+LIB = librte_bus_ifpga.a
+
+CFLAGS += -O3
+CFLAGS += $(WERROR_FLAGS)
+
+# versioning export map
+EXPORT_MAP := rte_bus_ifpga_version.map
+
+# library version
+LIBABIVER := 1
+
+VPATH += $(SRCDIR)/base
+
+SRCS-y += \
+ifpga_bus.c \
+ifpga_common.c
+
+LDLIBS += -lrte_eal
+
+#
+# Export include files
+#
+SYMLINK-y-include += rte_bus_ifpga.h
+
+include $(RTE_SDK)/mk/rte.lib.mk
diff --git a/drivers/bus/ifpga/ifpga_bus.c b/drivers/bus/ifpga/ifpga_bus.c
new file mode 100644
index 000..eba2615
--- /dev/null
+++ b/drivers/bus/ifpga/ifpga_bus.c
@@ -0,0 +1,517 @@
+/* SPDX-License-Identifier: BSD-3-Clause
+ * Copyright(c) 2010-2018 Intel Corporation
+ */
+
+#include 
+#include 
+#include 
+#include 
+#include 
+#include 
+#include 
+#include 
+#include 
+#include 
+
+#include 
+#include 
+#include 
+#include 
+#include 
+#include 
+#include 
+
+#include 
+#include 
+#include 
+#include 
+#include 
+
+#include "rte_rawdev.h"
+#include "rte_rawdev_pmd.h"
+#include "rte_bus_ifpga.h"
+#include "ifpga_logs.h"
+#include "ifpga_common.h"
+
+int ifpga_bus_logtype;
+
+/* register a ifpga bus based driver */
+void rte_ifpga_driver_register(struct rte_afu_driver *driver)
+{
+   RTE_VERIFY(driver);
+
+   TAILQ_INSERT_TAIL(&rte_ifpga_bus.driver_list, driver, next);
+}
+
+/* un-register a fpga bus based driver */
+void rte_ifpga_driver_unregister(struct rte_afu_driver *driver)
+{
+   TAILQ_REMOVE(&rte_ifpga_bus.driver_list, driver, next);
+}
+
+static struct rte_ifpga_device *
+ifpga_find_ifpga_dev(const struct rte_pci_addr *pci_addr)
+{
+   struct rte_ifpga_device *ifpga_dev = NULL;
+
+   TAILQ_FOREACH(ifpga_dev, &rte_ifpga_bus.ifpga_list, next) {
+   if (!rte_pci_addr_cmp(&ifpga_dev->pci_addr, pci_addr))
+   return ifpga_dev;
+   }
+   return NULL;
+}
+
+static struct rte_afu_device *
+ifpga_find_afu_dev(const struct rte_ifpga_device *ifpga_dev,
+   const struct rte_afu_id *afu_id)
+{
+   struct rte_afu_device *afu_dev = NULL;
+
+   TAILQ_FOREACH(afu_dev, &ifpga_dev->afu_list, next) {
+   if (!ifpga_afu_id_cmp(&afu_dev->id, afu_id))
+   return afu_dev;
+   }
+   return NULL;
+}
+
+static const char * const valid_args[] = {
+#define IFPGA_ARG_BDF  "bdf"
+   IFPGA_ARG_BDF,
+#define IFPGA_ARG_PORT "port"
+   IFPGA_ARG_PORT,
+#define IFPGA_AFU_BTS  "afu_bts"
+   IFPGA_AFU_BTS,
+   NULL
+};
+
+/*
+ * Scan the content of the FPGA bus, and the devices in the devices
+ * list
+ */
+static struct rte_afu_device *
+rte_ifpga_scan_one(struct rte_devargs *devargs,
+   struct rte_ifpga_device *ifpga_dev)
+{
+   struct rte_kvargs *kvlist = NULL;
+   struct rte_rawdev *rawdev = NULL;
+   struct rte_afu_device *afu_dev = NULL;
+   struct rte_afu_pr_conf afu_pr_conf;
+   int ret = 0;
+   char *path = NU

Re: [dpdk-dev] Build is broken in dpdk-next-net

2018-03-31 Thread Gaëtan Rivet
On Sat, Mar 31, 2018 at 11:27:55AM -0400, Neil Horman wrote:
> On Sat, Mar 31, 2018 at 05:09:47PM +0200, Gaëtan Rivet wrote:
> > On Sat, Mar 31, 2018 at 09:33:43AM -0400, Neil Horman wrote:
> > > On Fri, Mar 30, 2018 at 10:47:09PM +0800, Tonghao Zhang wrote:
> > > > I rebuild it on ubuntu 17.10 and cash it. I use the 'RTE_SET_USED' to 
> > > > fix it.
> > > > 
> > > > 
> > > > diff --git a/lib/librte_vhost/fd_man.c b/lib/librte_vhost/fd_man.c
> > > > index 771675718..f11803191 100644
> > > > --- a/lib/librte_vhost/fd_man.c
> > > > +++ b/lib/librte_vhost/fd_man.c
> > > > @@ -279,7 +279,8 @@ fdset_pipe_read_cb(int readfd, void *dat 
> > > > __rte_unused,
> > > >int *remove __rte_unused)
> > > >  {
> > > > char charbuf[16];
> > > > -   read(readfd, charbuf, sizeof(charbuf));
> > > > +   int r = read(readfd, charbuf, sizeof(charbuf));
> > > > +   RTE_SET_USED(r);
> > > >  }
> > > > 
> > > >  void
> > > > @@ -319,5 +320,6 @@ fdset_pipe_init(struct fdset *fdset)
> > > >  void
> > > >  fdset_pipe_notify(struct fdset *fdset)
> > > >  {
> > > > -   write(fdset->u.writefd, "1", 1);
> > > > +   int r = write(fdset->u.writefd, "1", 1);
> > > > +   RTE_SET_USED(r);
> > > >  }
> > > > 
> > > 
> > > A better option might be to use _Pragma
> > > 
> > > Something like this perhaps
> > > 
> > > #define ALLOW_UNUSED(x) \
> > > _Pragma(push) \
> > > _Pragma(diagnostic ignored "-Wunused-result") \
> > > #x;\
> > > _Pragma(pop)
> > > 
> > > This is of course untested, so it probably needs some tweaking, but this 
> > > method
> > > avoids the need to declare an additional stack variable, which i don't 
> > > think can
> > > be eliminated due to the cast.  I believe that this method should also 
> > > work
> > > accross compilers (the gcc and clang compilers support this, and i think 
> > > the
> > > intel compiler should as well)
> > > 
> > > Neil
> > > 
> > 
> > It would be nice to avoid the definition of a useless variable.
> > An alternative could be
> > 
> >if (read() < 0) {
> >/* Failure here is acceptable for such and such reason. */
> >}
> > 
> > to ensure all-around compatibility, and the definition or another macro.
> > Just a suggestion.
> > 
> That would be a good alternative, but I think its effectiveness is dependent 
> on
> when the compiler does with the return value check. Without any code inside 
> the
> conditional, the compiler may optimize the check out, meaning the warning will
> still be asserted.  If it doesn't optimize the check out, then you have a
> useless compare and jump instruction left in the code path.
> 
> Best
> Neil
> 

I tested quickly, I see no difference with the three methods:

#include 

__attribute__((warn_unused_result))
int wur(void)
{
return read(0, NULL, 0);
}

void with_void(void)
{
int ret;

ret = wur();
(void) ret;
}

void with_pragma(void)
{
#pragma GCC diagnostic push
#pragma GCC diagnostic ignored "-Wunused-result"
wur();
#pragma GCC diagnostic pop
}

void with_if(void)
{
if (wur() < 0) {
/* I do not care for errors. */
}
}

int main(void)
{
return 0;
}



gcc -D_FORTIFY_SOURCE=2 -Wunused-result -Werror -O3 _wur.c -o wur_O3.out
gcc -D_FORTIFY_SOURCE=2 -Wunused-result -Werror -O0 _wur.c -o wur_O0.out
diff -Napy <(gdb -batch -ex 'file ./wur_O0.out' -ex 'disassemble with_void') 
<(gdb -batch -ex 'file ./wur_O3.out' -ex 'disassemble with_void') || true
Dump of assembler code for function with_void:  Dump of 
assembler code for function with_void:
   0x06ca <+0>: push   %rbp   |
0x06e0 <+0>: xor%edx,%edx
   0x06cb <+1>: mov%rsp,%rbp  |
0x06e2 <+2>: xor%esi,%esi
   0x06ce <+4>: sub$0x10,%rsp |
0x06e4 <+4>: xor%edi,%edi
   0x06d2 <+8>: callq  0x6b0 |
0x06e6 <+6>: jmpq   0x560 
   0x06d7 <+13>:mov%eax,-0x4(%rbp)<
   0x06da <+16>:nop   <
   0x06db <+17>:leaveq<
   0x06dc <+18>:retq  <
End of assembler dump.  End of 
assembler dump.
diff -Napy <(gdb -batch -ex 'file ./wur_O0.out' -ex 'disassemble with_pragma') 
<(gdb -batch -ex 'file ./wur_O3.out' -ex 'disassemble with_pragma') || true
Dump of assembler code for function with_pragma:Dump of 
assembler code for function with_pragma:
   0x06dd <+0>: push   %rbp   |
0x06f0 <+0>: xor%edx,%edx
   0x06de <+1>: mov%rsp,%rbp  |
0x06f2 <+2>: xor%esi,%esi
   0x06e1 <+4>: callq  0x6b0 |
0x06f4 <

Re: [dpdk-dev] [PATCH v3 1/6] Add Intel FPGA BUS Command Parse Code

2018-03-31 Thread Xu, Rosen


> -Original Message-
> From: Gaëtan Rivet [mailto:gaetan.ri...@6wind.com]
> Sent: Wednesday, March 28, 2018 21:26
> To: Xu, Rosen 
> Cc: dev@dpdk.org; Doherty, Declan ;
> Richardson, Bruce ; shreyansh.j...@nxp.com;
> Zhang, Tianfei ; Wu, Hao 
> Subject: Re: [PATCH v3 1/6] Add Intel FPGA BUS Command Parse Code
> 
> On Wed, Mar 28, 2018 at 05:29:51PM +0800, Rosen Xu wrote:
> > Signed-off-by: Rosen Xu 
> > ---
> >  lib/librte_eal/common/eal_common_options.c | 8 +++-
> >  lib/librte_eal/common/eal_options.h| 2 ++
> >  2 files changed, 9 insertions(+), 1 deletion(-)
> >
> > diff --git a/lib/librte_eal/common/eal_common_options.c
> > b/lib/librte_eal/common/eal_common_options.c
> > index 9f2f8d2..4fe0875 100644
> > --- a/lib/librte_eal/common/eal_common_options.c
> > +++ b/lib/librte_eal/common/eal_common_options.c
> > @@ -73,6 +73,7 @@
> > {OPT_VDEV,  1, NULL, OPT_VDEV_NUM },
> > {OPT_VFIO_INTR, 1, NULL, OPT_VFIO_INTR_NUM},
> > {OPT_VMWARE_TSC_MAP,0, NULL,
> OPT_VMWARE_TSC_MAP_NUM   },
> > +   {OPT_IFPGA, 1, NULL, OPT_IFPGA_NUM},
> > {0, 0, NULL, 0}
> >  };
> >
> > @@ -1160,7 +1161,12 @@ static int xdigit2val(unsigned char c)
> >
> > core_parsed = LCORE_OPT_MAP;
> > break;
> > -
> > +   case OPT_IFPGA_NUM:
> > +   if (eal_option_device_add(RTE_DEVTYPE_VIRTUAL,
> > +   optarg) < 0) {
> > +   return -1;
> > +   }
> > +   break;
> 
> why do you need to add a new option if you only insert a virtual devargs?
> 
> Why wouldn't --vdev option work instead? and for that matter, I was
> expecting you to provide a PCI address. Can you give a command line
> showing how you create your device? The devtype is essentially ignored
> currently (at option stage, maybe there are still cruft left in PCI bus), 
> instead
> the devargs parsing will detect the bus from the given optarg.
> 
> This part of EAL will change rather soon, I'd prefer not to deal with 
> additional
> options unless necessary.

For PATCH v4, I have removed all the modification from eal library. 
Create vdev to take IFPGA parameters configuration.

The command line for PATCH v4 is(just take 2 AFU for example):
testpmd -c 0x3 -n 4 --socket-mem 1024,0 --huge-dir=/mnt/huge \
--vdev 'net_ifpga_cfg0,bdf=5e:00.0,port=0,afu_bts=./xxx.gbs'  \
--vdev 'net_ifpga_cfg1,bdf=be:00.0,port=0,afu_bts=./xxx.gbs'  -- -i --no-numa
Note: the parameter of "port" is used by OPAE for download bitstream.

> > /* don't know what to do, leave this to caller */
> > default:
> > return 1;
> > diff --git a/lib/librte_eal/common/eal_options.h
> > b/lib/librte_eal/common/eal_options.h
> > index e86c711..bdbb2c4 100644
> > --- a/lib/librte_eal/common/eal_options.h
> > +++ b/lib/librte_eal/common/eal_options.h
> > @@ -55,6 +55,8 @@ enum {
> > OPT_VFIO_INTR_NUM,
> >  #define OPT_VMWARE_TSC_MAP"vmware-tsc-map"
> > OPT_VMWARE_TSC_MAP_NUM,
> > +#define OPT_IFPGA  "ifpga"
> > +   OPT_IFPGA_NUM,
> > OPT_LONG_MAX_NUM
> >  };
> >
> > --
> > 1.8.3.1
> >
> 
> --
> Gaëtan Rivet
> 6WIND


Re: [dpdk-dev] [PATCH v3 2/6] config/common_base: Add Intel FPGA Build Configuration Macro

2018-03-31 Thread Xu, Rosen


> -Original Message-
> From: Gaëtan Rivet [mailto:gaetan.ri...@6wind.com]
> Sent: Wednesday, March 28, 2018 21:27
> To: Xu, Rosen 
> Cc: dev@dpdk.org; Doherty, Declan ;
> Richardson, Bruce ; shreyansh.j...@nxp.com;
> Zhang, Tianfei ; Wu, Hao 
> Subject: Re: [PATCH v3 2/6] config/common_base: Add Intel FPGA Build
> Configuration Macro
> 
> On Wed, Mar 28, 2018 at 05:29:52PM +0800, Rosen Xu wrote:
> > Signed-off-by: Rosen Xu 
> > ---
> >  config/common_base | 6 ++
> >  1 file changed, 6 insertions(+)
> >
> > diff --git a/config/common_base b/config/common_base index
> > ad03cf4..08b7cce 100644
> > --- a/config/common_base
> > +++ b/config/common_base
> > @@ -134,6 +134,12 @@ CONFIG_RTE_LIBRTE_PCI_BUS=y
> > CONFIG_RTE_LIBRTE_VDEV_BUS=y
> >
> >  #
> > +# Compile the Intel FPGA bus
> > +#
> > +CONFIG_RTE_LIBRTE_IFPGA_BUS=y
> > +CONFIG_RTE_LIBRTE_IFPGA_RAWDEV=y
> > +
> > +#
> 
> Please squash this patch with their relevant counterparts.
> As it is, this won't trigger an error but the patch is meaningless.

It's done by PATCH v4.

> >  # Compile ARK PMD
> >  #
> >  CONFIG_RTE_LIBRTE_ARK_PMD=y
> > --
> > 1.8.3.1
> >
> 
> --
> Gaëtan Rivet
> 6WIND


Re: [dpdk-dev] [PATCH v3 3/6] mk/rte.app.mk: Add Intel FPGA Bus Build Configuration Macro To App Script

2018-03-31 Thread Xu, Rosen


> -Original Message-
> From: Gaëtan Rivet [mailto:gaetan.ri...@6wind.com]
> Sent: Wednesday, March 28, 2018 21:29
> To: Xu, Rosen 
> Cc: dev@dpdk.org; Doherty, Declan ;
> Richardson, Bruce ; shreyansh.j...@nxp.com;
> Zhang, Tianfei ; Wu, Hao 
> Subject: Re: [PATCH v3 3/6] mk/rte.app.mk: Add Intel FPGA Bus Build
> Configuration Macro To App Script
> 
> On Wed, Mar 28, 2018 at 05:29:53PM +0800, Rosen Xu wrote:
> > Signed-off-by: Rosen Xu 
> > ---
> >  mk/rte.app.mk | 3 +++
> >  1 file changed, 3 insertions(+)
> >
> > diff --git a/mk/rte.app.mk b/mk/rte.app.mk index 3eb41d1..958b6b5
> > 100644
> > --- a/mk/rte.app.mk
> > +++ b/mk/rte.app.mk
> > @@ -107,6 +107,9 @@ _LDLIBS-$(CONFIG_RTE_LIBRTE_CMDLINE)+= -
> lrte_cmdline
> >  _LDLIBS-$(CONFIG_RTE_LIBRTE_REORDER)+= -lrte_reorder
> >  _LDLIBS-$(CONFIG_RTE_LIBRTE_SCHED)  += -lrte_sched
> >
> > +_LDLIBS-$(CONFIG_RTE_LIBRTE_IFPGA_BUS)  += -lrte_bus_ifpga
> > +_LDLIBS-$(CONFIG_RTE_LIBRTE_IFPGA_RAWDEV)   += -
> lrte_ifpga_rawdev
> > +
> 
> This however, should trigger a link error given that the relevant libraries 
> are
> not yet available. Same as before, please squash with the patch introducing
> the libraries.

It's done by PATCH v4.

> >  ifeq ($(CONFIG_RTE_EXEC_ENV_LINUXAPP),y)
> >  _LDLIBS-$(CONFIG_RTE_LIBRTE_KNI)+= -lrte_kni
> >  endif
> > --
> > 1.8.3.1
> >
> 
> --
> Gaëtan Rivet
> 6WIND


Re: [dpdk-dev] [PATCH v3 4/6] drivers/bus: Add Intel FPGA Bus Lib Code

2018-03-31 Thread Xu, Rosen


> -Original Message-
> From: Gaëtan Rivet [mailto:gaetan.ri...@6wind.com]
> Sent: Wednesday, March 28, 2018 21:52
> To: Xu, Rosen 
> Cc: dev@dpdk.org; Doherty, Declan ;
> Richardson, Bruce ; shreyansh.j...@nxp.com;
> Zhang, Tianfei ; Wu, Hao 
> Subject: Re: [PATCH v3 4/6] drivers/bus: Add Intel FPGA Bus Lib Code
> 
> On Wed, Mar 28, 2018 at 05:29:54PM +0800, Rosen Xu wrote:
> > Signed-off-by: Rosen Xu 
> > ---
> >  drivers/bus/Makefile|   1 +
> >  drivers/bus/ifpga/Makefile  |  33 ++
> >  drivers/bus/ifpga/ifpga_bus.c   | 562
> 
> >  drivers/bus/ifpga/ifpga_common.c| 141 +++
> >  drivers/bus/ifpga/ifpga_common.h|  22 ++
> >  drivers/bus/ifpga/ifpga_logs.h  |  31 ++
> >  drivers/bus/ifpga/rte_bus_ifpga.h   | 140 +++
> >  drivers/bus/ifpga/rte_bus_ifpga_version.map |   8 +
> >  8 files changed, 938 insertions(+)
> >  create mode 100644 drivers/bus/ifpga/Makefile  create mode 100644
> > drivers/bus/ifpga/ifpga_bus.c  create mode 100644
> > drivers/bus/ifpga/ifpga_common.c  create mode 100644
> > drivers/bus/ifpga/ifpga_common.h  create mode 100644
> > drivers/bus/ifpga/ifpga_logs.h  create mode 100644
> > drivers/bus/ifpga/rte_bus_ifpga.h  create mode 100644
> > drivers/bus/ifpga/rte_bus_ifpga_version.map
> >
> > diff --git a/drivers/bus/Makefile b/drivers/bus/Makefile index
> > 7ef2593..55d2dfe 100644
> > --- a/drivers/bus/Makefile
> > +++ b/drivers/bus/Makefile
> > @@ -7,5 +7,6 @@ DIRS-$(CONFIG_RTE_LIBRTE_DPAA_BUS) += dpaa
> >  DIRS-$(CONFIG_RTE_LIBRTE_FSLMC_BUS) += fslmc
> >  DIRS-$(CONFIG_RTE_LIBRTE_PCI_BUS) += pci
> >  DIRS-$(CONFIG_RTE_LIBRTE_VDEV_BUS) += vdev
> > +DIRS-$(CONFIG_RTE_LIBRTE_IFPGA_BUS) += ifpga
> >
> >  include $(RTE_SDK)/mk/rte.subdir.mk
> > diff --git a/drivers/bus/ifpga/Makefile b/drivers/bus/ifpga/Makefile
> > new file mode 100644 index 000..e611950
> > --- /dev/null
> > +++ b/drivers/bus/ifpga/Makefile
> > @@ -0,0 +1,33 @@
> > +# SPDX-License-Identifier: BSD-3-Clause # Copyright(c) 2017 Intel
> > +Corporation
> 
> Copyrigth 2018 (same comment for most SPDX tags, I think I saw 2017 or a
> variation of it everywhere I think).

It's done by PATCH v4.

> > +
> > +include $(RTE_SDK)/mk/rte.vars.mk
> > +
> > +#
> > +# library name
> > +#
> > +LIB = librte_bus_ifpga.a
> > +
> > +CFLAGS += -O3
> > +CFLAGS += $(WERROR_FLAGS)
> > +
> > +# versioning export map
> > +EXPORT_MAP := rte_bus_ifpga_version.map
> > +
> > +# library version
> > +LIBABIVER := 1
> > +
> > +VPATH += $(SRCDIR)/base
> > +
> > +SRCS-y += \
> > +ifpga_bus.c \
> > +ifpga_common.c
> > +
> > +LDLIBS += -lrte_eal
> 
> you should probably load librte_pci.
> You use afterward functions (at least address comparison).
> I haven't tested the SHARED build, but my guess is that it would break.

The FPGA BUS is based PCI(IFPGA is probed by PCI), do you think so users
to add it?

> On that note, you haven't acted on my previous remarks to use the common
> PCI utilities provided.

It's done in PATCH v4.

> > +
> > +#
> > +# Export include files
> > +#
> > +SYMLINK-y-include += rte_bus_ifpga.h
> > +
> > +include $(RTE_SDK)/mk/rte.lib.mk
> > diff --git a/drivers/bus/ifpga/ifpga_bus.c
> > b/drivers/bus/ifpga/ifpga_bus.c new file mode 100644 index
> > 000..092be65
> > --- /dev/null
> > +++ b/drivers/bus/ifpga/ifpga_bus.c
> > @@ -0,0 +1,562 @@
> > +/* SPDX-License-Identifier: BSD-3-Clause
> > + * Copyright(c) 2010-2017 Intel Corporation  */
> > +
> > +#include 
> > +#include 
> > +#include 
> > +#include 
> > +#include 
> > +#include 
> > +#include 
> > +#include 
> > +#include 
> > +#include 
> > +
> > +#include 
> > +#include 
> > +#include 
> > +#include 
> > +#include 
> > +#include 
> > +#include 
> > +
> > +#include 
> > +#include 
> > +#include 
> > +#include 
> > +#include 
> > +
> > +#include "rte_rawdev.h"
> > +#include "rte_rawdev_pmd.h"
> > +#include "rte_bus_ifpga.h"
> > +#include "ifpga_logs.h"
> > +#include "ifpga_common.h"
> > +
> > +int ifpga_bus_logtype;
> > +
> > +/* register a ifpga bus based driver */ void
> > +rte_ifpga_driver_register(struct rte_afu_driver *driver) {
> > +   RTE_VERIFY(driver);
> > +
> > +   TAILQ_INSERT_TAIL(&rte_ifpga_bus.driver_list, driver, next); }
> > +
> > +/* un-register a fpga bus based driver */ void
> > +rte_ifpga_driver_unregister(struct rte_afu_driver *driver) {
> > +   TAILQ_REMOVE(&rte_ifpga_bus.driver_list, driver, next); }
> > +
> > +static struct rte_ifpga_device *
> > +ifpga_find_ifpga_dev(const struct rte_pci_addr *pci_addr) {
> > +   struct rte_ifpga_device *ifpga_dev = NULL;
> > +
> > +   TAILQ_FOREACH(ifpga_dev, &rte_ifpga_bus.ifpga_list, next) {
> > +   if (!rte_pci_addr_cmp(&ifpga_dev->pci_addr, pci_addr))
> > +   return ifpga_dev;
> > +   }
> > +   return NULL;
> > +}
> > +
> > +static struct rte_afu_device *
> > +ifpga_find_afu_dev(const struct rte_ifpga_device *ifpga_dev,
> > +   const stru

Re: [dpdk-dev] [PATCH] net/nfp: support new HW offloads API

2018-03-31 Thread Alejandro Lucero
On Tue, Mar 27, 2018 at 7:25 PM, Ferruh Yigit 
wrote:

> On 3/15/2018 2:30 PM, Alejandro Lucero wrote:
> > In next 18.05 the old hw offload API will be removed. This patch adds
> > support for just the new hw offload API.
> >
> > Signed-off-by: Alejandro Lucero 
>
> <...>
>
> > - if (rxmode->enable_scatter) {
> > + if (!(rxmode->offloads & DEV_RX_OFFLOAD_CRC_STRIP))
> > + PMD_INIT_LOG(INFO, "HW does strip CRC. No configurable!");
>
> Also this behavior is changing, not providing CRC_STRIP will be by default
> stripping [2], this check should be removed.
>
> [2]
> https://dpdk.org/ml/archives/dev/2018-March/093489.
> htmlhttps://dpdk.org/ml/archives/dev/2018-March/093489.html
>
> <...>
>
> > + dev_conf = &dev->data->dev_conf;
> > + rxmode = &dev_conf->rxmode;
> > +
> > + if (rx_conf->offloads != rxmode->offloads) {
> > + RTE_LOG(ERR, PMD, "queue %u rx offloads not as port
> offloads\n",
> > +   queue_idx);
> > + RTE_LOG(ERR, PMD, "\tport: %" PRIx64 "\n",
> rxmode->offloads);
> > + RTE_LOG(ERR, PMD, "\tqueue: %" PRIx64 "\n",
> rx_conf->offloads);
> > + return -EINVAL;
> > + }
>
> The offload API is changing [1], this check is no more valid. If PMD is not
> supporting queue specific offload app will not send port offloads here.
>
> [1]
> https://dpdk.org/ml/archives/dev/2018-March/092978.html
>
> <...>
>
> > + dev_conf = &dev->data->dev_conf;
> > + txmode = &dev_conf->txmode;
> > +
> > + if (tx_conf->offloads != txmode->offloads) {
> > + RTE_LOG(ERR, PMD, "queue %u tx offloads not as port
> offloads",
> > +   queue_idx);
> > + return -EINVAL;
> > + }
> > +
>
> Same as above.
>

Thank you for the review.

I will remove those checks and send a new path version.


Re: [dpdk-dev] [PATCH 1/4] net/nfp: add NFP CPP support

2018-03-31 Thread Alejandro Lucero
On Fri, Mar 30, 2018 at 11:37 AM, Ferruh Yigit 
wrote:

> On 3/23/2018 5:35 PM, Alejandro Lucero wrote:
> > CPP refers to the internal NFP Command Push Pull bus. This patch allows
> > to create CPP commands from user space allowing to access any single
> > part of the chip.
> >
> > This CPP interface is the base for having other functionalities like
> > mutexes when accessing specific chip components, chip resources
> management,
> > firmware upload or using the NSP, an embedded arm processor which can
> > perform tasks on demand.
> >
> > NSP was the previous only way for doing things in the chip by the PMD,
> > where a NSPU interface was used for commands like firmware upload or
> > port link configuration. CPP interface supersedes NSPU, but it is still
> > possible to use NSP through CPP.
> >
> > CPP interface adds a great flexibility for doing things like extended
> > stats, firmware debugging or selecting properly the firmware file to
> > upload.
>
> It can be good to announce this new feature in release notes, what do you
> think?
>
>
Uhmm, not sure about this. It is specific to the NFP PMD and I do not see
it as a new feature, at least DPDK users will not be aware of it.



> Also get some build errors [1], one is about zlib.h, normally we disable
> PMDs by
> default with external dependencies, is nfp depends to libz with this patch?
>
>
I forgot to remove this reference. It is not needed now, but it was with
the initial internal work.

About the other build errors, I do not get them and I have used a couple of
different systems, Ubuntu and Redhat. This is, of course, a serious
concern. Can you give me more information about the system you are using?

I remember I got some build error with other patches, from automatic builds
made just after those patches were sent. I did not get any this time, just
those warning for checkpatch which I was aware of. Is this automatic build
not happening any more?



> [1]
> ...dpdk/drivers/net/nfp/nfpcore/nfp_mutex.c:295:28: error: format
> specifies type
> 'short' but the argument has type 'unsigned int' [-Werror,-Wformat]
> printf("\tusage:%hd\n", mutex->usage);
>
> ~~~ ^~~~
>
>
> %u
>
> ...dpdk/drivers/net/nfp/nfpcore/nfp_cppcore.c:819:1: error: unused
> function
> '__nfp_bytemask_of' [-Werror,-Wunused-function]
> __nfp_bytemask_of(int width, uint64_t addr)
>
>
> ^
>
> ...dpdk/drivers/net/nfp/nfp_net.c:2971:35: error: format specifies type
> 'unsigned char' but the argument has type 'uint32_t' (aka 'unsigned int')
> [-Werror,-Wformat]
> cpp->serial[4], cpp->serial[5], cpp->interface >> 8,
>
>
> ^~~
> ...dpdk/drivers/net/nfp/nfp_net.c:2972:3: error: format specifies type
> 'unsigned
> char' but the argument has type 'unsigned int' [-Werror,-Wformat]
> cpp->interface & 0xff);
> ^
>
> ...dpdk/drivers/net/nfp/nfpcore/nfp_cppcore.c: In function
> ‘nfp_cpp_area_readl’:
> ...dpdk/drivers/net/nfp/nfpcore/nfp_cppcore.c:459:9: error: ‘tmp’ may be
> used
> uninitialized in this function [-Werror=maybe-uninitialized]
>   *value = rte_le_to_cpu_32(tmp);
>
> ...dpdk/drivers/net/nfp/nfpcore/nfp_cppcore.c: In function
> ‘nfp_cpp_area_readq’:
> ...dpdk/drivers/net/nfp/nfpcore/nfp_cppcore.c:483:9: error: ‘tmp’ may be
> used
> uninitialized in this function [-Werror=maybe-uninitialized]
>   *value = rte_le_to_cpu_64(tmp);
>
> ...dpdk/drivers/net/nfp/nfpcore/nfp_resource.c:34:10: fatal error:
> zlib.h: No
> such file or directory
>  #include 
>   ^~~~
>
> >
> > Signed-off-by: Alejandro Lucero 
>
> <...>
>
> > diff --git a/drivers/net/nfp/nfpcore/nfp-common/nfp_cppat.h
> b/drivers/net/nfp/nfpcore/nfp-common/nfp_cppat.h
> > new file mode 100644
> > index 000..fbeec57
> > --- /dev/null
> > +++ b/drivers/net/nfp/nfpcore/nfp-common/nfp_cppat.h
> > @@ -0,0 +1,748 @@
> > +/*
> > + * Copyright (c) 2018 Netronome Systems, Inc.
> > + * All rights reserved.
> > + *
> > + * Redistribution and use in source and binary forms, with or without
> > + * modification, are permitted provided that the following conditions
> are met:
> > + *
> > + * 1. Redistributions of source code must retain the above copyright
> notice,
> > + *  this list of conditions and the following disclaimer.
> > + *
> > + * 2. Redistributions in binary form must reproduce the above copyright
> > + *  notice, this list of conditions and the following disclaimer in the
> > + *  documentation and/or other materials provided with the distribution
> > + *
> > + * 3. Neither the name of the copyright holder nor the names of its
> > + *  contributors may be used to endorse or promote products derived
> from this
> > + *  software without specific prior written permission.
> > + *
> > + * THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS
> "AS IS"
> > + * AND

Re: [dpdk-dev] [PATCH 3/4] doc: update NFP guide

2018-03-31 Thread Alejandro Lucero
On Fri, Mar 30, 2018 at 11:37 AM, Ferruh Yigit 
wrote:

> On 3/23/2018 5:35 PM, Alejandro Lucero wrote:
> > New CPP interface changes the way firmware upload is managed by
> > the PMD. It also supports different firmware file names for
> > having specific firmware aplications per card.
> >
> > Signed-off-by: Alejandro Lucero 
>
> This conflicts with another nfp doc patch applied in next-net, can you
> please
> rebase this on latest next-net?
>

Yes, sure.

Thanks


[dpdk-dev] [PATCH v7 1/3] eal: rename IPC sync request to pending request

2018-03-31 Thread Anatoly Burakov
Originally, there was only one type of request which was used
for multiprocess synchronization (hence the name - sync request).

However, now that we are going to have two types of requests,
synchronous and asynchronous, having it named "sync request" is
very confusing, so we will rename it to "pending request". This
is internal-only, so no externally visible API changes.

Signed-off-by: Anatoly Burakov 
Suggested-by: Jianfeng Tan 
Acked-by: Jianfeng Tan 
---

Notes:
v7:
- Provide explanation as to why this change is being made

 lib/librte_eal/common/eal_common_proc.c | 38 -
 1 file changed, 19 insertions(+), 19 deletions(-)

diff --git a/lib/librte_eal/common/eal_common_proc.c 
b/lib/librte_eal/common/eal_common_proc.c
index 4131b67..52b6ab2 100644
--- a/lib/librte_eal/common/eal_common_proc.c
+++ b/lib/librte_eal/common/eal_common_proc.c
@@ -60,8 +60,8 @@ struct mp_msg_internal {
struct rte_mp_msg msg;
 };
 
-struct sync_request {
-   TAILQ_ENTRY(sync_request) next;
+struct pending_request {
+   TAILQ_ENTRY(pending_request) next;
int reply_received;
char dst[PATH_MAX];
struct rte_mp_msg *request;
@@ -69,13 +69,13 @@ struct sync_request {
pthread_cond_t cond;
 };
 
-TAILQ_HEAD(sync_request_list, sync_request);
+TAILQ_HEAD(pending_request_list, pending_request);
 
 static struct {
-   struct sync_request_list requests;
+   struct pending_request_list requests;
pthread_mutex_t lock;
-} sync_requests = {
-   .requests = TAILQ_HEAD_INITIALIZER(sync_requests.requests),
+} pending_requests = {
+   .requests = TAILQ_HEAD_INITIALIZER(pending_requests.requests),
.lock = PTHREAD_MUTEX_INITIALIZER
 };
 
@@ -84,12 +84,12 @@ static int
 mp_send(struct rte_mp_msg *msg, const char *peer, int type);
 
 
-static struct sync_request *
+static struct pending_request *
 find_sync_request(const char *dst, const char *act_name)
 {
-   struct sync_request *r;
+   struct pending_request *r;
 
-   TAILQ_FOREACH(r, &sync_requests.requests, next) {
+   TAILQ_FOREACH(r, &pending_requests.requests, next) {
if (!strcmp(r->dst, dst) &&
!strcmp(r->request->name, act_name))
break;
@@ -259,7 +259,7 @@ read_msg(struct mp_msg_internal *m, struct sockaddr_un *s)
 static void
 process_msg(struct mp_msg_internal *m, struct sockaddr_un *s)
 {
-   struct sync_request *sync_req;
+   struct pending_request *sync_req;
struct action_entry *entry;
struct rte_mp_msg *msg = &m->msg;
rte_mp_t action = NULL;
@@ -267,7 +267,7 @@ process_msg(struct mp_msg_internal *m, struct sockaddr_un 
*s)
RTE_LOG(DEBUG, EAL, "msg: %s\n", msg->name);
 
if (m->type == MP_REP || m->type == MP_IGN) {
-   pthread_mutex_lock(&sync_requests.lock);
+   pthread_mutex_lock(&pending_requests.lock);
sync_req = find_sync_request(s->sun_path, msg->name);
if (sync_req) {
memcpy(sync_req->reply, msg, sizeof(*msg));
@@ -276,7 +276,7 @@ process_msg(struct mp_msg_internal *m, struct sockaddr_un 
*s)
pthread_cond_signal(&sync_req->cond);
} else
RTE_LOG(ERR, EAL, "Drop mp reply: %s\n", msg->name);
-   pthread_mutex_unlock(&sync_requests.lock);
+   pthread_mutex_unlock(&pending_requests.lock);
return;
}
 
@@ -607,7 +607,7 @@ mp_request_one(const char *dst, struct rte_mp_msg *req,
 {
int ret;
struct rte_mp_msg msg, *tmp;
-   struct sync_request sync_req, *exist;
+   struct pending_request sync_req, *exist;
 
sync_req.reply_received = 0;
strcpy(sync_req.dst, dst);
@@ -615,14 +615,14 @@ mp_request_one(const char *dst, struct rte_mp_msg *req,
sync_req.reply = &msg;
pthread_cond_init(&sync_req.cond, NULL);
 
-   pthread_mutex_lock(&sync_requests.lock);
+   pthread_mutex_lock(&pending_requests.lock);
exist = find_sync_request(dst, req->name);
if (!exist)
-   TAILQ_INSERT_TAIL(&sync_requests.requests, &sync_req, next);
+   TAILQ_INSERT_TAIL(&pending_requests.requests, &sync_req, next);
if (exist) {
RTE_LOG(ERR, EAL, "A pending request %s:%s\n", dst, req->name);
rte_errno = EEXIST;
-   pthread_mutex_unlock(&sync_requests.lock);
+   pthread_mutex_unlock(&pending_requests.lock);
return -1;
}
 
@@ -638,12 +638,12 @@ mp_request_one(const char *dst, struct rte_mp_msg *req,
 
do {
ret = pthread_cond_timedwait(&sync_req.cond,
-   &sync_requests.lock, ts);
+   &pending_requests.lock, ts);
} while (ret != 0 && ret != ETIMEDOUT);
 
/* We got the lock now */
-   TAILQ_REMOVE(&sync_requests.reque

[dpdk-dev] [PATCH v7 2/3] eal: rename mp_request to mp_request_sync

2018-03-31 Thread Anatoly Burakov
Rename rte_mp_request to rte_mp_request_sync to indicate
that this request will be done synchronously (as opposed to
asynchronous request, which comes in next patch).

Also, fix alphabetical ordering for .map file.

Signed-off-by: Anatoly Burakov 
Suggested-by: Thomas Monjalon 
---

Notes:
v7:
- Added this patch

 lib/librte_eal/common/eal_common_proc.c | 2 +-
 lib/librte_eal/common/include/rte_eal.h | 2 +-
 lib/librte_eal/rte_eal_version.map  | 4 ++--
 3 files changed, 4 insertions(+), 4 deletions(-)

diff --git a/lib/librte_eal/common/eal_common_proc.c 
b/lib/librte_eal/common/eal_common_proc.c
index 52b6ab2..b704f5a 100644
--- a/lib/librte_eal/common/eal_common_proc.c
+++ b/lib/librte_eal/common/eal_common_proc.c
@@ -674,7 +674,7 @@ mp_request_one(const char *dst, struct rte_mp_msg *req,
 }
 
 int __rte_experimental
-rte_mp_request(struct rte_mp_msg *req, struct rte_mp_reply *reply,
+rte_mp_request_sync(struct rte_mp_msg *req, struct rte_mp_reply *reply,
const struct timespec *ts)
 {
int dir_fd, ret = 0;
diff --git a/lib/librte_eal/common/include/rte_eal.h 
b/lib/librte_eal/common/include/rte_eal.h
index 044474e..d1cc89e 100644
--- a/lib/librte_eal/common/include/rte_eal.h
+++ b/lib/librte_eal/common/include/rte_eal.h
@@ -314,7 +314,7 @@ rte_mp_sendmsg(struct rte_mp_msg *msg);
  *  - On failure, return -1, and the reason will be stored in rte_errno.
  */
 int __rte_experimental
-rte_mp_request(struct rte_mp_msg *req, struct rte_mp_reply *reply,
+rte_mp_request_sync(struct rte_mp_msg *req, struct rte_mp_reply *reply,
   const struct timespec *ts);
 
 /**
diff --git a/lib/librte_eal/rte_eal_version.map 
b/lib/librte_eal/rte_eal_version.map
index d123602..7b66c73 100644
--- a/lib/librte_eal/rte_eal_version.map
+++ b/lib/librte_eal/rte_eal_version.map
@@ -223,9 +223,9 @@ EXPERIMENTAL {
rte_eal_mbuf_user_pool_ops;
rte_mp_action_register;
rte_mp_action_unregister;
-   rte_mp_sendmsg;
-   rte_mp_request;
rte_mp_reply;
+   rte_mp_request_sync;
+   rte_mp_sendmsg;
rte_service_attr_get;
rte_service_attr_reset_all;
rte_service_component_register;
-- 
2.7.4


[dpdk-dev] [PATCH v7 3/3] eal: add asynchronous request API to DPDK IPC

2018-03-31 Thread Anatoly Burakov
This API is similar to the blocking API that is already present,
but reply will be received in a separate callback by the caller
(callback specified at the time of request, rather than registering
for it in advance).

Under the hood, we create a separate thread to deal with replies to
asynchronous requests, that will just wait to be notified by the
main thread, or woken up on a timer.

Signed-off-by: Anatoly Burakov 
Acked-by: Jianfeng Tan 
---

Notes:
v6:
  - address review comments from Jianfeng
  - do not add dummy item to queue by default

v5:
  - addressed review comments from Jianfeng
  - split into two patches to avoid rename noise
  - do not mark ignored message as processed
v4:
  - rebase on top of latest IPC Improvements patchset [2]

v3:
  - added support for MP_IGN messages introduced in
IPC improvements v5 patchset
v2:
  - fixed deadlocks and race conditions by not calling
callbacks while iterating over sync request list
  - fixed use-after-free by making a copy of request
  - changed API to also give user a copy of original
request, so that they know to which message the
callback is a reply to
  - fixed missing .map file entries

This patch is dependent upon previously published patchsets
for IPC fixes [1] and improvements [2].

rte_mp_action_unregister and rte_mp_async_reply_unregister
do the same thing - should we perhaps make it one function?

[1] http://dpdk.org/dev/patchwork/bundle/aburakov/IPC_Fixes/
[2] http://dpdk.org/dev/patchwork/bundle/aburakov/IPC_Improvements/

 lib/librte_eal/common/eal_common_proc.c | 458 +++-
 lib/librte_eal/common/include/rte_eal.h |  36 +++
 lib/librte_eal/rte_eal_version.map  |   1 +
 3 files changed, 482 insertions(+), 13 deletions(-)

diff --git a/lib/librte_eal/common/eal_common_proc.c 
b/lib/librte_eal/common/eal_common_proc.c
index b704f5a..f98622f 100644
--- a/lib/librte_eal/common/eal_common_proc.c
+++ b/lib/librte_eal/common/eal_common_proc.c
@@ -26,6 +26,7 @@
 #include 
 #include 
 #include 
+#include 
 
 #include "eal_private.h"
 #include "eal_filesystem.h"
@@ -60,13 +61,32 @@ struct mp_msg_internal {
struct rte_mp_msg msg;
 };
 
+struct async_request_param {
+   rte_mp_async_reply_t clb;
+   struct rte_mp_reply user_reply;
+   struct timespec end;
+   int n_responses_processed;
+};
+
 struct pending_request {
TAILQ_ENTRY(pending_request) next;
-   int reply_received;
+   enum {
+   REQUEST_TYPE_SYNC,
+   REQUEST_TYPE_ASYNC
+   } type;
char dst[PATH_MAX];
struct rte_mp_msg *request;
struct rte_mp_msg *reply;
-   pthread_cond_t cond;
+   int reply_received;
+   RTE_STD_C11
+   union {
+   struct {
+   struct async_request_param *param;
+   } async;
+   struct {
+   pthread_cond_t cond;
+   } sync;
+   };
 };
 
 TAILQ_HEAD(pending_request_list, pending_request);
@@ -74,9 +94,12 @@ TAILQ_HEAD(pending_request_list, pending_request);
 static struct {
struct pending_request_list requests;
pthread_mutex_t lock;
+   pthread_cond_t async_cond;
 } pending_requests = {
.requests = TAILQ_HEAD_INITIALIZER(pending_requests.requests),
-   .lock = PTHREAD_MUTEX_INITIALIZER
+   .lock = PTHREAD_MUTEX_INITIALIZER,
+   .async_cond = PTHREAD_COND_INITIALIZER
+   /**< used in async requests only */
 };
 
 /* forward declarations */
@@ -273,7 +296,12 @@ process_msg(struct mp_msg_internal *m, struct sockaddr_un 
*s)
memcpy(sync_req->reply, msg, sizeof(*msg));
/* -1 indicates that we've been asked to ignore */
sync_req->reply_received = m->type == MP_REP ? 1 : -1;
-   pthread_cond_signal(&sync_req->cond);
+
+   if (sync_req->type == REQUEST_TYPE_SYNC)
+   pthread_cond_signal(&sync_req->sync.cond);
+   else if (sync_req->type == REQUEST_TYPE_ASYNC)
+   pthread_cond_signal(
+   &pending_requests.async_cond);
} else
RTE_LOG(ERR, EAL, "Drop mp reply: %s\n", msg->name);
pthread_mutex_unlock(&pending_requests.lock);
@@ -320,6 +348,189 @@ mp_handle(void *arg __rte_unused)
 }
 
 static int
+timespec_cmp(const struct timespec *a, const struct timespec *b)
+{
+   if (a->tv_sec < b->tv_sec)
+   return -1;
+   if (a->tv_sec > b->tv_sec)
+   return 1;
+   if (a->tv_nsec < b->tv_nsec)
+   return -1;
+   if (a->tv_nsec > b->tv_nsec)
+   return 1;
+   return 0;
+}
+
+enum async_action {
+   ACTION_NONE, /**< don't do anything */
+

[dpdk-dev] [PATCH v7] eal: provide API for querying valid socket id's

2018-03-31 Thread Anatoly Burakov
During lcore scan, find all socket ID's and store them, and
provide public API to query valid socket id's. This will break
the ABI, so bump ABI version.

Also, remove deprecation notice corresponding to this change.

Signed-off-by: Anatoly Burakov 
Acked-by: Gowrishankar Muthukrishnan 
---

Notes:
v7:
- Renamed rte_num_socket_ids() to rte_socket_count()
- Removed deprecation notice associated with this change
- Addressed review comments

v6:
- Fixed meson ABI version header

v5:
- Move API to experimental
- Store list of valid socket id's instead of simply
  recording the biggest one

v4:
- Remove backwards ABI compatibility, bump ABI instead

v3:
- Added ABI compatibility

v2:
- checkpatch changes
- check socket before deciding if the core is not to be used

 doc/guides/rel_notes/deprecation.rst  |  3 --
 lib/librte_eal/bsdapp/eal/Makefile|  2 +-
 lib/librte_eal/common/eal_common_lcore.c  | 75 ++-
 lib/librte_eal/common/include/rte_eal.h   |  2 +
 lib/librte_eal/common/include/rte_lcore.h | 30 +
 lib/librte_eal/linuxapp/eal/Makefile  |  2 +-
 lib/librte_eal/meson.build|  2 +-
 lib/librte_eal/rte_eal_version.map|  2 +
 8 files changed, 100 insertions(+), 18 deletions(-)

diff --git a/doc/guides/rel_notes/deprecation.rst 
b/doc/guides/rel_notes/deprecation.rst
index 74c18ed..80472f5 100644
--- a/doc/guides/rel_notes/deprecation.rst
+++ b/doc/guides/rel_notes/deprecation.rst
@@ -38,9 +38,6 @@ Deprecation Notices
   success and failure, respectively.  This will change to 1 and 0 for true and
   false, respectively, to make use of the function more intuitive.
 
-* eal: new ``numa_node_count`` member will be added to ``rte_config`` structure
-  in v18.05.
-
 * eal: due to internal data layout reorganization, there will be changes to
   several structures and functions as a result of coming changes to support
   memory hotplug in v18.05.
diff --git a/lib/librte_eal/bsdapp/eal/Makefile 
b/lib/librte_eal/bsdapp/eal/Makefile
index dd455e6..ed1d17b 100644
--- a/lib/librte_eal/bsdapp/eal/Makefile
+++ b/lib/librte_eal/bsdapp/eal/Makefile
@@ -21,7 +21,7 @@ LDLIBS += -lgcc_s
 
 EXPORT_MAP := ../../rte_eal_version.map
 
-LIBABIVER := 6
+LIBABIVER := 7
 
 # specific to bsdapp exec-env
 SRCS-$(CONFIG_RTE_EXEC_ENV_BSDAPP) := eal.c
diff --git a/lib/librte_eal/common/eal_common_lcore.c 
b/lib/librte_eal/common/eal_common_lcore.c
index 7724fa4..3167e9d 100644
--- a/lib/librte_eal/common/eal_common_lcore.c
+++ b/lib/librte_eal/common/eal_common_lcore.c
@@ -7,6 +7,7 @@
 #include 
 #include 
 
+#include 
 #include 
 #include 
 #include 
@@ -16,6 +17,19 @@
 #include "eal_private.h"
 #include "eal_thread.h"
 
+static int
+socket_id_cmp(const void *a, const void *b)
+{
+   const int *lcore_id_a = a;
+   const int *lcore_id_b = b;
+
+   if (*lcore_id_a < *lcore_id_b)
+   return -1;
+   if (*lcore_id_a > *lcore_id_b)
+   return 1;
+   return 0;
+}
+
 /*
  * Parse /sys/devices/system/cpu to get the number of physical and logical
  * processors on the machine. The function will fill the cpu_info
@@ -28,6 +42,8 @@ rte_eal_cpu_init(void)
struct rte_config *config = rte_eal_get_configuration();
unsigned lcore_id;
unsigned count = 0;
+   unsigned int socket_id, prev_socket_id;
+   int lcore_to_socket_id[RTE_MAX_LCORE];
 
/*
 * Parse the maximum set of logical cores, detect the subset of running
@@ -39,6 +55,19 @@ rte_eal_cpu_init(void)
/* init cpuset for per lcore config */
CPU_ZERO(&lcore_config[lcore_id].cpuset);
 
+   /* find socket first */
+   socket_id = eal_cpu_socket_id(lcore_id);
+   if (socket_id >= RTE_MAX_NUMA_NODES) {
+#ifdef RTE_EAL_ALLOW_INV_SOCKET_ID
+   socket_id = 0;
+#else
+   RTE_LOG(ERR, EAL, "Socket ID (%u) is greater than 
RTE_MAX_NUMA_NODES (%d)\n",
+   socket_id, RTE_MAX_NUMA_NODES);
+   return -1;
+#endif
+   }
+   lcore_to_socket_id[lcore_id] = socket_id;
+
/* in 1:1 mapping, record related cpu detected state */
lcore_config[lcore_id].detected = eal_cpu_detected(lcore_id);
if (lcore_config[lcore_id].detected == 0) {
@@ -54,18 +83,7 @@ rte_eal_cpu_init(void)
config->lcore_role[lcore_id] = ROLE_RTE;
lcore_config[lcore_id].core_role = ROLE_RTE;
lcore_config[lcore_id].core_id = eal_cpu_core_id(lcore_id);
-   lcore_config[lcore_id].socket_id = eal_cpu_socket_id(lcore_id);
-   if (lcore_config[lcore_id].socket_id >= RTE_MAX_NUMA_NODES) {
-#ifdef RTE_EAL_ALLOW_INV_SOCKET_ID
-   lcore_config[lcore_id].socket_id = 0;
-#else
- 

Re: [dpdk-dev] Build is broken in dpdk-next-net

2018-03-31 Thread Neil Horman
On Sat, Mar 31, 2018 at 06:21:41PM +0200, Gaëtan Rivet wrote:
> On Sat, Mar 31, 2018 at 11:27:55AM -0400, Neil Horman wrote:
> > On Sat, Mar 31, 2018 at 05:09:47PM +0200, Gaëtan Rivet wrote:
> > > On Sat, Mar 31, 2018 at 09:33:43AM -0400, Neil Horman wrote:
> > > > On Fri, Mar 30, 2018 at 10:47:09PM +0800, Tonghao Zhang wrote:
> > > > > I rebuild it on ubuntu 17.10 and cash it. I use the 'RTE_SET_USED' to 
> > > > > fix it.
> > > > > 
> > > > > 
> > > > > diff --git a/lib/librte_vhost/fd_man.c b/lib/librte_vhost/fd_man.c
> > > > > index 771675718..f11803191 100644
> > > > > --- a/lib/librte_vhost/fd_man.c
> > > > > +++ b/lib/librte_vhost/fd_man.c
> > > > > @@ -279,7 +279,8 @@ fdset_pipe_read_cb(int readfd, void *dat 
> > > > > __rte_unused,
> > > > >int *remove __rte_unused)
> > > > >  {
> > > > > char charbuf[16];
> > > > > -   read(readfd, charbuf, sizeof(charbuf));
> > > > > +   int r = read(readfd, charbuf, sizeof(charbuf));
> > > > > +   RTE_SET_USED(r);
> > > > >  }
> > > > > 
> > > > >  void
> > > > > @@ -319,5 +320,6 @@ fdset_pipe_init(struct fdset *fdset)
> > > > >  void
> > > > >  fdset_pipe_notify(struct fdset *fdset)
> > > > >  {
> > > > > -   write(fdset->u.writefd, "1", 1);
> > > > > +   int r = write(fdset->u.writefd, "1", 1);
> > > > > +   RTE_SET_USED(r);
> > > > >  }
> > > > > 
> > > > 
> > > > A better option might be to use _Pragma
> > > > 
> > > > Something like this perhaps
> > > > 
> > > > #define ALLOW_UNUSED(x) \
> > > > _Pragma(push) \
> > > > _Pragma(diagnostic ignored "-Wunused-result") \
> > > > #x;\
> > > > _Pragma(pop)
> > > > 
> > > > This is of course untested, so it probably needs some tweaking, but 
> > > > this method
> > > > avoids the need to declare an additional stack variable, which i don't 
> > > > think can
> > > > be eliminated due to the cast.  I believe that this method should also 
> > > > work
> > > > accross compilers (the gcc and clang compilers support this, and i 
> > > > think the
> > > > intel compiler should as well)
> > > > 
> > > > Neil
> > > > 
> > > 
> > > It would be nice to avoid the definition of a useless variable.
> > > An alternative could be
> > > 
> > >if (read() < 0) {
> > >/* Failure here is acceptable for such and such reason. */
> > >}
> > > 
> > > to ensure all-around compatibility, and the definition or another macro.
> > > Just a suggestion.
> > > 
> > That would be a good alternative, but I think its effectiveness is 
> > dependent on
> > when the compiler does with the return value check. Without any code inside 
> > the
> > conditional, the compiler may optimize the check out, meaning the warning 
> > will
> > still be asserted.  If it doesn't optimize the check out, then you have a
> > useless compare and jump instruction left in the code path.
> > 
> > Best
> > Neil
> > 
> 
> I tested quickly, I see no difference with the three methods:

gcc seems to be sufficiently smart to optimize out the conditional, clang not so
much:

#include 
#include 
#include 

__attribute__((warn_unused_result))
int wur(void)
{
printf("CALLING WUR!\n");
return read(0, NULL, 0);
}

#define UNUSED_RESULT(x) if (x) {}

int main(void)
{
UNUSED_RESULT(wur());
return 0;
}

[nhorman@neilslaptop ~]$ gcc -g -Wunused-result -Werror ./test.c
[nhorman@neilslaptop ~]$ objdump -d -S a.out > ./results
[nhorman@neilslaptop ~]$ cat results
... 
0040054b :

#define UNUSED_RESULT(x) if (x) {}

int main(void)
{
  40054b:   55  push   %rbp
  40054c:   48 89 e5mov%rsp,%rbp
UNUSED_RESULT(wur());
  40054f:   e8 d3 ff ff ff  callq  400527 
return 0;
  400554:   b8 00 00 00 00  mov$0x0,%eax
}
  400559:   5d  pop%rbp
  40055a:   c3  retq
  40055b:   0f 1f 44 00 00  nopl   0x0(%rax,%rax,1)


[nhorman@neilslaptop ~]$ clang -g -Wunused-result -Werror ./test.c
[nhorman@neilslaptop ~]$ objdump -d -S a.out > ./results
[nhorman@neilslaptop ~]$ cat results 
...
00400570 :
}

#define UNUSED_RESULT(x) if (x) {}

int main(void)
{
  400570:   55  push   %rbp
  400571:   48 89 e5mov%rsp,%rbp
  400574:   48 83 ec 10 sub$0x10,%rsp
  400578:   c7 45 fc 00 00 00 00movl   $0x0,-0x4(%rbp)
UNUSED_RESULT(wur());
  40057f:   e8 ac ff ff ff  callq  400530 
  400584:   83 f8 00cmp$0x0,%eax
  400587:   0f 84 05 00 00 00   je 400592 
  40058d:   e9 00 00 00 00  jmpq   400592 
  400592:   31 c0   xor%eax,%eax
return 0;
  400594:   48 83 c4 10 add$0x10,%rsp
  400598:   5d  pop%rbp
  400599:   c3  retq
  40059a:   66 0f 1f 44 00 00   nopw   0x0(%rax,%rax,1)


There is an additional compar

Re: [dpdk-dev] [PATCH v2] net/bnxt: convert to SPDX license tag

2018-03-31 Thread Ferruh Yigit
On 3/30/2018 7:10 PM, Scott Branden wrote:
> Hi Ferruh,
> 
> 
> On 18-03-30 03:35 AM, Ferruh Yigit wrote:
>> On 3/29/2018 5:40 PM, Ajit Khaparde wrote:
>>> From: Scott Branden 
>>>
>>> Update the license header on bnxt files to be the standard
>>> BSD-3-Clause license used for the rest of DPDK,
>>> bring the files in compliance with the DPDK licensing policy.
>>>
>>> Signed-off-by: Scott Branden 
>>> Signed-off-by: Ajit Khaparde 
>>> Cc:hemant.agra...@nxp.com
>>> 
>>> v1->v2: modify first line of SPDX identifer as per review comment.
>>> ---
>>>   doc/guides/nics/bnxt.rst   | 30 ++
>>>   drivers/net/bnxt/bnxt.h| 32 
>>> ++--
>>>   drivers/net/bnxt/bnxt_cpr.c| 32 
>>> ++--
>>>   drivers/net/bnxt/bnxt_cpr.h| 32 
>>> ++--
>>>   drivers/net/bnxt/bnxt_ethdev.c | 32 
>>> ++--
>>>   drivers/net/bnxt/bnxt_filter.c | 32 
>>> ++--
>>>   drivers/net/bnxt/bnxt_filter.h | 32 
>>> ++--
>>>   drivers/net/bnxt/bnxt_hwrm.c   | 32 
>>> ++--
>>>   drivers/net/bnxt/bnxt_hwrm.h   | 32 
>>> ++--
>>>   drivers/net/bnxt/bnxt_irq.c| 32 
>>> ++--
>>>   drivers/net/bnxt/bnxt_irq.h| 32 
>>> ++--
>>>   drivers/net/bnxt/bnxt_nvm_defs.h   | 11 +++
>>>   drivers/net/bnxt/bnxt_ring.c   | 32 
>>> ++--
>>>   drivers/net/bnxt/bnxt_ring.h   | 32 
>>> ++--
>>>   drivers/net/bnxt/bnxt_rxq.c| 32 
>>> ++--
>>>   drivers/net/bnxt/bnxt_rxq.h| 32 
>>> ++--
>>>   drivers/net/bnxt/bnxt_rxr.c| 32 
>>> ++--
>>>   drivers/net/bnxt/bnxt_rxr.h| 32 
>>> ++--
>>>   drivers/net/bnxt/bnxt_stats.c  | 32 
>>> ++--
>>>   drivers/net/bnxt/bnxt_stats.h  | 32 
>>> ++--
>>>   drivers/net/bnxt/bnxt_txq.c| 32 
>>> ++--
>>>   drivers/net/bnxt/bnxt_txq.h| 32 
>>> ++--
>>>   drivers/net/bnxt/bnxt_txr.c| 32 
>>> ++--
>>>   drivers/net/bnxt/bnxt_txr.h| 32 
>>> ++--
>>>   drivers/net/bnxt/bnxt_vnic.c   | 32 
>>> ++--
>>>   drivers/net/bnxt/bnxt_vnic.h   | 32 
>>> ++--
>>>   drivers/net/bnxt/hsi_struct_def_dpdk.h | 32 
>>> ++--
>>>   drivers/net/bnxt/rte_pmd_bnxt.c| 32 
>>> ++--
>>>   drivers/net/bnxt/rte_pmd_bnxt.h| 32 
>>> ++--
>>>   29 files changed, 59 insertions(+), 846 deletions(-)
>> Can you please update Makefile too, but I can see it has multiple coypright, 
>> it
>> can be better to send it as a separate patch to not block this one.
> Yes, Makefile change should be in another patch.
> I don't know how to change the header on that one though.
> Intel and 6WIND shouldn't really have any copyright on the Makefile, though?
> It looks like somebody just cut and paste the license header from 
> another Makefile.
> Please suggest what should be done with this file.

Most probably it is because of copy-paste as you stated, and I don't know what
does it mean to hold the copyright in the makefile indeed J. cc'ed Hemant and
Olivier.

But removing an existing copyright may mean involving legal and may take time,
unfortunately.

It may be easier to just do the SPDX updates with existing coypright, but if you
have motivation I suggest try to fix this.

>>
>> <...>
>>
>>> @@ -1,34 +1,6 @@
>>> -/*-
>>> - *   BSD LICENSE
>>> - *
>>> - *   Copyright(c) Broadcom Limited.
>>> +/* SPDX-License-Identifier: BSD-3-Clause
>>> + *   Copyright(c) 2014-2018 Broadcom
>>>*   All rights reserved.
>> It might be nit-picking but we don't have leading spaces [1] in format, are 
>> they
>> intentional?
>> If not it is easy to fix when introduced otherwise will stay as it is 
>> forever J
> Yes, it was intentional.

Why? What is the practical reason of intentionally diverging from defined 
syntax?

>>
>> [1]
>>   /* SPDX-License-Identifier: BSD-3-Clause
>>* Copyright(c) 2014-2018 Broadcom
>>* All rights reserved.
>>*/
>>
>> <...>
> Thanks,
>   Scott
> 



Re: [dpdk-dev] Survey for final decision about per-port offload API

2018-03-31 Thread Zhang, Qi Z
Hi Thomas:
> -Original Message-
> From: Thomas Monjalon [mailto:tho...@monjalon.net]
> Sent: Friday, March 30, 2018 9:48 PM
> To: dev@dpdk.org
> Cc: Ajit Khaparde ; Jerin Jacob
> ; Shijith Thotton
> ; Santosh Shukla
> ; Rahul Lakkireddy
> ; John Daley ; Lu,
> Wenzhuo ; Ananyev, Konstantin
> ; Xing, Beilei ; Zhang,
> Qi Z ; Wu, Jingjing ; Adrien
> Mazarguil ; Nelio Laranjeiro
> ; Yongseok Koh ; Shahaf
> Shuler ; Tomasz Duszynski ;
> Jianbo Liu ; Alejandro Lucero
> ; Hemant Agrawal
> ; Shreyansh Jain ;
> Harish Patil ; Rasesh Mody
> ; Andrew Rybchenko
> ; Shrikrishna Khare ;
> Maxime Coquelin ; Legacy, Allain (Wind River)
> ; Richardson, Bruce
> ; Gaetan Rivet ;
> Olivier Matz 
> Subject: Survey for final decision about per-port offload API
> 
> There are some discussions about a specific part of the offload API:
>   "To enable per-port offload, the offload should be set on both
>   device configuration and queue setup."
> 
> It means the application must repeat the port offload flags in
> rte_eth_conf.[rt]xmode.offloads and rte_eth_[rt]xconf.offloads, when calling
> respectively rte_eth_dev_configure() and rte_eth_[rt]x_queue_setup for each
> queue.
> 
> The PMD must check if there is mismatch, i.e. a port offload not repeated in
> queue setup.
> There is a proposal to do this check at ethdev level:
>   http://dpdk.org/ml/archives/dev/2018-March/094023.html
> 
> It was also proposed to relax the API and allow "forgetting" port offloads in
> queue offloads:
>   http://dpdk.org/ml/archives/dev/2018-March/092978.html
> 
> It would mean the offloads applied to a queue result of OR operation:
>   rte_eth_conf.[rt]xmode.offloads | rte_eth_[rt]xconf.offloads
> 
> 1/ Do you agree with above API change?
> 
> 
> If we agree with this change, we need to update the documentation and
> remove the checks in PMDs.

Do you mean we will move offload check from PMD to ethdev, 
or just remove specific check in each PMD
or it is not in the scope of this vote?

Thanks
Qi

> Note: no matter what is decided here, 18.05-rc1 should have all PMDs
> switched to the API which was defined in 17.11.
> Given that API is new and not yet adopted by the applications, the sonner it 
> is
> fixed, the better.
> 
> 2/ Should we do this change in 18.05-rc2?

> 
> 
> At the same time, we want to make clear that an offload enabled at port level,
> cannot be disabled at queue level.
> 
> 3/ Do you agree with above statement (to be added in the doc)?
> 
> 
> There is the same kind of confusion in the offload capabilities:
>   rte_eth_dev_info.[rt]x_offload_capa
>   rte_eth_dev_info.[rt]x_queue_offload_capa
> The queue capabilities must be a subset of port capabilities, i.e. every queue
> capabilities must be reported as port capabilities.
> But the port capabilities should be reported at queue level only if it can be
> applied to a specific queue.
> 
> 4/ Do you agree with above statement (to be added in the doc)?

Yes

> 
> 
> Please give your opinion on questions 1, 2, 3 and 4.
> Answering by yes/no may be sufficient in most cases :) Thank you
> 



Re: [dpdk-dev] Survey for final decision about per-port offload API

2018-03-31 Thread Shahaf Shuler
Friday, March 30, 2018 4:48 PM, Thomas Monjalon:
> Subject: Survey for final decision about per-port offload API
> 
> There are some discussions about a specific part of the offload API:
>   "To enable per-port offload, the offload should be set on both
>   device configuration and queue setup."
> 
> It means the application must repeat the port offload flags in
> rte_eth_conf.[rt]xmode.offloads and rte_eth_[rt]xconf.offloads, when
> calling respectively rte_eth_dev_configure() and
> rte_eth_[rt]x_queue_setup for each queue.
> 
> The PMD must check if there is mismatch, i.e. a port offload not repeated in
> queue setup.
> There is a proposal to do this check at ethdev level:
>   https://emea01.safelinks.protection.outlook.com/?url=http%3A%2F
> %2Fdpdk.org%2Fml%2Farchives%2Fdev%2F2018-
> March%2F094023.html&data=02%7C01%7Cshahafs%40mellanox.com%7Cb2a
> e36d768424c9e616308d59644e2a7%7Ca652971c7d2e4d9ba6a4d149256f461b
> %7C0%7C0%7C636580144980414466&sdata=Re2xM9u5jJr4M1PDTn5gE9mp22
> NmBI%2Bwa2GFPmUzq38%3D&reserved=0
> 
> It was also proposed to relax the API and allow "forgetting" port offloads in
> queue offloads:
>   https://emea01.safelinks.protection.outlook.com/?url=http%3A%2F
> %2Fdpdk.org%2Fml%2Farchives%2Fdev%2F2018-
> March%2F092978.html&data=02%7C01%7Cshahafs%40mellanox.com%7Cb2a
> e36d768424c9e616308d59644e2a7%7Ca652971c7d2e4d9ba6a4d149256f461b
> %7C0%7C0%7C636580144980414466&sdata=xaUM8jcVl9gf3e%2By9geZDPpO
> 1RJ5%2FXWJwA%2BpGp54pNs%3D&reserved=0
> 
> It would mean the offloads applied to a queue result of OR operation:
>   rte_eth_conf.[rt]xmode.offloads | rte_eth_[rt]xconf.offloads
> 
> 1/ Do you agree with above API change?

Yes.

> 
> 
> If we agree with this change, we need to update the documentation and
> remove the checks in PMDs.

And to update applications and examples in the tree to set the offloads 
according to above change. 

> Note: no matter what is decided here, 18.05-rc1 should have all PMDs
> switched to the API which was defined in 17.11.
> Given that API is new and not yet adopted by the applications, the sonner it
> is fixed, the better.
> 
> 2/ Should we do this change in 18.05-rc2?
> 
> 
> At the same time, we want to make clear that an offload enabled at port
> level, cannot be disabled at queue level.
> 
> 3/ Do you agree with above statement (to be added in the doc)?

Yes 

> 
> 
> There is the same kind of confusion in the offload capabilities:
>   rte_eth_dev_info.[rt]x_offload_capa
>   rte_eth_dev_info.[rt]x_queue_offload_capa
> The queue capabilities must be a subset of port capabilities, i.e. every queue
> capabilities must be reported as port capabilities.
> But the port capabilities should be reported at queue level only if it can be
> applied to a specific queue.
> 
> 4/ Do you agree with above statement (to be added in the doc)?

No. 

The documentation should describe the API from the application side, and not 
provide guidelines for the PMDs implementation. 
If missing, we should clarify more about what queue and port offload means. 
Something like:
"When port offload is enabled, the offload applies on the port along with all 
of its associated queues"  and
"When queue offload is enabled the offload, the offload applies only on the 
specific queue."

The PMDs then will decide how they report the different offloads they offer. 

> 
> 
> Please give your opinion on questions 1, 2, 3 and 4.
> Answering by yes/no may be sufficient in most cases :) Thank you
> 



[dpdk-dev] [PATCH 00/14] net/qede/base: update PMD version to 2.8.0.1

2018-03-31 Thread Rasesh Mody
Hi,

This patch set updates QEDE base driver to use FW version 8.33.12.0.
It contains some base driver enhancements and fixes. The PMD version
is updated to 2.8.0.1.

Please apply.

Thanks!
-Rasesh

Rasesh Mody (14):
  net/qede/base: use path ID for HW init
  net/qede/base: protect DMAE transactions
  net/qede/base: add DMAE sanity check
  net/qede/base: upgrade FW to 8.33.12.0
  net/qede/base: symantic changes
  net/qede/base: add new chain API
  net/qede/base: allow changing VF MAC address
  net/qede/base: add MFW support for driver load timeout
  net/qede/base: refine error handling
  net/qede/base: add stats counter for link state
  net/qede/base: add APIs for xcvr
  net/qede/base: fix to support OVLAN mode
  net/qede/base: add packet pacing support
  net/qede: update PMD version to 2.8.0.1

 drivers/net/qede/base/common_hsi.h|8 +-
 drivers/net/qede/base/ecore.h |   28 +-
 drivers/net/qede/base/ecore_chain.h   |   49 +-
 drivers/net/qede/base/ecore_cxt.c |   30 +-
 drivers/net/qede/base/ecore_cxt.h |4 +-
 drivers/net/qede/base/ecore_dcbx.c|7 +-
 drivers/net/qede/base/ecore_dcbx_api.h|1 +
 drivers/net/qede/base/ecore_dev.c |  324 ++
 drivers/net/qede/base/ecore_dev_api.h |   20 +-
 drivers/net/qede/base/ecore_hsi_common.h  |  106 -
 drivers/net/qede/base/ecore_hsi_debug_tools.h |  108 +++--
 drivers/net/qede/base/ecore_hsi_eth.h |   29 +-
 drivers/net/qede/base/ecore_hsi_init_func.h   |   36 +-
 drivers/net/qede/base/ecore_hsi_init_tool.h   |  107 ++---
 drivers/net/qede/base/ecore_hw.c  |  119 -
 drivers/net/qede/base/ecore_hw.h  |4 +
 drivers/net/qede/base/ecore_init_fw_funcs.c   |  210 +++--
 drivers/net/qede/base/ecore_init_fw_funcs.h   |   33 +-
 drivers/net/qede/base/ecore_init_ops.c|   32 +-
 drivers/net/qede/base/ecore_int.c |   11 +-
 drivers/net/qede/base/ecore_iov_api.h |   11 +
 drivers/net/qede/base/ecore_iro_values.h  |   64 +--
 drivers/net/qede/base/ecore_l2.c  |   53 ++-
 drivers/net/qede/base/ecore_mcp.c |  220 -
 drivers/net/qede/base/ecore_mcp_api.h |   46 ++
 drivers/net/qede/base/ecore_proto_if.h|3 +
 drivers/net/qede/base/ecore_rt_defs.h |  591 +
 drivers/net/qede/base/ecore_sp_commands.c |   29 +-
 drivers/net/qede/base/ecore_spq.c |   36 +-
 drivers/net/qede/base/ecore_spq.h |   13 +
 drivers/net/qede/base/ecore_sriov.c   |   41 +-
 drivers/net/qede/base/eth_common.h|3 +
 drivers/net/qede/base/mcp_public.h|3 +
 drivers/net/qede/base/reg_addr.h  |2 +
 drivers/net/qede/qede_ethdev.h|2 +-
 drivers/net/qede/qede_main.c  |3 +-
 36 files changed, 1632 insertions(+), 754 deletions(-)

-- 
1.7.10.3



[dpdk-dev] [PATCH 01/14] net/qede/base: use path ID for HW init

2018-03-31 Thread Rasesh Mody
Use the path ID as the phase ID when running the engine phase of the
HW init

Signed-off-by: Rasesh Mody 
---
 drivers/net/qede/base/ecore_dev.c |3 ++-
 1 file changed, 2 insertions(+), 1 deletion(-)

diff --git a/drivers/net/qede/base/ecore_dev.c 
b/drivers/net/qede/base/ecore_dev.c
index 744d204..cd274c3 100644
--- a/drivers/net/qede/base/ecore_dev.c
+++ b/drivers/net/qede/base/ecore_dev.c
@@ -1658,7 +1658,8 @@ static enum _ecore_status_t ecore_hw_init_common(struct 
ecore_hwfn *p_hwfn,
 
ecore_init_cache_line_size(p_hwfn, p_ptt);
 
-   rc = ecore_init_run(p_hwfn, p_ptt, PHASE_ENGINE, ANY_PHASE_ID, hw_mode);
+   rc = ecore_init_run(p_hwfn, p_ptt, PHASE_ENGINE, ECORE_PATH_ID(p_hwfn),
+   hw_mode);
if (rc != ECORE_SUCCESS)
return rc;
 
-- 
1.7.10.3



[dpdk-dev] [PATCH 02/14] net/qede/base: protect DMAE transactions

2018-03-31 Thread Rasesh Mody
Protect DMAE transactions with a spinlock instead of a mutex

Signed-off-by: Rasesh Mody 
---
 drivers/net/qede/base/ecore.h |6 --
 drivers/net/qede/base/ecore_dev.c |6 +++---
 drivers/net/qede/base/ecore_hw.c  |   30 +++---
 3 files changed, 26 insertions(+), 16 deletions(-)

diff --git a/drivers/net/qede/base/ecore.h b/drivers/net/qede/base/ecore.h
index ce5f3a9..7c642af 100644
--- a/drivers/net/qede/base/ecore.h
+++ b/drivers/net/qede/base/ecore.h
@@ -432,8 +432,10 @@ struct ecore_hw_info {
 #define DMAE_MAX_RW_SIZE   0x2000
 
 struct ecore_dmae_info {
-   /* Mutex for synchronizing access to functions */
-   osal_mutex_tmutex;
+   /* Spinlock for synchronizing access to functions */
+   osal_spinlock_t lock;
+
+   bool b_mem_ready;
 
u8 channel;
 
diff --git a/drivers/net/qede/base/ecore_dev.c 
b/drivers/net/qede/base/ecore_dev.c
index cd274c3..b15af03 100644
--- a/drivers/net/qede/base/ecore_dev.c
+++ b/drivers/net/qede/base/ecore_dev.c
@@ -423,9 +423,9 @@ void ecore_init_struct(struct ecore_dev *p_dev)
p_hwfn->b_active = false;
 
 #ifdef CONFIG_ECORE_LOCK_ALLOC
-   OSAL_MUTEX_ALLOC(p_hwfn, &p_hwfn->dmae_info.mutex);
+   OSAL_SPIN_LOCK_ALLOC(p_hwfn, &p_hwfn->dmae_info.lock);
 #endif
-   OSAL_MUTEX_INIT(&p_hwfn->dmae_info.mutex);
+   OSAL_SPIN_LOCK_INIT(&p_hwfn->dmae_info.lock);
}
 
/* hwfn 0 is always active */
@@ -4238,7 +4238,7 @@ void ecore_hw_remove(struct ecore_dev *p_dev)
ecore_mcp_free(p_hwfn);
 
 #ifdef CONFIG_ECORE_LOCK_ALLOC
-   OSAL_MUTEX_DEALLOC(&p_hwfn->dmae_info.mutex);
+   OSAL_SPIN_LOCK_DEALLOC(&p_hwfn->dmae_info.lock);
 #endif
}
 
diff --git a/drivers/net/qede/base/ecore_hw.c b/drivers/net/qede/base/ecore_hw.c
index 84f273b..34e2e5f 100644
--- a/drivers/net/qede/base/ecore_hw.c
+++ b/drivers/net/qede/base/ecore_hw.c
@@ -592,7 +592,8 @@ enum _ecore_status_t ecore_dmae_info_alloc(struct 
ecore_hwfn *p_hwfn)
goto err;
}
 
-   p_hwfn->dmae_info.channel = p_hwfn->rel_pf_id;
+   p_hwfn->dmae_info.channel = p_hwfn->rel_pf_id;
+   p_hwfn->dmae_info.b_mem_ready = true;
 
return ECORE_SUCCESS;
 err:
@@ -604,8 +605,9 @@ void ecore_dmae_info_free(struct ecore_hwfn *p_hwfn)
 {
dma_addr_t p_phys;
 
-   /* Just make sure no one is in the middle */
-   OSAL_MUTEX_ACQUIRE(&p_hwfn->dmae_info.mutex);
+   OSAL_SPIN_LOCK(&p_hwfn->dmae_info.lock);
+   p_hwfn->dmae_info.b_mem_ready = false;
+   OSAL_SPIN_UNLOCK(&p_hwfn->dmae_info.lock);
 
if (p_hwfn->dmae_info.p_completion_word != OSAL_NULL) {
p_phys = p_hwfn->dmae_info.completion_word_phys_addr;
@@ -630,8 +632,6 @@ void ecore_dmae_info_free(struct ecore_hwfn *p_hwfn)
   p_phys, sizeof(u32) * DMAE_MAX_RW_SIZE);
p_hwfn->dmae_info.p_intermediate_buffer = OSAL_NULL;
}
-
-   OSAL_MUTEX_RELEASE(&p_hwfn->dmae_info.mutex);
 }
 
 static enum _ecore_status_t ecore_dmae_operation_wait(struct ecore_hwfn 
*p_hwfn)
@@ -777,6 +777,14 @@ static enum _ecore_status_t 
ecore_dmae_operation_wait(struct ecore_hwfn *p_hwfn)
enum _ecore_status_t ecore_status = ECORE_SUCCESS;
u32 offset = 0;
 
+   if (!p_hwfn->dmae_info.b_mem_ready) {
+   DP_VERBOSE(p_hwfn, ECORE_MSG_HW,
+  "No buffers allocated. Avoid DMAE transaction [{src: 
addr 0x%lx, type %d}, {dst: addr 0x%lx, type %d}, size %d].\n",
+  src_addr, src_type, dst_addr, dst_type,
+  size_in_dwords);
+   return ECORE_NOMEM;
+   }
+
if (p_hwfn->p_dev->recov_in_prog) {
DP_VERBOSE(p_hwfn, ECORE_MSG_HW,
   "Recovery is in progress. Avoid DMAE transaction 
[{src: addr 0x%lx, type %d}, {dst: addr 0x%lx, type %d}, size %d].\n",
@@ -870,7 +878,7 @@ enum _ecore_status_t
OSAL_MEMSET(¶ms, 0, sizeof(struct ecore_dmae_params));
params.flags = flags;
 
-   OSAL_MUTEX_ACQUIRE(&p_hwfn->dmae_info.mutex);
+   OSAL_SPIN_LOCK(&p_hwfn->dmae_info.lock);
 
rc = ecore_dmae_execute_command(p_hwfn, p_ptt, source_addr,
grc_addr_in_dw,
@@ -878,7 +886,7 @@ enum _ecore_status_t
ECORE_DMAE_ADDRESS_GRC,
size_in_dwords, ¶ms);
 
-   OSAL_MUTEX_RELEASE(&p_hwfn->dmae_info.mutex);
+   OSAL_SPIN_UNLOCK(&p_hwfn->dmae_info.lock);
 
return rc;
 }
@@ -896,14 +904,14 @@ enum _ecore_status_t
OSAL_MEMSET(¶ms, 0, sizeof(struct ecore_dmae_params));
params.flags = flags;
 
-   OSAL_MUTEX_ACQUIRE(&p_hwfn->dmae_info.mutex);
+   OSAL_SPIN_LOCK(&p_hwfn->dmae_info.lock);
 
rc = ecore_dmae_execute_command(p_hwfn, p_ptt, grc_addr_in_dw,

[dpdk-dev] [PATCH 03/14] net/qede/base: add DMAE sanity check

2018-03-31 Thread Rasesh Mody
Add DMA engine sanity check during the engine initialization and before
PF inititialization

Signed-off-by: Rasesh Mody 
---
 drivers/net/qede/base/ecore_dev.c  |5 +++
 drivers/net/qede/base/ecore_hw.c   |   69 
 drivers/net/qede/base/ecore_hw.h   |4 ++
 drivers/net/qede/base/ecore_init_ops.c |   32 +--
 drivers/net/qede/base/ecore_rt_defs.h  |3 ++
 5 files changed, 100 insertions(+), 13 deletions(-)

diff --git a/drivers/net/qede/base/ecore_dev.c 
b/drivers/net/qede/base/ecore_dev.c
index b15af03..38492e6 100644
--- a/drivers/net/qede/base/ecore_dev.c
+++ b/drivers/net/qede/base/ecore_dev.c
@@ -2161,6 +2161,11 @@ static enum _ecore_status_t ecore_hw_init_port(struct 
ecore_hwfn *p_hwfn,
/* perform debug configuration when chip is out of reset */
OSAL_BEFORE_PF_START((void *)p_hwfn->p_dev, p_hwfn->my_id);
 
+   /* Sanity check before the PF init sequence that uses DMAE */
+   rc = ecore_dmae_sanity(p_hwfn, p_ptt, "pf_phase");
+   if (rc)
+   return rc;
+
/* PF Init sequence */
rc = ecore_init_run(p_hwfn, p_ptt, PHASE_PF, rel_pf_id, hw_mode);
if (rc)
diff --git a/drivers/net/qede/base/ecore_hw.c b/drivers/net/qede/base/ecore_hw.c
index 34e2e5f..98c7fbf 100644
--- a/drivers/net/qede/base/ecore_hw.c
+++ b/drivers/net/qede/base/ecore_hw.c
@@ -952,3 +952,72 @@ void ecore_hw_err_notify(struct ecore_hwfn *p_hwfn,
 
OSAL_HW_ERROR_OCCURRED(p_hwfn, err_type);
 }
+
+enum _ecore_status_t ecore_dmae_sanity(struct ecore_hwfn *p_hwfn,
+  struct ecore_ptt *p_ptt,
+  const char *phase)
+{
+   u32 size = OSAL_PAGE_SIZE / 2, val;
+   struct ecore_dmae_params params;
+   enum _ecore_status_t rc = ECORE_SUCCESS;
+   dma_addr_t p_phys;
+   void *p_virt;
+   u32 *p_tmp;
+
+   p_virt = OSAL_DMA_ALLOC_COHERENT(p_hwfn->p_dev, &p_phys, 2 * size);
+   if (!p_virt) {
+   DP_NOTICE(p_hwfn, false,
+ "DMAE sanity [%s]: failed to allocate memory\n",
+ phase);
+   return ECORE_NOMEM;
+   }
+
+   /* Fill the bottom half of the allocated memory with a known pattern */
+   for (p_tmp = (u32 *)p_virt;
+p_tmp < (u32 *)((u8 *)p_virt + size);
+p_tmp++) {
+   /* Save the address itself as the value */
+   val = (u32)(osal_uintptr_t)p_tmp;
+   *p_tmp = val;
+   }
+
+   /* Zero the top half of the allocated memory */
+   OSAL_MEM_ZERO((u8 *)p_virt + size, size);
+
+   DP_VERBOSE(p_hwfn, ECORE_MSG_SP,
+  "DMAE sanity [%s]: src_addr={phys 0x%lx, virt %p}, 
dst_addr={phys 0x%lx, virt %p}, size 0x%x\n",
+  phase, (u64)p_phys, p_virt, (u64)(p_phys + size),
+  (u8 *)p_virt + size, size);
+
+   OSAL_MEMSET(¶ms, 0, sizeof(params));
+   rc = ecore_dmae_host2host(p_hwfn, p_ptt, p_phys, p_phys + size,
+ size / 4 /* size_in_dwords */, ¶ms);
+   if (rc != ECORE_SUCCESS) {
+   DP_NOTICE(p_hwfn, false,
+ "DMAE sanity [%s]: ecore_dmae_host2host() failed. rc 
= %d.\n",
+ phase, rc);
+   goto out;
+   }
+
+   /* Verify that the top half of the allocated memory has the pattern */
+   for (p_tmp = (u32 *)((u8 *)p_virt + size);
+p_tmp < (u32 *)((u8 *)p_virt + (2 * size));
+p_tmp++) {
+   /* The corresponding address in the bottom half */
+   val = (u32)(osal_uintptr_t)p_tmp - size;
+
+   if (*p_tmp != val) {
+   DP_NOTICE(p_hwfn, false,
+ "DMAE sanity [%s]: addr={phys 0x%lx, virt 
%p}, read_val 0x%08x, expected_val 0x%08x\n",
+ phase,
+ (u64)p_phys + ((u8 *)p_tmp - (u8 *)p_virt),
+ p_tmp, *p_tmp, val);
+   rc = ECORE_UNKNOWN_ERROR;
+   goto out;
+   }
+   }
+
+out:
+   OSAL_DMA_FREE_COHERENT(p_hwfn->p_dev, p_virt, p_phys, 2 * size);
+   return rc;
+}
diff --git a/drivers/net/qede/base/ecore_hw.h b/drivers/net/qede/base/ecore_hw.h
index 0b9814f..b59a26a 100644
--- a/drivers/net/qede/base/ecore_hw.h
+++ b/drivers/net/qede/base/ecore_hw.h
@@ -255,4 +255,8 @@ enum _ecore_status_t ecore_init_fw_data(struct ecore_dev 
*p_dev,
 void ecore_hw_err_notify(struct ecore_hwfn *p_hwfn,
 enum ecore_hw_err_type err_type);
 
+enum _ecore_status_t ecore_dmae_sanity(struct ecore_hwfn *p_hwfn,
+  struct ecore_ptt *p_ptt,
+  const char *phase);
+
 #endif /* __ECORE_HW_H__ */
diff --git a/drivers/net/qede/base/ecore_init_ops.c 
b/drivers/net/qede/base/ecore_init

[dpdk-dev] [PATCH 04/14] net/qede/base: upgrade FW to 8.33.12.0

2018-03-31 Thread Rasesh Mody
This patch adds changes to support new firmware 8.33.12.0. The changes
consist of FW bug fixes and enhancements.

Signed-off-by: Rasesh Mody 
---
 drivers/net/qede/base/common_hsi.h|8 +-
 drivers/net/qede/base/ecore_cxt.c |   10 +-
 drivers/net/qede/base/ecore_cxt.h |4 +-
 drivers/net/qede/base/ecore_dev.c |   10 +-
 drivers/net/qede/base/ecore_hsi_common.h  |   19 +-
 drivers/net/qede/base/ecore_hsi_debug_tools.h |3 +-
 drivers/net/qede/base/ecore_hsi_eth.h |   23 +-
 drivers/net/qede/base/ecore_hsi_init_func.h   |3 +
 drivers/net/qede/base/ecore_init_fw_funcs.c   |  210 +++--
 drivers/net/qede/base/ecore_init_fw_funcs.h   |   33 +-
 drivers/net/qede/base/ecore_iro_values.h  |   64 +--
 drivers/net/qede/base/ecore_l2.c  |2 +-
 drivers/net/qede/base/ecore_rt_defs.h |  588 +
 drivers/net/qede/base/eth_common.h|3 +
 drivers/net/qede/base/reg_addr.h  |2 +
 drivers/net/qede/qede_main.c  |2 +-
 16 files changed, 585 insertions(+), 399 deletions(-)

diff --git a/drivers/net/qede/base/common_hsi.h 
b/drivers/net/qede/base/common_hsi.h
index 9a6059a..d37dc7c 100644
--- a/drivers/net/qede/base/common_hsi.h
+++ b/drivers/net/qede/base/common_hsi.h
@@ -96,10 +96,10 @@
 //
 
 
-#define FW_MAJOR_VERSION   8
-#define FW_MINOR_VERSION   30
-#define FW_REVISION_VERSION12
-#define FW_ENGINEERING_VERSION 0
+#define FW_MAJOR_VERSION8
+#define FW_MINOR_VERSION33
+#define FW_REVISION_VERSION 12
+#define FW_ENGINEERING_VERSION  0
 
 /***/
 /* COMMON HW CONSTANTS */
diff --git a/drivers/net/qede/base/ecore_cxt.c 
b/drivers/net/qede/base/ecore_cxt.c
index 50bd66d..ca7c55f 100644
--- a/drivers/net/qede/base/ecore_cxt.c
+++ b/drivers/net/qede/base/ecore_cxt.c
@@ -1427,7 +1427,8 @@ static void ecore_cdu_init_pf(struct ecore_hwfn *p_hwfn)
}
 }
 
-void ecore_qm_init_pf(struct ecore_hwfn *p_hwfn, struct ecore_ptt *p_ptt)
+void ecore_qm_init_pf(struct ecore_hwfn *p_hwfn, struct ecore_ptt *p_ptt,
+ bool is_pf_loading)
 {
struct ecore_qm_info *qm_info = &p_hwfn->qm_info;
struct ecore_mcp_link_state *p_link;
@@ -1438,8 +1439,9 @@ void ecore_qm_init_pf(struct ecore_hwfn *p_hwfn, struct 
ecore_ptt *p_ptt)
 
p_link = &ECORE_LEADING_HWFN(p_hwfn->p_dev)->mcp_info->link_output;
 
-   ecore_qm_pf_rt_init(p_hwfn, p_ptt, p_hwfn->port_id,
-   p_hwfn->rel_pf_id, qm_info->max_phys_tcs_per_port,
+   ecore_qm_pf_rt_init(p_hwfn, p_ptt, p_hwfn->rel_pf_id,
+   qm_info->max_phys_tcs_per_port,
+   is_pf_loading,
iids.cids, iids.vf_cids, iids.tids,
qm_info->start_pq,
qm_info->num_pqs - qm_info->num_vf_pqs,
@@ -1797,7 +1799,7 @@ void ecore_cxt_hw_init_common(struct ecore_hwfn *p_hwfn)
 
 void ecore_cxt_hw_init_pf(struct ecore_hwfn *p_hwfn, struct ecore_ptt *p_ptt)
 {
-   ecore_qm_init_pf(p_hwfn, p_ptt);
+   ecore_qm_init_pf(p_hwfn, p_ptt, true);
ecore_cm_init_pf(p_hwfn);
ecore_dq_init_pf(p_hwfn);
ecore_cdu_init_pf(p_hwfn);
diff --git a/drivers/net/qede/base/ecore_cxt.h 
b/drivers/net/qede/base/ecore_cxt.h
index 54761e4..1130a33 100644
--- a/drivers/net/qede/base/ecore_cxt.h
+++ b/drivers/net/qede/base/ecore_cxt.h
@@ -107,8 +107,10 @@ u32 ecore_cxt_get_proto_cid_start(struct ecore_hwfn 
*p_hwfn,
  *
  * @param p_hwfn
  * @param p_ptt
+ * @param is_pf_loading
  */
-void ecore_qm_init_pf(struct ecore_hwfn *p_hwfn, struct ecore_ptt *p_ptt);
+void ecore_qm_init_pf(struct ecore_hwfn *p_hwfn, struct ecore_ptt *p_ptt,
+ bool is_pf_loading);
 
  /**
  * @brief Reconfigures QM pf on the fly
diff --git a/drivers/net/qede/base/ecore_dev.c 
b/drivers/net/qede/base/ecore_dev.c
index 38492e6..a3269f4 100644
--- a/drivers/net/qede/base/ecore_dev.c
+++ b/drivers/net/qede/base/ecore_dev.c
@@ -721,6 +721,7 @@ static void ecore_init_qm_pq(struct ecore_hwfn *p_hwfn,
   "pq overflow! pq %d, max pq %d\n", pq_idx, max_pq);
 
/* init pq params */
+   qm_info->qm_pq_params[pq_idx].port_id = p_hwfn->port_id;
qm_info->qm_pq_params[pq_idx].vport_id = qm_info->start_vport +
 qm_info->num_vports;
qm_info->qm_pq_params[pq_idx].tc_id = tc;
@@ -1025,10 +1026,9 @@ static void ecore_dp_init_qm_params(struct ecore_hwfn 
*p_hwfn)
for (i = 0; i < qm_info->num_pqs; i++) {
pq = &qm_info->qm_pq_params[i];
DP_VERBOSE(p_hwfn, ECORE_MSG_HW,
-  "pq idx %d, vport_id %d, tc %d, wrr_grp %d,"
-  " rl_valid %d\n",
-  

[dpdk-dev] [PATCH 05/14] net/qede/base: symantic changes

2018-03-31 Thread Rasesh Mody
The changes included in this patch are for
 - formatting
 - comment rework/addtions
 - relocate FW info, version related code
 - convert:
__le16 to u16
__le32 to u32 etc.

Signed-off-by: Rasesh Mody 
---
 drivers/net/qede/base/ecore_hsi_common.h  |   89 +++-
 drivers/net/qede/base/ecore_hsi_debug_tools.h |  105 
 drivers/net/qede/base/ecore_hsi_eth.h |6 +-
 drivers/net/qede/base/ecore_hsi_init_func.h   |   33 
 drivers/net/qede/base/ecore_hsi_init_tool.h   |  107 +++--
 5 files changed, 171 insertions(+), 169 deletions(-)

diff --git a/drivers/net/qede/base/ecore_hsi_common.h 
b/drivers/net/qede/base/ecore_hsi_common.h
index 38ac507..60951a1 100644
--- a/drivers/net/qede/base/ecore_hsi_common.h
+++ b/drivers/net/qede/base/ecore_hsi_common.h
@@ -948,7 +948,9 @@ struct core_tx_bd_data {
 /* Do not allow additional VLAN manipulations on this packet (DCB) */
 #define CORE_TX_BD_DATA_FORCE_VLAN_MODE_MASK 0x1
 #define CORE_TX_BD_DATA_FORCE_VLAN_MODE_SHIFT0
-/* Insert VLAN into packet */
+/* Insert VLAN into packet. Cannot be set for LB packets
+ * (tx_dst == CORE_TX_DEST_LB)
+ */
 #define CORE_TX_BD_DATA_VLAN_INSERTION_MASK  0x1
 #define CORE_TX_BD_DATA_VLAN_INSERTION_SHIFT 1
 /* This is the first BD of the packet (for debug) */
@@ -1071,11 +1073,11 @@ struct core_tx_update_ramrod_data {
  * Enum flag for what type of dcb data to update
  */
 enum dcb_dscp_update_mode {
-/* use when no change should be done to dcb data */
+/* use when no change should be done to DCB data */
DONT_UPDATE_DCB_DSCP,
-   UPDATE_DCB /* use to update only l2 (vlan) priority */,
-   UPDATE_DSCP /* use to update only l3 dscp */,
-   UPDATE_DCB_DSCP /* update vlan pri and dscp */,
+   UPDATE_DCB /* use to update only L2 (vlan) priority */,
+   UPDATE_DSCP /* use to update only IP DSCP */,
+   UPDATE_DCB_DSCP /* update vlan pri and DSCP */,
MAX_DCB_DSCP_UPDATE_FLAG
 };
 
@@ -1293,10 +1295,12 @@ enum fw_flow_ctrl_mode {
  * GFT profile type.
  */
 enum gft_profile_type {
-   GFT_PROFILE_TYPE_4_TUPLE /* 4 tuple, IP type and L4 type match. */,
-/* L4 destination port, IP type and L4 type match. */
+/* tunnel type, inner 4 tuple, IP type and L4 type match. */
+   GFT_PROFILE_TYPE_4_TUPLE,
+/* tunnel type, inner L4 destination port, IP type and L4 type match. */
GFT_PROFILE_TYPE_L4_DST_PORT,
-   GFT_PROFILE_TYPE_IP_DST_ADDR /* IP destination port and IP type. */,
+/* tunnel type, inner IP destination address and IP type match. */
+   GFT_PROFILE_TYPE_IP_DST_ADDR,
 /* tunnel type, inner IP source address and IP type match. */
GFT_PROFILE_TYPE_IP_SRC_ADDR,
GFT_PROFILE_TYPE_TUNNEL_TYPE /* tunnel type and outer IP type match. */,
@@ -1416,8 +1420,9 @@ struct vlan_header {
  * outer tag configurations
  */
 struct outer_tag_config_struct {
-/* Enables the STAG Priority Change , Should be 1 for Bette Davis and UFP with
- * Host Control mode. Else - 0
+/* Enables updating S-tag priority from inner tag or DCB. Should be 1 for Bette
+ * Davis, UFP with Host Control mode, and UFP with DCB over base interface.
+ * else - 0.
  */
u8 enable_stag_pri_change;
 /* If inner_to_outer_pri_map is initialize then set pri_map_valid */
@@ -1512,14 +1517,14 @@ struct pf_start_ramrod_data {
 
 
 /*
- * Data for port update ramrod
+ * Per protocol DCB data
  */
 struct protocol_dcb_data {
-   u8 dcb_enable_flag /* dcbEnable flag value */;
-   u8 dscp_enable_flag /* If set use dscp value */;
-   u8 dcb_priority /* dcbPri flag value */;
-   u8 dcb_tc /* dcb TC value */;
-   u8 dscp_val /* dscp value to write if dscp_enable_flag is set */;
+   u8 dcb_enable_flag /* Enable DCB */;
+   u8 dscp_enable_flag /* Enable updating DSCP value */;
+   u8 dcb_priority /* DCB priority */;
+   u8 dcb_tc /* DCB TC */;
+   u8 dscp_val /* DSCP value to write if dscp_enable_flag is set */;
 /* When DCB is enabled - if this flag is set, dont add VLAN 0 tag to untagged
  * frames
  */
@@ -1583,8 +1588,9 @@ struct pf_update_ramrod_data {
 /* core iwarp related fields */
struct protocol_dcb_data iwarp_dcb_data;
__le16 mf_vlan /* new outer vlan id value */;
-/* enables the inner to outer TAG priority mapping. Should be 1 for Bette Davis
- * and UFP with Host Control mode, else - 0.
+/* enables updating S-tag priority from inner tag or DCB. Should be 1 for Bette
+ * Davis, UFP with Host Control mode, and UFP with DCB over base interface.
+ * else - 0
  */
u8 enable_stag_pri_change;
u8 reserved;
@@ -2139,6 +2145,53 @@ struct e4_ystorm_core_conn_ag_ctx {
 };
 
 
+struct fw_asserts_ram_section {
+/* The offset of the section in the RAM in RAM lines (64-bit units) */
+   __le16 section_ram_line_offset;
+/* The size of the section in RAM lines (64-bit units) */
+   __le16 section_ram_line_size;
+/* The offset of th

[dpdk-dev] [PATCH 07/14] net/qede/base: allow changing VF MAC address

2018-03-31 Thread Rasesh Mody
This patch allows VF to change its own MAC address regardless of MAC set
by PF

Signed-off-by: Rasesh Mody 
---
 drivers/net/qede/base/ecore_iov_api.h  |   11 ++
 drivers/net/qede/base/ecore_proto_if.h |3 +++
 drivers/net/qede/base/ecore_sriov.c|   36 +---
 3 files changed, 47 insertions(+), 3 deletions(-)

diff --git a/drivers/net/qede/base/ecore_iov_api.h 
b/drivers/net/qede/base/ecore_iov_api.h
index 218ef50..3ac219b 100644
--- a/drivers/net/qede/base/ecore_iov_api.h
+++ b/drivers/net/qede/base/ecore_iov_api.h
@@ -540,6 +540,17 @@ void ecore_iov_get_vf_reply_virt_mbx_params(struct 
ecore_hwfn *p_hwfn,
 u32 ecore_iov_pfvf_msg_length(void);
 
 /**
+ * @brief Returns MAC address if one is configured
+ *
+ * @parm p_hwfn
+ * @parm rel_vf_id
+ *
+ * @return OSAL_NULL if mac isn't set; Otherwise, returns MAC.
+ */
+u8 *ecore_iov_bulletin_get_mac(struct ecore_hwfn *p_hwfn,
+  u16 rel_vf_id);
+
+/**
  * @brief Returns forced MAC address if one is configured
  *
  * @parm p_hwfn
diff --git a/drivers/net/qede/base/ecore_proto_if.h 
b/drivers/net/qede/base/ecore_proto_if.h
index abca740..d0518df 100644
--- a/drivers/net/qede/base/ecore_proto_if.h
+++ b/drivers/net/qede/base/ecore_proto_if.h
@@ -31,6 +31,9 @@ struct ecore_eth_pf_params {
 * This will set the maximal number of configured steering-filters.
 */
u32 num_arfs_filters;
+
+   /* To allow VF to change its MAC despite of PF set forced MAC. */
+   boolallow_vf_mac_change;
 };
 
 /* Most of the parameters below are described in the FW iSCSI / TCP HSI */
diff --git a/drivers/net/qede/base/ecore_sriov.c 
b/drivers/net/qede/base/ecore_sriov.c
index b1e26d6..b7a52f8 100644
--- a/drivers/net/qede/base/ecore_sriov.c
+++ b/drivers/net/qede/base/ecore_sriov.c
@@ -1968,7 +1968,8 @@ static void ecore_iov_vf_mbx_acquire(struct ecore_hwfn
   *p_hwfn,
if (!p_vf->vport_instance)
return ECORE_INVAL;
 
-   if (events & (1 << MAC_ADDR_FORCED)) {
+   if ((events & (1 << MAC_ADDR_FORCED)) ||
+   p_hwfn->pf_params.eth_pf_params.allow_vf_mac_change) {
/* Since there's no way [currently] of removing the MAC,
 * we can always assume this means we need to force it.
 */
@@ -1989,7 +1990,11 @@ static void ecore_iov_vf_mbx_acquire(struct ecore_hwfn   
*p_hwfn,
return rc;
}
 
-   p_vf->configured_features |= 1 << MAC_ADDR_FORCED;
+   if (p_hwfn->pf_params.eth_pf_params.allow_vf_mac_change)
+   p_vf->configured_features |=
+   1 << VFPF_BULLETIN_MAC_ADDR;
+   else
+   p_vf->configured_features |= 1 << MAC_ADDR_FORCED;
}
 
if (events & (1 << VLAN_ADDR_FORCED)) {
@@ -4370,7 +4375,11 @@ void ecore_iov_bulletin_set_forced_mac(struct ecore_hwfn 
*p_hwfn,
return;
}
 
-   feature = 1 << MAC_ADDR_FORCED;
+   if (p_hwfn->pf_params.eth_pf_params.allow_vf_mac_change)
+   feature = 1 << VFPF_BULLETIN_MAC_ADDR;
+   else
+   feature = 1 << MAC_ADDR_FORCED;
+
OSAL_MEMCPY(vf_info->bulletin.p_virt->mac, mac, ETH_ALEN);
 
vf_info->bulletin.p_virt->valid_bitmap |= feature;
@@ -4411,9 +4420,13 @@ enum _ecore_status_t ecore_iov_bulletin_set_mac(struct 
ecore_hwfn *p_hwfn,
 
vf_info->bulletin.p_virt->valid_bitmap |= feature;
 
+   if (p_hwfn->pf_params.eth_pf_params.allow_vf_mac_change)
+   ecore_iov_configure_vport_forced(p_hwfn, vf_info, feature);
+
return ECORE_SUCCESS;
 }
 
+#ifndef LINUX_REMOVE
 enum _ecore_status_t
 ecore_iov_bulletin_set_forced_untagged_default(struct ecore_hwfn *p_hwfn,
   bool b_untagged_only, int vfid)
@@ -4470,6 +4483,7 @@ void ecore_iov_get_vfs_opaque_fid(struct ecore_hwfn 
*p_hwfn, int vfid,
 
*opaque_fid = vf_info->opaque_fid;
 }
+#endif
 
 void ecore_iov_bulletin_set_forced_vlan(struct ecore_hwfn *p_hwfn,
u16 pvid, int vfid)
@@ -4657,6 +4671,22 @@ u32 ecore_iov_pfvf_msg_length(void)
return sizeof(union pfvf_tlvs);
 }
 
+u8 *ecore_iov_bulletin_get_mac(struct ecore_hwfn *p_hwfn,
+ u16 rel_vf_id)
+{
+   struct ecore_vf_info *p_vf;
+
+   p_vf = ecore_iov_get_vf_info(p_hwfn, rel_vf_id, true);
+   if (!p_vf || !p_vf->bulletin.p_virt)
+   return OSAL_NULL;
+
+   if (!(p_vf->bulletin.p_virt->valid_bitmap &
+   (1 << VFPF_BULLETIN_MAC_ADDR)))
+   return OSAL_NULL;
+
+   return p_vf->bulletin.p_virt->mac;
+}
+
 u8 *ecore_iov_bulletin_get_forced_mac(struct ecore_hwfn *p_hwfn, u16 rel_vf_id)
 {
struct ecore_vf_info *p_vf;
-- 
1.7.10.3



[dpdk-dev] [PATCH 06/14] net/qede/base: add new chain API

2018-03-31 Thread Rasesh Mody
Add new API ecore_chain_set_cons() and fix page index setting in
ecore_chain_set_prod(). The new API is for future use.

Signed-off-by: Rasesh Mody 
---
 drivers/net/qede/base/ecore_chain.h |   49 ++-
 1 file changed, 48 insertions(+), 1 deletion(-)

diff --git a/drivers/net/qede/base/ecore_chain.h 
b/drivers/net/qede/base/ecore_chain.h
index d8f69ad..f8c932b 100644
--- a/drivers/net/qede/base/ecore_chain.h
+++ b/drivers/net/qede/base/ecore_chain.h
@@ -526,7 +526,7 @@ static OSAL_INLINE void ecore_chain_reset(struct 
ecore_chain *p_chain)
p_chain->p_prod_elem = p_chain->p_virt_addr;
 
if (p_chain->mode == ECORE_CHAIN_MODE_PBL) {
-   /* Use (page_cnt - 1) as a reset value for the prod/cons page's
+   /* Use "page_cnt-1" as a reset value for the prod/cons page's
 * indices, to avoid unnecessary page advancing on the first
 * call to ecore_chain_produce/consume. Instead, the indices
 * will be advanced to page_cnt and then will be wrapped to 0.
@@ -726,6 +726,21 @@ static OSAL_INLINE void *ecore_chain_get_last_elem(struct 
ecore_chain *p_chain)
 static OSAL_INLINE void ecore_chain_set_prod(struct ecore_chain *p_chain,
 u32 prod_idx, void *p_prod_elem)
 {
+   if (p_chain->mode == ECORE_CHAIN_MODE_PBL) {
+   /* Use "prod_idx-1" since ecore_chain_produce() advances the
+* page index before the producer index when getting to
+* "next_page_mask".
+*/
+   u32 elem_idx =
+   (prod_idx - 1 + p_chain->capacity) % p_chain->capacity;
+   u32 page_idx = elem_idx / p_chain->elem_per_page;
+
+   if (is_chain_u16(p_chain))
+   p_chain->pbl.c.u16.prod_page_idx = (u16)page_idx;
+   else
+   p_chain->pbl.c.u32.prod_page_idx = page_idx;
+   }
+
if (is_chain_u16(p_chain))
p_chain->u.chain16.prod_idx = (u16)prod_idx;
else
@@ -734,6 +749,38 @@ static OSAL_INLINE void ecore_chain_set_prod(struct 
ecore_chain *p_chain,
 }
 
 /**
+ * @brief ecore_chain_set_cons - sets the cons to the given value
+ *
+ * @param cons_idx
+ * @param p_cons_elem
+ */
+static OSAL_INLINE void ecore_chain_set_cons(struct ecore_chain *p_chain,
+u32 cons_idx, void *p_cons_elem)
+{
+   if (p_chain->mode == ECORE_CHAIN_MODE_PBL) {
+   /* Use "cons_idx-1" since ecore_chain_consume() advances the
+* page index before the consumer index when getting to
+* "next_page_mask".
+*/
+   u32 elem_idx =
+   (cons_idx - 1 + p_chain->capacity) % p_chain->capacity;
+   u32 page_idx = elem_idx / p_chain->elem_per_page;
+
+   if (is_chain_u16(p_chain))
+   p_chain->pbl.c.u16.cons_page_idx = (u16)page_idx;
+   else
+   p_chain->pbl.c.u32.cons_page_idx = page_idx;
+   }
+
+   if (is_chain_u16(p_chain))
+   p_chain->u.chain16.cons_idx = (u16)cons_idx;
+   else
+   p_chain->u.chain32.cons_idx = cons_idx;
+
+   p_chain->p_cons_elem = p_cons_elem;
+}
+
+/**
  * @brief ecore_chain_pbl_zero_mem - set chain memory to 0
  *
  * @param p_chain
-- 
1.7.10.3



[dpdk-dev] [PATCH 09/14] net/qede/base: refine error handling

2018-03-31 Thread Rasesh Mody
Adjust the verbosity of the log messages and add preventive checks for
errors.

Signed-off-by: Rasesh Mody 
---
 drivers/net/qede/base/ecore_cxt.c |   20 ++--
 drivers/net/qede/base/ecore_dcbx.c|2 +-
 drivers/net/qede/base/ecore_dev.c |  179 -
 drivers/net/qede/base/ecore_dev_api.h |2 +-
 drivers/net/qede/base/ecore_hw.c  |   20 ++--
 drivers/net/qede/base/ecore_int.c |   11 +-
 drivers/net/qede/base/ecore_l2.c  |5 +-
 drivers/net/qede/base/ecore_mcp.c |   21 ++--
 drivers/net/qede/base/ecore_spq.c |   20 ++--
 drivers/net/qede/base/ecore_sriov.c   |5 +-
 10 files changed, 173 insertions(+), 112 deletions(-)

diff --git a/drivers/net/qede/base/ecore_cxt.c 
b/drivers/net/qede/base/ecore_cxt.c
index ca7c55f..389008c 100644
--- a/drivers/net/qede/base/ecore_cxt.c
+++ b/drivers/net/qede/base/ecore_cxt.c
@@ -834,7 +834,7 @@ static enum _ecore_status_t ecore_cxt_src_t2_alloc(struct 
ecore_hwfn *p_hwfn)
 p_mngr->t2_num_pages *
 sizeof(struct ecore_dma_mem));
if (!p_mngr->t2) {
-   DP_NOTICE(p_hwfn, true, "Failed to allocate t2 table\n");
+   DP_NOTICE(p_hwfn, false, "Failed to allocate t2 table\n");
rc = ECORE_NOMEM;
goto t2_fail;
}
@@ -919,6 +919,9 @@ static void ecore_ilt_shadow_free(struct ecore_hwfn *p_hwfn)
struct ecore_cxt_mngr *p_mngr = p_hwfn->p_cxt_mngr;
u32 ilt_size, i;
 
+   if (p_mngr->ilt_shadow == OSAL_NULL)
+   return;
+
ilt_size = ecore_cxt_ilt_shadow_size(p_cli);
 
for (i = 0; p_mngr->ilt_shadow && i < ilt_size; i++) {
@@ -931,6 +934,7 @@ static void ecore_ilt_shadow_free(struct ecore_hwfn *p_hwfn)
p_dma->p_virt = OSAL_NULL;
}
OSAL_FREE(p_hwfn->p_dev, p_mngr->ilt_shadow);
+   p_mngr->ilt_shadow = OSAL_NULL;
 }
 
 static enum _ecore_status_t
@@ -1000,8 +1004,7 @@ static enum _ecore_status_t ecore_ilt_shadow_alloc(struct 
ecore_hwfn *p_hwfn)
 size * sizeof(struct ecore_dma_mem));
 
if (!p_mngr->ilt_shadow) {
-   DP_NOTICE(p_hwfn, true,
- "Failed to allocate ilt shadow table\n");
+   DP_NOTICE(p_hwfn, false, "Failed to allocate ilt shadow 
table\n");
rc = ECORE_NOMEM;
goto ilt_shadow_fail;
}
@@ -1044,12 +1047,14 @@ static void ecore_cid_map_free(struct ecore_hwfn 
*p_hwfn)
 
for (type = 0; type < MAX_CONN_TYPES; type++) {
OSAL_FREE(p_hwfn->p_dev, p_mngr->acquired[type].cid_map);
+   p_mngr->acquired[type].cid_map = OSAL_NULL;
p_mngr->acquired[type].max_count = 0;
p_mngr->acquired[type].start_cid = 0;
 
for (vf = 0; vf < COMMON_MAX_NUM_VFS; vf++) {
OSAL_FREE(p_hwfn->p_dev,
  p_mngr->acquired_vf[type][vf].cid_map);
+   p_mngr->acquired_vf[type][vf].cid_map = OSAL_NULL;
p_mngr->acquired_vf[type][vf].max_count = 0;
p_mngr->acquired_vf[type][vf].start_cid = 0;
}
@@ -1126,8 +1131,7 @@ enum _ecore_status_t ecore_cxt_mngr_alloc(struct 
ecore_hwfn *p_hwfn)
 
p_mngr = OSAL_ZALLOC(p_hwfn->p_dev, GFP_KERNEL, sizeof(*p_mngr));
if (!p_mngr) {
-   DP_NOTICE(p_hwfn, true,
- "Failed to allocate `struct ecore_cxt_mngr'\n");
+   DP_NOTICE(p_hwfn, false, "Failed to allocate `struct 
ecore_cxt_mngr'\n");
return ECORE_NOMEM;
}
 
@@ -1189,21 +1193,21 @@ enum _ecore_status_t ecore_cxt_tables_alloc(struct 
ecore_hwfn *p_hwfn)
/* Allocate the ILT shadow table */
rc = ecore_ilt_shadow_alloc(p_hwfn);
if (rc) {
-   DP_NOTICE(p_hwfn, true, "Failed to allocate ilt memory\n");
+   DP_NOTICE(p_hwfn, false, "Failed to allocate ilt memory\n");
goto tables_alloc_fail;
}
 
/* Allocate the T2  table */
rc = ecore_cxt_src_t2_alloc(p_hwfn);
if (rc) {
-   DP_NOTICE(p_hwfn, true, "Failed to allocate T2 memory\n");
+   DP_NOTICE(p_hwfn, false, "Failed to allocate T2 memory\n");
goto tables_alloc_fail;
}
 
/* Allocate and initialize the acquired cids bitmaps */
rc = ecore_cid_map_alloc(p_hwfn);
if (rc) {
-   DP_NOTICE(p_hwfn, true, "Failed to allocate cid maps\n");
+   DP_NOTICE(p_hwfn, false, "Failed to allocate cid maps\n");
goto tables_alloc_fail;
}
 
diff --git a/drivers/net/qede/base/ecore_dcbx.c 
b/drivers/net/qede/base/ecore_dcbx.c
index 21ddda9..fe9d5c0 100644
--- a/drivers/net/qede/base/ecore_dcbx.c
+++ b/drivers/net/qede/base/ecore_dcbx.c
@@ -910,7 +910,7 @@ enum _ecore_status_t ecore_dc

[dpdk-dev] [PATCH 10/14] net/qede/base: add stats counter for link state

2018-03-31 Thread Rasesh Mody
Add link_change_count counter to track number of link state transitions

Signed-off-by: Rasesh Mody 
---
 drivers/net/qede/base/ecore_dev_api.h |1 +
 drivers/net/qede/base/ecore_l2.c  |   10 +-
 2 files changed, 10 insertions(+), 1 deletion(-)

diff --git a/drivers/net/qede/base/ecore_dev_api.h 
b/drivers/net/qede/base/ecore_dev_api.h
index aee11c0..f619683 100644
--- a/drivers/net/qede/base/ecore_dev_api.h
+++ b/drivers/net/qede/base/ecore_dev_api.h
@@ -377,6 +377,7 @@ struct ecore_eth_stats_common {
u64 tx_mac_mc_packets;
u64 tx_mac_bc_packets;
u64 tx_mac_ctrl_frames;
+   u64 link_change_count;
 };
 
 struct ecore_eth_stats_bb {
diff --git a/drivers/net/qede/base/ecore_l2.c b/drivers/net/qede/base/ecore_l2.c
index bbcbbd0..0883fd3 100644
--- a/drivers/net/qede/base/ecore_l2.c
+++ b/drivers/net/qede/base/ecore_l2.c
@@ -1948,6 +1948,11 @@ static void __ecore_get_vport_port_stats(struct 
ecore_hwfn *p_hwfn,
p_ah->tx_1519_to_max_byte_packets =
port_stats.eth.u1.ah1.t1519_to_max;
}
+
+   p_common->link_change_count = ecore_rd(p_hwfn, p_ptt,
+  p_hwfn->mcp_info->port_addr +
+  OFFSETOF(struct public_port,
+   link_change_count));
 }
 
 void __ecore_get_vport_stats(struct ecore_hwfn *p_hwfn,
@@ -2064,11 +2069,14 @@ void ecore_reset_vport_stats(struct ecore_dev *p_dev)
 
/* PORT statistics are not necessarily reset, so we need to
 * read and create a baseline for future statistics.
+* Link change stat is maintained by MFW, return its value as is.
 */
if (!p_dev->reset_stats)
DP_INFO(p_dev, "Reset stats not allocated\n");
-   else
+   else {
_ecore_get_vport_stats(p_dev, p_dev->reset_stats);
+   p_dev->reset_stats->common.link_change_count = 0;
+   }
 }
 
 void ecore_arfs_mode_configure(struct ecore_hwfn *p_hwfn,
-- 
1.7.10.3



[dpdk-dev] [PATCH 08/14] net/qede/base: add MFW support for driver load timeout

2018-03-31 Thread Rasesh Mody
Add SPQ timeout base driver parameter support management FW timeout values
other than default and none. Have fallback mechanism for old MFWs.
Reduce the defult timeout to 1 sec.

Signed-off-by: Rasesh Mody 
---
 drivers/net/qede/base/ecore_dev.c |   66 +++--
 drivers/net/qede/base/ecore_dev_api.h |   14 +++
 drivers/net/qede/base/ecore_spq.c |   16 +++-
 drivers/net/qede/base/ecore_spq.h |   13 +++
 drivers/net/qede/base/mcp_public.h|2 +
 5 files changed, 97 insertions(+), 14 deletions(-)

diff --git a/drivers/net/qede/base/ecore_dev.c 
b/drivers/net/qede/base/ecore_dev.c
index a3269f4..1b01bba 100644
--- a/drivers/net/qede/base/ecore_dev.c
+++ b/drivers/net/qede/base/ecore_dev.c
@@ -2289,14 +2289,15 @@ static void ecore_reset_mb_shadow(struct ecore_hwfn 
*p_hwfn,
 }
 
 static void ecore_pglueb_clear_err(struct ecore_hwfn *p_hwfn,
-struct ecore_ptt *p_ptt)
+  struct ecore_ptt *p_ptt)
 {
ecore_wr(p_hwfn, p_ptt, PGLUE_B_REG_WAS_ERROR_PF_31_0_CLR,
 1 << p_hwfn->abs_pf_id);
 }
 
-static void
-ecore_fill_load_req_params(struct ecore_load_req_params *p_load_req,
+static enum _ecore_status_t
+ecore_fill_load_req_params(struct ecore_hwfn *p_hwfn,
+  struct ecore_load_req_params *p_load_req,
   struct ecore_drv_load_params *p_drv_load)
 {
/* Make sure that if ecore-client didn't provide inputs, all the
@@ -2308,15 +2309,51 @@ static void ecore_pglueb_clear_err(struct ecore_hwfn 
*p_hwfn,
 
OSAL_MEM_ZERO(p_load_req, sizeof(*p_load_req));
 
-   if (p_drv_load != OSAL_NULL) {
-   p_load_req->drv_role = p_drv_load->is_crash_kernel ?
-  ECORE_DRV_ROLE_KDUMP :
-  ECORE_DRV_ROLE_OS;
+   if (p_drv_load == OSAL_NULL)
+   goto out;
+
+   p_load_req->drv_role = p_drv_load->is_crash_kernel ?
+  ECORE_DRV_ROLE_KDUMP :
+  ECORE_DRV_ROLE_OS;
+   p_load_req->avoid_eng_reset = p_drv_load->avoid_eng_reset;
+   p_load_req->override_force_load = p_drv_load->override_force_load;
+
+   /* Old MFW versions don't support timeout values other than default and
+* none, so these values are replaced according to the fall-back action.
+*/
+
+   if (p_drv_load->mfw_timeout_val == ECORE_LOAD_REQ_LOCK_TO_DEFAULT ||
+   p_drv_load->mfw_timeout_val == ECORE_LOAD_REQ_LOCK_TO_NONE ||
+   (p_hwfn->mcp_info->capabilities &
+FW_MB_PARAM_FEATURE_SUPPORT_DRV_LOAD_TO)) {
p_load_req->timeout_val = p_drv_load->mfw_timeout_val;
-   p_load_req->avoid_eng_reset = p_drv_load->avoid_eng_reset;
-   p_load_req->override_force_load =
-   p_drv_load->override_force_load;
+   goto out;
}
+
+   switch (p_drv_load->mfw_timeout_fallback) {
+   case ECORE_TO_FALLBACK_TO_NONE:
+   p_load_req->timeout_val = ECORE_LOAD_REQ_LOCK_TO_NONE;
+   break;
+   case ECORE_TO_FALLBACK_TO_DEFAULT:
+   p_load_req->timeout_val = ECORE_LOAD_REQ_LOCK_TO_DEFAULT;
+   break;
+   case ECORE_TO_FALLBACK_FAIL_LOAD:
+   DP_NOTICE(p_hwfn, false,
+ "Received %d as a value for MFW timeout while the MFW 
supports only default [%d] or none [%d]. Abort.\n",
+ p_drv_load->mfw_timeout_val,
+ ECORE_LOAD_REQ_LOCK_TO_DEFAULT,
+ ECORE_LOAD_REQ_LOCK_TO_NONE);
+   return ECORE_ABORTED;
+   }
+
+   DP_INFO(p_hwfn,
+   "Modified the MFW timeout value from %d to %s [%d] due to lack 
of MFW support\n",
+   p_drv_load->mfw_timeout_val,
+   (p_load_req->timeout_val == ECORE_LOAD_REQ_LOCK_TO_DEFAULT) ?
+   "default" : "none",
+   p_load_req->timeout_val);
+out:
+   return ECORE_SUCCESS;
 }
 
 enum _ecore_status_t ecore_vf_start(struct ecore_hwfn *p_hwfn,
@@ -2372,8 +2409,13 @@ enum _ecore_status_t ecore_hw_init(struct ecore_dev 
*p_dev,
if (rc != ECORE_SUCCESS)
return rc;
 
-   ecore_fill_load_req_params(&load_req_params,
-  p_params->p_drv_load_params);
+   ecore_set_spq_block_timeout(p_hwfn, p_params->spq_timeout_ms);
+
+   rc = ecore_fill_load_req_params(p_hwfn, &load_req_params,
+   p_params->p_drv_load_params);
+   if (rc != ECORE_SUCCESS)
+   return rc;
+
rc = ecore_mcp_load_req(p_hwfn, p_hwfn->p_main_ptt,
&load_req_params);
if (rc != ECORE_SUCCESS) {
diff --git a/drivers/net/qede/base/ecore

[dpdk-dev] [PATCH 11/14] net/qede/base: add APIs for xcvr

2018-03-31 Thread Rasesh Mody
Add API to query transceiver info and to retrieve link speed.

Signed-off-by: Rasesh Mody 
---
 drivers/net/qede/base/ecore_mcp.c |  199 -
 drivers/net/qede/base/ecore_mcp_api.h |   46 
 drivers/net/qede/base/mcp_public.h|1 +
 3 files changed, 243 insertions(+), 3 deletions(-)

diff --git a/drivers/net/qede/base/ecore_mcp.c 
b/drivers/net/qede/base/ecore_mcp.c
index 0e425aa..c1bfdd1 100644
--- a/drivers/net/qede/base/ecore_mcp.c
+++ b/drivers/net/qede/base/ecore_mcp.c
@@ -9,6 +9,7 @@
 #include "bcm_osal.h"
 #include "ecore.h"
 #include "ecore_status.h"
+#include "nvm_cfg.h"
 #include "ecore_mcp.h"
 #include "mcp_public.h"
 #include "reg_addr.h"
@@ -602,7 +603,7 @@ void ecore_mcp_print_cpu_info(struct ecore_hwfn *p_hwfn,
 
/* MCP not initialized */
if (!ecore_mcp_is_init(p_hwfn)) {
-   DP_NOTICE(p_hwfn, true, "MFW is not initialized !\n");
+   DP_NOTICE(p_hwfn, true, "MFW is not initialized!\n");
return ECORE_BUSY;
}
 
@@ -2130,19 +2131,20 @@ enum _ecore_status_t ecore_mcp_get_media_type(struct 
ecore_hwfn *p_hwfn,
  struct ecore_ptt *p_ptt,
  u32 *p_media_type)
 {
+   enum _ecore_status_t rc = ECORE_SUCCESS;
 
/* TODO - Add support for VFs */
if (IS_VF(p_hwfn->p_dev))
return ECORE_INVAL;
 
if (!ecore_mcp_is_init(p_hwfn)) {
-   DP_NOTICE(p_hwfn, true, "MFW is not initialized !\n");
+   DP_NOTICE(p_hwfn, false, "MFW is not initialized!\n");
return ECORE_BUSY;
}
 
if (!p_ptt) {
*p_media_type = MEDIA_UNSPECIFIED;
-   return ECORE_INVAL;
+   rc = ECORE_INVAL;
} else {
*p_media_type = ecore_rd(p_hwfn, p_ptt,
 p_hwfn->mcp_info->port_addr +
@@ -2153,6 +2155,197 @@ enum _ecore_status_t ecore_mcp_get_media_type(struct 
ecore_hwfn *p_hwfn,
return ECORE_SUCCESS;
 }
 
+enum _ecore_status_t ecore_mcp_get_transceiver_data(struct ecore_hwfn *p_hwfn,
+   struct ecore_ptt *p_ptt,
+   u32 *p_tranceiver_type)
+{
+   enum _ecore_status_t rc = ECORE_SUCCESS;
+
+   /* TODO - Add support for VFs */
+   if (IS_VF(p_hwfn->p_dev))
+   return ECORE_INVAL;
+
+   if (!ecore_mcp_is_init(p_hwfn)) {
+   DP_NOTICE(p_hwfn, false, "MFW is not initialized!\n");
+   return ECORE_BUSY;
+   }
+   if (!p_ptt) {
+   *p_tranceiver_type = ETH_TRANSCEIVER_TYPE_NONE;
+   rc = ECORE_INVAL;
+   } else {
+   *p_tranceiver_type = ecore_rd(p_hwfn, p_ptt,
+   p_hwfn->mcp_info->port_addr +
+   offsetof(struct public_port,
+   transceiver_data));
+   }
+
+   return rc;
+}
+
+static int is_transceiver_ready(u32 transceiver_state, u32 transceiver_type)
+{
+   if ((transceiver_state & ETH_TRANSCEIVER_STATE_PRESENT) &&
+   ((transceiver_state & ETH_TRANSCEIVER_STATE_UPDATING) == 0x0) &&
+   (transceiver_type != ETH_TRANSCEIVER_TYPE_NONE))
+   return 1;
+
+   return 0;
+}
+
+enum _ecore_status_t ecore_mcp_trans_speed_mask(struct ecore_hwfn *p_hwfn,
+   struct ecore_ptt *p_ptt,
+   u32 *p_speed_mask)
+{
+   u32 transceiver_data, transceiver_type, transceiver_state;
+
+   ecore_mcp_get_transceiver_data(p_hwfn, p_ptt, &transceiver_data);
+
+   transceiver_state = GET_MFW_FIELD(transceiver_data,
+   ETH_TRANSCEIVER_STATE);
+
+   transceiver_type = GET_MFW_FIELD(transceiver_data,
+  ETH_TRANSCEIVER_TYPE);
+
+   if (is_transceiver_ready(transceiver_state, transceiver_type) == 0)
+   return ECORE_INVAL;
+
+   switch (transceiver_type) {
+   case ETH_TRANSCEIVER_TYPE_1G_LX:
+   case ETH_TRANSCEIVER_TYPE_1G_SX:
+   case ETH_TRANSCEIVER_TYPE_1G_PCC:
+   case ETH_TRANSCEIVER_TYPE_1G_ACC:
+   case ETH_TRANSCEIVER_TYPE_1000BASET:
+   *p_speed_mask = NVM_CFG1_PORT_DRV_SPEED_CAPABILITY_MASK_1G;
+   break;
+
+   case ETH_TRANSCEIVER_TYPE_10G_SR:
+   case ETH_TRANSCEIVER_TYPE_10G_LR:
+   case ETH_TRANSCEIVER_TYPE_10G_LRM:
+   case ETH_TRANSCEIVER_TYPE_10G_ER:
+   case ETH_TRANSCEIVER_TYPE_10G_PCC:
+   case ETH_TRANSCEIVER_TYPE_10G_ACC:
+   case ETH_TRANSCEIVER_TYPE_4x10G:
+   *p_speed_mask = NVM_CFG1_PORT_DRV_SPEED_CAPABILITY_MASK_10G;
+   break;
+
+   case ETH_TRANSCEIVER_TYPE_40G_LR4:
+   case ETH_TRANSCEIVER_TYPE_40G_SR4:
+   case ETH_TRANSCEIVER_TYPE_MULTI_RATE_10G_40G

[dpdk-dev] [PATCH 14/14] net/qede: update PMD version to 2.8.0.1

2018-03-31 Thread Rasesh Mody
Signed-off-by: Rasesh Mody 
---
 drivers/net/qede/qede_ethdev.h |2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/drivers/net/qede/qede_ethdev.h b/drivers/net/qede/qede_ethdev.h
index baae22d..4737c8f 100644
--- a/drivers/net/qede/qede_ethdev.h
+++ b/drivers/net/qede/qede_ethdev.h
@@ -45,7 +45,7 @@
 /* Driver versions */
 #define QEDE_PMD_VER_PREFIX"QEDE PMD"
 #define QEDE_PMD_VERSION_MAJOR 2
-#define QEDE_PMD_VERSION_MINOR 7
+#define QEDE_PMD_VERSION_MINOR 8
 #define QEDE_PMD_VERSION_REVISION   0
 #define QEDE_PMD_VERSION_PATCH 1
 
-- 
1.7.10.3



[dpdk-dev] [PATCH 12/14] net/qede/base: fix to support OVLAN mode

2018-03-31 Thread Rasesh Mody
This fix allows driver to program NIC configuration to support OVLAN
mode in multi-function scenario

Signed-off-by: Rasesh Mody 
---
 drivers/net/qede/base/ecore.h |6 ++
 drivers/net/qede/base/ecore_dcbx.c|5 +
 drivers/net/qede/base/ecore_dcbx_api.h|1 +
 drivers/net/qede/base/ecore_dev.c |   10 --
 drivers/net/qede/base/ecore_sp_commands.c |   29 -
 5 files changed, 40 insertions(+), 11 deletions(-)

diff --git a/drivers/net/qede/base/ecore.h b/drivers/net/qede/base/ecore.h
index 7c642af..c8e6311 100644
--- a/drivers/net/qede/base/ecore.h
+++ b/drivers/net/qede/base/ecore.h
@@ -536,6 +536,12 @@ enum ecore_mf_mode_bit {
ECORE_MF_UFP_SPECIFIC,
 
ECORE_MF_DISABLE_ARFS,
+
+   /* Use vlan for steering */
+   ECORE_MF_8021Q_TAGGING,
+
+   /* Use stag for steering */
+   ECORE_MF_8021AD_TAGGING,
 };
 
 enum ecore_ufp_mode {
diff --git a/drivers/net/qede/base/ecore_dcbx.c 
b/drivers/net/qede/base/ecore_dcbx.c
index fe9d5c0..93262ee 100644
--- a/drivers/net/qede/base/ecore_dcbx.c
+++ b/drivers/net/qede/base/ecore_dcbx.c
@@ -149,6 +149,10 @@ u8 ecore_dcbx_get_dscp_value(struct ecore_hwfn *p_hwfn, u8 
pri)
}
p_data->arr[type].update = UPDATE_DCB_DSCP;
 
+   /* Do not add valn tag 0 when DCB is enabled and port is in UFP mode */
+   if (OSAL_TEST_BIT(ECORE_MF_UFP_SPECIFIC, &p_hwfn->p_dev->mf_bits))
+   p_data->arr[type].dont_add_vlan0 = true;
+
/* QM reconf data */
if (p_hwfn->hw_info.personality == personality)
p_hwfn->hw_info.offload_tc = tc;
@@ -935,6 +939,7 @@ static void ecore_dcbx_update_protocol_data(struct 
protocol_dcb_data *p_data,
p_data->dcb_tc = p_src->arr[type].tc;
p_data->dscp_enable_flag = p_src->arr[type].dscp_enable;
p_data->dscp_val = p_src->arr[type].dscp_val;
+   p_data->dcb_dont_add_vlan0 = p_src->arr[type].dont_add_vlan0;
 }
 
 /* Set pf update ramrod command params */
diff --git a/drivers/net/qede/base/ecore_dcbx_api.h 
b/drivers/net/qede/base/ecore_dcbx_api.h
index 9ff4df4..4df99ae 100644
--- a/drivers/net/qede/base/ecore_dcbx_api.h
+++ b/drivers/net/qede/base/ecore_dcbx_api.h
@@ -29,6 +29,7 @@ struct ecore_dcbx_app_data {
u8 tc;  /* Traffic Class */
bool dscp_enable;   /* DSCP enabled */
u8 dscp_val;/* DSCP value */
+   bool dont_add_vlan0;/* Do not insert a vlan tag with id 0 */
 };
 
 #ifndef __EXTRACT__LINUX__
diff --git a/drivers/net/qede/base/ecore_dev.c 
b/drivers/net/qede/base/ecore_dev.c
index a85d26d..112f854 100644
--- a/drivers/net/qede/base/ecore_dev.c
+++ b/drivers/net/qede/base/ecore_dev.c
@@ -3588,9 +3588,14 @@ static enum _ecore_status_t ecore_hw_get_resc(struct 
ecore_hwfn *p_hwfn,
break;
case NVM_CFG1_GLOB_MF_MODE_UFP:
p_hwfn->p_dev->mf_bits = 1 << ECORE_MF_OVLAN_CLSS |
-1 << ECORE_MF_UFP_SPECIFIC;
+1 << ECORE_MF_UFP_SPECIFIC |
+1 << ECORE_MF_8021Q_TAGGING;
+   break;
+   case NVM_CFG1_GLOB_MF_MODE_BD:
+   p_hwfn->p_dev->mf_bits = 1 << ECORE_MF_OVLAN_CLSS |
+1 << ECORE_MF_LLH_PROTO_CLSS |
+1 << ECORE_MF_8021AD_TAGGING;
break;
-
case NVM_CFG1_GLOB_MF_MODE_NPAR1_0:
p_hwfn->p_dev->mf_bits = 1 << ECORE_MF_LLH_MAC_CLSS |
 1 << ECORE_MF_LLH_PROTO_CLSS |
@@ -3619,6 +3624,7 @@ static enum _ecore_status_t ecore_hw_get_resc(struct 
ecore_hwfn *p_hwfn,
 */
switch (mf_mode) {
case NVM_CFG1_GLOB_MF_MODE_MF_ALLOWED:
+   case NVM_CFG1_GLOB_MF_MODE_BD:
p_hwfn->p_dev->mf_mode = ECORE_MF_OVLAN;
break;
case NVM_CFG1_GLOB_MF_MODE_NPAR1_0:
diff --git a/drivers/net/qede/base/ecore_sp_commands.c 
b/drivers/net/qede/base/ecore_sp_commands.c
index 7598e7a..83705b8 100644
--- a/drivers/net/qede/base/ecore_sp_commands.c
+++ b/drivers/net/qede/base/ecore_sp_commands.c
@@ -295,6 +295,7 @@ static void ecore_set_hw_tunn_mode_port(struct ecore_hwfn 
*p_hwfn,
 }
 
 #define ETH_P_8021Q 0x8100
+#define ETH_P_8021AD 0x88A8 /* 802.1ad Service VLAN */
 
 enum _ecore_status_t ecore_sp_pf_start(struct ecore_hwfn *p_hwfn,
   struct ecore_ptt *p_ptt,
@@ -308,7 +309,7 @@ enum _ecore_status_t ecore_sp_pf_start(struct ecore_hwfn 
*p_hwfn,
struct ecore_sp_init_data init_data;
enum _ecore_status_t rc = ECORE_NOTIMPL;
u8 page_cnt;
-   int i;
+   u8 i;
 
/* update initial eq producer */
ecore_eq_prod_update(p_hwfn,
@@ -343,18 +344,27 @@ enum _ecore_status_t ecore_sp_pf_start(struct ecore_hwfn 
*p_hwfn,
 
p_ramrod->outer_tag_config.outer_tag.

[dpdk-dev] [PATCH 13/14] net/qede/base: add packet pacing support

2018-03-31 Thread Rasesh Mody
Add packet pacing support for PFs.
ecore client can request for enabling packet pacing at init time,
if requested then ecore is going to skip MCoS and SRIOV configurations.

Signed-off-by: Rasesh Mody 
---
 drivers/net/qede/base/ecore.h |   16 ++-
 drivers/net/qede/base/ecore_dev.c |   47 -
 drivers/net/qede/base/ecore_dev_api.h |3 +++
 drivers/net/qede/base/ecore_l2.c  |   36 ++---
 drivers/net/qede/qede_main.c  |1 +
 5 files changed, 91 insertions(+), 12 deletions(-)

diff --git a/drivers/net/qede/base/ecore.h b/drivers/net/qede/base/ecore.h
index c8e6311..b6541dc 100644
--- a/drivers/net/qede/base/ecore.h
+++ b/drivers/net/qede/base/ecore.h
@@ -41,6 +41,9 @@
((FW_MAJOR_VERSION << 24) | (FW_MINOR_VERSION << 16) |  \
 (FW_REVISION_VERSION << 8) | FW_ENGINEERING_VERSION)
 
+#define IS_ECORE_PACING(p_hwfn)\
+   (!!(p_hwfn->b_en_pacing))
+
 #define MAX_HWFNS_PER_DEVICE   2
 #define NAME_SIZE 128 /* @DPDK */
 #define ECORE_WFQ_UNIT 100
@@ -680,6 +683,13 @@ struct ecore_hwfn {
/* Mechanism for recovering from doorbell drop */
struct ecore_db_recovery_info   db_recovery_info;
 
+   /* Enable/disable pacing, if request to enable then
+* IOV and mcos configuration will be skipped.
+* this actually reflects the value requested in
+* struct ecore_hw_prepare_params by ecore client.
+*/
+   bool b_en_pacing;
+
/* @DPDK */
struct ecore_ptt*p_arfs_ptt;
 };
@@ -932,12 +942,16 @@ void ecore_set_fw_mac_addr(__le16 *fw_msb, __le16 
*fw_mid, __le16 *fw_lsb,
 #define PQ_FLAGS_ACK   (1 << 4)
 #define PQ_FLAGS_OFLD  (1 << 5)
 #define PQ_FLAGS_VFS   (1 << 6)
+#define PQ_FLAGS_LLT   (1 << 7)
 
 /* physical queue index for cm context intialization */
 u16 ecore_get_cm_pq_idx(struct ecore_hwfn *p_hwfn, u32 pq_flags);
 u16 ecore_get_cm_pq_idx_mcos(struct ecore_hwfn *p_hwfn, u8 tc);
 u16 ecore_get_cm_pq_idx_vf(struct ecore_hwfn *p_hwfn, u16 vf);
-u16 ecore_get_cm_pq_idx_rl(struct ecore_hwfn *p_hwfn, u8 qpid);
+u16 ecore_get_cm_pq_idx_rl(struct ecore_hwfn *p_hwfn, u16 rl);
+
+/* qm vport for rate limit configuration */
+u16 ecore_get_qm_vport_idx_rl(struct ecore_hwfn *p_hwfn, u16 rl);
 
 const char *ecore_hw_get_resc_name(enum ecore_resources res_id);
 
diff --git a/drivers/net/qede/base/ecore_dev.c 
b/drivers/net/qede/base/ecore_dev.c
index 112f854..b1e67e2 100644
--- a/drivers/net/qede/base/ecore_dev.c
+++ b/drivers/net/qede/base/ecore_dev.c
@@ -513,11 +513,14 @@ static u32 ecore_get_pq_flags(struct ecore_hwfn *p_hwfn)
/* feature flags */
if (IS_ECORE_SRIOV(p_hwfn->p_dev))
flags |= PQ_FLAGS_VFS;
+   if (IS_ECORE_PACING(p_hwfn))
+   flags |= PQ_FLAGS_RLS;
 
/* protocol flags */
switch (p_hwfn->hw_info.personality) {
case ECORE_PCI_ETH:
-   flags |= PQ_FLAGS_MCOS;
+   if (!IS_ECORE_PACING(p_hwfn))
+   flags |= PQ_FLAGS_MCOS;
break;
case ECORE_PCI_FCOE:
flags |= PQ_FLAGS_OFLD;
@@ -526,11 +529,14 @@ static u32 ecore_get_pq_flags(struct ecore_hwfn *p_hwfn)
flags |= PQ_FLAGS_ACK | PQ_FLAGS_OOO | PQ_FLAGS_OFLD;
break;
case ECORE_PCI_ETH_ROCE:
-   flags |= PQ_FLAGS_MCOS | PQ_FLAGS_OFLD;
+   flags |= PQ_FLAGS_OFLD | PQ_FLAGS_LLT;
+   if (!IS_ECORE_PACING(p_hwfn))
+   flags |= PQ_FLAGS_MCOS;
break;
case ECORE_PCI_ETH_IWARP:
-   flags |= PQ_FLAGS_MCOS | PQ_FLAGS_ACK | PQ_FLAGS_OOO |
-PQ_FLAGS_OFLD;
+   flags |= PQ_FLAGS_ACK | PQ_FLAGS_OOO | PQ_FLAGS_OFLD;
+   if (!IS_ECORE_PACING(p_hwfn))
+   flags |= PQ_FLAGS_MCOS;
break;
default:
DP_ERR(p_hwfn, "unknown personality %d\n",
@@ -837,7 +843,7 @@ u16 ecore_get_cm_pq_idx_vf(struct ecore_hwfn *p_hwfn, u16 
vf)
return ecore_get_cm_pq_idx(p_hwfn, PQ_FLAGS_VFS) + vf;
 }
 
-u16 ecore_get_cm_pq_idx_rl(struct ecore_hwfn *p_hwfn, u8 rl)
+u16 ecore_get_cm_pq_idx_rl(struct ecore_hwfn *p_hwfn, u16 rl)
 {
u16 max_rl = ecore_init_qm_get_num_pf_rls(p_hwfn);
 
@@ -847,6 +853,23 @@ u16 ecore_get_cm_pq_idx_rl(struct ecore_hwfn *p_hwfn, u8 
rl)
return ecore_get_cm_pq_idx(p_hwfn, PQ_FLAGS_RLS) + rl;
 }
 
+u16 ecore_get_qm_vport_idx_rl(struct ecore_hwfn *p_hwfn, u16 rl)
+{
+   u16 start_pq, pq, qm_pq_idx;
+
+   pq = ecore_get_cm_pq_idx_rl(p_hwfn, rl);
+   start_pq = p_hwfn->qm_info.start_pq;
+   qm_pq_idx = pq - start_pq - CM_TX_PQ_BASE;
+
+   if (qm_pq_idx > p_hwfn->qm_info.num_pqs) {
+   DP_ERR(p_hwfn,
+  "qm_pq_idx %d must be smaller than %d\n",
+   qm_pq_idx, p_hwfn->qm_info.num_pqs);
+   }
+
+   retur

[dpdk-dev] [PATCH] net/bnx2x: convert to new Rx offloads API

2018-03-31 Thread Rasesh Mody
From: Harish Patil 

Ethdev RX offloads API has changed since:
commit ce17eddefc20 ("ethdev: introduce Rx queue offloads API")

This patch makes use of DEV_RX_OFFLOAD_JUMBO_FRAME offload flag
to advertise jumbo frame support.

Signed-off-by: Harish Patil 
---
 drivers/net/bnx2x/bnx2x_ethdev.c |5 -
 1 file changed, 4 insertions(+), 1 deletion(-)

diff --git a/drivers/net/bnx2x/bnx2x_ethdev.c b/drivers/net/bnx2x/bnx2x_ethdev.c
index 483d5a1..fada4bd 100644
--- a/drivers/net/bnx2x/bnx2x_ethdev.c
+++ b/drivers/net/bnx2x/bnx2x_ethdev.c
@@ -140,11 +140,13 @@ struct rte_bnx2x_xstats_name_off {
 bnx2x_dev_configure(struct rte_eth_dev *dev)
 {
struct bnx2x_softc *sc = dev->data->dev_private;
+   struct rte_eth_rxmode *rxmode = &dev->data->dev_conf.rxmode;
+
int mp_ncpus = sysconf(_SC_NPROCESSORS_CONF);
 
PMD_INIT_FUNC_TRACE();
 
-   if (dev->data->dev_conf.rxmode.jumbo_frame)
+   if (rxmode & DEV_RX_OFFLOAD_JUMBO_FRAME)
sc->mtu = dev->data->dev_conf.rxmode.max_rx_pkt_len;
 
if (dev->data->nb_tx_queues > dev->data->nb_rx_queues) {
@@ -454,6 +456,7 @@ struct rte_bnx2x_xstats_name_off {
dev_info->max_rx_pktlen  = BNX2X_MAX_RX_PKT_LEN;
dev_info->max_mac_addrs  = BNX2X_MAX_MAC_ADDRS;
dev_info->speed_capa = ETH_LINK_SPEED_10G | ETH_LINK_SPEED_20G;
+   dev_info->rx_offload_capa = DEV_RX_OFFLOAD_JUMBO_FRAME;
 }
 
 static int
-- 
1.7.10.3



Re: [dpdk-dev] [PATCH v6 2/8] ethdev: add switch identifier parameter to port

2018-03-31 Thread Shahaf Shuler


--Shahaf


> -Original Message-
> From: Doherty, Declan [mailto:declan.dohe...@intel.com]
> Sent: Thursday, March 29, 2018 6:13 PM
> To: Shahaf Shuler ; dev@dpdk.org
> Cc: Alex Rosenbaum ; Ferruh Yigit
> ; Thomas Monjalon ; Qi
> Zhang ; Alejandro Lucero
> ; Andrew Rybchenko
> ; Mohammad Abdul Awal
> ; Remy Horton
> ; John McNamara ;
> Rony Efraim ; Jingjing Wu ;
> Wenzhuo Lu ; Vincent Jardin
> ; Yuanhan Liu ; Bruce
> Richardson ; Konstantin Ananyev
> ; Zhihong Wang
> 
> Subject: Re: [dpdk-dev][PATCH v6 2/8] ethdev: add switch identifier
> parameter to port
> 
> On 29/03/2018 11:12 AM, Shahaf Shuler wrote:
> > Thursday, March 29, 2018 12:14 PM, Doherty, Declan:
> >> On 29/03/2018 7:13 AM, Shahaf Shuler wrote:
> >>> Hi Declan,
> >>>
> >>> Thanks for the series! See some comments below
> >>>
> >>> Wednesday, March 28, 2018 4:54 PM, Declan Doherty:
>  Subject: [dpdk-dev][PATCH v6 2/8] ethdev: add switch identifier
>  parameter to port
> 
>  Introduces a new port attribute to ethdev port's which denotes the
>  switch domain a port belongs to. By default all port's switch
>  identifiers are the their port_id. Ports which share a common
>  switch domain are configured with the same switch id.
> 
>  Signed-off-by: Declan Doherty 
>  ---
> app/test-pmd/config.c  | 1 +
> lib/librte_ether/rte_ethdev.c  | 3 +++
> lib/librte_ether/rte_ethdev.h  | 1 +
> lib/librte_ether/rte_ethdev_core.h | 1 +
> 4 files changed, 6 insertions(+)
> 
>  diff --git a/app/test-pmd/config.c b/app/test-pmd/config.c index
>  4bb255c62..e12f8c515 100644
>  --- a/app/test-pmd/config.c
>  +++ b/app/test-pmd/config.c
>  @@ -517,6 +517,7 @@ port_infos_display(portid_t port_id)
>   printf("Min possible number of TXDs per queue: %hu\n",
>   dev_info.tx_desc_lim.nb_min);
>   printf("TXDs number alignment: %hu\n",
>  dev_info.tx_desc_lim.nb_align);
>  +printf("Switch Id: %u\n", dev_info.switch_id);
> }
> 
> void
>  diff --git a/lib/librte_ether/rte_ethdev.c
>  b/lib/librte_ether/rte_ethdev.c index 23857c91f..f32d18cad 100644
>  --- a/lib/librte_ether/rte_ethdev.c
>  +++ b/lib/librte_ether/rte_ethdev.c
>  @@ -290,6 +290,8 @@ rte_eth_dev_allocate(const char *name)
>   eth_dev = eth_dev_get(port_id);
>   snprintf(eth_dev->data->name, sizeof(eth_dev->data->name),
> >> "%s",
>  name);
>   eth_dev->data->port_id = port_id;
>  +eth_dev->data->switch_id = port_id;
>  +/**< Default switch_id is the port_id of the device */
> >>>
> >>> Why such default is needed? Why not let the PMD to set it always?
> >>
> >> I saw this a simple way to have a consistent default value (the
> >> port_id) for all PMDs, without the need to modify existing PMD which
> >> don't currently have any concept of a switch domain.
> >
> > The default value don't makes much sense though. By default it would
> > mean the application each port is on different switch domain. This is
> > obviously not true in case of multiple VFs
> 
> But it is the case today for all ports, that they are assumed to be in 
> separate
> switch domains or at least in unknowable switch domains by applications,
> with the exception of LAG groups, were it is implicit that they are in the 
> same
> domain. Even if two ports were attached to the same switch, or if you where
> using multiple VFs from the same switch there is currently no way of telling
> the application that this is the case. 

Right, but I thought your new parameter is the way :

Uint16_t switch_domain -
"Introduces a new port attribute to ethdev port's which denotes the
switch domain a port belongs to"


What would be the use case for having
> multiple VFs from the same port/switch domain in a single data path
> application. It doesn't seem likely to me that you would use hardware
> switching to move traffic between 2 VFs in the same data path application.

It is not likely. However the parameter you defined is not true only for the 
representor case, but for the generic case (unless you state otherwise in the 
documentation of it).

Maybe it can also use application like VFd to understand the connectivity 
between the different VFs.

My point is - unless this parameter is valid only for the reprsentor case, the 
default value should be the correct one. 
I think it is better to not limit this field to representor only. Extra info 
for application is never a bad thing. 

> 
> If you are using port representors, I assumed that you would set a valid
> switch domain id, possibly picking up the port id of the first port created on
> that switch domain, but it would be completely up to the PMD how this was
> done, I have just shown the simplest model in which the port_id of the PF is
> used for all subsequent representor ports in that switch domain, but if you
> want

Re: [dpdk-dev] [PATCH v6 4/8] ethdev: Add port representor device flag

2018-03-31 Thread Shahaf Shuler
Thursday, March 29, 2018 5:53 PM, Doherty, Declan:
> On 29/03/2018 7:13 AM, Shahaf Shuler wrote:
> > Wednesday, March 28, 2018 4:54 PM, Declan Doherty:
> >> Subject: [dpdk-dev][PATCH v6 4/8] ethdev: Add port representor device
> >> flag
> >>
> >> Add new device flag to specify that ethdev port is a port representor.
> >> Extend rte_eth_dev_info structure to expose device flags to user
> >> which enable applications to discover if a port is a representor port.
> >>
> >> Signed-off-by: Declan Doherty 
> >> ---
> >>   lib/librte_ether/rte_ethdev.c | 1 +
> >>   lib/librte_ether/rte_ethdev.h | 9 ++---
> >>   lib/librte_ether/rte_ethdev_representor.h | 3 +++
> >>   3 files changed, 10 insertions(+), 3 deletions(-)
> >>
> >> diff --git a/lib/librte_ether/rte_ethdev.c
> >> b/lib/librte_ether/rte_ethdev.c index c719f84a3..163246433 100644
> >> --- a/lib/librte_ether/rte_ethdev.c
> >> +++ b/lib/librte_ether/rte_ethdev.c
> >> @@ -2399,6 +2399,7 @@ rte_eth_dev_info_get(uint16_t port_id, struct
> >> rte_eth_dev_info *dev_info)
> >>dev_info->nb_rx_queues = dev->data->nb_rx_queues;
> >>dev_info->nb_tx_queues = dev->data->nb_tx_queues;
> >>dev_info->switch_id = dev->data->switch_id;
> >> +  dev_info->dev_flags = dev->data->dev_flags;
> >>   }
> >>
> >>   int
> >> diff --git a/lib/librte_ether/rte_ethdev.h
> >> b/lib/librte_ether/rte_ethdev.h index dced4fc41..226acc8b1 100644
> >> --- a/lib/librte_ether/rte_ethdev.h
> >> +++ b/lib/librte_ether/rte_ethdev.h
> >> @@ -996,6 +996,7 @@ struct rte_eth_dev_info {
> >>const char *driver_name; /**< Device Driver name. */
> >>unsigned int if_index; /**< Index to bound host interface, or 0 if
> >> none.
> >>Use if_indextoname() to translate into an interface name. */
> >> +  uint32_t dev_flags; /**< Device flags */
> >>uint32_t min_rx_bufsize; /**< Minimum size of RX buffer. */
> >>uint32_t max_rx_pktlen; /**< Maximum configurable length of RX
> >> pkt. */
> >>uint16_t max_rx_queues; /**< Maximum number of RX queues. */
> @@
> >> -1229,11 +1230,13 @@ struct rte_eth_dev_owner {  };
> >>
> >>   /** Device supports link state interrupt */
> >> -#define RTE_ETH_DEV_INTR_LSC 0x0002
> >> +#define RTE_ETH_DEV_INTR_LSC  0x0002
> >>   /** Device is a bonded slave */
> >> -#define RTE_ETH_DEV_BONDED_SLAVE 0x0004
> >> +#define RTE_ETH_DEV_BONDED_SLAVE  0x0004
> >>   /** Device supports device removal interrupt */
> >> -#define RTE_ETH_DEV_INTR_RMV 0x0008
> >> +#define RTE_ETH_DEV_INTR_RMV  0x0008
> >> +/** Device is port representor */
> >> +#define RTE_ETH_DEV_REPRESENTOR   0x0010
> >
> > Maybe it is a good time to make some order here.
> > I understand the decision to use flags instead of bit-field. It is better.
> >
> > However there is a mix here of device capabilities like :
> RTE_ETH_DEV_INTR_LSC   and RTE_ETH_DEV_INTR_RMV
> > And device attributes like : RTE_ETH_DEV_BONDED_SLAVE and
> RTE_ETH_DEV_REPRESENTOR.
> > I don't think they belong together under the genetic name of dev_flags.
> >
> > Moreover, I am not sure the fact device is bonded slave should be exposed
> to the application. It should be internal to ethdev and its port iterators.
> 
> That's a good point on the bonded slave flag, I'll look at fixing that for the
> next release. I don't think changing it should effect ABI but I'll need to 
> have a
> closer look.
> 
> Do you think that we should have a separate device attributes field, which
> the representor flag is contained in.
> 
> >
> > Finally I think representor port may need more info now (and in the
> future), for example the associated vf id.
> > For that, I think it is better it to be exposed as a dedicated struct on 
> > device
> info.
> 
> I think a switch port id should suffice for that, for SR-IOV devices it would
> map to the vf_id.

I think we need both switch_domain and vf_id. 
Because for representors, the application should know which VFs can be reached 
from this representor and which VF it represent. 

> 
> >
> >>
> >>   /**
> >>* @warning
> >> diff --git a/lib/librte_ether/rte_ethdev_representor.h
> >> b/lib/librte_ether/rte_ethdev_representor.h
> >> index cbc1f2855..f3726d0ba 100644
> >> --- a/lib/librte_ether/rte_ethdev_representor.h
> >> +++ b/lib/librte_ether/rte_ethdev_representor.h
> >> @@ -22,6 +22,9 @@ eth_dev_representor_port_init(struct rte_eth_dev
> >> *ethdev, void *init_params)
> >>/** representor inherits the switch id of it's base device */
> >>ethdev->data->switch_id = base_ethdev->data->switch_id;
> >>
> >> +  /** Set device flags to specify that device is a representor port */
> >> +  ethdev->data->dev_flags |= RTE_ETH_DEV_REPRESENTOR;
> >
> > Should be set in the PMD, not in ethdev layer
> 
> As in the previous patch this is just a generic port bus init function which
> meets the simplest use case of representor port with a single switch domain,
> a PMD doesn't need to use it but having it here saves duplicating th