xref: /linux/drivers/vfio/pci/mlx5/cmd.h (revision ab93e0dd72c37d378dd936f031ffb83ff2bd87ce)
1f1d98f34SYishai Hadas /* SPDX-License-Identifier: GPL-2.0 OR Linux-OpenIB */
2f1d98f34SYishai Hadas /*
3f1d98f34SYishai Hadas  * Copyright (c) 2021-2022, NVIDIA CORPORATION & AFFILIATES. All rights reserved.
4f1d98f34SYishai Hadas  */
5f1d98f34SYishai Hadas 
6f1d98f34SYishai Hadas #ifndef MLX5_VFIO_CMD_H
7f1d98f34SYishai Hadas #define MLX5_VFIO_CMD_H
8f1d98f34SYishai Hadas 
9f1d98f34SYishai Hadas #include <linux/kernel.h>
1061a2f146SYishai Hadas #include <linux/vfio_pci_core.h>
11f1d98f34SYishai Hadas #include <linux/mlx5/driver.h>
12caf094b5SShay Drory #include <linux/mlx5/vport.h>
1379c3cf27SYishai Hadas #include <linux/mlx5/cq.h>
1479c3cf27SYishai Hadas #include <linux/mlx5/qp.h>
15f1d98f34SYishai Hadas 
168b599d14SYishai Hadas enum mlx5_vf_migf_state {
178b599d14SYishai Hadas 	MLX5_MIGF_STATE_ERROR = 1,
18d6e18a4bSShay Drory 	MLX5_MIGF_STATE_PRE_COPY_ERROR,
1981156c27SYishai Hadas 	MLX5_MIGF_STATE_PRE_COPY,
209114100dSYishai Hadas 	MLX5_MIGF_STATE_SAVE_STOP_COPY_CHUNK,
21c6688783SYishai Hadas 	MLX5_MIGF_STATE_COMPLETE,
228b599d14SYishai Hadas };
238b599d14SYishai Hadas 
2434e2f271SYishai Hadas enum mlx5_vf_load_state {
2534e2f271SYishai Hadas 	MLX5_VF_LOAD_STATE_READ_HEADER,
26f4f0c25eSYishai Hadas 	MLX5_VF_LOAD_STATE_PREP_HEADER_DATA,
27f4f0c25eSYishai Hadas 	MLX5_VF_LOAD_STATE_READ_HEADER_DATA,
2834e2f271SYishai Hadas 	MLX5_VF_LOAD_STATE_PREP_IMAGE,
2934e2f271SYishai Hadas 	MLX5_VF_LOAD_STATE_READ_IMAGE,
3034e2f271SYishai Hadas 	MLX5_VF_LOAD_STATE_LOAD_IMAGE,
3134e2f271SYishai Hadas };
3234e2f271SYishai Hadas 
33b04e2e86SYishai Hadas struct mlx5_vf_migration_tag_stop_copy_data {
34b04e2e86SYishai Hadas 	__le64 stop_copy_size;
35b04e2e86SYishai Hadas };
36b04e2e86SYishai Hadas 
37b04e2e86SYishai Hadas enum mlx5_vf_migf_header_flags {
38b04e2e86SYishai Hadas 	MLX5_MIGF_HEADER_FLAGS_TAG_MANDATORY = 0,
39b04e2e86SYishai Hadas 	MLX5_MIGF_HEADER_FLAGS_TAG_OPTIONAL = 1 << 0,
40b04e2e86SYishai Hadas };
41b04e2e86SYishai Hadas 
42b04e2e86SYishai Hadas enum mlx5_vf_migf_header_tag {
43b04e2e86SYishai Hadas 	MLX5_MIGF_HEADER_TAG_FW_DATA = 0,
44b04e2e86SYishai Hadas 	MLX5_MIGF_HEADER_TAG_STOP_COPY_SIZE = 1 << 0,
45b04e2e86SYishai Hadas };
46b04e2e86SYishai Hadas 
470c9a38feSYishai Hadas struct mlx5_vf_migration_header {
48b04e2e86SYishai Hadas 	__le64 record_size;
490c9a38feSYishai Hadas 	/* For future use in case we may need to change the kernel protocol */
50b04e2e86SYishai Hadas 	__le32 flags; /* Use mlx5_vf_migf_header_flags */
51b04e2e86SYishai Hadas 	__le32 tag; /* Use mlx5_vf_migf_header_tag */
52b04e2e86SYishai Hadas 	__u8 data[]; /* Its size is given in the record_size */
530c9a38feSYishai Hadas };
540c9a38feSYishai Hadas 
5591454f8bSYishai Hadas struct mlx5_vhca_data_buffer {
56*089803c4SLeon Romanovsky 	struct page **page_list;
57*089803c4SLeon Romanovsky 	struct dma_iova_state state;
5891454f8bSYishai Hadas 	loff_t start_pos;
5991454f8bSYishai Hadas 	u64 length;
60674ebb64SLeon Romanovsky 	u32 npages;
6191454f8bSYishai Hadas 	u32 mkey;
62ac6c973aSLeon Romanovsky 	u32 *mkey_in;
6391454f8bSYishai Hadas 	enum dma_data_direction dma_dir;
645798e4ddSYishai Hadas 	u8 stop_copy_chunk_num;
65c6688783SYishai Hadas 	struct list_head buf_elm;
6691454f8bSYishai Hadas 	struct mlx5_vf_migration_file *migf;
6791454f8bSYishai Hadas };
6891454f8bSYishai Hadas 
6985c205dbSYishai Hadas struct mlx5vf_async_data {
7085c205dbSYishai Hadas 	struct mlx5_async_work cb_work;
7185c205dbSYishai Hadas 	struct work_struct work;
72c6688783SYishai Hadas 	struct mlx5_vhca_data_buffer *buf;
730c9a38feSYishai Hadas 	struct mlx5_vhca_data_buffer *header_buf;
7485c205dbSYishai Hadas 	int status;
759114100dSYishai Hadas 	u8 stop_copy_chunk:1;
7685c205dbSYishai Hadas 	void *out;
7785c205dbSYishai Hadas };
7885c205dbSYishai Hadas 
7967135f29SYishai Hadas struct mlx5vf_save_work_data {
8067135f29SYishai Hadas 	struct mlx5_vf_migration_file *migf;
8167135f29SYishai Hadas 	size_t next_required_umem_size;
8267135f29SYishai Hadas 	struct work_struct work;
8367135f29SYishai Hadas 	u8 chunk_num;
8467135f29SYishai Hadas };
8567135f29SYishai Hadas 
865798e4ddSYishai Hadas #define MAX_NUM_CHUNKS 2
875798e4ddSYishai Hadas 
88f1d98f34SYishai Hadas struct mlx5_vf_migration_file {
89f1d98f34SYishai Hadas 	struct file *filp;
90f1d98f34SYishai Hadas 	struct mutex lock;
918b599d14SYishai Hadas 	enum mlx5_vf_migf_state state;
92f1d98f34SYishai Hadas 
9334e2f271SYishai Hadas 	enum mlx5_vf_load_state load_state;
949945a67eSYishai Hadas 	u32 pdn;
953319d287SYishai Hadas 	loff_t max_pos;
96f4f0c25eSYishai Hadas 	u64 record_size;
97f4f0c25eSYishai Hadas 	u32 record_tag;
98f4f0c25eSYishai Hadas 	u64 stop_copy_prep_size;
99b04e2e86SYishai Hadas 	u64 pre_copy_initial_bytes;
10067135f29SYishai Hadas 	size_t next_required_umem_size;
10167135f29SYishai Hadas 	u8 num_ready_chunks;
1025798e4ddSYishai Hadas 	/* Upon chunk mode preserve another set of buffers for stop_copy phase */
1035798e4ddSYishai Hadas 	struct mlx5_vhca_data_buffer *buf[MAX_NUM_CHUNKS];
1045798e4ddSYishai Hadas 	struct mlx5_vhca_data_buffer *buf_header[MAX_NUM_CHUNKS];
10567135f29SYishai Hadas 	struct mlx5vf_save_work_data save_data[MAX_NUM_CHUNKS];
106c6688783SYishai Hadas 	spinlock_t list_lock;
107c6688783SYishai Hadas 	struct list_head buf_list;
1083319d287SYishai Hadas 	struct list_head avail_list;
10985c205dbSYishai Hadas 	struct mlx5vf_pci_core_device *mvdev;
11085c205dbSYishai Hadas 	wait_queue_head_t poll_wait;
1110e7caa65SYishai Hadas 	struct completion save_comp;
11285c205dbSYishai Hadas 	struct mlx5_async_ctx async_ctx;
11385c205dbSYishai Hadas 	struct mlx5vf_async_data async_data;
114f1d98f34SYishai Hadas };
115f1d98f34SYishai Hadas 
11679c3cf27SYishai Hadas struct mlx5_vhca_cq_buf {
11779c3cf27SYishai Hadas 	struct mlx5_frag_buf_ctrl fbc;
11879c3cf27SYishai Hadas 	struct mlx5_frag_buf frag_buf;
11979c3cf27SYishai Hadas 	int cqe_size;
12079c3cf27SYishai Hadas 	int nent;
12179c3cf27SYishai Hadas };
12279c3cf27SYishai Hadas 
12379c3cf27SYishai Hadas struct mlx5_vhca_cq {
12479c3cf27SYishai Hadas 	struct mlx5_vhca_cq_buf buf;
12579c3cf27SYishai Hadas 	struct mlx5_db db;
12679c3cf27SYishai Hadas 	struct mlx5_core_cq mcq;
12779c3cf27SYishai Hadas 	size_t ncqe;
12879c3cf27SYishai Hadas };
12979c3cf27SYishai Hadas 
13079c3cf27SYishai Hadas struct mlx5_vhca_recv_buf {
13179c3cf27SYishai Hadas 	u32 npages;
13279c3cf27SYishai Hadas 	struct page **page_list;
133*089803c4SLeon Romanovsky 	struct dma_iova_state state;
13479c3cf27SYishai Hadas 	u32 next_rq_offset;
135ac6c973aSLeon Romanovsky 	u32 *mkey_in;
13679c3cf27SYishai Hadas 	u32 mkey;
13779c3cf27SYishai Hadas };
13879c3cf27SYishai Hadas 
13979c3cf27SYishai Hadas struct mlx5_vhca_qp {
14079c3cf27SYishai Hadas 	struct mlx5_frag_buf buf;
14179c3cf27SYishai Hadas 	struct mlx5_db db;
14279c3cf27SYishai Hadas 	struct mlx5_vhca_recv_buf recv_buf;
14379c3cf27SYishai Hadas 	u32 tracked_page_size;
14479c3cf27SYishai Hadas 	u32 max_msg_size;
14579c3cf27SYishai Hadas 	u32 qpn;
14679c3cf27SYishai Hadas 	struct {
14779c3cf27SYishai Hadas 		unsigned int pc;
14879c3cf27SYishai Hadas 		unsigned int cc;
14979c3cf27SYishai Hadas 		unsigned int wqe_cnt;
15079c3cf27SYishai Hadas 		__be32 *db;
15179c3cf27SYishai Hadas 		struct mlx5_frag_buf_ctrl fbc;
15279c3cf27SYishai Hadas 	} rq;
15379c3cf27SYishai Hadas };
15479c3cf27SYishai Hadas 
15579c3cf27SYishai Hadas struct mlx5_vhca_page_tracker {
156c1d050b0SYishai Hadas 	u32 id;
15779c3cf27SYishai Hadas 	u32 pdn;
158e2957387SYishai Hadas 	u8 is_err:1;
159f8864730SYishai Hadas 	u8 object_changed:1;
16079c3cf27SYishai Hadas 	struct mlx5_uars_page *uar;
16179c3cf27SYishai Hadas 	struct mlx5_vhca_cq cq;
16279c3cf27SYishai Hadas 	struct mlx5_vhca_qp *host_qp;
16379c3cf27SYishai Hadas 	struct mlx5_vhca_qp *fw_qp;
164e2957387SYishai Hadas 	struct mlx5_nb nb;
1651047797eSYishai Hadas 	int status;
16679c3cf27SYishai Hadas };
16779c3cf27SYishai Hadas 
16861a2f146SYishai Hadas struct mlx5vf_pci_core_device {
16961a2f146SYishai Hadas 	struct vfio_pci_core_device core_device;
17061a2f146SYishai Hadas 	int vf_id;
17161a2f146SYishai Hadas 	u16 vhca_id;
17261a2f146SYishai Hadas 	u8 migrate_cap:1;
17361a2f146SYishai Hadas 	u8 deferred_reset:1;
17461a2f146SYishai Hadas 	u8 mdev_detach:1;
17579c3cf27SYishai Hadas 	u8 log_active:1;
176543640afSYishai Hadas 	u8 chunk_mode:1;
1771047797eSYishai Hadas 	struct completion tracker_comp;
17861a2f146SYishai Hadas 	/* protect migration state */
17961a2f146SYishai Hadas 	struct mutex state_mutex;
18061a2f146SYishai Hadas 	enum vfio_device_mig_state mig_state;
18161a2f146SYishai Hadas 	/* protect the reset_done flow */
18261a2f146SYishai Hadas 	spinlock_t reset_lock;
18361a2f146SYishai Hadas 	struct mlx5_vf_migration_file *resuming_migf;
18461a2f146SYishai Hadas 	struct mlx5_vf_migration_file *saving_migf;
18579c3cf27SYishai Hadas 	struct mlx5_vhca_page_tracker tracker;
18685c205dbSYishai Hadas 	struct workqueue_struct *cb_wq;
18761a2f146SYishai Hadas 	struct notifier_block nb;
18861a2f146SYishai Hadas 	struct mlx5_core_dev *mdev;
18961a2f146SYishai Hadas };
19061a2f146SYishai Hadas 
1913319d287SYishai Hadas enum {
1923319d287SYishai Hadas 	MLX5VF_QUERY_INC = (1UL << 0),
193d6e18a4bSShay Drory 	MLX5VF_QUERY_FINAL = (1UL << 1),
1946de04224SYishai Hadas 	MLX5VF_QUERY_CLEANUP = (1UL << 2),
1953319d287SYishai Hadas };
1963319d287SYishai Hadas 
1978580ad14SYishai Hadas int mlx5vf_cmd_suspend_vhca(struct mlx5vf_pci_core_device *mvdev, u16 op_mod);
1988580ad14SYishai Hadas int mlx5vf_cmd_resume_vhca(struct mlx5vf_pci_core_device *mvdev, u16 op_mod);
1998580ad14SYishai Hadas int mlx5vf_cmd_query_vhca_migration_state(struct mlx5vf_pci_core_device *mvdev,
200543640afSYishai Hadas 					  size_t *state_size, u64 *total_size,
201543640afSYishai Hadas 					  u8 query_flags);
2026e97eba8SYishai Hadas void mlx5vf_cmd_set_migratable(struct mlx5vf_pci_core_device *mvdev,
203f39856aaSYishai Hadas 			       const struct vfio_migration_ops *mig_ops,
204f39856aaSYishai Hadas 			       const struct vfio_log_ops *log_ops);
20561a2f146SYishai Hadas void mlx5vf_cmd_remove_migratable(struct mlx5vf_pci_core_device *mvdev);
2062b1c1906SYishai Hadas void mlx5vf_cmd_close_migratable(struct mlx5vf_pci_core_device *mvdev);
2078580ad14SYishai Hadas int mlx5vf_cmd_save_vhca_state(struct mlx5vf_pci_core_device *mvdev,
20891454f8bSYishai Hadas 			       struct mlx5_vf_migration_file *migf,
2093319d287SYishai Hadas 			       struct mlx5_vhca_data_buffer *buf, bool inc,
2103319d287SYishai Hadas 			       bool track);
2118580ad14SYishai Hadas int mlx5vf_cmd_load_vhca_state(struct mlx5vf_pci_core_device *mvdev,
21291454f8bSYishai Hadas 			       struct mlx5_vf_migration_file *migf,
21391454f8bSYishai Hadas 			       struct mlx5_vhca_data_buffer *buf);
2149945a67eSYishai Hadas int mlx5vf_cmd_alloc_pd(struct mlx5_vf_migration_file *migf);
2159945a67eSYishai Hadas void mlx5vf_cmd_dealloc_pd(struct mlx5_vf_migration_file *migf);
2169945a67eSYishai Hadas void mlx5fv_cmd_clean_migf_resources(struct mlx5_vf_migration_file *migf);
21791454f8bSYishai Hadas struct mlx5_vhca_data_buffer *
218674ebb64SLeon Romanovsky mlx5vf_alloc_data_buffer(struct mlx5_vf_migration_file *migf, u32 npages,
219674ebb64SLeon Romanovsky 			 enum dma_data_direction dma_dir);
22091454f8bSYishai Hadas void mlx5vf_free_data_buffer(struct mlx5_vhca_data_buffer *buf);
2213319d287SYishai Hadas struct mlx5_vhca_data_buffer *
222674ebb64SLeon Romanovsky mlx5vf_get_data_buffer(struct mlx5_vf_migration_file *migf, u32 npages,
223674ebb64SLeon Romanovsky 		       enum dma_data_direction dma_dir);
2243319d287SYishai Hadas void mlx5vf_put_data_buffer(struct mlx5_vhca_data_buffer *buf);
225*089803c4SLeon Romanovsky static inline struct page *
mlx5vf_get_migration_page(struct mlx5_vhca_data_buffer * buf,unsigned long offset)226*089803c4SLeon Romanovsky mlx5vf_get_migration_page(struct mlx5_vhca_data_buffer *buf,
227*089803c4SLeon Romanovsky 			  unsigned long offset)
228*089803c4SLeon Romanovsky {
229*089803c4SLeon Romanovsky 	int page_entry = offset / PAGE_SIZE;
230*089803c4SLeon Romanovsky 
231*089803c4SLeon Romanovsky 	if (page_entry >= buf->npages)
232*089803c4SLeon Romanovsky 		return NULL;
233*089803c4SLeon Romanovsky 
234*089803c4SLeon Romanovsky 	return buf->page_list[page_entry];
235*089803c4SLeon Romanovsky }
23661a2f146SYishai Hadas void mlx5vf_state_mutex_unlock(struct mlx5vf_pci_core_device *mvdev);
2376de04224SYishai Hadas void mlx5vf_disable_fds(struct mlx5vf_pci_core_device *mvdev,
2386de04224SYishai Hadas 			enum mlx5_vf_migf_state *last_save_state);
23985c205dbSYishai Hadas void mlx5vf_mig_file_cleanup_cb(struct work_struct *_work);
24067135f29SYishai Hadas void mlx5vf_mig_file_set_save_work(struct mlx5_vf_migration_file *migf,
24167135f29SYishai Hadas 				   u8 chunk_num, size_t next_required_umem_size);
24279c3cf27SYishai Hadas int mlx5vf_start_page_tracker(struct vfio_device *vdev,
24379c3cf27SYishai Hadas 		struct rb_root_cached *ranges, u32 nnodes, u64 *page_size);
24479c3cf27SYishai Hadas int mlx5vf_stop_page_tracker(struct vfio_device *vdev);
2451047797eSYishai Hadas int mlx5vf_tracker_read_and_clear(struct vfio_device *vdev, unsigned long iova,
2461047797eSYishai Hadas 			unsigned long length, struct iova_bitmap *dirty);
247f1d98f34SYishai Hadas #endif /* MLX5_VFIO_CMD_H */
248