1// SPDX-License-Identifier: GPL-2.0-or-later
2/*
3 * RDMA Network Block Driver
4 *
5 * Copyright (c) 2014 - 2018 ProfitBricks GmbH. All rights reserved.
6 * Copyright (c) 2018 - 2019 1&1 IONOS Cloud GmbH. All rights reserved.
7 * Copyright (c) 2019 - 2020 1&1 IONOS SE. All rights reserved.
8 */
9#undef pr_fmt
10#define pr_fmt(fmt) KBUILD_MODNAME " L" __stringify(__LINE__) ": " fmt
11
12#include <linux/module.h>
13#include <linux/blkdev.h>
14
15#include "rnbd-srv.h"
16#include "rnbd-srv-trace.h"
17
18MODULE_DESCRIPTION("RDMA Network Block Device Server");
19MODULE_LICENSE("GPL");
20
21static u16 port_nr = RTRS_PORT;
22
23module_param_named(port_nr, port_nr, ushort, 0444);
24MODULE_PARM_DESC(port_nr,
25		 "The port number the server is listening on (default: "
26		 __stringify(RTRS_PORT)")");
27
28#define DEFAULT_DEV_SEARCH_PATH "/"
29
30static char dev_search_path[PATH_MAX] = DEFAULT_DEV_SEARCH_PATH;
31
32static int dev_search_path_set(const char *val, const struct kernel_param *kp)
33{
34	const char *p = strrchr(val, '\n') ? : val + strlen(val);
35
36	if (strlen(val) >= sizeof(dev_search_path))
37		return -EINVAL;
38
39	snprintf(dev_search_path, sizeof(dev_search_path), "%.*s",
40		 (int)(p - val), val);
41
42	pr_info("dev_search_path changed to '%s'\n", dev_search_path);
43
44	return 0;
45}
46
47static struct kparam_string dev_search_path_kparam_str = {
48	.maxlen	= sizeof(dev_search_path),
49	.string	= dev_search_path
50};
51
52static const struct kernel_param_ops dev_search_path_ops = {
53	.set	= dev_search_path_set,
54	.get	= param_get_string,
55};
56
57module_param_cb(dev_search_path, &dev_search_path_ops,
58		&dev_search_path_kparam_str, 0444);
59MODULE_PARM_DESC(dev_search_path,
60		 "Sets the dev_search_path. When a device is mapped this path is prepended to the device path from the map device operation.  If %SESSNAME% is specified in a path, then device will be searched in a session namespace. (default: "
61		 DEFAULT_DEV_SEARCH_PATH ")");
62
63static DEFINE_MUTEX(sess_lock);
64static DEFINE_SPINLOCK(dev_lock);
65
66static LIST_HEAD(sess_list);
67static LIST_HEAD(dev_list);
68
69struct rnbd_io_private {
70	struct rtrs_srv_op		*id;
71	struct rnbd_srv_sess_dev	*sess_dev;
72};
73
74static void rnbd_sess_dev_release(struct kref *kref)
75{
76	struct rnbd_srv_sess_dev *sess_dev;
77
78	sess_dev = container_of(kref, struct rnbd_srv_sess_dev, kref);
79	complete(sess_dev->destroy_comp);
80}
81
82static inline void rnbd_put_sess_dev(struct rnbd_srv_sess_dev *sess_dev)
83{
84	kref_put(&sess_dev->kref, rnbd_sess_dev_release);
85}
86
87static struct rnbd_srv_sess_dev *
88rnbd_get_sess_dev(int dev_id, struct rnbd_srv_session *srv_sess)
89{
90	struct rnbd_srv_sess_dev *sess_dev;
91	int ret = 0;
92
93	rcu_read_lock();
94	sess_dev = xa_load(&srv_sess->index_idr, dev_id);
95	if (sess_dev)
96		ret = kref_get_unless_zero(&sess_dev->kref);
97	rcu_read_unlock();
98
99	if (!ret)
100		return ERR_PTR(-ENXIO);
101
102	return sess_dev;
103}
104
105static void rnbd_dev_bi_end_io(struct bio *bio)
106{
107	struct rnbd_io_private *rnbd_priv = bio->bi_private;
108	struct rnbd_srv_sess_dev *sess_dev = rnbd_priv->sess_dev;
109
110	rnbd_put_sess_dev(sess_dev);
111	rtrs_srv_resp_rdma(rnbd_priv->id, blk_status_to_errno(bio->bi_status));
112
113	kfree(rnbd_priv);
114	bio_put(bio);
115}
116
117static int process_rdma(struct rnbd_srv_session *srv_sess,
118			struct rtrs_srv_op *id, void *data, u32 datalen,
119			const void *usr, size_t usrlen)
120{
121	const struct rnbd_msg_io *msg = usr;
122	struct rnbd_io_private *priv;
123	struct rnbd_srv_sess_dev *sess_dev;
124	u32 dev_id;
125	int err;
126	struct bio *bio;
127	short prio;
128
129	trace_process_rdma(srv_sess, msg, id, datalen, usrlen);
130
131	priv = kmalloc(sizeof(*priv), GFP_KERNEL);
132	if (!priv)
133		return -ENOMEM;
134
135	dev_id = le32_to_cpu(msg->device_id);
136
137	sess_dev = rnbd_get_sess_dev(dev_id, srv_sess);
138	if (IS_ERR(sess_dev)) {
139		pr_err_ratelimited("Got I/O request on session %s for unknown device id %d: %pe\n",
140				   srv_sess->sessname, dev_id, sess_dev);
141		err = -ENOTCONN;
142		goto err;
143	}
144
145	priv->sess_dev = sess_dev;
146	priv->id = id;
147
148	bio = bio_alloc(file_bdev(sess_dev->bdev_file), 1,
149			rnbd_to_bio_flags(le32_to_cpu(msg->rw)), GFP_KERNEL);
150	if (bio_add_page(bio, virt_to_page(data), datalen,
151			offset_in_page(data)) != datalen) {
152		rnbd_srv_err(sess_dev, "Failed to map data to bio\n");
153		err = -EINVAL;
154		goto bio_put;
155	}
156
157	bio->bi_end_io = rnbd_dev_bi_end_io;
158	bio->bi_private = priv;
159	bio->bi_iter.bi_sector = le64_to_cpu(msg->sector);
160	bio->bi_iter.bi_size = le32_to_cpu(msg->bi_size);
161	prio = srv_sess->ver < RNBD_PROTO_VER_MAJOR ||
162	       usrlen < sizeof(*msg) ? 0 : le16_to_cpu(msg->prio);
163	bio_set_prio(bio, prio);
164
165	submit_bio(bio);
166
167	return 0;
168
169bio_put:
170	bio_put(bio);
171	rnbd_put_sess_dev(sess_dev);
172err:
173	kfree(priv);
174	return err;
175}
176
177static void destroy_device(struct kref *kref)
178{
179	struct rnbd_srv_dev *dev = container_of(kref, struct rnbd_srv_dev, kref);
180
181	WARN_ONCE(!list_empty(&dev->sess_dev_list),
182		  "Device %s is being destroyed but still in use!\n",
183		  dev->name);
184
185	spin_lock(&dev_lock);
186	list_del(&dev->list);
187	spin_unlock(&dev_lock);
188
189	mutex_destroy(&dev->lock);
190	if (dev->dev_kobj.state_in_sysfs)
191		/*
192		 * Destroy kobj only if it was really created.
193		 */
194		rnbd_srv_destroy_dev_sysfs(dev);
195	else
196		kfree(dev);
197}
198
199static void rnbd_put_srv_dev(struct rnbd_srv_dev *dev)
200{
201	kref_put(&dev->kref, destroy_device);
202}
203
204void rnbd_destroy_sess_dev(struct rnbd_srv_sess_dev *sess_dev, bool keep_id)
205{
206	DECLARE_COMPLETION_ONSTACK(dc);
207
208	if (keep_id)
209		/* free the resources for the id but don't  */
210		/* allow to re-use the id itself because it */
211		/* is still used by the client              */
212		xa_cmpxchg(&sess_dev->sess->index_idr, sess_dev->device_id,
213			   sess_dev, NULL, 0);
214	else
215		xa_erase(&sess_dev->sess->index_idr, sess_dev->device_id);
216	synchronize_rcu();
217
218	sess_dev->destroy_comp = &dc;
219	rnbd_put_sess_dev(sess_dev);
220	wait_for_completion(&dc); /* wait for inflights to drop to zero */
221
222	fput(sess_dev->bdev_file);
223	mutex_lock(&sess_dev->dev->lock);
224	list_del(&sess_dev->dev_list);
225	if (!sess_dev->readonly)
226		sess_dev->dev->open_write_cnt--;
227	mutex_unlock(&sess_dev->dev->lock);
228
229	rnbd_put_srv_dev(sess_dev->dev);
230
231	rnbd_srv_info(sess_dev, "Device closed\n");
232	kfree(sess_dev);
233}
234
235static void destroy_sess(struct rnbd_srv_session *srv_sess)
236{
237	struct rnbd_srv_sess_dev *sess_dev;
238	unsigned long index;
239
240	if (xa_empty(&srv_sess->index_idr))
241		goto out;
242
243	trace_destroy_sess(srv_sess);
244
245	mutex_lock(&srv_sess->lock);
246	xa_for_each(&srv_sess->index_idr, index, sess_dev)
247		rnbd_srv_destroy_dev_session_sysfs(sess_dev);
248	mutex_unlock(&srv_sess->lock);
249
250out:
251	xa_destroy(&srv_sess->index_idr);
252
253	pr_info("RTRS Session %s disconnected\n", srv_sess->sessname);
254
255	mutex_lock(&sess_lock);
256	list_del(&srv_sess->list);
257	mutex_unlock(&sess_lock);
258
259	mutex_destroy(&srv_sess->lock);
260	kfree(srv_sess);
261}
262
263static int create_sess(struct rtrs_srv_sess *rtrs)
264{
265	struct rnbd_srv_session *srv_sess;
266	char pathname[NAME_MAX];
267	int err;
268
269	err = rtrs_srv_get_path_name(rtrs, pathname, sizeof(pathname));
270	if (err) {
271		pr_err("rtrs_srv_get_path_name(%s): %d\n", pathname, err);
272
273		return err;
274	}
275	srv_sess = kzalloc(sizeof(*srv_sess), GFP_KERNEL);
276	if (!srv_sess)
277		return -ENOMEM;
278
279	srv_sess->queue_depth = rtrs_srv_get_queue_depth(rtrs);
280	xa_init_flags(&srv_sess->index_idr, XA_FLAGS_ALLOC);
281	mutex_init(&srv_sess->lock);
282	mutex_lock(&sess_lock);
283	list_add(&srv_sess->list, &sess_list);
284	mutex_unlock(&sess_lock);
285
286	srv_sess->rtrs = rtrs;
287	strscpy(srv_sess->sessname, pathname, sizeof(srv_sess->sessname));
288
289	rtrs_srv_set_sess_priv(rtrs, srv_sess);
290
291	trace_create_sess(srv_sess);
292
293	return 0;
294}
295
296static int rnbd_srv_link_ev(struct rtrs_srv_sess *rtrs,
297			     enum rtrs_srv_link_ev ev, void *priv)
298{
299	struct rnbd_srv_session *srv_sess = priv;
300
301	switch (ev) {
302	case RTRS_SRV_LINK_EV_CONNECTED:
303		return create_sess(rtrs);
304
305	case RTRS_SRV_LINK_EV_DISCONNECTED:
306		if (WARN_ON_ONCE(!srv_sess))
307			return -EINVAL;
308
309		destroy_sess(srv_sess);
310		return 0;
311
312	default:
313		pr_warn("Received unknown RTRS session event %d from session %s\n",
314			ev, srv_sess->sessname);
315		return -EINVAL;
316	}
317}
318
319void rnbd_srv_sess_dev_force_close(struct rnbd_srv_sess_dev *sess_dev,
320				   struct kobj_attribute *attr)
321{
322	struct rnbd_srv_session	*sess = sess_dev->sess;
323
324	/* It is already started to close by client's close message. */
325	if (!mutex_trylock(&sess->lock))
326		return;
327
328	sess_dev->keep_id = true;
329	/* first remove sysfs itself to avoid deadlock */
330	sysfs_remove_file_self(&sess_dev->kobj, &attr->attr);
331	rnbd_srv_destroy_dev_session_sysfs(sess_dev);
332	mutex_unlock(&sess->lock);
333}
334
335static void process_msg_close(struct rnbd_srv_session *srv_sess,
336			     void *data, size_t datalen, const void *usr,
337			     size_t usrlen)
338{
339	const struct rnbd_msg_close *close_msg = usr;
340	struct rnbd_srv_sess_dev *sess_dev;
341
342	trace_process_msg_close(srv_sess, close_msg);
343
344	sess_dev = rnbd_get_sess_dev(le32_to_cpu(close_msg->device_id),
345				      srv_sess);
346	if (IS_ERR(sess_dev))
347		return;
348
349	rnbd_put_sess_dev(sess_dev);
350	mutex_lock(&srv_sess->lock);
351	rnbd_srv_destroy_dev_session_sysfs(sess_dev);
352	mutex_unlock(&srv_sess->lock);
353}
354
355static int process_msg_open(struct rnbd_srv_session *srv_sess,
356			    const void *msg, size_t len,
357			    void *data, size_t datalen);
358
359static void process_msg_sess_info(struct rnbd_srv_session *srv_sess,
360				 const void *msg, size_t len,
361				 void *data, size_t datalen);
362
363static int rnbd_srv_rdma_ev(void *priv, struct rtrs_srv_op *id,
364			    void *data, size_t datalen,
365			    const void *usr, size_t usrlen)
366{
367	struct rnbd_srv_session *srv_sess = priv;
368	const struct rnbd_msg_hdr *hdr = usr;
369	int ret = 0;
370	u16 type;
371
372	if (WARN_ON_ONCE(!srv_sess))
373		return -ENODEV;
374
375	type = le16_to_cpu(hdr->type);
376
377	switch (type) {
378	case RNBD_MSG_IO:
379		return process_rdma(srv_sess, id, data, datalen, usr, usrlen);
380	case RNBD_MSG_CLOSE:
381		process_msg_close(srv_sess, data, datalen, usr, usrlen);
382		break;
383	case RNBD_MSG_OPEN:
384		ret = process_msg_open(srv_sess, usr, usrlen, data, datalen);
385		break;
386	case RNBD_MSG_SESS_INFO:
387		process_msg_sess_info(srv_sess, usr, usrlen, data, datalen);
388		break;
389	default:
390		pr_warn("Received unexpected message type %d from session %s\n",
391			type, srv_sess->sessname);
392		return -EINVAL;
393	}
394
395	/*
396	 * Since ret is passed to rtrs to handle the failure case, we
397	 * just return 0 at the end otherwise callers in rtrs would call
398	 * send_io_resp_imm again to print redundant err message.
399	 */
400	rtrs_srv_resp_rdma(id, ret);
401	return 0;
402}
403
404static struct rnbd_srv_sess_dev
405*rnbd_sess_dev_alloc(struct rnbd_srv_session *srv_sess)
406{
407	struct rnbd_srv_sess_dev *sess_dev;
408	int error;
409
410	sess_dev = kzalloc(sizeof(*sess_dev), GFP_KERNEL);
411	if (!sess_dev)
412		return ERR_PTR(-ENOMEM);
413
414	error = xa_alloc(&srv_sess->index_idr, &sess_dev->device_id, sess_dev,
415			 xa_limit_32b, GFP_NOWAIT);
416	if (error < 0) {
417		pr_warn("Allocating idr failed, err: %d\n", error);
418		kfree(sess_dev);
419		return ERR_PTR(error);
420	}
421
422	return sess_dev;
423}
424
425static struct rnbd_srv_dev *rnbd_srv_init_srv_dev(struct block_device *bdev)
426{
427	struct rnbd_srv_dev *dev;
428
429	dev = kzalloc(sizeof(*dev), GFP_KERNEL);
430	if (!dev)
431		return ERR_PTR(-ENOMEM);
432
433	snprintf(dev->name, sizeof(dev->name), "%pg", bdev);
434	kref_init(&dev->kref);
435	INIT_LIST_HEAD(&dev->sess_dev_list);
436	mutex_init(&dev->lock);
437
438	return dev;
439}
440
441static struct rnbd_srv_dev *
442rnbd_srv_find_or_add_srv_dev(struct rnbd_srv_dev *new_dev)
443{
444	struct rnbd_srv_dev *dev;
445
446	spin_lock(&dev_lock);
447	list_for_each_entry(dev, &dev_list, list) {
448		if (!strncmp(dev->name, new_dev->name, sizeof(dev->name))) {
449			if (!kref_get_unless_zero(&dev->kref))
450				/*
451				 * We lost the race, device is almost dead.
452				 *  Continue traversing to find a valid one.
453				 */
454				continue;
455			spin_unlock(&dev_lock);
456			return dev;
457		}
458	}
459	list_add(&new_dev->list, &dev_list);
460	spin_unlock(&dev_lock);
461
462	return new_dev;
463}
464
465static int rnbd_srv_check_update_open_perm(struct rnbd_srv_dev *srv_dev,
466					    struct rnbd_srv_session *srv_sess,
467					    enum rnbd_access_mode access_mode)
468{
469	int ret = 0;
470
471	mutex_lock(&srv_dev->lock);
472
473	switch (access_mode) {
474	case RNBD_ACCESS_RO:
475		break;
476	case RNBD_ACCESS_RW:
477		if (srv_dev->open_write_cnt == 0)  {
478			srv_dev->open_write_cnt++;
479		} else {
480			pr_err("Mapping device '%s' for session %s with RW permissions failed. Device already opened as 'RW' by %d client(s), access mode %s.\n",
481			       srv_dev->name, srv_sess->sessname,
482			       srv_dev->open_write_cnt,
483			       rnbd_access_modes[access_mode].str);
484			ret = -EPERM;
485		}
486		break;
487	case RNBD_ACCESS_MIGRATION:
488		if (srv_dev->open_write_cnt < 2) {
489			srv_dev->open_write_cnt++;
490		} else {
491			pr_err("Mapping device '%s' for session %s with migration permissions failed. Device already opened as 'RW' by %d client(s), access mode %s.\n",
492			       srv_dev->name, srv_sess->sessname,
493			       srv_dev->open_write_cnt,
494			       rnbd_access_modes[access_mode].str);
495			ret = -EPERM;
496		}
497		break;
498	default:
499		pr_err("Received mapping request for device '%s' on session %s with invalid access mode: %d\n",
500		       srv_dev->name, srv_sess->sessname, access_mode);
501		ret = -EINVAL;
502	}
503
504	mutex_unlock(&srv_dev->lock);
505
506	return ret;
507}
508
509static struct rnbd_srv_dev *
510rnbd_srv_get_or_create_srv_dev(struct block_device *bdev,
511				struct rnbd_srv_session *srv_sess,
512				enum rnbd_access_mode access_mode)
513{
514	int ret;
515	struct rnbd_srv_dev *new_dev, *dev;
516
517	new_dev = rnbd_srv_init_srv_dev(bdev);
518	if (IS_ERR(new_dev))
519		return new_dev;
520
521	dev = rnbd_srv_find_or_add_srv_dev(new_dev);
522	if (dev != new_dev)
523		kfree(new_dev);
524
525	ret = rnbd_srv_check_update_open_perm(dev, srv_sess, access_mode);
526	if (ret) {
527		rnbd_put_srv_dev(dev);
528		return ERR_PTR(ret);
529	}
530
531	return dev;
532}
533
534static void rnbd_srv_fill_msg_open_rsp(struct rnbd_msg_open_rsp *rsp,
535					struct rnbd_srv_sess_dev *sess_dev)
536{
537	struct block_device *bdev = file_bdev(sess_dev->bdev_file);
538
539	rsp->hdr.type = cpu_to_le16(RNBD_MSG_OPEN_RSP);
540	rsp->device_id = cpu_to_le32(sess_dev->device_id);
541	rsp->nsectors = cpu_to_le64(bdev_nr_sectors(bdev));
542	rsp->logical_block_size	= cpu_to_le16(bdev_logical_block_size(bdev));
543	rsp->physical_block_size = cpu_to_le16(bdev_physical_block_size(bdev));
544	rsp->max_segments = cpu_to_le16(bdev_max_segments(bdev));
545	rsp->max_hw_sectors =
546		cpu_to_le32(queue_max_hw_sectors(bdev_get_queue(bdev)));
547	rsp->max_write_zeroes_sectors =
548		cpu_to_le32(bdev_write_zeroes_sectors(bdev));
549	rsp->max_discard_sectors = cpu_to_le32(bdev_max_discard_sectors(bdev));
550	rsp->discard_granularity = cpu_to_le32(bdev_discard_granularity(bdev));
551	rsp->discard_alignment = cpu_to_le32(bdev_discard_alignment(bdev));
552	rsp->secure_discard = cpu_to_le16(bdev_max_secure_erase_sectors(bdev));
553	rsp->cache_policy = 0;
554	if (bdev_write_cache(bdev))
555		rsp->cache_policy |= RNBD_WRITEBACK;
556	if (bdev_fua(bdev))
557		rsp->cache_policy |= RNBD_FUA;
558}
559
560static struct rnbd_srv_sess_dev *
561rnbd_srv_create_set_sess_dev(struct rnbd_srv_session *srv_sess,
562			      const struct rnbd_msg_open *open_msg,
563			      struct file *bdev_file, bool readonly,
564			      struct rnbd_srv_dev *srv_dev)
565{
566	struct rnbd_srv_sess_dev *sdev = rnbd_sess_dev_alloc(srv_sess);
567
568	if (IS_ERR(sdev))
569		return sdev;
570
571	kref_init(&sdev->kref);
572
573	strscpy(sdev->pathname, open_msg->dev_name, sizeof(sdev->pathname));
574
575	sdev->bdev_file		= bdev_file;
576	sdev->sess		= srv_sess;
577	sdev->dev		= srv_dev;
578	sdev->readonly		= readonly;
579	sdev->access_mode	= open_msg->access_mode;
580
581	return sdev;
582}
583
584static char *rnbd_srv_get_full_path(struct rnbd_srv_session *srv_sess,
585				     const char *dev_name)
586{
587	char *full_path;
588	char *a, *b;
589	int len;
590
591	full_path = kmalloc(PATH_MAX, GFP_KERNEL);
592	if (!full_path)
593		return ERR_PTR(-ENOMEM);
594
595	/*
596	 * Replace %SESSNAME% with a real session name in order to
597	 * create device namespace.
598	 */
599	a = strnstr(dev_search_path, "%SESSNAME%", sizeof(dev_search_path));
600	if (a) {
601		len = a - dev_search_path;
602
603		len = snprintf(full_path, PATH_MAX, "%.*s/%s/%s", len,
604			       dev_search_path, srv_sess->sessname, dev_name);
605	} else {
606		len = snprintf(full_path, PATH_MAX, "%s/%s",
607			       dev_search_path, dev_name);
608	}
609	if (len >= PATH_MAX) {
610		pr_err("Too long path: %s, %s, %s\n",
611		       dev_search_path, srv_sess->sessname, dev_name);
612		kfree(full_path);
613		return ERR_PTR(-EINVAL);
614	}
615
616	/* eliminitate duplicated slashes */
617	a = strchr(full_path, '/');
618	b = a;
619	while (*b != '\0') {
620		if (*b == '/' && *a == '/') {
621			b++;
622		} else {
623			a++;
624			*a = *b;
625			b++;
626		}
627	}
628	a++;
629	*a = '\0';
630
631	return full_path;
632}
633
634static void process_msg_sess_info(struct rnbd_srv_session *srv_sess,
635				 const void *msg, size_t len,
636				 void *data, size_t datalen)
637{
638	const struct rnbd_msg_sess_info *sess_info_msg = msg;
639	struct rnbd_msg_sess_info_rsp *rsp = data;
640
641	srv_sess->ver = min_t(u8, sess_info_msg->ver, RNBD_PROTO_VER_MAJOR);
642
643	trace_process_msg_sess_info(srv_sess, sess_info_msg);
644
645	rsp->hdr.type = cpu_to_le16(RNBD_MSG_SESS_INFO_RSP);
646	rsp->ver = srv_sess->ver;
647}
648
649/**
650 * find_srv_sess_dev() - a dev is already opened by this name
651 * @srv_sess:	the session to search.
652 * @dev_name:	string containing the name of the device.
653 *
654 * Return struct rnbd_srv_sess_dev if srv_sess already opened the dev_name
655 * NULL if the session didn't open the device yet.
656 */
657static struct rnbd_srv_sess_dev *
658find_srv_sess_dev(struct rnbd_srv_session *srv_sess, const char *dev_name)
659{
660	struct rnbd_srv_sess_dev *sess_dev;
661	unsigned long index;
662
663	if (xa_empty(&srv_sess->index_idr))
664		return NULL;
665
666	xa_for_each(&srv_sess->index_idr, index, sess_dev)
667		if (!strcmp(sess_dev->pathname, dev_name))
668			return sess_dev;
669
670	return NULL;
671}
672
673static int process_msg_open(struct rnbd_srv_session *srv_sess,
674			    const void *msg, size_t len,
675			    void *data, size_t datalen)
676{
677	int ret;
678	struct rnbd_srv_dev *srv_dev;
679	struct rnbd_srv_sess_dev *srv_sess_dev;
680	const struct rnbd_msg_open *open_msg = msg;
681	struct file *bdev_file;
682	blk_mode_t open_flags = BLK_OPEN_READ;
683	char *full_path;
684	struct rnbd_msg_open_rsp *rsp = data;
685
686	trace_process_msg_open(srv_sess, open_msg);
687
688	if (open_msg->access_mode != RNBD_ACCESS_RO)
689		open_flags |= BLK_OPEN_WRITE;
690
691	mutex_lock(&srv_sess->lock);
692
693	srv_sess_dev = find_srv_sess_dev(srv_sess, open_msg->dev_name);
694	if (srv_sess_dev)
695		goto fill_response;
696
697	if ((strlen(dev_search_path) + strlen(open_msg->dev_name))
698	    >= PATH_MAX) {
699		pr_err("Opening device for session %s failed, device path too long. '%s/%s' is longer than PATH_MAX (%d)\n",
700		       srv_sess->sessname, dev_search_path, open_msg->dev_name,
701		       PATH_MAX);
702		ret = -EINVAL;
703		goto reject;
704	}
705	if (strstr(open_msg->dev_name, "..")) {
706		pr_err("Opening device for session %s failed, device path %s contains relative path ..\n",
707		       srv_sess->sessname, open_msg->dev_name);
708		ret = -EINVAL;
709		goto reject;
710	}
711	full_path = rnbd_srv_get_full_path(srv_sess, open_msg->dev_name);
712	if (IS_ERR(full_path)) {
713		ret = PTR_ERR(full_path);
714		pr_err("Opening device '%s' for client %s failed, failed to get device full path, err: %pe\n",
715		       open_msg->dev_name, srv_sess->sessname, full_path);
716		goto reject;
717	}
718
719	bdev_file = bdev_file_open_by_path(full_path, open_flags, NULL, NULL);
720	if (IS_ERR(bdev_file)) {
721		ret = PTR_ERR(bdev_file);
722		pr_err("Opening device '%s' on session %s failed, failed to open the block device, err: %pe\n",
723		       full_path, srv_sess->sessname, bdev_file);
724		goto free_path;
725	}
726
727	srv_dev = rnbd_srv_get_or_create_srv_dev(file_bdev(bdev_file), srv_sess,
728						  open_msg->access_mode);
729	if (IS_ERR(srv_dev)) {
730		pr_err("Opening device '%s' on session %s failed, creating srv_dev failed, err: %pe\n",
731		       full_path, srv_sess->sessname, srv_dev);
732		ret = PTR_ERR(srv_dev);
733		goto blkdev_put;
734	}
735
736	srv_sess_dev = rnbd_srv_create_set_sess_dev(srv_sess, open_msg,
737				bdev_file,
738				open_msg->access_mode == RNBD_ACCESS_RO,
739				srv_dev);
740	if (IS_ERR(srv_sess_dev)) {
741		pr_err("Opening device '%s' on session %s failed, creating sess_dev failed, err: %pe\n",
742		       full_path, srv_sess->sessname, srv_sess_dev);
743		ret = PTR_ERR(srv_sess_dev);
744		goto srv_dev_put;
745	}
746
747	/* Create the srv_dev sysfs files if they haven't been created yet. The
748	 * reason to delay the creation is not to create the sysfs files before
749	 * we are sure the device can be opened.
750	 */
751	mutex_lock(&srv_dev->lock);
752	if (!srv_dev->dev_kobj.state_in_sysfs) {
753		ret = rnbd_srv_create_dev_sysfs(srv_dev, file_bdev(bdev_file));
754		if (ret) {
755			mutex_unlock(&srv_dev->lock);
756			rnbd_srv_err(srv_sess_dev,
757				      "Opening device failed, failed to create device sysfs files, err: %d\n",
758				      ret);
759			goto free_srv_sess_dev;
760		}
761	}
762
763	ret = rnbd_srv_create_dev_session_sysfs(srv_sess_dev);
764	if (ret) {
765		mutex_unlock(&srv_dev->lock);
766		rnbd_srv_err(srv_sess_dev,
767			      "Opening device failed, failed to create dev client sysfs files, err: %d\n",
768			      ret);
769		goto free_srv_sess_dev;
770	}
771
772	list_add(&srv_sess_dev->dev_list, &srv_dev->sess_dev_list);
773	mutex_unlock(&srv_dev->lock);
774
775	rnbd_srv_info(srv_sess_dev, "Opened device '%s'\n", srv_dev->name);
776
777	kfree(full_path);
778
779fill_response:
780	rnbd_srv_fill_msg_open_rsp(rsp, srv_sess_dev);
781	mutex_unlock(&srv_sess->lock);
782	return 0;
783
784free_srv_sess_dev:
785	xa_erase(&srv_sess->index_idr, srv_sess_dev->device_id);
786	synchronize_rcu();
787	kfree(srv_sess_dev);
788srv_dev_put:
789	if (open_msg->access_mode != RNBD_ACCESS_RO) {
790		mutex_lock(&srv_dev->lock);
791		srv_dev->open_write_cnt--;
792		mutex_unlock(&srv_dev->lock);
793	}
794	rnbd_put_srv_dev(srv_dev);
795blkdev_put:
796	fput(bdev_file);
797free_path:
798	kfree(full_path);
799reject:
800	mutex_unlock(&srv_sess->lock);
801	return ret;
802}
803
804static struct rtrs_srv_ctx *rtrs_ctx;
805
806static struct rtrs_srv_ops rtrs_ops;
807static int __init rnbd_srv_init_module(void)
808{
809	int err = 0;
810
811	BUILD_BUG_ON(sizeof(struct rnbd_msg_hdr) != 4);
812	BUILD_BUG_ON(sizeof(struct rnbd_msg_sess_info) != 36);
813	BUILD_BUG_ON(sizeof(struct rnbd_msg_sess_info_rsp) != 36);
814	BUILD_BUG_ON(sizeof(struct rnbd_msg_open) != 264);
815	BUILD_BUG_ON(sizeof(struct rnbd_msg_close) != 8);
816	BUILD_BUG_ON(sizeof(struct rnbd_msg_open_rsp) != 56);
817	rtrs_ops = (struct rtrs_srv_ops) {
818		.rdma_ev = rnbd_srv_rdma_ev,
819		.link_ev = rnbd_srv_link_ev,
820	};
821	rtrs_ctx = rtrs_srv_open(&rtrs_ops, port_nr);
822	if (IS_ERR(rtrs_ctx)) {
823		pr_err("rtrs_srv_open(), err: %pe\n", rtrs_ctx);
824		return PTR_ERR(rtrs_ctx);
825	}
826
827	err = rnbd_srv_create_sysfs_files();
828	if (err) {
829		pr_err("rnbd_srv_create_sysfs_files(), err: %d\n", err);
830		rtrs_srv_close(rtrs_ctx);
831	}
832
833	return err;
834}
835
836static void __exit rnbd_srv_cleanup_module(void)
837{
838	rtrs_srv_close(rtrs_ctx);
839	WARN_ON(!list_empty(&sess_list));
840	rnbd_srv_destroy_sysfs_files();
841}
842
843module_init(rnbd_srv_init_module);
844module_exit(rnbd_srv_cleanup_module);
845