summaryrefslogblamecommitdiffstats
path: root/src/kernel/block.c
blob: 4eb52c55ff04c2ffe9b7732fa603811297d77ee6 (plain) (tree)
1
2
3
4
5
6
7
8






                            
                     


                  
                         
 
                                                                                                                                   
 






                                                   























                                                                              
 

                                          


                                    
                                                                        



















































































































































































                                                                                                                              
                 










                                        





                                                                           
























                                                           


















































































































































                                                                                                                             
/*
 * block.c
 *
 *  Created on: Jun 26, 2019
 *      Author: fred
 */

#include <net/sock.h>

#include "dnbd3.h"
#include "block.h"
#include "clientconfig.h"

#define dnbd3_sock_create(af,type,proto,sock) sock_create_kern(&init_net, (af) == HOST_IP4 ? AF_INET : AF_INET6, type, proto, sock)

#define init_msghdr(h) do { \
        h.msg_name = NULL; \
        h.msg_namelen = 0; \
        h.msg_control = NULL; \
        h.msg_controllen = 0; \
        h.msg_flags = MSG_WAITALL | MSG_NOSIGNAL; \
	} while (0)

static int dnbd3_open(struct block_device *bdev, fmode_t mode)
{
	dnbd3_device_t *dev = bdev->bd_disk->private_data;
	printk(KERN_DEBUG "dnbd3: open device %i\n", dev->minor);
	//TODO can be removed?
	return 0;
}

static void dnbd3_release(struct gendisk *disk, fmode_t mode)
{
	dnbd3_device_t *dev = disk->private_data;
	printk(KERN_DEBUG "dnbd3: release device %i\n", dev->minor);
	//TODO can be removed?

}


void dnbd3_blk_fail_all_requests(dnbd3_device_t *dev)
{
	printk(KERN_DEBUG "dnbd3: fail all requests device %i\n", dev->minor);
}



int dnbd3_net_connect(dnbd3_device_t *dev)
{
	struct request *req1 = NULL;
	struct timeval timeout;

	printk(KERN_DEBUG "dnbd3: net connect device %i\n", dev->minor);

	if (dev->disconnecting) {
		printk(KERN_DEBUG "dnbd3: device still disconnecting\n");
		while (dev->disconnecting)
			schedule();
	}
	if (dev->request) {
		printk(KERN_DEBUG "dnbd3: device still in request\n");
		while (dev->disconnecting)
			schedule();
	}

	timeout.tv_sec = SOCKET_TIMEOUT_CLIENT_DATA;
	timeout.tv_usec = 0;

	// do some checks before connecting

	req1 = kmalloc(sizeof(*req1), GFP_ATOMIC );
	if (!req1) {
		printk(KERN_ERR "dnbd3: kmalloc failed\n");
		goto error;
	}
	if (dev->cur_server.host.port == 0 || dev->cur_server.host.type == 0 || dev->imgname == NULL ) {
		printk(KERN_ERR "dnbd3: host, port or image name not set\n");
		goto error;
	}
	if (dev->sock) {
		printk(KERN_WARNING "dnbd3: already connected\n");
		goto error;
	}

	if (dev->cur_server.host.type != HOST_IP4 && dev->cur_server.host.type != HOST_IP6) {
		printk(KERN_ERR "dnbd3: unknown address type %d\n", (int)dev->cur_server.host.type);
		goto error;
	}

	if (dev->better_sock == NULL ) {
		//  no established connection yet from discovery thread, start new one
		dnbd3_request_t dnbd3_request;
		dnbd3_reply_t dnbd3_reply;
		struct msghdr msg;
		struct kvec iov[2];
		uint16_t rid;
		char *name;
		int mlen;
		init_msghdr(msg);

		if (dnbd3_sock_create(dev->cur_server.host.type, SOCK_STREAM, IPPROTO_TCP, &dev->sock) < 0) {
			printk(KERN_ERR "dnbd3: could not create socket\n");
			goto error;
		}

		kernel_setsockopt(dev->sock, SOL_SOCKET, SO_SNDTIMEO, (char *)&timeout, sizeof(timeout));
		kernel_setsockopt(dev->sock, SOL_SOCKET, SO_RCVTIMEO, (char *)&timeout, sizeof(timeout));
		dev->sock->sk->sk_allocation = GFP_NOIO;
		if (dev->cur_server.host.type == HOST_IP4) {
			struct sockaddr_in sin;
			memset(&sin, 0, sizeof(sin));
			sin.sin_family = AF_INET;
			memcpy(&(sin.sin_addr), dev->cur_server.host.addr, 4);
			sin.sin_port = dev->cur_server.host.port;
			if (kernel_connect(dev->sock, (struct sockaddr *)&sin, sizeof(sin), 0) != 0) {
				printk(KERN_ERR "dnbd3: connection to host failed (ipv4)\n");
				goto error;
			}
		} else {
			struct sockaddr_in6 sin;
			memset(&sin, 0, sizeof(sin));
			sin.sin6_family = AF_INET6;
			memcpy(&(sin.sin6_addr), dev->cur_server.host.addr, 16);
			sin.sin6_port = dev->cur_server.host.port;
			if (kernel_connect(dev->sock, (struct sockaddr *)&sin, sizeof(sin), 0) != 0){
				printk(KERN_ERR "dnbd3: connection to host failed (ipv6)\n");
				goto error;
			}
		}
		// Request filesize
		dnbd3_request.magic = dnbd3_packet_magic;
		dnbd3_request.cmd = CMD_SELECT_IMAGE;
		iov[0].iov_base = &dnbd3_request;
		iov[0].iov_len = sizeof(dnbd3_request);
		serializer_reset_write(&dev->payload_buffer);
		serializer_put_uint16(&dev->payload_buffer, PROTOCOL_VERSION);
		serializer_put_string(&dev->payload_buffer, dev->imgname);
		serializer_put_uint16(&dev->payload_buffer, dev->rid);
		serializer_put_uint8(&dev->payload_buffer, 0); // is_server = false
		iov[1].iov_base = &dev->payload_buffer;
		dnbd3_request.size = iov[1].iov_len = serializer_get_written_length(&dev->payload_buffer);
		fixup_request(dnbd3_request);
		mlen = sizeof(dnbd3_request) + iov[1].iov_len;
		if (kernel_sendmsg(dev->sock, &msg, iov, 2, mlen) != mlen) {
			printk(KERN_ERR "dnbd3: could not send CMD_SIZE_REQUEST\n");
			goto error;
		}
		// receive reply header
		iov[0].iov_base = &dnbd3_reply;
		iov[0].iov_len = sizeof(dnbd3_reply);
		if (kernel_recvmsg(dev->sock, &msg, iov, 1, sizeof(dnbd3_reply), msg.msg_flags) != sizeof(dnbd3_reply)) {
			printk(KERN_ERR "dnbd3: received corrupted reply header after CMD_SIZE_REQUEST\n");
			goto error;
		}

		// check reply header
		fixup_reply(dnbd3_reply);
		if (dnbd3_reply.cmd != CMD_SELECT_IMAGE ||
				dnbd3_reply.size < 3 ||
				dnbd3_reply.size > MAX_PAYLOAD ||
				dnbd3_reply.magic != dnbd3_packet_magic) {
			printk(KERN_ERR "dnbd3: received invalid reply to CMD_SIZE_REQUEST image does not exist on server\n");
			goto error;
		}

		// receive reply payload
		iov[0].iov_base = &dev->payload_buffer;
		iov[0].iov_len = dnbd3_reply.size;
		if (kernel_recvmsg(dev->sock, &msg, iov, 1, dnbd3_reply.size, msg.msg_flags) != dnbd3_reply.size) {
			printk(KERN_ERR "dnbd3: could not read CMD_SELECT_IMAGE payload on handshake\n");
			goto error;
		}

		// handle/check reply payload
		serializer_reset_read(&dev->payload_buffer, dnbd3_reply.size);
		dev->cur_server.protocol_version = serializer_get_uint16(&dev->payload_buffer);
		if (dev->cur_server.protocol_version < MIN_SUPPORTED_SERVER) {
			printk(KERN_ERR "dnbd3: server version is lower than min supported version\n");
			goto error;
		}

		name = serializer_get_string(&dev->payload_buffer);
		if (dev->rid != 0 && strcmp(name, dev->imgname) != 0) {
			printk(KERN_ERR "dnbd3: server offers image '%s', requested '%s'\n", name, dev->imgname);
			goto error;
		}

		if (strlen(dev->imgname) < strlen(name)) {
			dev->imgname = krealloc(dev->imgname, strlen(name) + 1, GFP_ATOMIC );
			if (dev->imgname == NULL ) {
				printk(KERN_ERR "dnbd3: reallocating buffer for new image name failed\n");
				goto error;
			}
		}
		strcpy(dev->imgname, name);
		rid = serializer_get_uint16(&dev->payload_buffer);
		if (dev->rid != 0 && dev->rid != rid) {
			printk(KERN_ERR "dnbd3: server provides rid %d, requested was %d\n", (int)rid, (int)dev->rid);
			goto error;
		}

		dev->rid = rid;
		dev->reported_size = serializer_get_uint64(&dev->payload_buffer);
		if (dev->reported_size < 4096) {
			printk(KERN_ERR "dnbd3: reported size by server is < 4096\n");
			goto error;
		}

		// store image information
		set_capacity(dev->disk, dev->reported_size >> 9); /* 512 Byte blocks */
		printk(KERN_DEBUG "dnbd3: connected to image %s, filesize %llu\n", dev->imgname, dev->reported_size);
		dev->update_available = 0;
	} else { // Switching server, connection is already established and size request was executed

		printk(KERN_DEBUG "dnbd3: changing server\n");
		dev->sock = dev->better_sock;
		dev->better_sock = NULL;
		kernel_setsockopt(dev->sock, SOL_SOCKET, SO_SNDTIMEO, (char *)&timeout, sizeof(timeout));
		kernel_setsockopt(dev->sock, SOL_SOCKET, SO_RCVTIMEO, (char *)&timeout, sizeof(timeout));
	}

	dev->panic = 0;
	dev->panic_count = 0;

	// Enqueue request to request_queue_send for a fresh list of alt servers
	//TODO refresh alt server list

	// add heartbeat timer
	//TODO needed anymore=
//	dev->heartbeat_count = 0;
//	timer_setup(&dev->hb_timer, dnbd3_net_heartbeat, 0);
//	dev->hb_timer.expires = jiffies + HZ;
//	add_timer(&dev->hb_timer);
	return 0;
error:
	if (dev->sock) {
		sock_release(dev->sock);
		dev->sock = NULL;
	}
	dev->cur_server.host.type = 0;
	dev->cur_server.host.port = 0;
	if (req1) {
		kfree(req1);
	}
	return -1;
}


int dnbd3_net_disconnect(dnbd3_device_t *dev)
{
	printk(KERN_DEBUG "dnbd3: net disconnect device %i\n", dev->minor);
	if (dev->disconnecting)  {
		return 0;
	}

	dev->disconnecting = 1;

	// clear heartbeat timer
//	del_timer(&dev->hb_timer);

	dev->discover = 0;

	if (dev->sock) {
		kernel_sock_shutdown(dev->sock, SHUT_RDWR);
	}

	// clear socket
	if (dev->sock) {
		sock_release(dev->sock);
		dev->sock = NULL;
	}
	dev->cur_server.host.type = 0;
	dev->cur_server.host.port = 0;

	dev->disconnecting = 0;

	return 0;
}

static int dnbd3_ioctl(struct block_device *bdev, fmode_t mode, unsigned int cmd, unsigned long arg)
{
	int result = -100;
	dnbd3_device_t *dev = bdev->bd_disk->private_data;
	char *imgname = NULL;
	dnbd3_ioctl_t *msg = NULL;

	printk(KERN_DEBUG "dnbd3: ioctl device %i, cmd %i, arg %lu\n", dev->minor, cmd, arg);
	//unsigned long irqflags;

	while (dev->disconnecting) {
		// do nothing
	}

	if (arg != 0) {
		msg = kmalloc(sizeof(*msg), GFP_KERNEL);
		if (msg == NULL) return -ENOMEM;
		if (copy_from_user((char *)msg, (char *)arg, 2) != 0 || msg->len != sizeof(*msg)) {
			result = -ENOEXEC;
			goto cleanup_return;
		}
		if (copy_from_user((char *)msg, (char *)arg, sizeof(*msg)) != 0) {
			result = -ENOENT;
			goto cleanup_return;
		}
		if (msg->imgname != NULL && msg->imgnamelen > 0) {
			imgname = kmalloc(msg->imgnamelen + 1, GFP_KERNEL);
			if (imgname == NULL) {
				result = -ENOMEM;
				goto cleanup_return;
			}
			if (copy_from_user(imgname, msg->imgname, msg->imgnamelen) != 0) {
				result = -ENOENT;
				goto cleanup_return;
			}
			imgname[msg->imgnamelen] = '\0';

			printk(KERN_DEBUG "dnbd3: ioctl image name of len %i is %s\n", (int)msg->imgnamelen, imgname);
		}
	}

	switch (cmd) {
	case IOCTL_OPEN:
		printk(KERN_DEBUG "dnbd3: ioctl open\n");
		if (dev->imgname != NULL) {
			result = -EBUSY;
		} else if (imgname == NULL) {
			result = -EINVAL;
		} else if (msg == NULL) {
			result = -EINVAL;
		} else {
			if (sizeof(msg->host) != sizeof(dev->cur_server.host)) {
				printk(KERN_INFO "dnbd3: odd size bug#1 triggered in ioctl\n");
			}
			memcpy(&dev->cur_server.host, &msg->host, sizeof(msg->host));
			dev->cur_server.failures = 0;
			memcpy(&dev->initial_server, &dev->cur_server, sizeof(dev->initial_server));
			dev->imgname = imgname;
			dev->rid = msg->rid;
			dev->use_server_provided_alts = msg->use_server_provided_alts;
			// Forget all alt servers on explicit connect, set first al server to initial server
			memset(dev->alt_servers, 0, sizeof(dev->alt_servers[0])*NUMBER_SERVERS);
			memcpy(dev->alt_servers, &dev->initial_server, sizeof(dev->alt_servers[0]));
//#if LINUX_VERSION_CODE >= KERNEL_VERSION(4, 11, 0)
//			if (blk_queue->backing_dev_info != NULL) {
//				blk_queue->backing_dev_info->ra_pages = (msg->read_ahead_kb * 1024) / PAGE_SIZE;
//			}
//#else
//			blk_queue->backing_dev_info.ra_pages = (msg->read_ahead_kb * 1024) / PAGE_SIZE;
//#endif
			if (dnbd3_net_connect(dev) == 0) {
				result = 0;
				imgname = NULL; // Prevent kfree at the end
			} else {
				result = -ENOENT;
				dev->imgname = NULL;
			}
		}
		break;

	case IOCTL_CLOSE:
		printk(KERN_DEBUG "dnbd3: ioctl close\n");
		dnbd3_blk_fail_all_requests(dev);
		result = dnbd3_net_disconnect(dev);
		dnbd3_blk_fail_all_requests(dev);
		set_capacity(dev->disk, 0);
		if (dev->imgname) {
			kfree(dev->imgname);
			dev->imgname = NULL;
		}
		break;

	case IOCTL_SWITCH:
		printk(KERN_DEBUG "dnbd3: ioctl switch\n");
		result = -EINVAL;
		break;

	case IOCTL_ADD_SRV:
	case IOCTL_REM_SRV:
		printk(KERN_DEBUG "dnbd3: ioctl add/rem srv\n");
		if (dev->imgname == NULL) {
			result = -ENOENT;
		} else if (dev->new_servers_num >= NUMBER_SERVERS) {
			result = -EAGAIN;
		} else if (msg == NULL) {
			result = -EINVAL;
		} else {
			memcpy(&dev->new_servers[dev->new_servers_num].host, &msg->host, sizeof(msg->host));
			dev->new_servers[dev->new_servers_num].failures = (cmd == IOCTL_ADD_SRV ? 0 : 1); // 0 = ADD, 1 = REM
			++dev->new_servers_num;
			result = 0;
		}
		break;

	case BLKFLSBUF:
		printk(KERN_DEBUG "dnbd3: ioctl blkflsbuf\n");
		result = 0;
		break;

	default:
		printk(KERN_DEBUG "dnbd3: ioctl unhandled cmd\n");
		result = -EIO;
		break;
	}

cleanup_return:
	if (msg) kfree(msg);
	if (imgname) kfree(imgname);
	return result;

}



struct block_device_operations dnbd3_fops =
{
	.owner = THIS_MODULE,
	.open = dnbd3_open,
	.release = dnbd3_release,
	.ioctl = dnbd3_ioctl,
	.compat_ioctl =	dnbd3_ioctl,
};