mirror of
git://git.kernel.org/pub/scm/linux/kernel/git/torvalds/linux.git
synced 2025-08-05 16:54:27 +00:00

Size of ring buffer, as defined in uio_hv_generic driver, is no longer
fixed to 16 KB. This creates a problem in fcopy, since this size was
hardcoded. With the change in place to make ring sysfs node actually
reflect the size of underlying ring buffer, it is safe to get the size
of ring sysfs file and use it for ring buffer size in fcopy daemon.
Fix the issue of disparity in ring buffer size, by making it dynamic
in fcopy uio daemon.
Cc: stable@vger.kernel.org
Fixes: 0315fef2af
("uio_hv_generic: Align ring size to system page")
Signed-off-by: Naman Jain <namjain@linux.microsoft.com>
Reviewed-by: Saurabh Sengar <ssengar@linux.microsoft.com>
Reviewed-by: Long Li <longli@microsoft.com>
Link: https://lore.kernel.org/r/20250711060846.9168-1-namjain@linux.microsoft.com
Signed-off-by: Wei Liu <wei.liu@kernel.org>
Message-ID: <20250711060846.9168-1-namjain@linux.microsoft.com>
559 lines
13 KiB
C
559 lines
13 KiB
C
// SPDX-License-Identifier: GPL-2.0-only
|
|
/*
|
|
* An implementation of host to guest copy functionality for Linux.
|
|
*
|
|
* Copyright (C) 2023, Microsoft, Inc.
|
|
*
|
|
* Author : K. Y. Srinivasan <kys@microsoft.com>
|
|
* Author : Saurabh Sengar <ssengar@microsoft.com>
|
|
*
|
|
*/
|
|
|
|
#include <dirent.h>
|
|
#include <errno.h>
|
|
#include <fcntl.h>
|
|
#include <getopt.h>
|
|
#include <locale.h>
|
|
#include <stdbool.h>
|
|
#include <stddef.h>
|
|
#include <stdint.h>
|
|
#include <stdio.h>
|
|
#include <stdlib.h>
|
|
#include <string.h>
|
|
#include <syslog.h>
|
|
#include <unistd.h>
|
|
#include <wchar.h>
|
|
#include <sys/stat.h>
|
|
#include <linux/hyperv.h>
|
|
#include <linux/limits.h>
|
|
#include "vmbus_bufring.h"
|
|
|
|
#define ICMSGTYPE_NEGOTIATE 0
|
|
#define ICMSGTYPE_FCOPY 7
|
|
|
|
#define WIN8_SRV_MAJOR 1
|
|
#define WIN8_SRV_MINOR 1
|
|
#define WIN8_SRV_VERSION (WIN8_SRV_MAJOR << 16 | WIN8_SRV_MINOR)
|
|
|
|
#define FCOPY_DEVICE_PATH(subdir) \
|
|
"/sys/bus/vmbus/devices/eb765408-105f-49b6-b4aa-c123b64d17d4/" #subdir
|
|
#define FCOPY_UIO_PATH FCOPY_DEVICE_PATH(uio)
|
|
#define FCOPY_CHANNELS_PATH FCOPY_DEVICE_PATH(channels)
|
|
|
|
#define FCOPY_VER_COUNT 1
|
|
static const int fcopy_versions[] = {
|
|
WIN8_SRV_VERSION
|
|
};
|
|
|
|
#define FW_VER_COUNT 1
|
|
static const int fw_versions[] = {
|
|
UTIL_FW_VERSION
|
|
};
|
|
|
|
static uint32_t get_ring_buffer_size(void)
|
|
{
|
|
char ring_path[PATH_MAX];
|
|
DIR *dir;
|
|
struct dirent *entry;
|
|
struct stat st;
|
|
uint32_t ring_size = 0;
|
|
int retry_count = 0;
|
|
|
|
/* Find the channel directory */
|
|
dir = opendir(FCOPY_CHANNELS_PATH);
|
|
if (!dir) {
|
|
usleep(100 * 1000); /* Avoid race with kernel, wait 100ms and retry once */
|
|
dir = opendir(FCOPY_CHANNELS_PATH);
|
|
if (!dir) {
|
|
syslog(LOG_ERR, "Failed to open channels directory: %s", strerror(errno));
|
|
return 0;
|
|
}
|
|
}
|
|
|
|
retry_once:
|
|
while ((entry = readdir(dir)) != NULL) {
|
|
if (entry->d_type == DT_DIR && strcmp(entry->d_name, ".") != 0 &&
|
|
strcmp(entry->d_name, "..") != 0) {
|
|
snprintf(ring_path, sizeof(ring_path), "%s/%s/ring",
|
|
FCOPY_CHANNELS_PATH, entry->d_name);
|
|
|
|
if (stat(ring_path, &st) == 0) {
|
|
/*
|
|
* stat returns size of Tx, Rx rings combined,
|
|
* so take half of it for individual ring size.
|
|
*/
|
|
ring_size = (uint32_t)st.st_size / 2;
|
|
syslog(LOG_INFO, "Ring buffer size from %s: %u bytes",
|
|
ring_path, ring_size);
|
|
break;
|
|
}
|
|
}
|
|
}
|
|
|
|
if (!ring_size && retry_count == 0) {
|
|
retry_count = 1;
|
|
rewinddir(dir);
|
|
usleep(100 * 1000); /* Wait 100ms and retry once */
|
|
goto retry_once;
|
|
}
|
|
|
|
closedir(dir);
|
|
|
|
if (!ring_size)
|
|
syslog(LOG_ERR, "Could not determine ring size");
|
|
|
|
return ring_size;
|
|
}
|
|
|
|
static unsigned char *desc;
|
|
|
|
static int target_fd;
|
|
static char target_fname[PATH_MAX];
|
|
static unsigned long long filesize;
|
|
|
|
static int hv_fcopy_create_file(char *file_name, char *path_name, __u32 flags)
|
|
{
|
|
int error = HV_E_FAIL;
|
|
char *q, *p;
|
|
|
|
filesize = 0;
|
|
p = path_name;
|
|
if (snprintf(target_fname, sizeof(target_fname), "%s/%s",
|
|
path_name, file_name) >= sizeof(target_fname)) {
|
|
syslog(LOG_ERR, "target file name is too long: %s/%s", path_name, file_name);
|
|
goto done;
|
|
}
|
|
|
|
/*
|
|
* Check to see if the path is already in place; if not,
|
|
* create if required.
|
|
*/
|
|
while ((q = strchr(p, '/')) != NULL) {
|
|
if (q == p) {
|
|
p++;
|
|
continue;
|
|
}
|
|
*q = '\0';
|
|
if (access(path_name, F_OK)) {
|
|
if (flags & CREATE_PATH) {
|
|
if (mkdir(path_name, 0755)) {
|
|
syslog(LOG_ERR, "Failed to create %s",
|
|
path_name);
|
|
goto done;
|
|
}
|
|
} else {
|
|
syslog(LOG_ERR, "Invalid path: %s", path_name);
|
|
goto done;
|
|
}
|
|
}
|
|
p = q + 1;
|
|
*q = '/';
|
|
}
|
|
|
|
if (!access(target_fname, F_OK)) {
|
|
syslog(LOG_INFO, "File: %s exists", target_fname);
|
|
if (!(flags & OVER_WRITE)) {
|
|
error = HV_ERROR_ALREADY_EXISTS;
|
|
goto done;
|
|
}
|
|
}
|
|
|
|
target_fd = open(target_fname,
|
|
O_RDWR | O_CREAT | O_TRUNC | O_CLOEXEC, 0744);
|
|
if (target_fd == -1) {
|
|
syslog(LOG_INFO, "Open Failed: %s", strerror(errno));
|
|
goto done;
|
|
}
|
|
|
|
error = 0;
|
|
done:
|
|
if (error)
|
|
target_fname[0] = '\0';
|
|
return error;
|
|
}
|
|
|
|
/* copy the data into the file */
|
|
static int hv_copy_data(struct hv_do_fcopy *cpmsg)
|
|
{
|
|
ssize_t len;
|
|
int ret = 0;
|
|
|
|
len = pwrite(target_fd, cpmsg->data, cpmsg->size, cpmsg->offset);
|
|
|
|
filesize += cpmsg->size;
|
|
if (len != cpmsg->size) {
|
|
switch (errno) {
|
|
case ENOSPC:
|
|
ret = HV_ERROR_DISK_FULL;
|
|
break;
|
|
default:
|
|
ret = HV_E_FAIL;
|
|
break;
|
|
}
|
|
syslog(LOG_ERR, "pwrite failed to write %llu bytes: %ld (%s)",
|
|
filesize, (long)len, strerror(errno));
|
|
}
|
|
|
|
return ret;
|
|
}
|
|
|
|
static int hv_copy_finished(void)
|
|
{
|
|
close(target_fd);
|
|
target_fname[0] = '\0';
|
|
|
|
return 0;
|
|
}
|
|
|
|
static void print_usage(char *argv[])
|
|
{
|
|
fprintf(stderr, "Usage: %s [options]\n"
|
|
"Options are:\n"
|
|
" -n, --no-daemon stay in foreground, don't daemonize\n"
|
|
" -h, --help print this help\n", argv[0]);
|
|
}
|
|
|
|
static bool vmbus_prep_negotiate_resp(struct icmsg_hdr *icmsghdrp, unsigned char *buf,
|
|
unsigned int buflen, const int *fw_version, int fw_vercnt,
|
|
const int *srv_version, int srv_vercnt,
|
|
int *nego_fw_version, int *nego_srv_version)
|
|
{
|
|
int icframe_major, icframe_minor;
|
|
int icmsg_major, icmsg_minor;
|
|
int fw_major, fw_minor;
|
|
int srv_major, srv_minor;
|
|
int i, j;
|
|
bool found_match = false;
|
|
struct icmsg_negotiate *negop;
|
|
|
|
/* Check that there's enough space for icframe_vercnt, icmsg_vercnt */
|
|
if (buflen < ICMSG_HDR + offsetof(struct icmsg_negotiate, reserved)) {
|
|
syslog(LOG_ERR, "Invalid icmsg negotiate");
|
|
return false;
|
|
}
|
|
|
|
icmsghdrp->icmsgsize = 0x10;
|
|
negop = (struct icmsg_negotiate *)&buf[ICMSG_HDR];
|
|
|
|
icframe_major = negop->icframe_vercnt;
|
|
icframe_minor = 0;
|
|
|
|
icmsg_major = negop->icmsg_vercnt;
|
|
icmsg_minor = 0;
|
|
|
|
/* Validate negop packet */
|
|
if (icframe_major > IC_VERSION_NEGOTIATION_MAX_VER_COUNT ||
|
|
icmsg_major > IC_VERSION_NEGOTIATION_MAX_VER_COUNT ||
|
|
ICMSG_NEGOTIATE_PKT_SIZE(icframe_major, icmsg_major) > buflen) {
|
|
syslog(LOG_ERR, "Invalid icmsg negotiate - icframe_major: %u, icmsg_major: %u\n",
|
|
icframe_major, icmsg_major);
|
|
goto fw_error;
|
|
}
|
|
|
|
/*
|
|
* Select the framework version number we will
|
|
* support.
|
|
*/
|
|
|
|
for (i = 0; i < fw_vercnt; i++) {
|
|
fw_major = (fw_version[i] >> 16);
|
|
fw_minor = (fw_version[i] & 0xFFFF);
|
|
|
|
for (j = 0; j < negop->icframe_vercnt; j++) {
|
|
if (negop->icversion_data[j].major == fw_major &&
|
|
negop->icversion_data[j].minor == fw_minor) {
|
|
icframe_major = negop->icversion_data[j].major;
|
|
icframe_minor = negop->icversion_data[j].minor;
|
|
found_match = true;
|
|
break;
|
|
}
|
|
}
|
|
|
|
if (found_match)
|
|
break;
|
|
}
|
|
|
|
if (!found_match)
|
|
goto fw_error;
|
|
|
|
found_match = false;
|
|
|
|
for (i = 0; i < srv_vercnt; i++) {
|
|
srv_major = (srv_version[i] >> 16);
|
|
srv_minor = (srv_version[i] & 0xFFFF);
|
|
|
|
for (j = negop->icframe_vercnt;
|
|
(j < negop->icframe_vercnt + negop->icmsg_vercnt);
|
|
j++) {
|
|
if (negop->icversion_data[j].major == srv_major &&
|
|
negop->icversion_data[j].minor == srv_minor) {
|
|
icmsg_major = negop->icversion_data[j].major;
|
|
icmsg_minor = negop->icversion_data[j].minor;
|
|
found_match = true;
|
|
break;
|
|
}
|
|
}
|
|
|
|
if (found_match)
|
|
break;
|
|
}
|
|
|
|
/*
|
|
* Respond with the framework and service
|
|
* version numbers we can support.
|
|
*/
|
|
fw_error:
|
|
if (!found_match) {
|
|
negop->icframe_vercnt = 0;
|
|
negop->icmsg_vercnt = 0;
|
|
} else {
|
|
negop->icframe_vercnt = 1;
|
|
negop->icmsg_vercnt = 1;
|
|
}
|
|
|
|
if (nego_fw_version)
|
|
*nego_fw_version = (icframe_major << 16) | icframe_minor;
|
|
|
|
if (nego_srv_version)
|
|
*nego_srv_version = (icmsg_major << 16) | icmsg_minor;
|
|
|
|
negop->icversion_data[0].major = icframe_major;
|
|
negop->icversion_data[0].minor = icframe_minor;
|
|
negop->icversion_data[1].major = icmsg_major;
|
|
negop->icversion_data[1].minor = icmsg_minor;
|
|
|
|
return found_match;
|
|
}
|
|
|
|
static void wcstoutf8(char *dest, const __u16 *src, size_t dest_size)
|
|
{
|
|
size_t len = 0;
|
|
|
|
while (len < dest_size && *src) {
|
|
if (src[len] < 0x80)
|
|
dest[len++] = (char)(*src++);
|
|
else
|
|
dest[len++] = 'X';
|
|
}
|
|
|
|
dest[len] = '\0';
|
|
}
|
|
|
|
static int hv_fcopy_start(struct hv_start_fcopy *smsg_in)
|
|
{
|
|
/*
|
|
* file_name and path_name should have same length with appropriate
|
|
* member of hv_start_fcopy.
|
|
*/
|
|
char file_name[W_MAX_PATH], path_name[W_MAX_PATH];
|
|
|
|
setlocale(LC_ALL, "en_US.utf8");
|
|
wcstoutf8(file_name, smsg_in->file_name, W_MAX_PATH - 1);
|
|
wcstoutf8(path_name, smsg_in->path_name, W_MAX_PATH - 1);
|
|
|
|
return hv_fcopy_create_file(file_name, path_name, smsg_in->copy_flags);
|
|
}
|
|
|
|
static int hv_fcopy_send_data(struct hv_fcopy_hdr *fcopy_msg, int recvlen)
|
|
{
|
|
int operation = fcopy_msg->operation;
|
|
|
|
/*
|
|
* The strings sent from the host are encoded in
|
|
* utf16; convert it to utf8 strings.
|
|
* The host assures us that the utf16 strings will not exceed
|
|
* the max lengths specified. We will however, reserve room
|
|
* for the string terminating character - in the utf16s_utf8s()
|
|
* function we limit the size of the buffer where the converted
|
|
* string is placed to W_MAX_PATH -1 to guarantee
|
|
* that the strings can be properly terminated!
|
|
*/
|
|
|
|
switch (operation) {
|
|
case START_FILE_COPY:
|
|
return hv_fcopy_start((struct hv_start_fcopy *)fcopy_msg);
|
|
case WRITE_TO_FILE:
|
|
return hv_copy_data((struct hv_do_fcopy *)fcopy_msg);
|
|
case COMPLETE_FCOPY:
|
|
return hv_copy_finished();
|
|
}
|
|
|
|
return HV_E_FAIL;
|
|
}
|
|
|
|
/* process the packet recv from host */
|
|
static int fcopy_pkt_process(struct vmbus_br *txbr)
|
|
{
|
|
int ret, offset, pktlen;
|
|
int fcopy_srv_version;
|
|
const struct vmbus_chanpkt_hdr *pkt;
|
|
struct hv_fcopy_hdr *fcopy_msg;
|
|
struct icmsg_hdr *icmsghdr;
|
|
|
|
pkt = (const struct vmbus_chanpkt_hdr *)desc;
|
|
offset = pkt->hlen << 3;
|
|
pktlen = (pkt->tlen << 3) - offset;
|
|
icmsghdr = (struct icmsg_hdr *)&desc[offset + sizeof(struct vmbuspipe_hdr)];
|
|
icmsghdr->status = HV_E_FAIL;
|
|
|
|
if (icmsghdr->icmsgtype == ICMSGTYPE_NEGOTIATE) {
|
|
if (vmbus_prep_negotiate_resp(icmsghdr, desc + offset, pktlen, fw_versions,
|
|
FW_VER_COUNT, fcopy_versions, FCOPY_VER_COUNT,
|
|
NULL, &fcopy_srv_version)) {
|
|
syslog(LOG_INFO, "FCopy IC version %d.%d",
|
|
fcopy_srv_version >> 16, fcopy_srv_version & 0xFFFF);
|
|
icmsghdr->status = 0;
|
|
}
|
|
} else if (icmsghdr->icmsgtype == ICMSGTYPE_FCOPY) {
|
|
/* Ensure recvlen is big enough to contain hv_fcopy_hdr */
|
|
if (pktlen < ICMSG_HDR + sizeof(struct hv_fcopy_hdr)) {
|
|
syslog(LOG_ERR, "Invalid Fcopy hdr. Packet length too small: %u",
|
|
pktlen);
|
|
return -ENOBUFS;
|
|
}
|
|
|
|
fcopy_msg = (struct hv_fcopy_hdr *)&desc[offset + ICMSG_HDR];
|
|
icmsghdr->status = hv_fcopy_send_data(fcopy_msg, pktlen);
|
|
}
|
|
|
|
icmsghdr->icflags = ICMSGHDRFLAG_TRANSACTION | ICMSGHDRFLAG_RESPONSE;
|
|
ret = rte_vmbus_chan_send(txbr, 0x6, desc + offset, pktlen, 0);
|
|
if (ret) {
|
|
syslog(LOG_ERR, "Write to ringbuffer failed err: %d", ret);
|
|
return ret;
|
|
}
|
|
|
|
return 0;
|
|
}
|
|
|
|
static void fcopy_get_first_folder(char *path, char *chan_no)
|
|
{
|
|
DIR *dir = opendir(path);
|
|
struct dirent *entry;
|
|
|
|
if (!dir) {
|
|
syslog(LOG_ERR, "Failed to open directory (errno=%s).\n", strerror(errno));
|
|
return;
|
|
}
|
|
|
|
while ((entry = readdir(dir)) != NULL) {
|
|
if (entry->d_type == DT_DIR && strcmp(entry->d_name, ".") != 0 &&
|
|
strcmp(entry->d_name, "..") != 0) {
|
|
strcpy(chan_no, entry->d_name);
|
|
break;
|
|
}
|
|
}
|
|
|
|
closedir(dir);
|
|
}
|
|
|
|
int main(int argc, char *argv[])
|
|
{
|
|
int fcopy_fd = -1, tmp = 1;
|
|
int daemonize = 1, long_index = 0, opt, ret = -EINVAL;
|
|
struct vmbus_br txbr, rxbr;
|
|
void *ring;
|
|
uint32_t ring_size, len;
|
|
char uio_name[NAME_MAX] = {0};
|
|
char uio_dev_path[PATH_MAX] = {0};
|
|
|
|
static struct option long_options[] = {
|
|
{"help", no_argument, 0, 'h' },
|
|
{"no-daemon", no_argument, 0, 'n' },
|
|
{0, 0, 0, 0 }
|
|
};
|
|
|
|
while ((opt = getopt_long(argc, argv, "hn", long_options,
|
|
&long_index)) != -1) {
|
|
switch (opt) {
|
|
case 'n':
|
|
daemonize = 0;
|
|
break;
|
|
case 'h':
|
|
default:
|
|
print_usage(argv);
|
|
goto exit;
|
|
}
|
|
}
|
|
|
|
if (daemonize && daemon(1, 0)) {
|
|
syslog(LOG_ERR, "daemon() failed; error: %s", strerror(errno));
|
|
goto exit;
|
|
}
|
|
|
|
openlog("HV_UIO_FCOPY", 0, LOG_USER);
|
|
syslog(LOG_INFO, "starting; pid is:%d", getpid());
|
|
|
|
ring_size = get_ring_buffer_size();
|
|
if (!ring_size) {
|
|
ret = -ENODEV;
|
|
goto exit;
|
|
}
|
|
|
|
desc = malloc(ring_size * sizeof(unsigned char));
|
|
if (!desc) {
|
|
syslog(LOG_ERR, "malloc failed for desc buffer");
|
|
ret = -ENOMEM;
|
|
goto exit;
|
|
}
|
|
|
|
fcopy_get_first_folder(FCOPY_UIO_PATH, uio_name);
|
|
snprintf(uio_dev_path, sizeof(uio_dev_path), "/dev/%s", uio_name);
|
|
fcopy_fd = open(uio_dev_path, O_RDWR);
|
|
|
|
if (fcopy_fd < 0) {
|
|
syslog(LOG_ERR, "open %s failed; error: %d %s",
|
|
uio_dev_path, errno, strerror(errno));
|
|
ret = fcopy_fd;
|
|
goto free_desc;
|
|
}
|
|
|
|
ring = vmbus_uio_map(&fcopy_fd, ring_size);
|
|
if (!ring) {
|
|
ret = errno;
|
|
syslog(LOG_ERR, "mmap ringbuffer failed; error: %d %s", ret, strerror(ret));
|
|
goto close;
|
|
}
|
|
vmbus_br_setup(&txbr, ring, ring_size);
|
|
vmbus_br_setup(&rxbr, (char *)ring + ring_size, ring_size);
|
|
|
|
rxbr.vbr->imask = 0;
|
|
|
|
while (1) {
|
|
/*
|
|
* In this loop we process fcopy messages after the
|
|
* handshake is complete.
|
|
*/
|
|
ret = pread(fcopy_fd, &tmp, sizeof(int), 0);
|
|
if (ret < 0) {
|
|
if (errno == EINTR || errno == EAGAIN)
|
|
continue;
|
|
syslog(LOG_ERR, "pread failed: %s", strerror(errno));
|
|
goto close;
|
|
}
|
|
|
|
len = ring_size;
|
|
ret = rte_vmbus_chan_recv_raw(&rxbr, desc, &len);
|
|
if (unlikely(ret <= 0)) {
|
|
/* This indicates a failure to communicate (or worse) */
|
|
syslog(LOG_ERR, "VMBus channel recv error: %d", ret);
|
|
} else {
|
|
ret = fcopy_pkt_process(&txbr);
|
|
if (ret < 0)
|
|
goto close;
|
|
|
|
/* Signal host */
|
|
if ((write(fcopy_fd, &tmp, sizeof(int))) != sizeof(int)) {
|
|
ret = errno;
|
|
syslog(LOG_ERR, "Signal to host failed: %s\n", strerror(ret));
|
|
goto close;
|
|
}
|
|
}
|
|
}
|
|
close:
|
|
close(fcopy_fd);
|
|
free_desc:
|
|
free(desc);
|
|
exit:
|
|
return ret;
|
|
}
|