Tracify migration/rdma.c

Turn all the D/DD/DDDPRINTFs into trace events
Turn most of the fprintf(stderr, into error_report

Signed-off-by: Dr. David Alan Gilbert <dgilbert@redhat.com>
Signed-off-by: Amit Shah <amit.shah@redhat.com>
Signed-off-by: Juan Quintela <quintela@redhat.com>
This commit is contained in:
Dr. David Alan Gilbert 2015-02-02 19:53:33 +00:00 committed by Juan Quintela
parent b17425701d
commit 733252deb8
2 changed files with 206 additions and 189 deletions

View File

@ -26,34 +26,7 @@
#include <arpa/inet.h> #include <arpa/inet.h>
#include <string.h> #include <string.h>
#include <rdma/rdma_cma.h> #include <rdma/rdma_cma.h>
#include "trace.h"
//#define DEBUG_RDMA
//#define DEBUG_RDMA_VERBOSE
//#define DEBUG_RDMA_REALLY_VERBOSE
#ifdef DEBUG_RDMA
#define DPRINTF(fmt, ...) \
do { printf("rdma: " fmt, ## __VA_ARGS__); } while (0)
#else
#define DPRINTF(fmt, ...) \
do { } while (0)
#endif
#ifdef DEBUG_RDMA_VERBOSE
#define DDPRINTF(fmt, ...) \
do { printf("rdma: " fmt, ## __VA_ARGS__); } while (0)
#else
#define DDPRINTF(fmt, ...) \
do { } while (0)
#endif
#ifdef DEBUG_RDMA_REALLY_VERBOSE
#define DDDPRINTF(fmt, ...) \
do { printf("rdma: " fmt, ## __VA_ARGS__); } while (0)
#else
#define DDDPRINTF(fmt, ...) \
do { } while (0)
#endif
/* /*
* Print and error on both the Monitor and the Log file. * Print and error on both the Monitor and the Log file.
@ -104,8 +77,8 @@ static uint32_t known_capabilities = RDMA_CAPABILITY_PIN_ALL;
do { \ do { \
if (rdma->error_state) { \ if (rdma->error_state) { \
if (!rdma->error_reported) { \ if (!rdma->error_reported) { \
fprintf(stderr, "RDMA is in an error state waiting migration" \ error_report("RDMA is in an error state waiting migration" \
" to abort!\n"); \ " to abort!"); \
rdma->error_reported = 1; \ rdma->error_reported = 1; \
} \ } \
return rdma->error_state; \ return rdma->error_state; \
@ -578,12 +551,13 @@ static int __qemu_rdma_add_block(RDMAContext *rdma, void *host_addr,
g_hash_table_insert(rdma->blockmap, (void *) block_offset, block); g_hash_table_insert(rdma->blockmap, (void *) block_offset, block);
DDPRINTF("Added Block: %d, addr: %" PRIu64 ", offset: %" PRIu64 trace___qemu_rdma_add_block(local->nb_blocks,
" length: %" PRIu64 " end: %" PRIu64 " bits %" PRIu64 " chunks %d\n", (uint64_t) block->local_host_addr, block->offset,
local->nb_blocks, (uint64_t) block->local_host_addr, block->offset, block->length,
block->length, (uint64_t) (block->local_host_addr + block->length), (uint64_t) (block->local_host_addr + block->length),
BITS_TO_LONGS(block->nb_chunks) * BITS_TO_LONGS(block->nb_chunks) *
sizeof(unsigned long) * 8, block->nb_chunks); sizeof(unsigned long) * 8,
block->nb_chunks);
local->nb_blocks++; local->nb_blocks++;
@ -614,7 +588,7 @@ static int qemu_rdma_init_ram_blocks(RDMAContext *rdma)
rdma->blockmap = g_hash_table_new(g_direct_hash, g_direct_equal); rdma->blockmap = g_hash_table_new(g_direct_hash, g_direct_equal);
memset(local, 0, sizeof *local); memset(local, 0, sizeof *local);
qemu_ram_foreach_block(qemu_rdma_init_one_block, rdma); qemu_ram_foreach_block(qemu_rdma_init_one_block, rdma);
DPRINTF("Allocated %d local ram block structures\n", local->nb_blocks); trace_qemu_rdma_init_ram_blocks(local->nb_blocks);
rdma->block = (RDMARemoteBlock *) g_malloc0(sizeof(RDMARemoteBlock) * rdma->block = (RDMARemoteBlock *) g_malloc0(sizeof(RDMARemoteBlock) *
rdma->local_ram_blocks.nb_blocks); rdma->local_ram_blocks.nb_blocks);
local->init = true; local->init = true;
@ -683,12 +657,12 @@ static int __qemu_rdma_delete_block(RDMAContext *rdma, ram_addr_t block_offset)
local->block = NULL; local->block = NULL;
} }
DDPRINTF("Deleted Block: %d, addr: %" PRIu64 ", offset: %" PRIu64 trace___qemu_rdma_delete_block(local->nb_blocks,
" length: %" PRIu64 " end: %" PRIu64 " bits %" PRIu64 " chunks %d\n", (uint64_t)block->local_host_addr,
local->nb_blocks, (uint64_t) block->local_host_addr, block->offset, block->offset, block->length,
block->length, (uint64_t) (block->local_host_addr + block->length), (uint64_t)(block->local_host_addr + block->length),
BITS_TO_LONGS(block->nb_chunks) * BITS_TO_LONGS(block->nb_chunks) *
sizeof(unsigned long) * 8, block->nb_chunks); sizeof(unsigned long) * 8, block->nb_chunks);
g_free(old); g_free(old);
@ -713,7 +687,7 @@ static void qemu_rdma_dump_id(const char *who, struct ibv_context *verbs)
struct ibv_port_attr port; struct ibv_port_attr port;
if (ibv_query_port(verbs, 1, &port)) { if (ibv_query_port(verbs, 1, &port)) {
fprintf(stderr, "FAILED TO QUERY PORT INFORMATION!\n"); error_report("Failed to query port information");
return; return;
} }
@ -744,7 +718,7 @@ static void qemu_rdma_dump_gid(const char *who, struct rdma_cm_id *id)
char dgid[33]; char dgid[33];
inet_ntop(AF_INET6, &id->route.addr.addr.ibaddr.sgid, sgid, sizeof sgid); inet_ntop(AF_INET6, &id->route.addr.addr.ibaddr.sgid, sgid, sizeof sgid);
inet_ntop(AF_INET6, &id->route.addr.addr.ibaddr.dgid, dgid, sizeof dgid); inet_ntop(AF_INET6, &id->route.addr.addr.ibaddr.dgid, dgid, sizeof dgid);
DPRINTF("%s Source GID: %s, Dest GID: %s\n", who, sgid, dgid); trace_qemu_rdma_dump_gid(who, sgid, dgid);
} }
/* /*
@ -918,7 +892,7 @@ static int qemu_rdma_resolve_host(RDMAContext *rdma, Error **errp)
for (e = res; e != NULL; e = e->ai_next) { for (e = res; e != NULL; e = e->ai_next) {
inet_ntop(e->ai_family, inet_ntop(e->ai_family,
&((struct sockaddr_in *) e->ai_dst_addr)->sin_addr, ip, sizeof ip); &((struct sockaddr_in *) e->ai_dst_addr)->sin_addr, ip, sizeof ip);
DPRINTF("Trying %s => %s\n", rdma->host, ip); trace_qemu_rdma_resolve_host_trying(rdma->host, ip);
ret = rdma_resolve_addr(rdma->cm_id, NULL, e->ai_dst_addr, ret = rdma_resolve_addr(rdma->cm_id, NULL, e->ai_dst_addr,
RDMA_RESOLVE_TIMEOUT_MS); RDMA_RESOLVE_TIMEOUT_MS);
@ -997,14 +971,14 @@ static int qemu_rdma_alloc_pd_cq(RDMAContext *rdma)
/* allocate pd */ /* allocate pd */
rdma->pd = ibv_alloc_pd(rdma->verbs); rdma->pd = ibv_alloc_pd(rdma->verbs);
if (!rdma->pd) { if (!rdma->pd) {
fprintf(stderr, "failed to allocate protection domain\n"); error_report("failed to allocate protection domain");
return -1; return -1;
} }
/* create completion channel */ /* create completion channel */
rdma->comp_channel = ibv_create_comp_channel(rdma->verbs); rdma->comp_channel = ibv_create_comp_channel(rdma->verbs);
if (!rdma->comp_channel) { if (!rdma->comp_channel) {
fprintf(stderr, "failed to allocate completion channel\n"); error_report("failed to allocate completion channel");
goto err_alloc_pd_cq; goto err_alloc_pd_cq;
} }
@ -1015,7 +989,7 @@ static int qemu_rdma_alloc_pd_cq(RDMAContext *rdma)
rdma->cq = ibv_create_cq(rdma->verbs, (RDMA_SIGNALED_SEND_MAX * 3), rdma->cq = ibv_create_cq(rdma->verbs, (RDMA_SIGNALED_SEND_MAX * 3),
NULL, rdma->comp_channel, 0); NULL, rdma->comp_channel, 0);
if (!rdma->cq) { if (!rdma->cq) {
fprintf(stderr, "failed to allocate completion queue\n"); error_report("failed to allocate completion queue");
goto err_alloc_pd_cq; goto err_alloc_pd_cq;
} }
@ -1160,8 +1134,7 @@ static int qemu_rdma_register_and_get_keys(RDMAContext *rdma,
if (!block->pmr[chunk]) { if (!block->pmr[chunk]) {
uint64_t len = chunk_end - chunk_start; uint64_t len = chunk_end - chunk_start;
DDPRINTF("Registering %" PRIu64 " bytes @ %p\n", trace_qemu_rdma_register_and_get_keys(len, chunk_start);
len, chunk_start);
block->pmr[chunk] = ibv_reg_mr(rdma->pd, block->pmr[chunk] = ibv_reg_mr(rdma->pd,
chunk_start, len, chunk_start, len,
@ -1204,7 +1177,7 @@ static int qemu_rdma_reg_control(RDMAContext *rdma, int idx)
rdma->total_registrations++; rdma->total_registrations++;
return 0; return 0;
} }
fprintf(stderr, "qemu_rdma_reg_control failed!\n"); error_report("qemu_rdma_reg_control failed");
return -1; return -1;
} }
@ -1270,8 +1243,8 @@ static int qemu_rdma_unregister_waiting(RDMAContext *rdma)
.repeat = 1, .repeat = 1,
}; };
DDPRINTF("Processing unregister for chunk: %" PRIu64 trace_qemu_rdma_unregister_waiting_proc(chunk,
" at position %d\n", chunk, rdma->unregister_current); rdma->unregister_current);
rdma->unregistrations[rdma->unregister_current] = 0; rdma->unregistrations[rdma->unregister_current] = 0;
rdma->unregister_current++; rdma->unregister_current++;
@ -1291,11 +1264,11 @@ static int qemu_rdma_unregister_waiting(RDMAContext *rdma)
clear_bit(chunk, block->unregister_bitmap); clear_bit(chunk, block->unregister_bitmap);
if (test_bit(chunk, block->transit_bitmap)) { if (test_bit(chunk, block->transit_bitmap)) {
DDPRINTF("Cannot unregister inflight chunk: %" PRIu64 "\n", chunk); trace_qemu_rdma_unregister_waiting_inflight(chunk);
continue; continue;
} }
DDPRINTF("Sending unregister for chunk: %" PRIu64 "\n", chunk); trace_qemu_rdma_unregister_waiting_send(chunk);
ret = ibv_dereg_mr(block->pmr[chunk]); ret = ibv_dereg_mr(block->pmr[chunk]);
block->pmr[chunk] = NULL; block->pmr[chunk] = NULL;
@ -1315,7 +1288,7 @@ static int qemu_rdma_unregister_waiting(RDMAContext *rdma)
return ret; return ret;
} }
DDPRINTF("Unregister for chunk: %" PRIu64 " complete.\n", chunk); trace_qemu_rdma_unregister_waiting_complete(chunk);
} }
return 0; return 0;
@ -1340,13 +1313,13 @@ static void qemu_rdma_signal_unregister(RDMAContext *rdma, uint64_t index,
uint64_t chunk, uint64_t wr_id) uint64_t chunk, uint64_t wr_id)
{ {
if (rdma->unregistrations[rdma->unregister_next] != 0) { if (rdma->unregistrations[rdma->unregister_next] != 0) {
fprintf(stderr, "rdma migration: queue is full!\n"); error_report("rdma migration: queue is full");
} else { } else {
RDMALocalBlock *block = &(rdma->local_ram_blocks.block[index]); RDMALocalBlock *block = &(rdma->local_ram_blocks.block[index]);
if (!test_and_set_bit(chunk, block->unregister_bitmap)) { if (!test_and_set_bit(chunk, block->unregister_bitmap)) {
DDPRINTF("Appending unregister chunk %" PRIu64 trace_qemu_rdma_signal_unregister_append(chunk,
" at position %d\n", chunk, rdma->unregister_next); rdma->unregister_next);
rdma->unregistrations[rdma->unregister_next++] = rdma->unregistrations[rdma->unregister_next++] =
qemu_rdma_make_wrid(wr_id, index, chunk); qemu_rdma_make_wrid(wr_id, index, chunk);
@ -1355,8 +1328,7 @@ static void qemu_rdma_signal_unregister(RDMAContext *rdma, uint64_t index,
rdma->unregister_next = 0; rdma->unregister_next = 0;
} }
} else { } else {
DDPRINTF("Unregister chunk %" PRIu64 " already in queue.\n", trace_qemu_rdma_signal_unregister_already(chunk);
chunk);
} }
} }
} }
@ -1381,7 +1353,7 @@ static uint64_t qemu_rdma_poll(RDMAContext *rdma, uint64_t *wr_id_out,
} }
if (ret < 0) { if (ret < 0) {
fprintf(stderr, "ibv_poll_cq return %d!\n", ret); error_report("ibv_poll_cq return %d", ret);
return ret; return ret;
} }
@ -1397,8 +1369,7 @@ static uint64_t qemu_rdma_poll(RDMAContext *rdma, uint64_t *wr_id_out,
if (rdma->control_ready_expected && if (rdma->control_ready_expected &&
(wr_id >= RDMA_WRID_RECV_CONTROL)) { (wr_id >= RDMA_WRID_RECV_CONTROL)) {
DDDPRINTF("completion %s #%" PRId64 " received (%" PRId64 ")" trace_qemu_rdma_poll_recv(wrid_desc[RDMA_WRID_RECV_CONTROL],
" left %d\n", wrid_desc[RDMA_WRID_RECV_CONTROL],
wr_id - RDMA_WRID_RECV_CONTROL, wr_id, rdma->nb_sent); wr_id - RDMA_WRID_RECV_CONTROL, wr_id, rdma->nb_sent);
rdma->control_ready_expected = 0; rdma->control_ready_expected = 0;
} }
@ -1410,9 +1381,8 @@ static uint64_t qemu_rdma_poll(RDMAContext *rdma, uint64_t *wr_id_out,
(wc.wr_id & RDMA_WRID_BLOCK_MASK) >> RDMA_WRID_BLOCK_SHIFT; (wc.wr_id & RDMA_WRID_BLOCK_MASK) >> RDMA_WRID_BLOCK_SHIFT;
RDMALocalBlock *block = &(rdma->local_ram_blocks.block[index]); RDMALocalBlock *block = &(rdma->local_ram_blocks.block[index]);
DDDPRINTF("completions %s (%" PRId64 ") left %d, " trace_qemu_rdma_poll_write(print_wrid(wr_id), wr_id, rdma->nb_sent,
"block %" PRIu64 ", chunk: %" PRIu64 " %p %p\n", index, chunk,
print_wrid(wr_id), wr_id, rdma->nb_sent, index, chunk,
block->local_host_addr, (void *)block->remote_host_addr); block->local_host_addr, (void *)block->remote_host_addr);
clear_bit(chunk, block->transit_bitmap); clear_bit(chunk, block->transit_bitmap);
@ -1433,8 +1403,7 @@ static uint64_t qemu_rdma_poll(RDMAContext *rdma, uint64_t *wr_id_out,
#endif #endif
} }
} else { } else {
DDDPRINTF("other completion %s (%" PRId64 ") received left %d\n", trace_qemu_rdma_poll_other(print_wrid(wr_id), wr_id, rdma->nb_sent);
print_wrid(wr_id), wr_id, rdma->nb_sent);
} }
*wr_id_out = wc.wr_id; *wr_id_out = wc.wr_id;
@ -1482,9 +1451,8 @@ static int qemu_rdma_block_for_wrid(RDMAContext *rdma, int wrid_requested,
break; break;
} }
if (wr_id != wrid_requested) { if (wr_id != wrid_requested) {
DDDPRINTF("A Wanted wrid %s (%d) but got %s (%" PRIu64 ")\n", trace_qemu_rdma_block_for_wrid_miss(print_wrid(wrid_requested),
print_wrid(wrid_requested), wrid_requested, print_wrid(wr_id), wr_id);
wrid_requested, print_wrid(wr_id), wr_id);
} }
} }
@ -1524,9 +1492,8 @@ static int qemu_rdma_block_for_wrid(RDMAContext *rdma, int wrid_requested,
break; break;
} }
if (wr_id != wrid_requested) { if (wr_id != wrid_requested) {
DDDPRINTF("B Wanted wrid %s (%d) but got %s (%" PRIu64 ")\n", trace_qemu_rdma_block_for_wrid_miss(print_wrid(wrid_requested),
print_wrid(wrid_requested), wrid_requested, wrid_requested, print_wrid(wr_id), wr_id);
print_wrid(wr_id), wr_id);
} }
} }
@ -1571,7 +1538,7 @@ static int qemu_rdma_post_send_control(RDMAContext *rdma, uint8_t *buf,
.num_sge = 1, .num_sge = 1,
}; };
DDDPRINTF("CONTROL: sending %s..\n", control_desc[head->type]); trace_qemu_rdma_post_send_control(control_desc[head->type]);
/* /*
* We don't actually need to do a memcpy() in here if we used * We don't actually need to do a memcpy() in here if we used
@ -1593,13 +1560,13 @@ static int qemu_rdma_post_send_control(RDMAContext *rdma, uint8_t *buf,
ret = ibv_post_send(rdma->qp, &send_wr, &bad_wr); ret = ibv_post_send(rdma->qp, &send_wr, &bad_wr);
if (ret > 0) { if (ret > 0) {
fprintf(stderr, "Failed to use post IB SEND for control!\n"); error_report("Failed to use post IB SEND for control");
return -ret; return -ret;
} }
ret = qemu_rdma_block_for_wrid(rdma, RDMA_WRID_SEND_CONTROL, NULL); ret = qemu_rdma_block_for_wrid(rdma, RDMA_WRID_SEND_CONTROL, NULL);
if (ret < 0) { if (ret < 0) {
fprintf(stderr, "rdma migration: send polling control error!\n"); error_report("rdma migration: send polling control error");
} }
return ret; return ret;
@ -1643,32 +1610,31 @@ static int qemu_rdma_exchange_get_response(RDMAContext *rdma,
&byte_len); &byte_len);
if (ret < 0) { if (ret < 0) {
fprintf(stderr, "rdma migration: recv polling control error!\n"); error_report("rdma migration: recv polling control error!");
return ret; return ret;
} }
network_to_control((void *) rdma->wr_data[idx].control); network_to_control((void *) rdma->wr_data[idx].control);
memcpy(head, rdma->wr_data[idx].control, sizeof(RDMAControlHeader)); memcpy(head, rdma->wr_data[idx].control, sizeof(RDMAControlHeader));
DDDPRINTF("CONTROL: %s receiving...\n", control_desc[expecting]); trace_qemu_rdma_exchange_get_response_start(control_desc[expecting]);
if (expecting == RDMA_CONTROL_NONE) { if (expecting == RDMA_CONTROL_NONE) {
DDDPRINTF("Surprise: got %s (%d)\n", trace_qemu_rdma_exchange_get_response_none(control_desc[head->type],
control_desc[head->type], head->type); head->type);
} else if (head->type != expecting || head->type == RDMA_CONTROL_ERROR) { } else if (head->type != expecting || head->type == RDMA_CONTROL_ERROR) {
fprintf(stderr, "Was expecting a %s (%d) control message" error_report("Was expecting a %s (%d) control message"
", but got: %s (%d), length: %d\n", ", but got: %s (%d), length: %d",
control_desc[expecting], expecting, control_desc[expecting], expecting,
control_desc[head->type], head->type, head->len); control_desc[head->type], head->type, head->len);
return -EIO; return -EIO;
} }
if (head->len > RDMA_CONTROL_MAX_BUFFER - sizeof(*head)) { if (head->len > RDMA_CONTROL_MAX_BUFFER - sizeof(*head)) {
fprintf(stderr, "too long length: %d\n", head->len); error_report("too long length: %d\n", head->len);
return -EINVAL; return -EINVAL;
} }
if (sizeof(*head) + head->len != byte_len) { if (sizeof(*head) + head->len != byte_len) {
fprintf(stderr, "Malformed length: %d byte_len %d\n", error_report("Malformed length: %d byte_len %d", head->len, byte_len);
head->len, byte_len);
return -EINVAL; return -EINVAL;
} }
@ -1730,7 +1696,7 @@ static int qemu_rdma_exchange_send(RDMAContext *rdma, RDMAControlHeader *head,
if (resp) { if (resp) {
ret = qemu_rdma_post_recv_control(rdma, RDMA_WRID_DATA); ret = qemu_rdma_post_recv_control(rdma, RDMA_WRID_DATA);
if (ret) { if (ret) {
fprintf(stderr, "rdma migration: error posting" error_report("rdma migration: error posting"
" extra control recv for anticipated result!"); " extra control recv for anticipated result!");
return ret; return ret;
} }
@ -1741,7 +1707,7 @@ static int qemu_rdma_exchange_send(RDMAContext *rdma, RDMAControlHeader *head,
*/ */
ret = qemu_rdma_post_recv_control(rdma, RDMA_WRID_READY); ret = qemu_rdma_post_recv_control(rdma, RDMA_WRID_READY);
if (ret) { if (ret) {
fprintf(stderr, "rdma migration: error posting first control recv!"); error_report("rdma migration: error posting first control recv!");
return ret; return ret;
} }
@ -1751,7 +1717,7 @@ static int qemu_rdma_exchange_send(RDMAContext *rdma, RDMAControlHeader *head,
ret = qemu_rdma_post_send_control(rdma, data, head); ret = qemu_rdma_post_send_control(rdma, data, head);
if (ret < 0) { if (ret < 0) {
fprintf(stderr, "Failed to send control buffer!\n"); error_report("Failed to send control buffer!");
return ret; return ret;
} }
@ -1760,14 +1726,14 @@ static int qemu_rdma_exchange_send(RDMAContext *rdma, RDMAControlHeader *head,
*/ */
if (resp) { if (resp) {
if (callback) { if (callback) {
DDPRINTF("Issuing callback before receiving response...\n"); trace_qemu_rdma_exchange_send_issue_callback();
ret = callback(rdma); ret = callback(rdma);
if (ret < 0) { if (ret < 0) {
return ret; return ret;
} }
} }
DDPRINTF("Waiting for response %s\n", control_desc[resp->type]); trace_qemu_rdma_exchange_send_waiting(control_desc[resp->type]);
ret = qemu_rdma_exchange_get_response(rdma, resp, ret = qemu_rdma_exchange_get_response(rdma, resp,
resp->type, RDMA_WRID_DATA); resp->type, RDMA_WRID_DATA);
@ -1779,7 +1745,7 @@ static int qemu_rdma_exchange_send(RDMAContext *rdma, RDMAControlHeader *head,
if (resp_idx) { if (resp_idx) {
*resp_idx = RDMA_WRID_DATA; *resp_idx = RDMA_WRID_DATA;
} }
DDPRINTF("Response %s received.\n", control_desc[resp->type]); trace_qemu_rdma_exchange_send_received(control_desc[resp->type]);
} }
rdma->control_ready_expected = 1; rdma->control_ready_expected = 1;
@ -1807,7 +1773,7 @@ static int qemu_rdma_exchange_recv(RDMAContext *rdma, RDMAControlHeader *head,
ret = qemu_rdma_post_send_control(rdma, NULL, &ready); ret = qemu_rdma_post_send_control(rdma, NULL, &ready);
if (ret < 0) { if (ret < 0) {
fprintf(stderr, "Failed to send control buffer!\n"); error_report("Failed to send control buffer!");
return ret; return ret;
} }
@ -1828,7 +1794,7 @@ static int qemu_rdma_exchange_recv(RDMAContext *rdma, RDMAControlHeader *head,
*/ */
ret = qemu_rdma_post_recv_control(rdma, RDMA_WRID_READY); ret = qemu_rdma_post_recv_control(rdma, RDMA_WRID_READY);
if (ret) { if (ret) {
fprintf(stderr, "rdma migration: error posting second control recv!"); error_report("rdma migration: error posting second control recv!");
return ret; return ret;
} }
@ -1882,8 +1848,9 @@ retry:
} }
} }
DDPRINTF("Writing %" PRIu64 " chunks, (%" PRIu64 " MB)\n", trace_qemu_rdma_write_one_top(chunks + 1,
chunks + 1, (chunks + 1) * (1UL << RDMA_REG_CHUNK_SHIFT) / 1024 / 1024); (chunks + 1) *
(1UL << RDMA_REG_CHUNK_SHIFT) / 1024 / 1024);
chunk_end = ram_chunk_end(block, chunk + chunks); chunk_end = ram_chunk_end(block, chunk + chunks);
@ -1895,17 +1862,15 @@ retry:
while (test_bit(chunk, block->transit_bitmap)) { while (test_bit(chunk, block->transit_bitmap)) {
(void)count; (void)count;
DDPRINTF("(%d) Not clobbering: block: %d chunk %" PRIu64 trace_qemu_rdma_write_one_block(count++, current_index, chunk,
" current %" PRIu64 " len %" PRIu64 " %d %d\n",
count++, current_index, chunk,
sge.addr, length, rdma->nb_sent, block->nb_chunks); sge.addr, length, rdma->nb_sent, block->nb_chunks);
ret = qemu_rdma_block_for_wrid(rdma, RDMA_WRID_RDMA_WRITE, NULL); ret = qemu_rdma_block_for_wrid(rdma, RDMA_WRID_RDMA_WRITE, NULL);
if (ret < 0) { if (ret < 0) {
fprintf(stderr, "Failed to Wait for previous write to complete " error_report("Failed to Wait for previous write to complete "
"block %d chunk %" PRIu64 "block %d chunk %" PRIu64
" current %" PRIu64 " len %" PRIu64 " %d\n", " current %" PRIu64 " len %" PRIu64 " %d",
current_index, chunk, sge.addr, length, rdma->nb_sent); current_index, chunk, sge.addr, length, rdma->nb_sent);
return ret; return ret;
} }
@ -1932,10 +1897,8 @@ retry:
head.len = sizeof(comp); head.len = sizeof(comp);
head.type = RDMA_CONTROL_COMPRESS; head.type = RDMA_CONTROL_COMPRESS;
DDPRINTF("Entire chunk is zero, sending compress: %" trace_qemu_rdma_write_one_zero(chunk, sge.length,
PRIu64 " for %d " current_index, current_addr);
"bytes, index: %d, offset: %" PRId64 "...\n",
chunk, sge.length, current_index, current_addr);
compress_to_network(&comp); compress_to_network(&comp);
ret = qemu_rdma_exchange_send(rdma, &head, ret = qemu_rdma_exchange_send(rdma, &head,
@ -1961,9 +1924,8 @@ retry:
} }
reg.chunks = chunks; reg.chunks = chunks;
DDPRINTF("Sending registration request chunk %" PRIu64 " for %d " trace_qemu_rdma_write_one_sendreg(chunk, sge.length, current_index,
"bytes, index: %d, offset: %" PRId64 "...\n", current_addr);
chunk, sge.length, current_index, current_addr);
register_to_network(&reg); register_to_network(&reg);
ret = qemu_rdma_exchange_send(rdma, &head, (uint8_t *) &reg, ret = qemu_rdma_exchange_send(rdma, &head, (uint8_t *) &reg,
@ -1977,7 +1939,7 @@ retry:
(uint8_t *) sge.addr, (uint8_t *) sge.addr,
&sge.lkey, NULL, chunk, &sge.lkey, NULL, chunk,
chunk_start, chunk_end)) { chunk_start, chunk_end)) {
fprintf(stderr, "cannot get lkey!\n"); error_report("cannot get lkey");
return -EINVAL; return -EINVAL;
} }
@ -1986,9 +1948,8 @@ retry:
network_to_result(reg_result); network_to_result(reg_result);
DDPRINTF("Received registration result:" trace_qemu_rdma_write_one_recvregres(block->remote_keys[chunk],
" my key: %x their key %x, chunk %" PRIu64 "\n", reg_result->rkey, chunk);
block->remote_keys[chunk], reg_result->rkey, chunk);
block->remote_keys[chunk] = reg_result->rkey; block->remote_keys[chunk] = reg_result->rkey;
block->remote_host_addr = reg_result->host_addr; block->remote_host_addr = reg_result->host_addr;
@ -1998,7 +1959,7 @@ retry:
(uint8_t *)sge.addr, (uint8_t *)sge.addr,
&sge.lkey, NULL, chunk, &sge.lkey, NULL, chunk,
chunk_start, chunk_end)) { chunk_start, chunk_end)) {
fprintf(stderr, "cannot get lkey!\n"); error_report("cannot get lkey!");
return -EINVAL; return -EINVAL;
} }
} }
@ -2010,7 +1971,7 @@ retry:
if (qemu_rdma_register_and_get_keys(rdma, block, (uint8_t *)sge.addr, if (qemu_rdma_register_and_get_keys(rdma, block, (uint8_t *)sge.addr,
&sge.lkey, NULL, chunk, &sge.lkey, NULL, chunk,
chunk_start, chunk_end)) { chunk_start, chunk_end)) {
fprintf(stderr, "cannot get lkey!\n"); error_report("cannot get lkey!");
return -EINVAL; return -EINVAL;
} }
} }
@ -2031,10 +1992,8 @@ retry:
send_wr.wr.rdma.remote_addr = block->remote_host_addr + send_wr.wr.rdma.remote_addr = block->remote_host_addr +
(current_addr - block->offset); (current_addr - block->offset);
DDDPRINTF("Posting chunk: %" PRIu64 ", addr: %lx" trace_qemu_rdma_write_one_post(chunk, sge.addr, send_wr.wr.rdma.remote_addr,
" remote: %lx, bytes %" PRIu32 "\n", sge.length);
chunk, sge.addr, send_wr.wr.rdma.remote_addr,
sge.length);
/* /*
* ibv_post_send() does not return negative error numbers, * ibv_post_send() does not return negative error numbers,
@ -2043,11 +2002,11 @@ retry:
ret = ibv_post_send(rdma->qp, &send_wr, &bad_wr); ret = ibv_post_send(rdma->qp, &send_wr, &bad_wr);
if (ret == ENOMEM) { if (ret == ENOMEM) {
DDPRINTF("send queue is full. wait a little....\n"); trace_qemu_rdma_write_one_queue_full();
ret = qemu_rdma_block_for_wrid(rdma, RDMA_WRID_RDMA_WRITE, NULL); ret = qemu_rdma_block_for_wrid(rdma, RDMA_WRID_RDMA_WRITE, NULL);
if (ret < 0) { if (ret < 0) {
fprintf(stderr, "rdma migration: failed to make " error_report("rdma migration: failed to make "
"room in full send queue! %d\n", ret); "room in full send queue! %d", ret);
return ret; return ret;
} }
@ -2088,7 +2047,7 @@ static int qemu_rdma_write_flush(QEMUFile *f, RDMAContext *rdma)
if (ret == 0) { if (ret == 0) {
rdma->nb_sent++; rdma->nb_sent++;
DDDPRINTF("sent total: %d\n", rdma->nb_sent); trace_qemu_rdma_write_flush(rdma->nb_sent);
} }
rdma->current_length = 0; rdma->current_length = 0;
@ -2173,7 +2132,7 @@ static int qemu_rdma_write(QEMUFile *f, RDMAContext *rdma,
ret = qemu_rdma_search_ram_block(rdma, block_offset, ret = qemu_rdma_search_ram_block(rdma, block_offset,
offset, len, &index, &chunk); offset, len, &index, &chunk);
if (ret) { if (ret) {
fprintf(stderr, "ram block search failed\n"); error_report("ram block search failed");
return ret; return ret;
} }
rdma->current_index = index; rdma->current_index = index;
@ -2202,19 +2161,19 @@ static void qemu_rdma_cleanup(RDMAContext *rdma)
.type = RDMA_CONTROL_ERROR, .type = RDMA_CONTROL_ERROR,
.repeat = 1, .repeat = 1,
}; };
fprintf(stderr, "Early error. Sending error.\n"); error_report("Early error. Sending error.");
qemu_rdma_post_send_control(rdma, NULL, &head); qemu_rdma_post_send_control(rdma, NULL, &head);
} }
ret = rdma_disconnect(rdma->cm_id); ret = rdma_disconnect(rdma->cm_id);
if (!ret) { if (!ret) {
DDPRINTF("waiting for disconnect\n"); trace_qemu_rdma_cleanup_waiting_for_disconnect();
ret = rdma_get_cm_event(rdma->channel, &cm_event); ret = rdma_get_cm_event(rdma->channel, &cm_event);
if (!ret) { if (!ret) {
rdma_ack_cm_event(cm_event); rdma_ack_cm_event(cm_event);
} }
} }
DDPRINTF("Disconnected.\n"); trace_qemu_rdma_cleanup_disconnect();
rdma->connected = false; rdma->connected = false;
} }
@ -2341,7 +2300,7 @@ static int qemu_rdma_connect(RDMAContext *rdma, Error **errp)
* on the source first requested the capability. * on the source first requested the capability.
*/ */
if (rdma->pin_all) { if (rdma->pin_all) {
DPRINTF("Server pin-all memory requested.\n"); trace_qemu_rdma_connect_pin_all_requested();
cap.flags |= RDMA_CAPABILITY_PIN_ALL; cap.flags |= RDMA_CAPABILITY_PIN_ALL;
} }
@ -2389,7 +2348,7 @@ static int qemu_rdma_connect(RDMAContext *rdma, Error **errp)
rdma->pin_all = false; rdma->pin_all = false;
} }
DPRINTF("Pin all memory: %s\n", rdma->pin_all ? "enabled" : "disabled"); trace_qemu_rdma_connect_pin_all_outcome(rdma->pin_all);
rdma_ack_cm_event(cm_event); rdma_ack_cm_event(cm_event);
@ -2456,7 +2415,7 @@ static int qemu_rdma_dest_init(RDMAContext *rdma, Error **errp)
for (e = res; e != NULL; e = e->ai_next) { for (e = res; e != NULL; e = e->ai_next) {
inet_ntop(e->ai_family, inet_ntop(e->ai_family,
&((struct sockaddr_in *) e->ai_dst_addr)->sin_addr, ip, sizeof ip); &((struct sockaddr_in *) e->ai_dst_addr)->sin_addr, ip, sizeof ip);
DPRINTF("Trying %s => %s\n", rdma->host, ip); trace_qemu_rdma_dest_init_trying(rdma->host, ip);
ret = rdma_bind_addr(listen_id, e->ai_dst_addr); ret = rdma_bind_addr(listen_id, e->ai_dst_addr);
if (!ret) { if (!ret) {
if (e->ai_family == AF_INET6) { if (e->ai_family == AF_INET6) {
@ -2575,8 +2534,7 @@ static size_t qemu_rdma_fill(RDMAContext *rdma, uint8_t *buf,
size_t len = 0; size_t len = 0;
if (rdma->wr_data[idx].control_len) { if (rdma->wr_data[idx].control_len) {
DDDPRINTF("RDMA %" PRId64 " of %d bytes already in buffer\n", trace_qemu_rdma_fill(rdma->wr_data[idx].control_len, size);
rdma->wr_data[idx].control_len, size);
len = MIN(size, rdma->wr_data[idx].control_len); len = MIN(size, rdma->wr_data[idx].control_len);
memcpy(buf, rdma->wr_data[idx].control_curr, len); memcpy(buf, rdma->wr_data[idx].control_curr, len);
@ -2643,7 +2601,7 @@ static int qemu_rdma_drain_cq(QEMUFile *f, RDMAContext *rdma)
while (rdma->nb_sent) { while (rdma->nb_sent) {
ret = qemu_rdma_block_for_wrid(rdma, RDMA_WRID_RDMA_WRITE, NULL); ret = qemu_rdma_block_for_wrid(rdma, RDMA_WRID_RDMA_WRITE, NULL);
if (ret < 0) { if (ret < 0) {
fprintf(stderr, "rdma migration: complete polling error!\n"); error_report("rdma migration: complete polling error!");
return -EIO; return -EIO;
} }
} }
@ -2655,7 +2613,7 @@ static int qemu_rdma_drain_cq(QEMUFile *f, RDMAContext *rdma)
static int qemu_rdma_close(void *opaque) static int qemu_rdma_close(void *opaque)
{ {
DPRINTF("Shutting down connection.\n"); trace_qemu_rdma_close();
QEMUFileRDMA *r = opaque; QEMUFileRDMA *r = opaque;
if (r->rdma) { if (r->rdma) {
qemu_rdma_cleanup(r->rdma); qemu_rdma_cleanup(r->rdma);
@ -2719,7 +2677,7 @@ static size_t qemu_rdma_save_page(QEMUFile *f, void *opaque,
*/ */
ret = qemu_rdma_write(f, rdma, block_offset, offset, size); ret = qemu_rdma_write(f, rdma, block_offset, offset, size);
if (ret < 0) { if (ret < 0) {
fprintf(stderr, "rdma migration: write error! %d\n", ret); error_report("rdma migration: write error! %d", ret);
goto err; goto err;
} }
@ -2752,7 +2710,7 @@ static size_t qemu_rdma_save_page(QEMUFile *f, void *opaque,
offset, size, &index, &chunk); offset, size, &index, &chunk);
if (ret) { if (ret) {
fprintf(stderr, "ram block search failed\n"); error_report("ram block search failed");
goto err; goto err;
} }
@ -2779,7 +2737,7 @@ static size_t qemu_rdma_save_page(QEMUFile *f, void *opaque,
uint64_t wr_id, wr_id_in; uint64_t wr_id, wr_id_in;
int ret = qemu_rdma_poll(rdma, &wr_id_in, NULL); int ret = qemu_rdma_poll(rdma, &wr_id_in, NULL);
if (ret < 0) { if (ret < 0) {
fprintf(stderr, "rdma migration: polling error! %d\n", ret); error_report("rdma migration: polling error! %d", ret);
goto err; goto err;
} }
@ -2824,7 +2782,7 @@ static int qemu_rdma_accept(RDMAContext *rdma)
network_to_caps(&cap); network_to_caps(&cap);
if (cap.version < 1 || cap.version > RDMA_CONTROL_VERSION_CURRENT) { if (cap.version < 1 || cap.version > RDMA_CONTROL_VERSION_CURRENT) {
fprintf(stderr, "Unknown source RDMA version: %d, bailing...\n", error_report("Unknown source RDMA version: %d, bailing...",
cap.version); cap.version);
rdma_ack_cm_event(cm_event); rdma_ack_cm_event(cm_event);
goto err_rdma_dest_wait; goto err_rdma_dest_wait;
@ -2848,17 +2806,17 @@ static int qemu_rdma_accept(RDMAContext *rdma)
rdma_ack_cm_event(cm_event); rdma_ack_cm_event(cm_event);
DPRINTF("Memory pin all: %s\n", rdma->pin_all ? "enabled" : "disabled"); trace_qemu_rdma_accept_pin_state(rdma->pin_all);
caps_to_network(&cap); caps_to_network(&cap);
DPRINTF("verbs context after listen: %p\n", verbs); trace_qemu_rdma_accept_pin_verbsc(verbs);
if (!rdma->verbs) { if (!rdma->verbs) {
rdma->verbs = verbs; rdma->verbs = verbs;
} else if (rdma->verbs != verbs) { } else if (rdma->verbs != verbs) {
fprintf(stderr, "ibv context not matching %p, %p!\n", error_report("ibv context not matching %p, %p!", rdma->verbs,
rdma->verbs, verbs); verbs);
goto err_rdma_dest_wait; goto err_rdma_dest_wait;
} }
@ -2866,26 +2824,26 @@ static int qemu_rdma_accept(RDMAContext *rdma)
ret = qemu_rdma_alloc_pd_cq(rdma); ret = qemu_rdma_alloc_pd_cq(rdma);
if (ret) { if (ret) {
fprintf(stderr, "rdma migration: error allocating pd and cq!\n"); error_report("rdma migration: error allocating pd and cq!");
goto err_rdma_dest_wait; goto err_rdma_dest_wait;
} }
ret = qemu_rdma_alloc_qp(rdma); ret = qemu_rdma_alloc_qp(rdma);
if (ret) { if (ret) {
fprintf(stderr, "rdma migration: error allocating qp!\n"); error_report("rdma migration: error allocating qp!");
goto err_rdma_dest_wait; goto err_rdma_dest_wait;
} }
ret = qemu_rdma_init_ram_blocks(rdma); ret = qemu_rdma_init_ram_blocks(rdma);
if (ret) { if (ret) {
fprintf(stderr, "rdma migration: error initializing ram blocks!\n"); error_report("rdma migration: error initializing ram blocks!");
goto err_rdma_dest_wait; goto err_rdma_dest_wait;
} }
for (idx = 0; idx < RDMA_WRID_MAX; idx++) { for (idx = 0; idx < RDMA_WRID_MAX; idx++) {
ret = qemu_rdma_reg_control(rdma, idx); ret = qemu_rdma_reg_control(rdma, idx);
if (ret) { if (ret) {
fprintf(stderr, "rdma: error registering %d control!\n", idx); error_report("rdma: error registering %d control", idx);
goto err_rdma_dest_wait; goto err_rdma_dest_wait;
} }
} }
@ -2894,18 +2852,18 @@ static int qemu_rdma_accept(RDMAContext *rdma)
ret = rdma_accept(rdma->cm_id, &conn_param); ret = rdma_accept(rdma->cm_id, &conn_param);
if (ret) { if (ret) {
fprintf(stderr, "rdma_accept returns %d!\n", ret); error_report("rdma_accept returns %d", ret);
goto err_rdma_dest_wait; goto err_rdma_dest_wait;
} }
ret = rdma_get_cm_event(rdma->channel, &cm_event); ret = rdma_get_cm_event(rdma->channel, &cm_event);
if (ret) { if (ret) {
fprintf(stderr, "rdma_accept get_cm_event failed %d!\n", ret); error_report("rdma_accept get_cm_event failed %d", ret);
goto err_rdma_dest_wait; goto err_rdma_dest_wait;
} }
if (cm_event->event != RDMA_CM_EVENT_ESTABLISHED) { if (cm_event->event != RDMA_CM_EVENT_ESTABLISHED) {
fprintf(stderr, "rdma_accept not event established!\n"); error_report("rdma_accept not event established");
rdma_ack_cm_event(cm_event); rdma_ack_cm_event(cm_event);
goto err_rdma_dest_wait; goto err_rdma_dest_wait;
} }
@ -2915,7 +2873,7 @@ static int qemu_rdma_accept(RDMAContext *rdma)
ret = qemu_rdma_post_recv_control(rdma, RDMA_WRID_READY); ret = qemu_rdma_post_recv_control(rdma, RDMA_WRID_READY);
if (ret) { if (ret) {
fprintf(stderr, "rdma migration: error posting second control recv!\n"); error_report("rdma migration: error posting second control recv");
goto err_rdma_dest_wait; goto err_rdma_dest_wait;
} }
@ -2969,7 +2927,7 @@ static int qemu_rdma_registration_handle(QEMUFile *f, void *opaque,
CHECK_ERROR_STATE(); CHECK_ERROR_STATE();
do { do {
DDDPRINTF("Waiting for next request %" PRIu64 "...\n", flags); trace_qemu_rdma_registration_handle_wait(flags);
ret = qemu_rdma_exchange_recv(rdma, &head, RDMA_CONTROL_NONE); ret = qemu_rdma_exchange_recv(rdma, &head, RDMA_CONTROL_NONE);
@ -2978,8 +2936,8 @@ static int qemu_rdma_registration_handle(QEMUFile *f, void *opaque,
} }
if (head.repeat > RDMA_CONTROL_MAX_COMMANDS_PER_MESSAGE) { if (head.repeat > RDMA_CONTROL_MAX_COMMANDS_PER_MESSAGE) {
fprintf(stderr, "rdma: Too many requests in this message (%d)." error_report("rdma: Too many requests in this message (%d)."
"Bailing.\n", head.repeat); "Bailing.", head.repeat);
ret = -EIO; ret = -EIO;
break; break;
} }
@ -2989,9 +2947,9 @@ static int qemu_rdma_registration_handle(QEMUFile *f, void *opaque,
comp = (RDMACompress *) rdma->wr_data[idx].control_curr; comp = (RDMACompress *) rdma->wr_data[idx].control_curr;
network_to_compress(comp); network_to_compress(comp);
DDPRINTF("Zapping zero chunk: %" PRId64 trace_qemu_rdma_registration_handle_compress(comp->length,
" bytes, index %d, offset %" PRId64 "\n", comp->block_idx,
comp->length, comp->block_idx, comp->offset); comp->offset);
block = &(rdma->local_ram_blocks.block[comp->block_idx]); block = &(rdma->local_ram_blocks.block[comp->block_idx]);
host_addr = block->local_host_addr + host_addr = block->local_host_addr +
@ -3001,17 +2959,17 @@ static int qemu_rdma_registration_handle(QEMUFile *f, void *opaque,
break; break;
case RDMA_CONTROL_REGISTER_FINISHED: case RDMA_CONTROL_REGISTER_FINISHED:
DDDPRINTF("Current registrations complete.\n"); trace_qemu_rdma_registration_handle_finished();
goto out; goto out;
case RDMA_CONTROL_RAM_BLOCKS_REQUEST: case RDMA_CONTROL_RAM_BLOCKS_REQUEST:
DPRINTF("Initial setup info requested.\n"); trace_qemu_rdma_registration_handle_ram_blocks();
if (rdma->pin_all) { if (rdma->pin_all) {
ret = qemu_rdma_reg_whole_ram_blocks(rdma); ret = qemu_rdma_reg_whole_ram_blocks(rdma);
if (ret) { if (ret) {
fprintf(stderr, "rdma migration: error dest " error_report("rdma migration: error dest "
"registering ram blocks!\n"); "registering ram blocks");
goto out; goto out;
} }
} }
@ -3044,13 +3002,13 @@ static int qemu_rdma_registration_handle(QEMUFile *f, void *opaque,
(uint8_t *) rdma->block, &blocks); (uint8_t *) rdma->block, &blocks);
if (ret < 0) { if (ret < 0) {
fprintf(stderr, "rdma migration: error sending remote info!\n"); error_report("rdma migration: error sending remote info");
goto out; goto out;
} }
break; break;
case RDMA_CONTROL_REGISTER_REQUEST: case RDMA_CONTROL_REGISTER_REQUEST:
DDPRINTF("There are %d registration requests\n", head.repeat); trace_qemu_rdma_registration_handle_register(head.repeat);
reg_resp.repeat = head.repeat; reg_resp.repeat = head.repeat;
registers = (RDMARegister *) rdma->wr_data[idx].control_curr; registers = (RDMARegister *) rdma->wr_data[idx].control_curr;
@ -3064,8 +3022,7 @@ static int qemu_rdma_registration_handle(QEMUFile *f, void *opaque,
reg_result = &results[count]; reg_result = &results[count];
DDPRINTF("Registration request (%d): index %d, current_addr %" trace_qemu_rdma_registration_handle_register_loop(count,
PRIu64 " chunks: %" PRIu64 "\n", count,
reg->current_index, reg->key.current_addr, reg->chunks); reg->current_index, reg->key.current_addr, reg->chunks);
block = &(rdma->local_ram_blocks.block[reg->current_index]); block = &(rdma->local_ram_blocks.block[reg->current_index]);
@ -3084,15 +3041,15 @@ static int qemu_rdma_registration_handle(QEMUFile *f, void *opaque,
if (qemu_rdma_register_and_get_keys(rdma, block, if (qemu_rdma_register_and_get_keys(rdma, block,
(uint8_t *)host_addr, NULL, &reg_result->rkey, (uint8_t *)host_addr, NULL, &reg_result->rkey,
chunk, chunk_start, chunk_end)) { chunk, chunk_start, chunk_end)) {
fprintf(stderr, "cannot get rkey!\n"); error_report("cannot get rkey");
ret = -EINVAL; ret = -EINVAL;
goto out; goto out;
} }
reg_result->host_addr = (uint64_t) block->local_host_addr; reg_result->host_addr = (uint64_t) block->local_host_addr;
DDPRINTF("Registered rkey for this request: %x\n", trace_qemu_rdma_registration_handle_register_rkey(
reg_result->rkey); reg_result->rkey);
result_to_network(reg_result); result_to_network(reg_result);
} }
@ -3101,12 +3058,12 @@ static int qemu_rdma_registration_handle(QEMUFile *f, void *opaque,
(uint8_t *) results, &reg_resp); (uint8_t *) results, &reg_resp);
if (ret < 0) { if (ret < 0) {
fprintf(stderr, "Failed to send control buffer!\n"); error_report("Failed to send control buffer");
goto out; goto out;
} }
break; break;
case RDMA_CONTROL_UNREGISTER_REQUEST: case RDMA_CONTROL_UNREGISTER_REQUEST:
DDPRINTF("There are %d unregistration requests\n", head.repeat); trace_qemu_rdma_registration_handle_unregister(head.repeat);
unreg_resp.repeat = head.repeat; unreg_resp.repeat = head.repeat;
registers = (RDMARegister *) rdma->wr_data[idx].control_curr; registers = (RDMARegister *) rdma->wr_data[idx].control_curr;
@ -3114,9 +3071,8 @@ static int qemu_rdma_registration_handle(QEMUFile *f, void *opaque,
reg = &registers[count]; reg = &registers[count];
network_to_register(reg); network_to_register(reg);
DDPRINTF("Unregistration request (%d): " trace_qemu_rdma_registration_handle_unregister_loop(count,
" index %d, chunk %" PRIu64 "\n", reg->current_index, reg->key.chunk);
count, reg->current_index, reg->key.chunk);
block = &(rdma->local_ram_blocks.block[reg->current_index]); block = &(rdma->local_ram_blocks.block[reg->current_index]);
@ -3131,24 +3087,23 @@ static int qemu_rdma_registration_handle(QEMUFile *f, void *opaque,
rdma->total_registrations--; rdma->total_registrations--;
DDPRINTF("Unregistered chunk %" PRIu64 " successfully.\n", trace_qemu_rdma_registration_handle_unregister_success(
reg->key.chunk); reg->key.chunk);
} }
ret = qemu_rdma_post_send_control(rdma, NULL, &unreg_resp); ret = qemu_rdma_post_send_control(rdma, NULL, &unreg_resp);
if (ret < 0) { if (ret < 0) {
fprintf(stderr, "Failed to send control buffer!\n"); error_report("Failed to send control buffer");
goto out; goto out;
} }
break; break;
case RDMA_CONTROL_REGISTER_RESULT: case RDMA_CONTROL_REGISTER_RESULT:
fprintf(stderr, "Invalid RESULT message at dest.\n"); error_report("Invalid RESULT message at dest.");
ret = -EIO; ret = -EIO;
goto out; goto out;
default: default:
fprintf(stderr, "Unknown control message %s\n", error_report("Unknown control message %s", control_desc[head.type]);
control_desc[head.type]);
ret = -EIO; ret = -EIO;
goto out; goto out;
} }
@ -3168,7 +3123,7 @@ static int qemu_rdma_registration_start(QEMUFile *f, void *opaque,
CHECK_ERROR_STATE(); CHECK_ERROR_STATE();
DDDPRINTF("start section: %" PRIu64 "\n", flags); trace_qemu_rdma_registration_start(flags);
qemu_put_be64(f, RAM_SAVE_FLAG_HOOK); qemu_put_be64(f, RAM_SAVE_FLAG_HOOK);
qemu_fflush(f); qemu_fflush(f);
@ -3203,7 +3158,7 @@ static int qemu_rdma_registration_stop(QEMUFile *f, void *opaque,
int reg_result_idx, i, j, nb_remote_blocks; int reg_result_idx, i, j, nb_remote_blocks;
head.type = RDMA_CONTROL_RAM_BLOCKS_REQUEST; head.type = RDMA_CONTROL_RAM_BLOCKS_REQUEST;
DPRINTF("Sending registration setup for ram blocks...\n"); trace_qemu_rdma_registration_stop_ram();
/* /*
* Make sure that we parallelize the pinning on both sides. * Make sure that we parallelize the pinning on both sides.
@ -3275,7 +3230,7 @@ static int qemu_rdma_registration_stop(QEMUFile *f, void *opaque,
} }
} }
DDDPRINTF("Sending registration finish %" PRIu64 "...\n", flags); trace_qemu_rdma_registration_stop(flags);
head.type = RDMA_CONTROL_REGISTER_FINISHED; head.type = RDMA_CONTROL_REGISTER_FINISHED;
ret = qemu_rdma_exchange_send(rdma, &head, NULL, NULL, NULL, NULL); ret = qemu_rdma_exchange_send(rdma, &head, NULL, NULL, NULL, NULL);
@ -3339,7 +3294,7 @@ static void rdma_accept_incoming_migration(void *opaque)
QEMUFile *f; QEMUFile *f;
Error *local_err = NULL, **errp = &local_err; Error *local_err = NULL, **errp = &local_err;
DPRINTF("Accepting rdma connection...\n"); trace_qemu_dma_accept_incoming_migration();
ret = qemu_rdma_accept(rdma); ret = qemu_rdma_accept(rdma);
if (ret) { if (ret) {
@ -3347,7 +3302,7 @@ static void rdma_accept_incoming_migration(void *opaque)
return; return;
} }
DPRINTF("Accepted migration\n"); trace_qemu_dma_accept_incoming_migration_accepted();
f = qemu_fopen_rdma(rdma, "rb"); f = qemu_fopen_rdma(rdma, "rb");
if (f == NULL) { if (f == NULL) {
@ -3366,7 +3321,7 @@ void rdma_start_incoming_migration(const char *host_port, Error **errp)
RDMAContext *rdma; RDMAContext *rdma;
Error *local_err = NULL; Error *local_err = NULL;
DPRINTF("Starting RDMA-based incoming migration\n"); trace_rdma_start_incoming_migration();
rdma = qemu_rdma_data_init(host_port, &local_err); rdma = qemu_rdma_data_init(host_port, &local_err);
if (rdma == NULL) { if (rdma == NULL) {
@ -3379,7 +3334,7 @@ void rdma_start_incoming_migration(const char *host_port, Error **errp)
goto err; goto err;
} }
DPRINTF("qemu_rdma_dest_init success\n"); trace_rdma_start_incoming_migration_after_dest_init();
ret = rdma_listen(rdma->listen_id, 5); ret = rdma_listen(rdma->listen_id, 5);
@ -3388,7 +3343,7 @@ void rdma_start_incoming_migration(const char *host_port, Error **errp)
goto err; goto err;
} }
DPRINTF("rdma_listen success\n"); trace_rdma_start_incoming_migration_after_rdma_listen();
qemu_set_fd_handler2(rdma->channel->fd, NULL, qemu_set_fd_handler2(rdma->channel->fd, NULL,
rdma_accept_incoming_migration, NULL, rdma_accept_incoming_migration, NULL,
@ -3419,14 +3374,14 @@ void rdma_start_outgoing_migration(void *opaque,
goto err; goto err;
} }
DPRINTF("qemu_rdma_source_init success\n"); trace_rdma_start_outgoing_migration_after_rdma_source_init();
ret = qemu_rdma_connect(rdma, &local_err); ret = qemu_rdma_connect(rdma, &local_err);
if (ret) { if (ret) {
goto err; goto err;
} }
DPRINTF("qemu_rdma_source_connect success\n"); trace_rdma_start_outgoing_migration_after_rdma_connect();
s->file = qemu_fopen_rdma(rdma, "wb"); s->file = qemu_fopen_rdma(rdma, "wb");
migrate_fd_connect(s); migrate_fd_connect(s);

View File

@ -1335,6 +1335,68 @@ migrate_fd_cancel(void) ""
migrate_pending(uint64_t size, uint64_t max) "pending size %" PRIu64 " max %" PRIu64 migrate_pending(uint64_t size, uint64_t max) "pending size %" PRIu64 " max %" PRIu64
migrate_transferred(uint64_t tranferred, uint64_t time_spent, double bandwidth, uint64_t size) "transferred %" PRIu64 " time_spent %" PRIu64 " bandwidth %g max_size %" PRId64 migrate_transferred(uint64_t tranferred, uint64_t time_spent, double bandwidth, uint64_t size) "transferred %" PRIu64 " time_spent %" PRIu64 " bandwidth %g max_size %" PRId64
# migration/rdma.c
__qemu_rdma_add_block(int block, uint64_t addr, uint64_t offset, uint64_t len, uint64_t end, uint64_t bits, int chunks) "Added Block: %d, addr: %" PRIu64 ", offset: %" PRIu64 " length: %" PRIu64 " end: %" PRIu64 " bits %" PRIu64 " chunks %d"
__qemu_rdma_delete_block(int block, uint64_t addr, uint64_t offset, uint64_t len, uint64_t end, uint64_t bits, int chunks) "Deleted Block: %d, addr: %" PRIu64 ", offset: %" PRIu64 " length: %" PRIu64 " end: %" PRIu64 " bits %" PRIu64 " chunks %d"
qemu_dma_accept_incoming_migration(void) ""
qemu_dma_accept_incoming_migration_accepted(void) ""
qemu_rdma_accept_pin_state(bool pin) "%d"
qemu_rdma_accept_pin_verbsc(void *verbs) "Verbs context after listen: %p"
qemu_rdma_block_for_wrid_miss(const char *wcompstr, int wcomp, const char *gcompstr, uint64_t req) "A Wanted wrid %s (%d) but got %s (%" PRIu64 ")"
qemu_rdma_block_for_wrid_miss_b(const char *wcompstr, int wcomp, const char *gcompstr, uint64_t req) "B Wanted wrid %s (%d) but got %s (%" PRIu64 ")"
qemu_rdma_cleanup_disconnect(void) ""
qemu_rdma_cleanup_waiting_for_disconnect(void) ""
qemu_rdma_close(void) ""
qemu_rdma_connect_pin_all_requested(void) ""
qemu_rdma_connect_pin_all_outcome(bool pin) "%d"
qemu_rdma_dest_init_trying(const char *host, const char *ip) "%s => %s"
qemu_rdma_dump_gid(const char *who, const char *src, const char *dst) "%s Source GID: %s, Dest GID: %s"
qemu_rdma_exchange_get_response_start(const char *desc) "CONTROL: %s receiving..."
qemu_rdma_exchange_get_response_none(const char *desc, int type) "Surprise: got %s (%d)"
qemu_rdma_exchange_send_issue_callback(void) ""
qemu_rdma_exchange_send_waiting(const char *desc) "Waiting for response %s"
qemu_rdma_exchange_send_received(const char *desc) "Response %s received."
qemu_rdma_fill(int64_t control_len, int size) "RDMA %" PRId64 " of %d bytes already in buffer"
qemu_rdma_init_ram_blocks(int blocks) "Allocated %d local ram block structures"
qemu_rdma_poll_recv(const char *compstr, int64_t comp, int64_t id, int sent) "completion %s #%" PRId64 " received (%" PRId64 ") left %d"
qemu_rdma_poll_write(const char *compstr, int64_t comp, int left, uint64_t block, uint64_t chunk, void *local, void *remote) "completions %s (%" PRId64 ") left %d, block %" PRIu64 ", chunk: %" PRIu64 " %p %p"
qemu_rdma_poll_other(const char *compstr, int64_t comp, int left) "other completion %s (%" PRId64 ") received left %d"
qemu_rdma_post_send_control(const char *desc) "CONTROL: sending %s.."
qemu_rdma_register_and_get_keys(uint64_t len, void *start) "Registering %" PRIu64 " bytes @ %p"
qemu_rdma_registration_handle_compress(int64_t length, int index, int64_t offset) "Zapping zero chunk: %" PRId64 " bytes, index %d, offset %" PRId64
qemu_rdma_registration_handle_finished(void) ""
qemu_rdma_registration_handle_ram_blocks(void) ""
qemu_rdma_registration_handle_register(int requests) "%d requests"
qemu_rdma_registration_handle_register_loop(int req, int index, uint64_t addr, uint64_t chunks) "Registration request (%d): index %d, current_addr %" PRIu64 " chunks: %" PRIu64
qemu_rdma_registration_handle_register_rkey(int rkey) "%x"
qemu_rdma_registration_handle_unregister(int requests) "%d requests"
qemu_rdma_registration_handle_unregister_loop(int count, int index, uint64_t chunk) "Unregistration request (%d): index %d, chunk %" PRIu64
qemu_rdma_registration_handle_unregister_success(uint64_t chunk) "%" PRIu64
qemu_rdma_registration_handle_wait(uint64_t flags) "Waiting for next request %" PRIu64
qemu_rdma_registration_start(uint64_t flags) "%" PRIu64
qemu_rdma_registration_stop(uint64_t flags) "%" PRIu64
qemu_rdma_registration_stop_ram(void) ""
qemu_rdma_resolve_host_trying(const char *host, const char *ip) "Trying %s => %s"
qemu_rdma_signal_unregister_append(uint64_t chunk, int pos) "Appending unregister chunk %" PRIu64 " at position %d"
qemu_rdma_signal_unregister_already(uint64_t chunk) "Unregister chunk %" PRIu64 " already in queue"
qemu_rdma_unregister_waiting_inflight(uint64_t chunk) "Cannot unregister inflight chunk: %" PRIu64
qemu_rdma_unregister_waiting_proc(uint64_t chunk, int pos) "Processing unregister for chunk: %" PRIu64 " at position %d"
qemu_rdma_unregister_waiting_send(uint64_t chunk) "Sending unregister for chunk: %" PRIu64
qemu_rdma_unregister_waiting_complete(uint64_t chunk) "Unregister for chunk: %" PRIu64 " complete."
qemu_rdma_write_flush(int sent) "sent total: %d"
qemu_rdma_write_one_block(int count, int block, uint64_t chunk, uint64_t current, uint64_t len, int nb_sent, int nb_chunks) "(%d) Not clobbering: block: %d chunk %" PRIu64 " current %" PRIu64 " len %" PRIu64 " %d %d"
qemu_rdma_write_one_post(uint64_t chunk, long addr, long remote, uint32_t len) "Posting chunk: %" PRIu64 ", addr: %lx remote: %lx, bytes %" PRIu32
qemu_rdma_write_one_queue_full(void) ""
qemu_rdma_write_one_recvregres(int mykey, int theirkey, uint64_t chunk) "Received registration result: my key: %x their key %x, chunk %" PRIu64
qemu_rdma_write_one_sendreg(uint64_t chunk, int len, int index, int64_t offset) "Sending registration request chunk %" PRIu64 " for %d bytes, index: %d, offset: %" PRId64
qemu_rdma_write_one_top(uint64_t chunks, uint64_t size) "Writing %" PRIu64 " chunks, (%" PRIu64 " MB)"
qemu_rdma_write_one_zero(uint64_t chunk, int len, int index, int64_t offset) "Entire chunk is zero, sending compress: %" PRIu64 " for %d bytes, index: %d, offset: %" PRId64
rdma_start_incoming_migration(void) ""
rdma_start_incoming_migration_after_dest_init(void) ""
rdma_start_incoming_migration_after_rdma_listen(void) ""
rdma_start_outgoing_migration_after_rdma_connect(void) ""
rdma_start_outgoing_migration_after_rdma_source_init(void) ""
# kvm-all.c # kvm-all.c
kvm_ioctl(int type, void *arg) "type 0x%x, arg %p" kvm_ioctl(int type, void *arg) "type 0x%x, arg %p"
kvm_vm_ioctl(int type, void *arg) "type 0x%x, arg %p" kvm_vm_ioctl(int type, void *arg) "type 0x%x, arg %p"