Zhang Chen | 59509ec | 2016-09-27 10:22:27 +0800 | [diff] [blame] | 1 | /* |
| 2 | * COarse-grain LOck-stepping Virtual Machines for Non-stop Service (COLO) |
| 3 | * (a.k.a. Fault Tolerance or Continuous Replication) |
| 4 | * |
| 5 | * Copyright (c) 2016 HUAWEI TECHNOLOGIES CO., LTD. |
| 6 | * Copyright (c) 2016 FUJITSU LIMITED |
| 7 | * Copyright (c) 2016 Intel Corporation |
| 8 | * |
| 9 | * Author: Zhang Chen <zhangchen.fnst@cn.fujitsu.com> |
| 10 | * |
| 11 | * This work is licensed under the terms of the GNU GPL, version 2 or |
| 12 | * later. See the COPYING file in the top-level directory. |
| 13 | */ |
| 14 | |
| 15 | #include "qemu/osdep.h" |
| 16 | #include "trace.h" |
Michael S. Tsirkin | f27f01d | 2018-05-03 22:50:56 +0300 | [diff] [blame] | 17 | #include "colo.h" |
Marc-André Lureau | e05ae1d | 2018-11-14 16:36:40 +0400 | [diff] [blame] | 18 | #include "util.h" |
Zhang Chen | 59509ec | 2016-09-27 10:22:27 +0800 | [diff] [blame] | 19 | |
Zhang Chen | b6540d4 | 2016-09-27 10:22:29 +0800 | [diff] [blame] | 20 | uint32_t connection_key_hash(const void *opaque) |
| 21 | { |
| 22 | const ConnectionKey *key = opaque; |
| 23 | uint32_t a, b, c; |
| 24 | |
| 25 | /* Jenkins hash */ |
| 26 | a = b = c = JHASH_INITVAL + sizeof(*key); |
| 27 | a += key->src.s_addr; |
| 28 | b += key->dst.s_addr; |
| 29 | c += (key->src_port | key->dst_port << 16); |
| 30 | __jhash_mix(a, b, c); |
| 31 | |
| 32 | a += key->ip_proto; |
| 33 | __jhash_final(a, b, c); |
| 34 | |
| 35 | return c; |
| 36 | } |
| 37 | |
| 38 | int connection_key_equal(const void *key1, const void *key2) |
| 39 | { |
| 40 | return memcmp(key1, key2, sizeof(ConnectionKey)) == 0; |
| 41 | } |
| 42 | |
Zhang Chen | 59509ec | 2016-09-27 10:22:27 +0800 | [diff] [blame] | 43 | int parse_packet_early(Packet *pkt) |
| 44 | { |
| 45 | int network_length; |
| 46 | static const uint8_t vlan[] = {0x81, 0x00}; |
Zhang Chen | 3772cf0 | 2022-08-22 16:14:36 +0800 | [diff] [blame] | 47 | uint8_t *data = pkt->data; |
Zhang Chen | 59509ec | 2016-09-27 10:22:27 +0800 | [diff] [blame] | 48 | uint16_t l3_proto; |
Zhang Chen | 8bdab83 | 2022-04-01 11:47:02 +0800 | [diff] [blame] | 49 | ssize_t l2hdr_len; |
| 50 | |
Zhang Chen | 3772cf0 | 2022-08-22 16:14:36 +0800 | [diff] [blame] | 51 | assert(data); |
Zhang Chen | 59509ec | 2016-09-27 10:22:27 +0800 | [diff] [blame] | 52 | |
Zhang Chen | 3772cf0 | 2022-08-22 16:14:36 +0800 | [diff] [blame] | 53 | /* Check the received vnet_hdr_len then add the offset */ |
| 54 | if ((pkt->vnet_hdr_len > sizeof(struct virtio_net_hdr_v1_hash)) || |
| 55 | (pkt->size < sizeof(struct eth_header) + sizeof(struct vlan_header) + |
| 56 | pkt->vnet_hdr_len)) { |
| 57 | /* |
| 58 | * The received remote packet maybe misconfiguration here, |
| 59 | * Please enable/disable filter module's the vnet_hdr flag at |
| 60 | * the same time. |
| 61 | */ |
| 62 | trace_colo_proxy_main_vnet_info("This received packet load wrong ", |
| 63 | pkt->vnet_hdr_len, pkt->size); |
Zhang Chen | 59509ec | 2016-09-27 10:22:27 +0800 | [diff] [blame] | 64 | return 1; |
| 65 | } |
Zhang Chen | 3772cf0 | 2022-08-22 16:14:36 +0800 | [diff] [blame] | 66 | data += pkt->vnet_hdr_len; |
| 67 | |
| 68 | l2hdr_len = eth_get_l2_hdr_length(data); |
Zhang Chen | 59509ec | 2016-09-27 10:22:27 +0800 | [diff] [blame] | 69 | |
| 70 | /* |
| 71 | * TODO: support vlan. |
| 72 | */ |
| 73 | if (!memcmp(&data[12], vlan, sizeof(vlan))) { |
| 74 | trace_colo_proxy_main("COLO-proxy don't support vlan"); |
| 75 | return 1; |
| 76 | } |
| 77 | |
| 78 | pkt->network_header = data + l2hdr_len; |
| 79 | |
| 80 | const struct iovec l2vec = { |
| 81 | .iov_base = (void *) data, |
| 82 | .iov_len = l2hdr_len |
| 83 | }; |
| 84 | l3_proto = eth_get_l3_proto(&l2vec, 1, l2hdr_len); |
| 85 | |
| 86 | if (l3_proto != ETH_P_IP) { |
| 87 | return 1; |
| 88 | } |
| 89 | |
| 90 | network_length = pkt->ip->ip_hl * 4; |
Zhang Chen | 5cc444d | 2017-07-04 14:53:53 +0800 | [diff] [blame] | 91 | if (pkt->size < l2hdr_len + network_length + pkt->vnet_hdr_len) { |
Zhang Chen | 59509ec | 2016-09-27 10:22:27 +0800 | [diff] [blame] | 92 | trace_colo_proxy_main("pkt->size < network_header + network_length"); |
| 93 | return 1; |
| 94 | } |
| 95 | pkt->transport_header = pkt->network_header + network_length; |
| 96 | |
| 97 | return 0; |
| 98 | } |
| 99 | |
Rao, Lei | 64153ca | 2021-11-03 10:21:12 +0800 | [diff] [blame] | 100 | void extract_ip_and_port(uint32_t tmp_ports, ConnectionKey *key, |
| 101 | Packet *pkt, bool reverse) |
Mao Zhongyi | 8fa5ad6 | 2017-10-13 14:32:09 +0800 | [diff] [blame] | 102 | { |
Rao, Lei | 64153ca | 2021-11-03 10:21:12 +0800 | [diff] [blame] | 103 | if (reverse) { |
| 104 | key->src = pkt->ip->ip_dst; |
| 105 | key->dst = pkt->ip->ip_src; |
| 106 | key->src_port = ntohs(tmp_ports & 0xffff); |
| 107 | key->dst_port = ntohs(tmp_ports >> 16); |
| 108 | } else { |
Mao Zhongyi | 8fa5ad6 | 2017-10-13 14:32:09 +0800 | [diff] [blame] | 109 | key->src = pkt->ip->ip_src; |
| 110 | key->dst = pkt->ip->ip_dst; |
| 111 | key->src_port = ntohs(tmp_ports >> 16); |
| 112 | key->dst_port = ntohs(tmp_ports & 0xffff); |
Rao, Lei | 64153ca | 2021-11-03 10:21:12 +0800 | [diff] [blame] | 113 | } |
Mao Zhongyi | 8fa5ad6 | 2017-10-13 14:32:09 +0800 | [diff] [blame] | 114 | } |
| 115 | |
Rao, Lei | 64153ca | 2021-11-03 10:21:12 +0800 | [diff] [blame] | 116 | void fill_connection_key(Packet *pkt, ConnectionKey *key, bool reverse) |
Zhang Chen | b6540d4 | 2016-09-27 10:22:29 +0800 | [diff] [blame] | 117 | { |
Rao, Lei | 64153ca | 2021-11-03 10:21:12 +0800 | [diff] [blame] | 118 | uint32_t tmp_ports = 0; |
Zhang Chen | b6540d4 | 2016-09-27 10:22:29 +0800 | [diff] [blame] | 119 | |
Zhang Chen | b6540d4 | 2016-09-27 10:22:29 +0800 | [diff] [blame] | 120 | key->ip_proto = pkt->ip->ip_p; |
| 121 | |
| 122 | switch (key->ip_proto) { |
| 123 | case IPPROTO_TCP: |
| 124 | case IPPROTO_UDP: |
| 125 | case IPPROTO_DCCP: |
| 126 | case IPPROTO_ESP: |
| 127 | case IPPROTO_SCTP: |
| 128 | case IPPROTO_UDPLITE: |
| 129 | tmp_ports = *(uint32_t *)(pkt->transport_header); |
Zhang Chen | b6540d4 | 2016-09-27 10:22:29 +0800 | [diff] [blame] | 130 | break; |
| 131 | case IPPROTO_AH: |
| 132 | tmp_ports = *(uint32_t *)(pkt->transport_header + 4); |
Zhang Chen | b6540d4 | 2016-09-27 10:22:29 +0800 | [diff] [blame] | 133 | break; |
| 134 | default: |
| 135 | break; |
| 136 | } |
Zhang Chen | b6540d4 | 2016-09-27 10:22:29 +0800 | [diff] [blame] | 137 | |
Rao, Lei | 64153ca | 2021-11-03 10:21:12 +0800 | [diff] [blame] | 138 | extract_ip_and_port(tmp_ports, key, pkt, reverse); |
Zhang Chen | afe4612 | 2016-09-27 10:22:33 +0800 | [diff] [blame] | 139 | } |
| 140 | |
Zhang Chen | b6540d4 | 2016-09-27 10:22:29 +0800 | [diff] [blame] | 141 | Connection *connection_new(ConnectionKey *key) |
| 142 | { |
Li Zhijian | 862ee1e | 2020-10-16 13:52:03 +0800 | [diff] [blame] | 143 | Connection *conn = g_slice_new0(Connection); |
Zhang Chen | b6540d4 | 2016-09-27 10:22:29 +0800 | [diff] [blame] | 144 | |
| 145 | conn->ip_proto = key->ip_proto; |
| 146 | conn->processing = false; |
Zhang Chen | 6214231 | 2018-09-14 01:47:53 +0000 | [diff] [blame] | 147 | conn->tcp_state = TCPS_CLOSED; |
Zhang Chen | b6540d4 | 2016-09-27 10:22:29 +0800 | [diff] [blame] | 148 | g_queue_init(&conn->primary_list); |
| 149 | g_queue_init(&conn->secondary_list); |
| 150 | |
| 151 | return conn; |
| 152 | } |
| 153 | |
| 154 | void connection_destroy(void *opaque) |
| 155 | { |
| 156 | Connection *conn = opaque; |
| 157 | |
| 158 | g_queue_foreach(&conn->primary_list, packet_destroy, NULL); |
zhanghailiang | 0e79668 | 2017-02-28 11:54:18 +0800 | [diff] [blame] | 159 | g_queue_clear(&conn->primary_list); |
Zhang Chen | b6540d4 | 2016-09-27 10:22:29 +0800 | [diff] [blame] | 160 | g_queue_foreach(&conn->secondary_list, packet_destroy, NULL); |
zhanghailiang | 0e79668 | 2017-02-28 11:54:18 +0800 | [diff] [blame] | 161 | g_queue_clear(&conn->secondary_list); |
Zhang Chen | b6540d4 | 2016-09-27 10:22:29 +0800 | [diff] [blame] | 162 | g_slice_free(Connection, conn); |
| 163 | } |
| 164 | |
Zhang Chen | ada1a33 | 2017-07-04 14:53:50 +0800 | [diff] [blame] | 165 | Packet *packet_new(const void *data, int size, int vnet_hdr_len) |
Zhang Chen | 59509ec | 2016-09-27 10:22:27 +0800 | [diff] [blame] | 166 | { |
Rao, Lei | 9b49271 | 2021-06-08 16:23:29 +0800 | [diff] [blame] | 167 | Packet *pkt = g_slice_new0(Packet); |
Zhang Chen | 59509ec | 2016-09-27 10:22:27 +0800 | [diff] [blame] | 168 | |
| 169 | pkt->data = g_memdup(data, size); |
| 170 | pkt->size = size; |
Zhang Chen | 0682e15 | 2016-09-27 10:22:30 +0800 | [diff] [blame] | 171 | pkt->creation_ms = qemu_clock_get_ms(QEMU_CLOCK_HOST); |
Zhang Chen | ada1a33 | 2017-07-04 14:53:50 +0800 | [diff] [blame] | 172 | pkt->vnet_hdr_len = vnet_hdr_len; |
Rao, Lei | 9b49271 | 2021-06-08 16:23:29 +0800 | [diff] [blame] | 173 | |
| 174 | return pkt; |
| 175 | } |
| 176 | |
| 177 | /* |
| 178 | * packet_new_nocopy will not copy data, so the caller can't release |
| 179 | * the data. And it will be released in packet_destroy. |
| 180 | */ |
| 181 | Packet *packet_new_nocopy(void *data, int size, int vnet_hdr_len) |
| 182 | { |
| 183 | Packet *pkt = g_slice_new0(Packet); |
| 184 | |
| 185 | pkt->data = data; |
| 186 | pkt->size = size; |
| 187 | pkt->creation_ms = qemu_clock_get_ms(QEMU_CLOCK_HOST); |
| 188 | pkt->vnet_hdr_len = vnet_hdr_len; |
Zhang Chen | 59509ec | 2016-09-27 10:22:27 +0800 | [diff] [blame] | 189 | |
| 190 | return pkt; |
| 191 | } |
| 192 | |
| 193 | void packet_destroy(void *opaque, void *user_data) |
| 194 | { |
| 195 | Packet *pkt = opaque; |
| 196 | |
| 197 | g_free(pkt->data); |
| 198 | g_slice_free(Packet, pkt); |
| 199 | } |
| 200 | |
Lukas Straub | 9c55fe9 | 2020-05-22 15:53:53 +0800 | [diff] [blame] | 201 | void packet_destroy_partial(void *opaque, void *user_data) |
| 202 | { |
| 203 | Packet *pkt = opaque; |
| 204 | |
| 205 | g_slice_free(Packet, pkt); |
| 206 | } |
| 207 | |
Zhang Chen | 59509ec | 2016-09-27 10:22:27 +0800 | [diff] [blame] | 208 | /* |
| 209 | * Clear hashtable, stop this hash growing really huge |
| 210 | */ |
| 211 | void connection_hashtable_reset(GHashTable *connection_track_table) |
| 212 | { |
| 213 | g_hash_table_remove_all(connection_track_table); |
| 214 | } |
Zhang Chen | b6540d4 | 2016-09-27 10:22:29 +0800 | [diff] [blame] | 215 | |
| 216 | /* if not found, create a new connection and add to hash table */ |
| 217 | Connection *connection_get(GHashTable *connection_track_table, |
| 218 | ConnectionKey *key, |
| 219 | GQueue *conn_list) |
| 220 | { |
| 221 | Connection *conn = g_hash_table_lookup(connection_track_table, key); |
| 222 | |
| 223 | if (conn == NULL) { |
| 224 | ConnectionKey *new_key = g_memdup(key, sizeof(*key)); |
| 225 | |
| 226 | conn = connection_new(key); |
| 227 | |
| 228 | if (g_hash_table_size(connection_track_table) > HASHTABLE_MAX_SIZE) { |
| 229 | trace_colo_proxy_main("colo proxy connection hashtable full," |
| 230 | " clear it"); |
| 231 | connection_hashtable_reset(connection_track_table); |
| 232 | /* |
| 233 | * clear the conn_list |
| 234 | */ |
Zhang Chen | 94c36c4 | 2022-04-01 11:47:01 +0800 | [diff] [blame] | 235 | while (conn_list && !g_queue_is_empty(conn_list)) { |
Zhang Chen | b6540d4 | 2016-09-27 10:22:29 +0800 | [diff] [blame] | 236 | connection_destroy(g_queue_pop_head(conn_list)); |
| 237 | } |
| 238 | } |
| 239 | |
| 240 | g_hash_table_insert(connection_track_table, new_key, conn); |
| 241 | } |
| 242 | |
| 243 | return conn; |
| 244 | } |
Zhang Chen | 24525e9 | 2018-09-03 12:38:57 +0800 | [diff] [blame] | 245 | |
| 246 | bool connection_has_tracked(GHashTable *connection_track_table, |
| 247 | ConnectionKey *key) |
| 248 | { |
| 249 | Connection *conn = g_hash_table_lookup(connection_track_table, key); |
| 250 | |
| 251 | return conn ? true : false; |
| 252 | } |