meson: convert qapi-specific to meson
[qemu.git] / hw / net / e1000.c
1 /*
2 * QEMU e1000 emulation
3 *
4 * Software developer's manual:
5 * http://download.intel.com/design/network/manuals/8254x_GBe_SDM.pdf
6 *
7 * Nir Peleg, Tutis Systems Ltd. for Qumranet Inc.
8 * Copyright (c) 2008 Qumranet
9 * Based on work done by:
10 * Copyright (c) 2007 Dan Aloni
11 * Copyright (c) 2004 Antony T Curtis
12 *
13 * This library is free software; you can redistribute it and/or
14 * modify it under the terms of the GNU Lesser General Public
15 * License as published by the Free Software Foundation; either
16 * version 2 of the License, or (at your option) any later version.
17 *
18 * This library is distributed in the hope that it will be useful,
19 * but WITHOUT ANY WARRANTY; without even the implied warranty of
20 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
21 * Lesser General Public License for more details.
22 *
23 * You should have received a copy of the GNU Lesser General Public
24 * License along with this library; if not, see <http://www.gnu.org/licenses/>.
25 */
26
27
28 #include "qemu/osdep.h"
29 #include "hw/pci/pci.h"
30 #include "hw/qdev-properties.h"
31 #include "migration/vmstate.h"
32 #include "net/net.h"
33 #include "net/checksum.h"
34 #include "sysemu/sysemu.h"
35 #include "sysemu/dma.h"
36 #include "qemu/iov.h"
37 #include "qemu/module.h"
38 #include "qemu/range.h"
39
40 #include "e1000x_common.h"
41 #include "trace.h"
42
43 static const uint8_t bcast[] = {0xff, 0xff, 0xff, 0xff, 0xff, 0xff};
44
45 /* #define E1000_DEBUG */
46
47 #ifdef E1000_DEBUG
48 enum {
49 DEBUG_GENERAL, DEBUG_IO, DEBUG_MMIO, DEBUG_INTERRUPT,
50 DEBUG_RX, DEBUG_TX, DEBUG_MDIC, DEBUG_EEPROM,
51 DEBUG_UNKNOWN, DEBUG_TXSUM, DEBUG_TXERR, DEBUG_RXERR,
52 DEBUG_RXFILTER, DEBUG_PHY, DEBUG_NOTYET,
53 };
54 #define DBGBIT(x) (1<<DEBUG_##x)
55 static int debugflags = DBGBIT(TXERR) | DBGBIT(GENERAL);
56
57 #define DBGOUT(what, fmt, ...) do { \
58 if (debugflags & DBGBIT(what)) \
59 fprintf(stderr, "e1000: " fmt, ## __VA_ARGS__); \
60 } while (0)
61 #else
62 #define DBGOUT(what, fmt, ...) do {} while (0)
63 #endif
64
65 #define IOPORT_SIZE 0x40
66 #define PNPMMIO_SIZE 0x20000
67 #define MIN_BUF_SIZE 60 /* Min. octets in an ethernet frame sans FCS */
68
69 #define MAXIMUM_ETHERNET_HDR_LEN (14+4)
70
71 /*
72 * HW models:
73 * E1000_DEV_ID_82540EM works with Windows, Linux, and OS X <= 10.8
74 * E1000_DEV_ID_82544GC_COPPER appears to work; not well tested
75 * E1000_DEV_ID_82545EM_COPPER works with Linux and OS X >= 10.6
76 * Others never tested
77 */
78
79 typedef struct E1000State_st {
80 /*< private >*/
81 PCIDevice parent_obj;
82 /*< public >*/
83
84 NICState *nic;
85 NICConf conf;
86 MemoryRegion mmio;
87 MemoryRegion io;
88
89 uint32_t mac_reg[0x8000];
90 uint16_t phy_reg[0x20];
91 uint16_t eeprom_data[64];
92
93 uint32_t rxbuf_size;
94 uint32_t rxbuf_min_shift;
95 struct e1000_tx {
96 unsigned char header[256];
97 unsigned char vlan_header[4];
98 /* Fields vlan and data must not be reordered or separated. */
99 unsigned char vlan[4];
100 unsigned char data[0x10000];
101 uint16_t size;
102 unsigned char vlan_needed;
103 unsigned char sum_needed;
104 bool cptse;
105 e1000x_txd_props props;
106 e1000x_txd_props tso_props;
107 uint16_t tso_frames;
108 } tx;
109
110 struct {
111 uint32_t val_in; /* shifted in from guest driver */
112 uint16_t bitnum_in;
113 uint16_t bitnum_out;
114 uint16_t reading;
115 uint32_t old_eecd;
116 } eecd_state;
117
118 QEMUTimer *autoneg_timer;
119
120 QEMUTimer *mit_timer; /* Mitigation timer. */
121 bool mit_timer_on; /* Mitigation timer is running. */
122 bool mit_irq_level; /* Tracks interrupt pin level. */
123 uint32_t mit_ide; /* Tracks E1000_TXD_CMD_IDE bit. */
124
125 QEMUTimer *flush_queue_timer;
126
127 /* Compatibility flags for migration to/from qemu 1.3.0 and older */
128 #define E1000_FLAG_AUTONEG_BIT 0
129 #define E1000_FLAG_MIT_BIT 1
130 #define E1000_FLAG_MAC_BIT 2
131 #define E1000_FLAG_TSO_BIT 3
132 #define E1000_FLAG_AUTONEG (1 << E1000_FLAG_AUTONEG_BIT)
133 #define E1000_FLAG_MIT (1 << E1000_FLAG_MIT_BIT)
134 #define E1000_FLAG_MAC (1 << E1000_FLAG_MAC_BIT)
135 #define E1000_FLAG_TSO (1 << E1000_FLAG_TSO_BIT)
136 uint32_t compat_flags;
137 bool received_tx_tso;
138 bool use_tso_for_migration;
139 e1000x_txd_props mig_props;
140 } E1000State;
141
142 #define chkflag(x) (s->compat_flags & E1000_FLAG_##x)
143
144 typedef struct E1000BaseClass {
145 PCIDeviceClass parent_class;
146 uint16_t phy_id2;
147 } E1000BaseClass;
148
149 #define TYPE_E1000_BASE "e1000-base"
150
151 #define E1000(obj) \
152 OBJECT_CHECK(E1000State, (obj), TYPE_E1000_BASE)
153
154 #define E1000_DEVICE_CLASS(klass) \
155 OBJECT_CLASS_CHECK(E1000BaseClass, (klass), TYPE_E1000_BASE)
156 #define E1000_DEVICE_GET_CLASS(obj) \
157 OBJECT_GET_CLASS(E1000BaseClass, (obj), TYPE_E1000_BASE)
158
159 static void
160 e1000_link_up(E1000State *s)
161 {
162 e1000x_update_regs_on_link_up(s->mac_reg, s->phy_reg);
163
164 /* E1000_STATUS_LU is tested by e1000_can_receive() */
165 qemu_flush_queued_packets(qemu_get_queue(s->nic));
166 }
167
168 static void
169 e1000_autoneg_done(E1000State *s)
170 {
171 e1000x_update_regs_on_autoneg_done(s->mac_reg, s->phy_reg);
172
173 /* E1000_STATUS_LU is tested by e1000_can_receive() */
174 qemu_flush_queued_packets(qemu_get_queue(s->nic));
175 }
176
177 static bool
178 have_autoneg(E1000State *s)
179 {
180 return chkflag(AUTONEG) && (s->phy_reg[PHY_CTRL] & MII_CR_AUTO_NEG_EN);
181 }
182
183 static void
184 set_phy_ctrl(E1000State *s, int index, uint16_t val)
185 {
186 /* bits 0-5 reserved; MII_CR_[RESTART_AUTO_NEG,RESET] are self clearing */
187 s->phy_reg[PHY_CTRL] = val & ~(0x3f |
188 MII_CR_RESET |
189 MII_CR_RESTART_AUTO_NEG);
190
191 /*
192 * QEMU 1.3 does not support link auto-negotiation emulation, so if we
193 * migrate during auto negotiation, after migration the link will be
194 * down.
195 */
196 if (have_autoneg(s) && (val & MII_CR_RESTART_AUTO_NEG)) {
197 e1000x_restart_autoneg(s->mac_reg, s->phy_reg, s->autoneg_timer);
198 }
199 }
200
201 static void (*phyreg_writeops[])(E1000State *, int, uint16_t) = {
202 [PHY_CTRL] = set_phy_ctrl,
203 };
204
205 enum { NPHYWRITEOPS = ARRAY_SIZE(phyreg_writeops) };
206
207 enum { PHY_R = 1, PHY_W = 2, PHY_RW = PHY_R | PHY_W };
208 static const char phy_regcap[0x20] = {
209 [PHY_STATUS] = PHY_R, [M88E1000_EXT_PHY_SPEC_CTRL] = PHY_RW,
210 [PHY_ID1] = PHY_R, [M88E1000_PHY_SPEC_CTRL] = PHY_RW,
211 [PHY_CTRL] = PHY_RW, [PHY_1000T_CTRL] = PHY_RW,
212 [PHY_LP_ABILITY] = PHY_R, [PHY_1000T_STATUS] = PHY_R,
213 [PHY_AUTONEG_ADV] = PHY_RW, [M88E1000_RX_ERR_CNTR] = PHY_R,
214 [PHY_ID2] = PHY_R, [M88E1000_PHY_SPEC_STATUS] = PHY_R,
215 [PHY_AUTONEG_EXP] = PHY_R,
216 };
217
218 /* PHY_ID2 documented in 8254x_GBe_SDM.pdf, pp. 250 */
219 static const uint16_t phy_reg_init[] = {
220 [PHY_CTRL] = MII_CR_SPEED_SELECT_MSB |
221 MII_CR_FULL_DUPLEX |
222 MII_CR_AUTO_NEG_EN,
223
224 [PHY_STATUS] = MII_SR_EXTENDED_CAPS |
225 MII_SR_LINK_STATUS | /* link initially up */
226 MII_SR_AUTONEG_CAPS |
227 /* MII_SR_AUTONEG_COMPLETE: initially NOT completed */
228 MII_SR_PREAMBLE_SUPPRESS |
229 MII_SR_EXTENDED_STATUS |
230 MII_SR_10T_HD_CAPS |
231 MII_SR_10T_FD_CAPS |
232 MII_SR_100X_HD_CAPS |
233 MII_SR_100X_FD_CAPS,
234
235 [PHY_ID1] = 0x141,
236 /* [PHY_ID2] configured per DevId, from e1000_reset() */
237 [PHY_AUTONEG_ADV] = 0xde1,
238 [PHY_LP_ABILITY] = 0x1e0,
239 [PHY_1000T_CTRL] = 0x0e00,
240 [PHY_1000T_STATUS] = 0x3c00,
241 [M88E1000_PHY_SPEC_CTRL] = 0x360,
242 [M88E1000_PHY_SPEC_STATUS] = 0xac00,
243 [M88E1000_EXT_PHY_SPEC_CTRL] = 0x0d60,
244 };
245
246 static const uint32_t mac_reg_init[] = {
247 [PBA] = 0x00100030,
248 [LEDCTL] = 0x602,
249 [CTRL] = E1000_CTRL_SWDPIN2 | E1000_CTRL_SWDPIN0 |
250 E1000_CTRL_SPD_1000 | E1000_CTRL_SLU,
251 [STATUS] = 0x80000000 | E1000_STATUS_GIO_MASTER_ENABLE |
252 E1000_STATUS_ASDV | E1000_STATUS_MTXCKOK |
253 E1000_STATUS_SPEED_1000 | E1000_STATUS_FD |
254 E1000_STATUS_LU,
255 [MANC] = E1000_MANC_EN_MNG2HOST | E1000_MANC_RCV_TCO_EN |
256 E1000_MANC_ARP_EN | E1000_MANC_0298_EN |
257 E1000_MANC_RMCP_EN,
258 };
259
260 /* Helper function, *curr == 0 means the value is not set */
261 static inline void
262 mit_update_delay(uint32_t *curr, uint32_t value)
263 {
264 if (value && (*curr == 0 || value < *curr)) {
265 *curr = value;
266 }
267 }
268
269 static void
270 set_interrupt_cause(E1000State *s, int index, uint32_t val)
271 {
272 PCIDevice *d = PCI_DEVICE(s);
273 uint32_t pending_ints;
274 uint32_t mit_delay;
275
276 s->mac_reg[ICR] = val;
277
278 /*
279 * Make sure ICR and ICS registers have the same value.
280 * The spec says that the ICS register is write-only. However in practice,
281 * on real hardware ICS is readable, and for reads it has the same value as
282 * ICR (except that ICS does not have the clear on read behaviour of ICR).
283 *
284 * The VxWorks PRO/1000 driver uses this behaviour.
285 */
286 s->mac_reg[ICS] = val;
287
288 pending_ints = (s->mac_reg[IMS] & s->mac_reg[ICR]);
289 if (!s->mit_irq_level && pending_ints) {
290 /*
291 * Here we detect a potential raising edge. We postpone raising the
292 * interrupt line if we are inside the mitigation delay window
293 * (s->mit_timer_on == 1).
294 * We provide a partial implementation of interrupt mitigation,
295 * emulating only RADV, TADV and ITR (lower 16 bits, 1024ns units for
296 * RADV and TADV, 256ns units for ITR). RDTR is only used to enable
297 * RADV; relative timers based on TIDV and RDTR are not implemented.
298 */
299 if (s->mit_timer_on) {
300 return;
301 }
302 if (chkflag(MIT)) {
303 /* Compute the next mitigation delay according to pending
304 * interrupts and the current values of RADV (provided
305 * RDTR!=0), TADV and ITR.
306 * Then rearm the timer.
307 */
308 mit_delay = 0;
309 if (s->mit_ide &&
310 (pending_ints & (E1000_ICR_TXQE | E1000_ICR_TXDW))) {
311 mit_update_delay(&mit_delay, s->mac_reg[TADV] * 4);
312 }
313 if (s->mac_reg[RDTR] && (pending_ints & E1000_ICS_RXT0)) {
314 mit_update_delay(&mit_delay, s->mac_reg[RADV] * 4);
315 }
316 mit_update_delay(&mit_delay, s->mac_reg[ITR]);
317
318 /*
319 * According to e1000 SPEC, the Ethernet controller guarantees
320 * a maximum observable interrupt rate of 7813 interrupts/sec.
321 * Thus if mit_delay < 500 then the delay should be set to the
322 * minimum delay possible which is 500.
323 */
324 mit_delay = (mit_delay < 500) ? 500 : mit_delay;
325
326 s->mit_timer_on = 1;
327 timer_mod(s->mit_timer, qemu_clock_get_ns(QEMU_CLOCK_VIRTUAL) +
328 mit_delay * 256);
329 s->mit_ide = 0;
330 }
331 }
332
333 s->mit_irq_level = (pending_ints != 0);
334 pci_set_irq(d, s->mit_irq_level);
335 }
336
337 static void
338 e1000_mit_timer(void *opaque)
339 {
340 E1000State *s = opaque;
341
342 s->mit_timer_on = 0;
343 /* Call set_interrupt_cause to update the irq level (if necessary). */
344 set_interrupt_cause(s, 0, s->mac_reg[ICR]);
345 }
346
347 static void
348 set_ics(E1000State *s, int index, uint32_t val)
349 {
350 DBGOUT(INTERRUPT, "set_ics %x, ICR %x, IMR %x\n", val, s->mac_reg[ICR],
351 s->mac_reg[IMS]);
352 set_interrupt_cause(s, 0, val | s->mac_reg[ICR]);
353 }
354
355 static void
356 e1000_autoneg_timer(void *opaque)
357 {
358 E1000State *s = opaque;
359 if (!qemu_get_queue(s->nic)->link_down) {
360 e1000_autoneg_done(s);
361 set_ics(s, 0, E1000_ICS_LSC); /* signal link status change to guest */
362 }
363 }
364
365 static void e1000_reset(void *opaque)
366 {
367 E1000State *d = opaque;
368 E1000BaseClass *edc = E1000_DEVICE_GET_CLASS(d);
369 uint8_t *macaddr = d->conf.macaddr.a;
370
371 timer_del(d->autoneg_timer);
372 timer_del(d->mit_timer);
373 timer_del(d->flush_queue_timer);
374 d->mit_timer_on = 0;
375 d->mit_irq_level = 0;
376 d->mit_ide = 0;
377 memset(d->phy_reg, 0, sizeof d->phy_reg);
378 memmove(d->phy_reg, phy_reg_init, sizeof phy_reg_init);
379 d->phy_reg[PHY_ID2] = edc->phy_id2;
380 memset(d->mac_reg, 0, sizeof d->mac_reg);
381 memmove(d->mac_reg, mac_reg_init, sizeof mac_reg_init);
382 d->rxbuf_min_shift = 1;
383 memset(&d->tx, 0, sizeof d->tx);
384
385 if (qemu_get_queue(d->nic)->link_down) {
386 e1000x_update_regs_on_link_down(d->mac_reg, d->phy_reg);
387 }
388
389 e1000x_reset_mac_addr(d->nic, d->mac_reg, macaddr);
390 }
391
392 static void
393 set_ctrl(E1000State *s, int index, uint32_t val)
394 {
395 /* RST is self clearing */
396 s->mac_reg[CTRL] = val & ~E1000_CTRL_RST;
397 }
398
399 static void
400 e1000_flush_queue_timer(void *opaque)
401 {
402 E1000State *s = opaque;
403
404 qemu_flush_queued_packets(qemu_get_queue(s->nic));
405 }
406
407 static void
408 set_rx_control(E1000State *s, int index, uint32_t val)
409 {
410 s->mac_reg[RCTL] = val;
411 s->rxbuf_size = e1000x_rxbufsize(val);
412 s->rxbuf_min_shift = ((val / E1000_RCTL_RDMTS_QUAT) & 3) + 1;
413 DBGOUT(RX, "RCTL: %d, mac_reg[RCTL] = 0x%x\n", s->mac_reg[RDT],
414 s->mac_reg[RCTL]);
415 timer_mod(s->flush_queue_timer,
416 qemu_clock_get_ms(QEMU_CLOCK_VIRTUAL) + 1000);
417 }
418
419 static void
420 set_mdic(E1000State *s, int index, uint32_t val)
421 {
422 uint32_t data = val & E1000_MDIC_DATA_MASK;
423 uint32_t addr = ((val & E1000_MDIC_REG_MASK) >> E1000_MDIC_REG_SHIFT);
424
425 if ((val & E1000_MDIC_PHY_MASK) >> E1000_MDIC_PHY_SHIFT != 1) // phy #
426 val = s->mac_reg[MDIC] | E1000_MDIC_ERROR;
427 else if (val & E1000_MDIC_OP_READ) {
428 DBGOUT(MDIC, "MDIC read reg 0x%x\n", addr);
429 if (!(phy_regcap[addr] & PHY_R)) {
430 DBGOUT(MDIC, "MDIC read reg %x unhandled\n", addr);
431 val |= E1000_MDIC_ERROR;
432 } else
433 val = (val ^ data) | s->phy_reg[addr];
434 } else if (val & E1000_MDIC_OP_WRITE) {
435 DBGOUT(MDIC, "MDIC write reg 0x%x, value 0x%x\n", addr, data);
436 if (!(phy_regcap[addr] & PHY_W)) {
437 DBGOUT(MDIC, "MDIC write reg %x unhandled\n", addr);
438 val |= E1000_MDIC_ERROR;
439 } else {
440 if (addr < NPHYWRITEOPS && phyreg_writeops[addr]) {
441 phyreg_writeops[addr](s, index, data);
442 } else {
443 s->phy_reg[addr] = data;
444 }
445 }
446 }
447 s->mac_reg[MDIC] = val | E1000_MDIC_READY;
448
449 if (val & E1000_MDIC_INT_EN) {
450 set_ics(s, 0, E1000_ICR_MDAC);
451 }
452 }
453
454 static uint32_t
455 get_eecd(E1000State *s, int index)
456 {
457 uint32_t ret = E1000_EECD_PRES|E1000_EECD_GNT | s->eecd_state.old_eecd;
458
459 DBGOUT(EEPROM, "reading eeprom bit %d (reading %d)\n",
460 s->eecd_state.bitnum_out, s->eecd_state.reading);
461 if (!s->eecd_state.reading ||
462 ((s->eeprom_data[(s->eecd_state.bitnum_out >> 4) & 0x3f] >>
463 ((s->eecd_state.bitnum_out & 0xf) ^ 0xf))) & 1)
464 ret |= E1000_EECD_DO;
465 return ret;
466 }
467
468 static void
469 set_eecd(E1000State *s, int index, uint32_t val)
470 {
471 uint32_t oldval = s->eecd_state.old_eecd;
472
473 s->eecd_state.old_eecd = val & (E1000_EECD_SK | E1000_EECD_CS |
474 E1000_EECD_DI|E1000_EECD_FWE_MASK|E1000_EECD_REQ);
475 if (!(E1000_EECD_CS & val)) { /* CS inactive; nothing to do */
476 return;
477 }
478 if (E1000_EECD_CS & (val ^ oldval)) { /* CS rise edge; reset state */
479 s->eecd_state.val_in = 0;
480 s->eecd_state.bitnum_in = 0;
481 s->eecd_state.bitnum_out = 0;
482 s->eecd_state.reading = 0;
483 }
484 if (!(E1000_EECD_SK & (val ^ oldval))) { /* no clock edge */
485 return;
486 }
487 if (!(E1000_EECD_SK & val)) { /* falling edge */
488 s->eecd_state.bitnum_out++;
489 return;
490 }
491 s->eecd_state.val_in <<= 1;
492 if (val & E1000_EECD_DI)
493 s->eecd_state.val_in |= 1;
494 if (++s->eecd_state.bitnum_in == 9 && !s->eecd_state.reading) {
495 s->eecd_state.bitnum_out = ((s->eecd_state.val_in & 0x3f)<<4)-1;
496 s->eecd_state.reading = (((s->eecd_state.val_in >> 6) & 7) ==
497 EEPROM_READ_OPCODE_MICROWIRE);
498 }
499 DBGOUT(EEPROM, "eeprom bitnum in %d out %d, reading %d\n",
500 s->eecd_state.bitnum_in, s->eecd_state.bitnum_out,
501 s->eecd_state.reading);
502 }
503
504 static uint32_t
505 flash_eerd_read(E1000State *s, int x)
506 {
507 unsigned int index, r = s->mac_reg[EERD] & ~E1000_EEPROM_RW_REG_START;
508
509 if ((s->mac_reg[EERD] & E1000_EEPROM_RW_REG_START) == 0)
510 return (s->mac_reg[EERD]);
511
512 if ((index = r >> E1000_EEPROM_RW_ADDR_SHIFT) > EEPROM_CHECKSUM_REG)
513 return (E1000_EEPROM_RW_REG_DONE | r);
514
515 return ((s->eeprom_data[index] << E1000_EEPROM_RW_REG_DATA) |
516 E1000_EEPROM_RW_REG_DONE | r);
517 }
518
519 static void
520 putsum(uint8_t *data, uint32_t n, uint32_t sloc, uint32_t css, uint32_t cse)
521 {
522 uint32_t sum;
523
524 if (cse && cse < n)
525 n = cse + 1;
526 if (sloc < n-1) {
527 sum = net_checksum_add(n-css, data+css);
528 stw_be_p(data + sloc, net_checksum_finish_nozero(sum));
529 }
530 }
531
532 static inline void
533 inc_tx_bcast_or_mcast_count(E1000State *s, const unsigned char *arr)
534 {
535 if (!memcmp(arr, bcast, sizeof bcast)) {
536 e1000x_inc_reg_if_not_full(s->mac_reg, BPTC);
537 } else if (arr[0] & 1) {
538 e1000x_inc_reg_if_not_full(s->mac_reg, MPTC);
539 }
540 }
541
542 static void
543 e1000_send_packet(E1000State *s, const uint8_t *buf, int size)
544 {
545 static const int PTCregs[6] = { PTC64, PTC127, PTC255, PTC511,
546 PTC1023, PTC1522 };
547
548 NetClientState *nc = qemu_get_queue(s->nic);
549 if (s->phy_reg[PHY_CTRL] & MII_CR_LOOPBACK) {
550 nc->info->receive(nc, buf, size);
551 } else {
552 qemu_send_packet(nc, buf, size);
553 }
554 inc_tx_bcast_or_mcast_count(s, buf);
555 e1000x_increase_size_stats(s->mac_reg, PTCregs, size);
556 }
557
558 static void
559 xmit_seg(E1000State *s)
560 {
561 uint16_t len;
562 unsigned int frames = s->tx.tso_frames, css, sofar;
563 struct e1000_tx *tp = &s->tx;
564 struct e1000x_txd_props *props = tp->cptse ? &tp->tso_props : &tp->props;
565
566 if (tp->cptse) {
567 css = props->ipcss;
568 DBGOUT(TXSUM, "frames %d size %d ipcss %d\n",
569 frames, tp->size, css);
570 if (props->ip) { /* IPv4 */
571 stw_be_p(tp->data+css+2, tp->size - css);
572 stw_be_p(tp->data+css+4,
573 lduw_be_p(tp->data + css + 4) + frames);
574 } else { /* IPv6 */
575 stw_be_p(tp->data+css+4, tp->size - css);
576 }
577 css = props->tucss;
578 len = tp->size - css;
579 DBGOUT(TXSUM, "tcp %d tucss %d len %d\n", props->tcp, css, len);
580 if (props->tcp) {
581 sofar = frames * props->mss;
582 stl_be_p(tp->data+css+4, ldl_be_p(tp->data+css+4)+sofar); /* seq */
583 if (props->paylen - sofar > props->mss) {
584 tp->data[css + 13] &= ~9; /* PSH, FIN */
585 } else if (frames) {
586 e1000x_inc_reg_if_not_full(s->mac_reg, TSCTC);
587 }
588 } else { /* UDP */
589 stw_be_p(tp->data+css+4, len);
590 }
591 if (tp->sum_needed & E1000_TXD_POPTS_TXSM) {
592 unsigned int phsum;
593 // add pseudo-header length before checksum calculation
594 void *sp = tp->data + props->tucso;
595
596 phsum = lduw_be_p(sp) + len;
597 phsum = (phsum >> 16) + (phsum & 0xffff);
598 stw_be_p(sp, phsum);
599 }
600 tp->tso_frames++;
601 }
602
603 if (tp->sum_needed & E1000_TXD_POPTS_TXSM) {
604 putsum(tp->data, tp->size, props->tucso, props->tucss, props->tucse);
605 }
606 if (tp->sum_needed & E1000_TXD_POPTS_IXSM) {
607 putsum(tp->data, tp->size, props->ipcso, props->ipcss, props->ipcse);
608 }
609 if (tp->vlan_needed) {
610 memmove(tp->vlan, tp->data, 4);
611 memmove(tp->data, tp->data + 4, 8);
612 memcpy(tp->data + 8, tp->vlan_header, 4);
613 e1000_send_packet(s, tp->vlan, tp->size + 4);
614 } else {
615 e1000_send_packet(s, tp->data, tp->size);
616 }
617
618 e1000x_inc_reg_if_not_full(s->mac_reg, TPT);
619 e1000x_grow_8reg_if_not_full(s->mac_reg, TOTL, s->tx.size);
620 s->mac_reg[GPTC] = s->mac_reg[TPT];
621 s->mac_reg[GOTCL] = s->mac_reg[TOTL];
622 s->mac_reg[GOTCH] = s->mac_reg[TOTH];
623 }
624
625 static void
626 process_tx_desc(E1000State *s, struct e1000_tx_desc *dp)
627 {
628 PCIDevice *d = PCI_DEVICE(s);
629 uint32_t txd_lower = le32_to_cpu(dp->lower.data);
630 uint32_t dtype = txd_lower & (E1000_TXD_CMD_DEXT | E1000_TXD_DTYP_D);
631 unsigned int split_size = txd_lower & 0xffff, bytes, sz;
632 unsigned int msh = 0xfffff;
633 uint64_t addr;
634 struct e1000_context_desc *xp = (struct e1000_context_desc *)dp;
635 struct e1000_tx *tp = &s->tx;
636
637 s->mit_ide |= (txd_lower & E1000_TXD_CMD_IDE);
638 if (dtype == E1000_TXD_CMD_DEXT) { /* context descriptor */
639 if (le32_to_cpu(xp->cmd_and_length) & E1000_TXD_CMD_TSE) {
640 e1000x_read_tx_ctx_descr(xp, &tp->tso_props);
641 s->use_tso_for_migration = 1;
642 tp->tso_frames = 0;
643 } else {
644 e1000x_read_tx_ctx_descr(xp, &tp->props);
645 s->use_tso_for_migration = 0;
646 }
647 return;
648 } else if (dtype == (E1000_TXD_CMD_DEXT | E1000_TXD_DTYP_D)) {
649 // data descriptor
650 if (tp->size == 0) {
651 tp->sum_needed = le32_to_cpu(dp->upper.data) >> 8;
652 }
653 tp->cptse = (txd_lower & E1000_TXD_CMD_TSE) ? 1 : 0;
654 } else {
655 // legacy descriptor
656 tp->cptse = 0;
657 }
658
659 if (e1000x_vlan_enabled(s->mac_reg) &&
660 e1000x_is_vlan_txd(txd_lower) &&
661 (tp->cptse || txd_lower & E1000_TXD_CMD_EOP)) {
662 tp->vlan_needed = 1;
663 stw_be_p(tp->vlan_header,
664 le16_to_cpu(s->mac_reg[VET]));
665 stw_be_p(tp->vlan_header + 2,
666 le16_to_cpu(dp->upper.fields.special));
667 }
668
669 addr = le64_to_cpu(dp->buffer_addr);
670 if (tp->cptse) {
671 msh = tp->tso_props.hdr_len + tp->tso_props.mss;
672 do {
673 bytes = split_size;
674 if (tp->size + bytes > msh)
675 bytes = msh - tp->size;
676
677 bytes = MIN(sizeof(tp->data) - tp->size, bytes);
678 pci_dma_read(d, addr, tp->data + tp->size, bytes);
679 sz = tp->size + bytes;
680 if (sz >= tp->tso_props.hdr_len
681 && tp->size < tp->tso_props.hdr_len) {
682 memmove(tp->header, tp->data, tp->tso_props.hdr_len);
683 }
684 tp->size = sz;
685 addr += bytes;
686 if (sz == msh) {
687 xmit_seg(s);
688 memmove(tp->data, tp->header, tp->tso_props.hdr_len);
689 tp->size = tp->tso_props.hdr_len;
690 }
691 split_size -= bytes;
692 } while (bytes && split_size);
693 } else {
694 split_size = MIN(sizeof(tp->data) - tp->size, split_size);
695 pci_dma_read(d, addr, tp->data + tp->size, split_size);
696 tp->size += split_size;
697 }
698
699 if (!(txd_lower & E1000_TXD_CMD_EOP))
700 return;
701 if (!(tp->cptse && tp->size < tp->tso_props.hdr_len)) {
702 xmit_seg(s);
703 }
704 tp->tso_frames = 0;
705 tp->sum_needed = 0;
706 tp->vlan_needed = 0;
707 tp->size = 0;
708 tp->cptse = 0;
709 }
710
711 static uint32_t
712 txdesc_writeback(E1000State *s, dma_addr_t base, struct e1000_tx_desc *dp)
713 {
714 PCIDevice *d = PCI_DEVICE(s);
715 uint32_t txd_upper, txd_lower = le32_to_cpu(dp->lower.data);
716
717 if (!(txd_lower & (E1000_TXD_CMD_RS|E1000_TXD_CMD_RPS)))
718 return 0;
719 txd_upper = (le32_to_cpu(dp->upper.data) | E1000_TXD_STAT_DD) &
720 ~(E1000_TXD_STAT_EC | E1000_TXD_STAT_LC | E1000_TXD_STAT_TU);
721 dp->upper.data = cpu_to_le32(txd_upper);
722 pci_dma_write(d, base + ((char *)&dp->upper - (char *)dp),
723 &dp->upper, sizeof(dp->upper));
724 return E1000_ICR_TXDW;
725 }
726
727 static uint64_t tx_desc_base(E1000State *s)
728 {
729 uint64_t bah = s->mac_reg[TDBAH];
730 uint64_t bal = s->mac_reg[TDBAL] & ~0xf;
731
732 return (bah << 32) + bal;
733 }
734
735 static void
736 start_xmit(E1000State *s)
737 {
738 PCIDevice *d = PCI_DEVICE(s);
739 dma_addr_t base;
740 struct e1000_tx_desc desc;
741 uint32_t tdh_start = s->mac_reg[TDH], cause = E1000_ICS_TXQE;
742
743 if (!(s->mac_reg[TCTL] & E1000_TCTL_EN)) {
744 DBGOUT(TX, "tx disabled\n");
745 return;
746 }
747
748 while (s->mac_reg[TDH] != s->mac_reg[TDT]) {
749 base = tx_desc_base(s) +
750 sizeof(struct e1000_tx_desc) * s->mac_reg[TDH];
751 pci_dma_read(d, base, &desc, sizeof(desc));
752
753 DBGOUT(TX, "index %d: %p : %x %x\n", s->mac_reg[TDH],
754 (void *)(intptr_t)desc.buffer_addr, desc.lower.data,
755 desc.upper.data);
756
757 process_tx_desc(s, &desc);
758 cause |= txdesc_writeback(s, base, &desc);
759
760 if (++s->mac_reg[TDH] * sizeof(desc) >= s->mac_reg[TDLEN])
761 s->mac_reg[TDH] = 0;
762 /*
763 * the following could happen only if guest sw assigns
764 * bogus values to TDT/TDLEN.
765 * there's nothing too intelligent we could do about this.
766 */
767 if (s->mac_reg[TDH] == tdh_start ||
768 tdh_start >= s->mac_reg[TDLEN] / sizeof(desc)) {
769 DBGOUT(TXERR, "TDH wraparound @%x, TDT %x, TDLEN %x\n",
770 tdh_start, s->mac_reg[TDT], s->mac_reg[TDLEN]);
771 break;
772 }
773 }
774 set_ics(s, 0, cause);
775 }
776
777 static int
778 receive_filter(E1000State *s, const uint8_t *buf, int size)
779 {
780 uint32_t rctl = s->mac_reg[RCTL];
781 int isbcast = !memcmp(buf, bcast, sizeof bcast), ismcast = (buf[0] & 1);
782
783 if (e1000x_is_vlan_packet(buf, le16_to_cpu(s->mac_reg[VET])) &&
784 e1000x_vlan_rx_filter_enabled(s->mac_reg)) {
785 uint16_t vid = lduw_be_p(buf + 14);
786 uint32_t vfta = ldl_le_p((uint32_t*)(s->mac_reg + VFTA) +
787 ((vid >> 5) & 0x7f));
788 if ((vfta & (1 << (vid & 0x1f))) == 0)
789 return 0;
790 }
791
792 if (!isbcast && !ismcast && (rctl & E1000_RCTL_UPE)) { /* promiscuous ucast */
793 return 1;
794 }
795
796 if (ismcast && (rctl & E1000_RCTL_MPE)) { /* promiscuous mcast */
797 e1000x_inc_reg_if_not_full(s->mac_reg, MPRC);
798 return 1;
799 }
800
801 if (isbcast && (rctl & E1000_RCTL_BAM)) { /* broadcast enabled */
802 e1000x_inc_reg_if_not_full(s->mac_reg, BPRC);
803 return 1;
804 }
805
806 return e1000x_rx_group_filter(s->mac_reg, buf);
807 }
808
809 static void
810 e1000_set_link_status(NetClientState *nc)
811 {
812 E1000State *s = qemu_get_nic_opaque(nc);
813 uint32_t old_status = s->mac_reg[STATUS];
814
815 if (nc->link_down) {
816 e1000x_update_regs_on_link_down(s->mac_reg, s->phy_reg);
817 } else {
818 if (have_autoneg(s) &&
819 !(s->phy_reg[PHY_STATUS] & MII_SR_AUTONEG_COMPLETE)) {
820 e1000x_restart_autoneg(s->mac_reg, s->phy_reg, s->autoneg_timer);
821 } else {
822 e1000_link_up(s);
823 }
824 }
825
826 if (s->mac_reg[STATUS] != old_status)
827 set_ics(s, 0, E1000_ICR_LSC);
828 }
829
830 static bool e1000_has_rxbufs(E1000State *s, size_t total_size)
831 {
832 int bufs;
833 /* Fast-path short packets */
834 if (total_size <= s->rxbuf_size) {
835 return s->mac_reg[RDH] != s->mac_reg[RDT];
836 }
837 if (s->mac_reg[RDH] < s->mac_reg[RDT]) {
838 bufs = s->mac_reg[RDT] - s->mac_reg[RDH];
839 } else if (s->mac_reg[RDH] > s->mac_reg[RDT]) {
840 bufs = s->mac_reg[RDLEN] / sizeof(struct e1000_rx_desc) +
841 s->mac_reg[RDT] - s->mac_reg[RDH];
842 } else {
843 return false;
844 }
845 return total_size <= bufs * s->rxbuf_size;
846 }
847
848 static bool
849 e1000_can_receive(NetClientState *nc)
850 {
851 E1000State *s = qemu_get_nic_opaque(nc);
852
853 return e1000x_rx_ready(&s->parent_obj, s->mac_reg) &&
854 e1000_has_rxbufs(s, 1) && !timer_pending(s->flush_queue_timer);
855 }
856
857 static uint64_t rx_desc_base(E1000State *s)
858 {
859 uint64_t bah = s->mac_reg[RDBAH];
860 uint64_t bal = s->mac_reg[RDBAL] & ~0xf;
861
862 return (bah << 32) + bal;
863 }
864
865 static void
866 e1000_receiver_overrun(E1000State *s, size_t size)
867 {
868 trace_e1000_receiver_overrun(size, s->mac_reg[RDH], s->mac_reg[RDT]);
869 e1000x_inc_reg_if_not_full(s->mac_reg, RNBC);
870 e1000x_inc_reg_if_not_full(s->mac_reg, MPC);
871 set_ics(s, 0, E1000_ICS_RXO);
872 }
873
874 static ssize_t
875 e1000_receive_iov(NetClientState *nc, const struct iovec *iov, int iovcnt)
876 {
877 E1000State *s = qemu_get_nic_opaque(nc);
878 PCIDevice *d = PCI_DEVICE(s);
879 struct e1000_rx_desc desc;
880 dma_addr_t base;
881 unsigned int n, rdt;
882 uint32_t rdh_start;
883 uint16_t vlan_special = 0;
884 uint8_t vlan_status = 0;
885 uint8_t min_buf[MIN_BUF_SIZE];
886 struct iovec min_iov;
887 uint8_t *filter_buf = iov->iov_base;
888 size_t size = iov_size(iov, iovcnt);
889 size_t iov_ofs = 0;
890 size_t desc_offset;
891 size_t desc_size;
892 size_t total_size;
893
894 if (!e1000x_hw_rx_enabled(s->mac_reg)) {
895 return -1;
896 }
897
898 if (timer_pending(s->flush_queue_timer)) {
899 return 0;
900 }
901
902 /* Pad to minimum Ethernet frame length */
903 if (size < sizeof(min_buf)) {
904 iov_to_buf(iov, iovcnt, 0, min_buf, size);
905 memset(&min_buf[size], 0, sizeof(min_buf) - size);
906 min_iov.iov_base = filter_buf = min_buf;
907 min_iov.iov_len = size = sizeof(min_buf);
908 iovcnt = 1;
909 iov = &min_iov;
910 } else if (iov->iov_len < MAXIMUM_ETHERNET_HDR_LEN) {
911 /* This is very unlikely, but may happen. */
912 iov_to_buf(iov, iovcnt, 0, min_buf, MAXIMUM_ETHERNET_HDR_LEN);
913 filter_buf = min_buf;
914 }
915
916 /* Discard oversized packets if !LPE and !SBP. */
917 if (e1000x_is_oversized(s->mac_reg, size)) {
918 return size;
919 }
920
921 if (!receive_filter(s, filter_buf, size)) {
922 return size;
923 }
924
925 if (e1000x_vlan_enabled(s->mac_reg) &&
926 e1000x_is_vlan_packet(filter_buf, le16_to_cpu(s->mac_reg[VET]))) {
927 vlan_special = cpu_to_le16(lduw_be_p(filter_buf + 14));
928 iov_ofs = 4;
929 if (filter_buf == iov->iov_base) {
930 memmove(filter_buf + 4, filter_buf, 12);
931 } else {
932 iov_from_buf(iov, iovcnt, 4, filter_buf, 12);
933 while (iov->iov_len <= iov_ofs) {
934 iov_ofs -= iov->iov_len;
935 iov++;
936 }
937 }
938 vlan_status = E1000_RXD_STAT_VP;
939 size -= 4;
940 }
941
942 rdh_start = s->mac_reg[RDH];
943 desc_offset = 0;
944 total_size = size + e1000x_fcs_len(s->mac_reg);
945 if (!e1000_has_rxbufs(s, total_size)) {
946 e1000_receiver_overrun(s, total_size);
947 return -1;
948 }
949 do {
950 desc_size = total_size - desc_offset;
951 if (desc_size > s->rxbuf_size) {
952 desc_size = s->rxbuf_size;
953 }
954 base = rx_desc_base(s) + sizeof(desc) * s->mac_reg[RDH];
955 pci_dma_read(d, base, &desc, sizeof(desc));
956 desc.special = vlan_special;
957 desc.status |= (vlan_status | E1000_RXD_STAT_DD);
958 if (desc.buffer_addr) {
959 if (desc_offset < size) {
960 size_t iov_copy;
961 hwaddr ba = le64_to_cpu(desc.buffer_addr);
962 size_t copy_size = size - desc_offset;
963 if (copy_size > s->rxbuf_size) {
964 copy_size = s->rxbuf_size;
965 }
966 do {
967 iov_copy = MIN(copy_size, iov->iov_len - iov_ofs);
968 pci_dma_write(d, ba, iov->iov_base + iov_ofs, iov_copy);
969 copy_size -= iov_copy;
970 ba += iov_copy;
971 iov_ofs += iov_copy;
972 if (iov_ofs == iov->iov_len) {
973 iov++;
974 iov_ofs = 0;
975 }
976 } while (copy_size);
977 }
978 desc_offset += desc_size;
979 desc.length = cpu_to_le16(desc_size);
980 if (desc_offset >= total_size) {
981 desc.status |= E1000_RXD_STAT_EOP | E1000_RXD_STAT_IXSM;
982 } else {
983 /* Guest zeroing out status is not a hardware requirement.
984 Clear EOP in case guest didn't do it. */
985 desc.status &= ~E1000_RXD_STAT_EOP;
986 }
987 } else { // as per intel docs; skip descriptors with null buf addr
988 DBGOUT(RX, "Null RX descriptor!!\n");
989 }
990 pci_dma_write(d, base, &desc, sizeof(desc));
991
992 if (++s->mac_reg[RDH] * sizeof(desc) >= s->mac_reg[RDLEN])
993 s->mac_reg[RDH] = 0;
994 /* see comment in start_xmit; same here */
995 if (s->mac_reg[RDH] == rdh_start ||
996 rdh_start >= s->mac_reg[RDLEN] / sizeof(desc)) {
997 DBGOUT(RXERR, "RDH wraparound @%x, RDT %x, RDLEN %x\n",
998 rdh_start, s->mac_reg[RDT], s->mac_reg[RDLEN]);
999 e1000_receiver_overrun(s, total_size);
1000 return -1;
1001 }
1002 } while (desc_offset < total_size);
1003
1004 e1000x_update_rx_total_stats(s->mac_reg, size, total_size);
1005
1006 n = E1000_ICS_RXT0;
1007 if ((rdt = s->mac_reg[RDT]) < s->mac_reg[RDH])
1008 rdt += s->mac_reg[RDLEN] / sizeof(desc);
1009 if (((rdt - s->mac_reg[RDH]) * sizeof(desc)) <= s->mac_reg[RDLEN] >>
1010 s->rxbuf_min_shift)
1011 n |= E1000_ICS_RXDMT0;
1012
1013 set_ics(s, 0, n);
1014
1015 return size;
1016 }
1017
1018 static ssize_t
1019 e1000_receive(NetClientState *nc, const uint8_t *buf, size_t size)
1020 {
1021 const struct iovec iov = {
1022 .iov_base = (uint8_t *)buf,
1023 .iov_len = size
1024 };
1025
1026 return e1000_receive_iov(nc, &iov, 1);
1027 }
1028
1029 static uint32_t
1030 mac_readreg(E1000State *s, int index)
1031 {
1032 return s->mac_reg[index];
1033 }
1034
1035 static uint32_t
1036 mac_low4_read(E1000State *s, int index)
1037 {
1038 return s->mac_reg[index] & 0xf;
1039 }
1040
1041 static uint32_t
1042 mac_low11_read(E1000State *s, int index)
1043 {
1044 return s->mac_reg[index] & 0x7ff;
1045 }
1046
1047 static uint32_t
1048 mac_low13_read(E1000State *s, int index)
1049 {
1050 return s->mac_reg[index] & 0x1fff;
1051 }
1052
1053 static uint32_t
1054 mac_low16_read(E1000State *s, int index)
1055 {
1056 return s->mac_reg[index] & 0xffff;
1057 }
1058
1059 static uint32_t
1060 mac_icr_read(E1000State *s, int index)
1061 {
1062 uint32_t ret = s->mac_reg[ICR];
1063
1064 DBGOUT(INTERRUPT, "ICR read: %x\n", ret);
1065 set_interrupt_cause(s, 0, 0);
1066 return ret;
1067 }
1068
1069 static uint32_t
1070 mac_read_clr4(E1000State *s, int index)
1071 {
1072 uint32_t ret = s->mac_reg[index];
1073
1074 s->mac_reg[index] = 0;
1075 return ret;
1076 }
1077
1078 static uint32_t
1079 mac_read_clr8(E1000State *s, int index)
1080 {
1081 uint32_t ret = s->mac_reg[index];
1082
1083 s->mac_reg[index] = 0;
1084 s->mac_reg[index-1] = 0;
1085 return ret;
1086 }
1087
1088 static void
1089 mac_writereg(E1000State *s, int index, uint32_t val)
1090 {
1091 uint32_t macaddr[2];
1092
1093 s->mac_reg[index] = val;
1094
1095 if (index == RA + 1) {
1096 macaddr[0] = cpu_to_le32(s->mac_reg[RA]);
1097 macaddr[1] = cpu_to_le32(s->mac_reg[RA + 1]);
1098 qemu_format_nic_info_str(qemu_get_queue(s->nic), (uint8_t *)macaddr);
1099 }
1100 }
1101
1102 static void
1103 set_rdt(E1000State *s, int index, uint32_t val)
1104 {
1105 s->mac_reg[index] = val & 0xffff;
1106 if (e1000_has_rxbufs(s, 1)) {
1107 qemu_flush_queued_packets(qemu_get_queue(s->nic));
1108 }
1109 }
1110
1111 static void
1112 set_16bit(E1000State *s, int index, uint32_t val)
1113 {
1114 s->mac_reg[index] = val & 0xffff;
1115 }
1116
1117 static void
1118 set_dlen(E1000State *s, int index, uint32_t val)
1119 {
1120 s->mac_reg[index] = val & 0xfff80;
1121 }
1122
1123 static void
1124 set_tctl(E1000State *s, int index, uint32_t val)
1125 {
1126 s->mac_reg[index] = val;
1127 s->mac_reg[TDT] &= 0xffff;
1128 start_xmit(s);
1129 }
1130
1131 static void
1132 set_icr(E1000State *s, int index, uint32_t val)
1133 {
1134 DBGOUT(INTERRUPT, "set_icr %x\n", val);
1135 set_interrupt_cause(s, 0, s->mac_reg[ICR] & ~val);
1136 }
1137
1138 static void
1139 set_imc(E1000State *s, int index, uint32_t val)
1140 {
1141 s->mac_reg[IMS] &= ~val;
1142 set_ics(s, 0, 0);
1143 }
1144
1145 static void
1146 set_ims(E1000State *s, int index, uint32_t val)
1147 {
1148 s->mac_reg[IMS] |= val;
1149 set_ics(s, 0, 0);
1150 }
1151
1152 #define getreg(x) [x] = mac_readreg
1153 typedef uint32_t (*readops)(E1000State *, int);
1154 static const readops macreg_readops[] = {
1155 getreg(PBA), getreg(RCTL), getreg(TDH), getreg(TXDCTL),
1156 getreg(WUFC), getreg(TDT), getreg(CTRL), getreg(LEDCTL),
1157 getreg(MANC), getreg(MDIC), getreg(SWSM), getreg(STATUS),
1158 getreg(TORL), getreg(TOTL), getreg(IMS), getreg(TCTL),
1159 getreg(RDH), getreg(RDT), getreg(VET), getreg(ICS),
1160 getreg(TDBAL), getreg(TDBAH), getreg(RDBAH), getreg(RDBAL),
1161 getreg(TDLEN), getreg(RDLEN), getreg(RDTR), getreg(RADV),
1162 getreg(TADV), getreg(ITR), getreg(FCRUC), getreg(IPAV),
1163 getreg(WUC), getreg(WUS), getreg(SCC), getreg(ECOL),
1164 getreg(MCC), getreg(LATECOL), getreg(COLC), getreg(DC),
1165 getreg(TNCRS), getreg(SEQEC), getreg(CEXTERR), getreg(RLEC),
1166 getreg(XONRXC), getreg(XONTXC), getreg(XOFFRXC), getreg(XOFFTXC),
1167 getreg(RFC), getreg(RJC), getreg(RNBC), getreg(TSCTFC),
1168 getreg(MGTPRC), getreg(MGTPDC), getreg(MGTPTC), getreg(GORCL),
1169 getreg(GOTCL),
1170
1171 [TOTH] = mac_read_clr8, [TORH] = mac_read_clr8,
1172 [GOTCH] = mac_read_clr8, [GORCH] = mac_read_clr8,
1173 [PRC64] = mac_read_clr4, [PRC127] = mac_read_clr4,
1174 [PRC255] = mac_read_clr4, [PRC511] = mac_read_clr4,
1175 [PRC1023] = mac_read_clr4, [PRC1522] = mac_read_clr4,
1176 [PTC64] = mac_read_clr4, [PTC127] = mac_read_clr4,
1177 [PTC255] = mac_read_clr4, [PTC511] = mac_read_clr4,
1178 [PTC1023] = mac_read_clr4, [PTC1522] = mac_read_clr4,
1179 [GPRC] = mac_read_clr4, [GPTC] = mac_read_clr4,
1180 [TPT] = mac_read_clr4, [TPR] = mac_read_clr4,
1181 [RUC] = mac_read_clr4, [ROC] = mac_read_clr4,
1182 [BPRC] = mac_read_clr4, [MPRC] = mac_read_clr4,
1183 [TSCTC] = mac_read_clr4, [BPTC] = mac_read_clr4,
1184 [MPTC] = mac_read_clr4,
1185 [ICR] = mac_icr_read, [EECD] = get_eecd,
1186 [EERD] = flash_eerd_read,
1187 [RDFH] = mac_low13_read, [RDFT] = mac_low13_read,
1188 [RDFHS] = mac_low13_read, [RDFTS] = mac_low13_read,
1189 [RDFPC] = mac_low13_read,
1190 [TDFH] = mac_low11_read, [TDFT] = mac_low11_read,
1191 [TDFHS] = mac_low13_read, [TDFTS] = mac_low13_read,
1192 [TDFPC] = mac_low13_read,
1193 [AIT] = mac_low16_read,
1194
1195 [CRCERRS ... MPC] = &mac_readreg,
1196 [IP6AT ... IP6AT+3] = &mac_readreg, [IP4AT ... IP4AT+6] = &mac_readreg,
1197 [FFLT ... FFLT+6] = &mac_low11_read,
1198 [RA ... RA+31] = &mac_readreg,
1199 [WUPM ... WUPM+31] = &mac_readreg,
1200 [MTA ... MTA+127] = &mac_readreg,
1201 [VFTA ... VFTA+127] = &mac_readreg,
1202 [FFMT ... FFMT+254] = &mac_low4_read,
1203 [FFVT ... FFVT+254] = &mac_readreg,
1204 [PBM ... PBM+16383] = &mac_readreg,
1205 };
1206 enum { NREADOPS = ARRAY_SIZE(macreg_readops) };
1207
1208 #define putreg(x) [x] = mac_writereg
1209 typedef void (*writeops)(E1000State *, int, uint32_t);
1210 static const writeops macreg_writeops[] = {
1211 putreg(PBA), putreg(EERD), putreg(SWSM), putreg(WUFC),
1212 putreg(TDBAL), putreg(TDBAH), putreg(TXDCTL), putreg(RDBAH),
1213 putreg(RDBAL), putreg(LEDCTL), putreg(VET), putreg(FCRUC),
1214 putreg(TDFH), putreg(TDFT), putreg(TDFHS), putreg(TDFTS),
1215 putreg(TDFPC), putreg(RDFH), putreg(RDFT), putreg(RDFHS),
1216 putreg(RDFTS), putreg(RDFPC), putreg(IPAV), putreg(WUC),
1217 putreg(WUS), putreg(AIT),
1218
1219 [TDLEN] = set_dlen, [RDLEN] = set_dlen, [TCTL] = set_tctl,
1220 [TDT] = set_tctl, [MDIC] = set_mdic, [ICS] = set_ics,
1221 [TDH] = set_16bit, [RDH] = set_16bit, [RDT] = set_rdt,
1222 [IMC] = set_imc, [IMS] = set_ims, [ICR] = set_icr,
1223 [EECD] = set_eecd, [RCTL] = set_rx_control, [CTRL] = set_ctrl,
1224 [RDTR] = set_16bit, [RADV] = set_16bit, [TADV] = set_16bit,
1225 [ITR] = set_16bit,
1226
1227 [IP6AT ... IP6AT+3] = &mac_writereg, [IP4AT ... IP4AT+6] = &mac_writereg,
1228 [FFLT ... FFLT+6] = &mac_writereg,
1229 [RA ... RA+31] = &mac_writereg,
1230 [WUPM ... WUPM+31] = &mac_writereg,
1231 [MTA ... MTA+127] = &mac_writereg,
1232 [VFTA ... VFTA+127] = &mac_writereg,
1233 [FFMT ... FFMT+254] = &mac_writereg, [FFVT ... FFVT+254] = &mac_writereg,
1234 [PBM ... PBM+16383] = &mac_writereg,
1235 };
1236
1237 enum { NWRITEOPS = ARRAY_SIZE(macreg_writeops) };
1238
1239 enum { MAC_ACCESS_PARTIAL = 1, MAC_ACCESS_FLAG_NEEDED = 2 };
1240
1241 #define markflag(x) ((E1000_FLAG_##x << 2) | MAC_ACCESS_FLAG_NEEDED)
1242 /* In the array below the meaning of the bits is: [f|f|f|f|f|f|n|p]
1243 * f - flag bits (up to 6 possible flags)
1244 * n - flag needed
1245 * p - partially implenented */
1246 static const uint8_t mac_reg_access[0x8000] = {
1247 [RDTR] = markflag(MIT), [TADV] = markflag(MIT),
1248 [RADV] = markflag(MIT), [ITR] = markflag(MIT),
1249
1250 [IPAV] = markflag(MAC), [WUC] = markflag(MAC),
1251 [IP6AT] = markflag(MAC), [IP4AT] = markflag(MAC),
1252 [FFVT] = markflag(MAC), [WUPM] = markflag(MAC),
1253 [ECOL] = markflag(MAC), [MCC] = markflag(MAC),
1254 [DC] = markflag(MAC), [TNCRS] = markflag(MAC),
1255 [RLEC] = markflag(MAC), [XONRXC] = markflag(MAC),
1256 [XOFFTXC] = markflag(MAC), [RFC] = markflag(MAC),
1257 [TSCTFC] = markflag(MAC), [MGTPRC] = markflag(MAC),
1258 [WUS] = markflag(MAC), [AIT] = markflag(MAC),
1259 [FFLT] = markflag(MAC), [FFMT] = markflag(MAC),
1260 [SCC] = markflag(MAC), [FCRUC] = markflag(MAC),
1261 [LATECOL] = markflag(MAC), [COLC] = markflag(MAC),
1262 [SEQEC] = markflag(MAC), [CEXTERR] = markflag(MAC),
1263 [XONTXC] = markflag(MAC), [XOFFRXC] = markflag(MAC),
1264 [RJC] = markflag(MAC), [RNBC] = markflag(MAC),
1265 [MGTPDC] = markflag(MAC), [MGTPTC] = markflag(MAC),
1266 [RUC] = markflag(MAC), [ROC] = markflag(MAC),
1267 [GORCL] = markflag(MAC), [GORCH] = markflag(MAC),
1268 [GOTCL] = markflag(MAC), [GOTCH] = markflag(MAC),
1269 [BPRC] = markflag(MAC), [MPRC] = markflag(MAC),
1270 [TSCTC] = markflag(MAC), [PRC64] = markflag(MAC),
1271 [PRC127] = markflag(MAC), [PRC255] = markflag(MAC),
1272 [PRC511] = markflag(MAC), [PRC1023] = markflag(MAC),
1273 [PRC1522] = markflag(MAC), [PTC64] = markflag(MAC),
1274 [PTC127] = markflag(MAC), [PTC255] = markflag(MAC),
1275 [PTC511] = markflag(MAC), [PTC1023] = markflag(MAC),
1276 [PTC1522] = markflag(MAC), [MPTC] = markflag(MAC),
1277 [BPTC] = markflag(MAC),
1278
1279 [TDFH] = markflag(MAC) | MAC_ACCESS_PARTIAL,
1280 [TDFT] = markflag(MAC) | MAC_ACCESS_PARTIAL,
1281 [TDFHS] = markflag(MAC) | MAC_ACCESS_PARTIAL,
1282 [TDFTS] = markflag(MAC) | MAC_ACCESS_PARTIAL,
1283 [TDFPC] = markflag(MAC) | MAC_ACCESS_PARTIAL,
1284 [RDFH] = markflag(MAC) | MAC_ACCESS_PARTIAL,
1285 [RDFT] = markflag(MAC) | MAC_ACCESS_PARTIAL,
1286 [RDFHS] = markflag(MAC) | MAC_ACCESS_PARTIAL,
1287 [RDFTS] = markflag(MAC) | MAC_ACCESS_PARTIAL,
1288 [RDFPC] = markflag(MAC) | MAC_ACCESS_PARTIAL,
1289 [PBM] = markflag(MAC) | MAC_ACCESS_PARTIAL,
1290 };
1291
1292 static void
1293 e1000_mmio_write(void *opaque, hwaddr addr, uint64_t val,
1294 unsigned size)
1295 {
1296 E1000State *s = opaque;
1297 unsigned int index = (addr & 0x1ffff) >> 2;
1298
1299 if (index < NWRITEOPS && macreg_writeops[index]) {
1300 if (!(mac_reg_access[index] & MAC_ACCESS_FLAG_NEEDED)
1301 || (s->compat_flags & (mac_reg_access[index] >> 2))) {
1302 if (mac_reg_access[index] & MAC_ACCESS_PARTIAL) {
1303 DBGOUT(GENERAL, "Writing to register at offset: 0x%08x. "
1304 "It is not fully implemented.\n", index<<2);
1305 }
1306 macreg_writeops[index](s, index, val);
1307 } else { /* "flag needed" bit is set, but the flag is not active */
1308 DBGOUT(MMIO, "MMIO write attempt to disabled reg. addr=0x%08x\n",
1309 index<<2);
1310 }
1311 } else if (index < NREADOPS && macreg_readops[index]) {
1312 DBGOUT(MMIO, "e1000_mmio_writel RO %x: 0x%04"PRIx64"\n",
1313 index<<2, val);
1314 } else {
1315 DBGOUT(UNKNOWN, "MMIO unknown write addr=0x%08x,val=0x%08"PRIx64"\n",
1316 index<<2, val);
1317 }
1318 }
1319
1320 static uint64_t
1321 e1000_mmio_read(void *opaque, hwaddr addr, unsigned size)
1322 {
1323 E1000State *s = opaque;
1324 unsigned int index = (addr & 0x1ffff) >> 2;
1325
1326 if (index < NREADOPS && macreg_readops[index]) {
1327 if (!(mac_reg_access[index] & MAC_ACCESS_FLAG_NEEDED)
1328 || (s->compat_flags & (mac_reg_access[index] >> 2))) {
1329 if (mac_reg_access[index] & MAC_ACCESS_PARTIAL) {
1330 DBGOUT(GENERAL, "Reading register at offset: 0x%08x. "
1331 "It is not fully implemented.\n", index<<2);
1332 }
1333 return macreg_readops[index](s, index);
1334 } else { /* "flag needed" bit is set, but the flag is not active */
1335 DBGOUT(MMIO, "MMIO read attempt of disabled reg. addr=0x%08x\n",
1336 index<<2);
1337 }
1338 } else {
1339 DBGOUT(UNKNOWN, "MMIO unknown read addr=0x%08x\n", index<<2);
1340 }
1341 return 0;
1342 }
1343
1344 static const MemoryRegionOps e1000_mmio_ops = {
1345 .read = e1000_mmio_read,
1346 .write = e1000_mmio_write,
1347 .endianness = DEVICE_LITTLE_ENDIAN,
1348 .impl = {
1349 .min_access_size = 4,
1350 .max_access_size = 4,
1351 },
1352 };
1353
1354 static uint64_t e1000_io_read(void *opaque, hwaddr addr,
1355 unsigned size)
1356 {
1357 E1000State *s = opaque;
1358
1359 (void)s;
1360 return 0;
1361 }
1362
1363 static void e1000_io_write(void *opaque, hwaddr addr,
1364 uint64_t val, unsigned size)
1365 {
1366 E1000State *s = opaque;
1367
1368 (void)s;
1369 }
1370
1371 static const MemoryRegionOps e1000_io_ops = {
1372 .read = e1000_io_read,
1373 .write = e1000_io_write,
1374 .endianness = DEVICE_LITTLE_ENDIAN,
1375 };
1376
1377 static bool is_version_1(void *opaque, int version_id)
1378 {
1379 return version_id == 1;
1380 }
1381
1382 static int e1000_pre_save(void *opaque)
1383 {
1384 E1000State *s = opaque;
1385 NetClientState *nc = qemu_get_queue(s->nic);
1386
1387 /*
1388 * If link is down and auto-negotiation is supported and ongoing,
1389 * complete auto-negotiation immediately. This allows us to look
1390 * at MII_SR_AUTONEG_COMPLETE to infer link status on load.
1391 */
1392 if (nc->link_down && have_autoneg(s)) {
1393 s->phy_reg[PHY_STATUS] |= MII_SR_AUTONEG_COMPLETE;
1394 }
1395
1396 /* Decide which set of props to migrate in the main structure */
1397 if (chkflag(TSO) || !s->use_tso_for_migration) {
1398 /* Either we're migrating with the extra subsection, in which
1399 * case the mig_props is always 'props' OR
1400 * we've not got the subsection, but 'props' was the last
1401 * updated.
1402 */
1403 s->mig_props = s->tx.props;
1404 } else {
1405 /* We're not using the subsection, and 'tso_props' was
1406 * the last updated.
1407 */
1408 s->mig_props = s->tx.tso_props;
1409 }
1410 return 0;
1411 }
1412
1413 static int e1000_post_load(void *opaque, int version_id)
1414 {
1415 E1000State *s = opaque;
1416 NetClientState *nc = qemu_get_queue(s->nic);
1417
1418 if (!chkflag(MIT)) {
1419 s->mac_reg[ITR] = s->mac_reg[RDTR] = s->mac_reg[RADV] =
1420 s->mac_reg[TADV] = 0;
1421 s->mit_irq_level = false;
1422 }
1423 s->mit_ide = 0;
1424 s->mit_timer_on = true;
1425 timer_mod(s->mit_timer, qemu_clock_get_ns(QEMU_CLOCK_VIRTUAL) + 1);
1426
1427 /* nc.link_down can't be migrated, so infer link_down according
1428 * to link status bit in mac_reg[STATUS].
1429 * Alternatively, restart link negotiation if it was in progress. */
1430 nc->link_down = (s->mac_reg[STATUS] & E1000_STATUS_LU) == 0;
1431
1432 if (have_autoneg(s) &&
1433 !(s->phy_reg[PHY_STATUS] & MII_SR_AUTONEG_COMPLETE)) {
1434 nc->link_down = false;
1435 timer_mod(s->autoneg_timer,
1436 qemu_clock_get_ms(QEMU_CLOCK_VIRTUAL) + 500);
1437 }
1438
1439 s->tx.props = s->mig_props;
1440 if (!s->received_tx_tso) {
1441 /* We received only one set of offload data (tx.props)
1442 * and haven't got tx.tso_props. The best we can do
1443 * is dupe the data.
1444 */
1445 s->tx.tso_props = s->mig_props;
1446 }
1447 return 0;
1448 }
1449
1450 static int e1000_tx_tso_post_load(void *opaque, int version_id)
1451 {
1452 E1000State *s = opaque;
1453 s->received_tx_tso = true;
1454 return 0;
1455 }
1456
1457 static bool e1000_mit_state_needed(void *opaque)
1458 {
1459 E1000State *s = opaque;
1460
1461 return chkflag(MIT);
1462 }
1463
1464 static bool e1000_full_mac_needed(void *opaque)
1465 {
1466 E1000State *s = opaque;
1467
1468 return chkflag(MAC);
1469 }
1470
1471 static bool e1000_tso_state_needed(void *opaque)
1472 {
1473 E1000State *s = opaque;
1474
1475 return chkflag(TSO);
1476 }
1477
1478 static const VMStateDescription vmstate_e1000_mit_state = {
1479 .name = "e1000/mit_state",
1480 .version_id = 1,
1481 .minimum_version_id = 1,
1482 .needed = e1000_mit_state_needed,
1483 .fields = (VMStateField[]) {
1484 VMSTATE_UINT32(mac_reg[RDTR], E1000State),
1485 VMSTATE_UINT32(mac_reg[RADV], E1000State),
1486 VMSTATE_UINT32(mac_reg[TADV], E1000State),
1487 VMSTATE_UINT32(mac_reg[ITR], E1000State),
1488 VMSTATE_BOOL(mit_irq_level, E1000State),
1489 VMSTATE_END_OF_LIST()
1490 }
1491 };
1492
1493 static const VMStateDescription vmstate_e1000_full_mac_state = {
1494 .name = "e1000/full_mac_state",
1495 .version_id = 1,
1496 .minimum_version_id = 1,
1497 .needed = e1000_full_mac_needed,
1498 .fields = (VMStateField[]) {
1499 VMSTATE_UINT32_ARRAY(mac_reg, E1000State, 0x8000),
1500 VMSTATE_END_OF_LIST()
1501 }
1502 };
1503
1504 static const VMStateDescription vmstate_e1000_tx_tso_state = {
1505 .name = "e1000/tx_tso_state",
1506 .version_id = 1,
1507 .minimum_version_id = 1,
1508 .needed = e1000_tso_state_needed,
1509 .post_load = e1000_tx_tso_post_load,
1510 .fields = (VMStateField[]) {
1511 VMSTATE_UINT8(tx.tso_props.ipcss, E1000State),
1512 VMSTATE_UINT8(tx.tso_props.ipcso, E1000State),
1513 VMSTATE_UINT16(tx.tso_props.ipcse, E1000State),
1514 VMSTATE_UINT8(tx.tso_props.tucss, E1000State),
1515 VMSTATE_UINT8(tx.tso_props.tucso, E1000State),
1516 VMSTATE_UINT16(tx.tso_props.tucse, E1000State),
1517 VMSTATE_UINT32(tx.tso_props.paylen, E1000State),
1518 VMSTATE_UINT8(tx.tso_props.hdr_len, E1000State),
1519 VMSTATE_UINT16(tx.tso_props.mss, E1000State),
1520 VMSTATE_INT8(tx.tso_props.ip, E1000State),
1521 VMSTATE_INT8(tx.tso_props.tcp, E1000State),
1522 VMSTATE_END_OF_LIST()
1523 }
1524 };
1525
1526 static const VMStateDescription vmstate_e1000 = {
1527 .name = "e1000",
1528 .version_id = 2,
1529 .minimum_version_id = 1,
1530 .pre_save = e1000_pre_save,
1531 .post_load = e1000_post_load,
1532 .fields = (VMStateField[]) {
1533 VMSTATE_PCI_DEVICE(parent_obj, E1000State),
1534 VMSTATE_UNUSED_TEST(is_version_1, 4), /* was instance id */
1535 VMSTATE_UNUSED(4), /* Was mmio_base. */
1536 VMSTATE_UINT32(rxbuf_size, E1000State),
1537 VMSTATE_UINT32(rxbuf_min_shift, E1000State),
1538 VMSTATE_UINT32(eecd_state.val_in, E1000State),
1539 VMSTATE_UINT16(eecd_state.bitnum_in, E1000State),
1540 VMSTATE_UINT16(eecd_state.bitnum_out, E1000State),
1541 VMSTATE_UINT16(eecd_state.reading, E1000State),
1542 VMSTATE_UINT32(eecd_state.old_eecd, E1000State),
1543 VMSTATE_UINT8(mig_props.ipcss, E1000State),
1544 VMSTATE_UINT8(mig_props.ipcso, E1000State),
1545 VMSTATE_UINT16(mig_props.ipcse, E1000State),
1546 VMSTATE_UINT8(mig_props.tucss, E1000State),
1547 VMSTATE_UINT8(mig_props.tucso, E1000State),
1548 VMSTATE_UINT16(mig_props.tucse, E1000State),
1549 VMSTATE_UINT32(mig_props.paylen, E1000State),
1550 VMSTATE_UINT8(mig_props.hdr_len, E1000State),
1551 VMSTATE_UINT16(mig_props.mss, E1000State),
1552 VMSTATE_UINT16(tx.size, E1000State),
1553 VMSTATE_UINT16(tx.tso_frames, E1000State),
1554 VMSTATE_UINT8(tx.sum_needed, E1000State),
1555 VMSTATE_INT8(mig_props.ip, E1000State),
1556 VMSTATE_INT8(mig_props.tcp, E1000State),
1557 VMSTATE_BUFFER(tx.header, E1000State),
1558 VMSTATE_BUFFER(tx.data, E1000State),
1559 VMSTATE_UINT16_ARRAY(eeprom_data, E1000State, 64),
1560 VMSTATE_UINT16_ARRAY(phy_reg, E1000State, 0x20),
1561 VMSTATE_UINT32(mac_reg[CTRL], E1000State),
1562 VMSTATE_UINT32(mac_reg[EECD], E1000State),
1563 VMSTATE_UINT32(mac_reg[EERD], E1000State),
1564 VMSTATE_UINT32(mac_reg[GPRC], E1000State),
1565 VMSTATE_UINT32(mac_reg[GPTC], E1000State),
1566 VMSTATE_UINT32(mac_reg[ICR], E1000State),
1567 VMSTATE_UINT32(mac_reg[ICS], E1000State),
1568 VMSTATE_UINT32(mac_reg[IMC], E1000State),
1569 VMSTATE_UINT32(mac_reg[IMS], E1000State),
1570 VMSTATE_UINT32(mac_reg[LEDCTL], E1000State),
1571 VMSTATE_UINT32(mac_reg[MANC], E1000State),
1572 VMSTATE_UINT32(mac_reg[MDIC], E1000State),
1573 VMSTATE_UINT32(mac_reg[MPC], E1000State),
1574 VMSTATE_UINT32(mac_reg[PBA], E1000State),
1575 VMSTATE_UINT32(mac_reg[RCTL], E1000State),
1576 VMSTATE_UINT32(mac_reg[RDBAH], E1000State),
1577 VMSTATE_UINT32(mac_reg[RDBAL], E1000State),
1578 VMSTATE_UINT32(mac_reg[RDH], E1000State),
1579 VMSTATE_UINT32(mac_reg[RDLEN], E1000State),
1580 VMSTATE_UINT32(mac_reg[RDT], E1000State),
1581 VMSTATE_UINT32(mac_reg[STATUS], E1000State),
1582 VMSTATE_UINT32(mac_reg[SWSM], E1000State),
1583 VMSTATE_UINT32(mac_reg[TCTL], E1000State),
1584 VMSTATE_UINT32(mac_reg[TDBAH], E1000State),
1585 VMSTATE_UINT32(mac_reg[TDBAL], E1000State),
1586 VMSTATE_UINT32(mac_reg[TDH], E1000State),
1587 VMSTATE_UINT32(mac_reg[TDLEN], E1000State),
1588 VMSTATE_UINT32(mac_reg[TDT], E1000State),
1589 VMSTATE_UINT32(mac_reg[TORH], E1000State),
1590 VMSTATE_UINT32(mac_reg[TORL], E1000State),
1591 VMSTATE_UINT32(mac_reg[TOTH], E1000State),
1592 VMSTATE_UINT32(mac_reg[TOTL], E1000State),
1593 VMSTATE_UINT32(mac_reg[TPR], E1000State),
1594 VMSTATE_UINT32(mac_reg[TPT], E1000State),
1595 VMSTATE_UINT32(mac_reg[TXDCTL], E1000State),
1596 VMSTATE_UINT32(mac_reg[WUFC], E1000State),
1597 VMSTATE_UINT32(mac_reg[VET], E1000State),
1598 VMSTATE_UINT32_SUB_ARRAY(mac_reg, E1000State, RA, 32),
1599 VMSTATE_UINT32_SUB_ARRAY(mac_reg, E1000State, MTA, 128),
1600 VMSTATE_UINT32_SUB_ARRAY(mac_reg, E1000State, VFTA, 128),
1601 VMSTATE_END_OF_LIST()
1602 },
1603 .subsections = (const VMStateDescription*[]) {
1604 &vmstate_e1000_mit_state,
1605 &vmstate_e1000_full_mac_state,
1606 &vmstate_e1000_tx_tso_state,
1607 NULL
1608 }
1609 };
1610
1611 /*
1612 * EEPROM contents documented in Tables 5-2 and 5-3, pp. 98-102.
1613 * Note: A valid DevId will be inserted during pci_e1000_realize().
1614 */
1615 static const uint16_t e1000_eeprom_template[64] = {
1616 0x0000, 0x0000, 0x0000, 0x0000, 0xffff, 0x0000, 0x0000, 0x0000,
1617 0x3000, 0x1000, 0x6403, 0 /*DevId*/, 0x8086, 0 /*DevId*/, 0x8086, 0x3040,
1618 0x0008, 0x2000, 0x7e14, 0x0048, 0x1000, 0x00d8, 0x0000, 0x2700,
1619 0x6cc9, 0x3150, 0x0722, 0x040b, 0x0984, 0x0000, 0xc000, 0x0706,
1620 0x1008, 0x0000, 0x0f04, 0x7fff, 0x4d01, 0xffff, 0xffff, 0xffff,
1621 0xffff, 0xffff, 0xffff, 0xffff, 0xffff, 0xffff, 0xffff, 0xffff,
1622 0x0100, 0x4000, 0x121c, 0xffff, 0xffff, 0xffff, 0xffff, 0xffff,
1623 0xffff, 0xffff, 0xffff, 0xffff, 0xffff, 0xffff, 0xffff, 0x0000,
1624 };
1625
1626 /* PCI interface */
1627
1628 static void
1629 e1000_mmio_setup(E1000State *d)
1630 {
1631 int i;
1632 const uint32_t excluded_regs[] = {
1633 E1000_MDIC, E1000_ICR, E1000_ICS, E1000_IMS,
1634 E1000_IMC, E1000_TCTL, E1000_TDT, PNPMMIO_SIZE
1635 };
1636
1637 memory_region_init_io(&d->mmio, OBJECT(d), &e1000_mmio_ops, d,
1638 "e1000-mmio", PNPMMIO_SIZE);
1639 memory_region_add_coalescing(&d->mmio, 0, excluded_regs[0]);
1640 for (i = 0; excluded_regs[i] != PNPMMIO_SIZE; i++)
1641 memory_region_add_coalescing(&d->mmio, excluded_regs[i] + 4,
1642 excluded_regs[i+1] - excluded_regs[i] - 4);
1643 memory_region_init_io(&d->io, OBJECT(d), &e1000_io_ops, d, "e1000-io", IOPORT_SIZE);
1644 }
1645
1646 static void
1647 pci_e1000_uninit(PCIDevice *dev)
1648 {
1649 E1000State *d = E1000(dev);
1650
1651 timer_del(d->autoneg_timer);
1652 timer_free(d->autoneg_timer);
1653 timer_del(d->mit_timer);
1654 timer_free(d->mit_timer);
1655 timer_del(d->flush_queue_timer);
1656 timer_free(d->flush_queue_timer);
1657 qemu_del_nic(d->nic);
1658 }
1659
1660 static NetClientInfo net_e1000_info = {
1661 .type = NET_CLIENT_DRIVER_NIC,
1662 .size = sizeof(NICState),
1663 .can_receive = e1000_can_receive,
1664 .receive = e1000_receive,
1665 .receive_iov = e1000_receive_iov,
1666 .link_status_changed = e1000_set_link_status,
1667 };
1668
1669 static void e1000_write_config(PCIDevice *pci_dev, uint32_t address,
1670 uint32_t val, int len)
1671 {
1672 E1000State *s = E1000(pci_dev);
1673
1674 pci_default_write_config(pci_dev, address, val, len);
1675
1676 if (range_covers_byte(address, len, PCI_COMMAND) &&
1677 (pci_dev->config[PCI_COMMAND] & PCI_COMMAND_MASTER)) {
1678 qemu_flush_queued_packets(qemu_get_queue(s->nic));
1679 }
1680 }
1681
1682 static void pci_e1000_realize(PCIDevice *pci_dev, Error **errp)
1683 {
1684 DeviceState *dev = DEVICE(pci_dev);
1685 E1000State *d = E1000(pci_dev);
1686 uint8_t *pci_conf;
1687 uint8_t *macaddr;
1688
1689 pci_dev->config_write = e1000_write_config;
1690
1691 pci_conf = pci_dev->config;
1692
1693 /* TODO: RST# value should be 0, PCI spec 6.2.4 */
1694 pci_conf[PCI_CACHE_LINE_SIZE] = 0x10;
1695
1696 pci_conf[PCI_INTERRUPT_PIN] = 1; /* interrupt pin A */
1697
1698 e1000_mmio_setup(d);
1699
1700 pci_register_bar(pci_dev, 0, PCI_BASE_ADDRESS_SPACE_MEMORY, &d->mmio);
1701
1702 pci_register_bar(pci_dev, 1, PCI_BASE_ADDRESS_SPACE_IO, &d->io);
1703
1704 qemu_macaddr_default_if_unset(&d->conf.macaddr);
1705 macaddr = d->conf.macaddr.a;
1706
1707 e1000x_core_prepare_eeprom(d->eeprom_data,
1708 e1000_eeprom_template,
1709 sizeof(e1000_eeprom_template),
1710 PCI_DEVICE_GET_CLASS(pci_dev)->device_id,
1711 macaddr);
1712
1713 d->nic = qemu_new_nic(&net_e1000_info, &d->conf,
1714 object_get_typename(OBJECT(d)), dev->id, d);
1715
1716 qemu_format_nic_info_str(qemu_get_queue(d->nic), macaddr);
1717
1718 d->autoneg_timer = timer_new_ms(QEMU_CLOCK_VIRTUAL, e1000_autoneg_timer, d);
1719 d->mit_timer = timer_new_ns(QEMU_CLOCK_VIRTUAL, e1000_mit_timer, d);
1720 d->flush_queue_timer = timer_new_ms(QEMU_CLOCK_VIRTUAL,
1721 e1000_flush_queue_timer, d);
1722 }
1723
1724 static void qdev_e1000_reset(DeviceState *dev)
1725 {
1726 E1000State *d = E1000(dev);
1727 e1000_reset(d);
1728 }
1729
1730 static Property e1000_properties[] = {
1731 DEFINE_NIC_PROPERTIES(E1000State, conf),
1732 DEFINE_PROP_BIT("autonegotiation", E1000State,
1733 compat_flags, E1000_FLAG_AUTONEG_BIT, true),
1734 DEFINE_PROP_BIT("mitigation", E1000State,
1735 compat_flags, E1000_FLAG_MIT_BIT, true),
1736 DEFINE_PROP_BIT("extra_mac_registers", E1000State,
1737 compat_flags, E1000_FLAG_MAC_BIT, true),
1738 DEFINE_PROP_BIT("migrate_tso_props", E1000State,
1739 compat_flags, E1000_FLAG_TSO_BIT, true),
1740 DEFINE_PROP_END_OF_LIST(),
1741 };
1742
1743 typedef struct E1000Info {
1744 const char *name;
1745 uint16_t device_id;
1746 uint8_t revision;
1747 uint16_t phy_id2;
1748 } E1000Info;
1749
1750 static void e1000_class_init(ObjectClass *klass, void *data)
1751 {
1752 DeviceClass *dc = DEVICE_CLASS(klass);
1753 PCIDeviceClass *k = PCI_DEVICE_CLASS(klass);
1754 E1000BaseClass *e = E1000_DEVICE_CLASS(klass);
1755 const E1000Info *info = data;
1756
1757 k->realize = pci_e1000_realize;
1758 k->exit = pci_e1000_uninit;
1759 k->romfile = "efi-e1000.rom";
1760 k->vendor_id = PCI_VENDOR_ID_INTEL;
1761 k->device_id = info->device_id;
1762 k->revision = info->revision;
1763 e->phy_id2 = info->phy_id2;
1764 k->class_id = PCI_CLASS_NETWORK_ETHERNET;
1765 set_bit(DEVICE_CATEGORY_NETWORK, dc->categories);
1766 dc->desc = "Intel Gigabit Ethernet";
1767 dc->reset = qdev_e1000_reset;
1768 dc->vmsd = &vmstate_e1000;
1769 device_class_set_props(dc, e1000_properties);
1770 }
1771
1772 static void e1000_instance_init(Object *obj)
1773 {
1774 E1000State *n = E1000(obj);
1775 device_add_bootindex_property(obj, &n->conf.bootindex,
1776 "bootindex", "/ethernet-phy@0",
1777 DEVICE(n));
1778 }
1779
1780 static const TypeInfo e1000_base_info = {
1781 .name = TYPE_E1000_BASE,
1782 .parent = TYPE_PCI_DEVICE,
1783 .instance_size = sizeof(E1000State),
1784 .instance_init = e1000_instance_init,
1785 .class_size = sizeof(E1000BaseClass),
1786 .abstract = true,
1787 .interfaces = (InterfaceInfo[]) {
1788 { INTERFACE_CONVENTIONAL_PCI_DEVICE },
1789 { },
1790 },
1791 };
1792
1793 static const E1000Info e1000_devices[] = {
1794 {
1795 .name = "e1000",
1796 .device_id = E1000_DEV_ID_82540EM,
1797 .revision = 0x03,
1798 .phy_id2 = E1000_PHY_ID2_8254xx_DEFAULT,
1799 },
1800 {
1801 .name = "e1000-82544gc",
1802 .device_id = E1000_DEV_ID_82544GC_COPPER,
1803 .revision = 0x03,
1804 .phy_id2 = E1000_PHY_ID2_82544x,
1805 },
1806 {
1807 .name = "e1000-82545em",
1808 .device_id = E1000_DEV_ID_82545EM_COPPER,
1809 .revision = 0x03,
1810 .phy_id2 = E1000_PHY_ID2_8254xx_DEFAULT,
1811 },
1812 };
1813
1814 static void e1000_register_types(void)
1815 {
1816 int i;
1817
1818 type_register_static(&e1000_base_info);
1819 for (i = 0; i < ARRAY_SIZE(e1000_devices); i++) {
1820 const E1000Info *info = &e1000_devices[i];
1821 TypeInfo type_info = {};
1822
1823 type_info.name = info->name;
1824 type_info.parent = TYPE_E1000_BASE;
1825 type_info.class_data = (void *)info;
1826 type_info.class_init = e1000_class_init;
1827
1828 type_register(&type_info);
1829 }
1830 }
1831
1832 type_init(e1000_register_types)