2 * Copyright (c) 2013 Zhixiang Yu <zcore@freebsd.org>
5 * Redistribution and use in source and binary forms, with or without
6 * modification, are permitted provided that the following conditions
8 * 1. Redistributions of source code must retain the above copyright
9 * notice, this list of conditions and the following disclaimer.
10 * 2. Redistributions in binary form must reproduce the above copyright
11 * notice, this list of conditions and the following disclaimer in the
12 * documentation and/or other materials provided with the distribution.
14 * THIS SOFTWARE IS PROVIDED BY THE AUTHOR ``AS IS'' AND
15 * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
16 * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
17 * ARE DISCLAIMED. IN NO EVENT SHALL THE AUTHOR OR CONTRIBUTORS BE LIABLE
18 * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
19 * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
20 * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
21 * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
22 * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
23 * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
29 #include <sys/cdefs.h>
30 __FBSDID("$FreeBSD$");
32 #include <sys/param.h>
33 #include <sys/linker_set.h>
36 #include <sys/ioctl.h>
39 #include <sys/endian.h>
51 #include <pthread_np.h>
59 #define MAX_PORTS 6 /* Intel ICH8 AHCI supports 6 ports */
61 #define PxSIG_ATA 0x00000101 /* ATA drive */
62 #define PxSIG_ATAPI 0xeb140101 /* ATAPI drive */
65 FIS_TYPE_REGH2D = 0x27, /* Register FIS - host to device */
66 FIS_TYPE_REGD2H = 0x34, /* Register FIS - device to host */
67 FIS_TYPE_DMAACT = 0x39, /* DMA activate FIS - device to host */
68 FIS_TYPE_DMASETUP = 0x41, /* DMA setup FIS - bidirectional */
69 FIS_TYPE_DATA = 0x46, /* Data FIS - bidirectional */
70 FIS_TYPE_BIST = 0x58, /* BIST activate FIS - bidirectional */
71 FIS_TYPE_PIOSETUP = 0x5F, /* PIO setup FIS - device to host */
72 FIS_TYPE_SETDEVBITS = 0xA1, /* Set dev bits FIS - device to host */
78 #define TEST_UNIT_READY 0x00
79 #define REQUEST_SENSE 0x03
81 #define START_STOP_UNIT 0x1B
82 #define PREVENT_ALLOW 0x1E
83 #define READ_CAPACITY 0x25
85 #define POSITION_TO_ELEMENT 0x2B
87 #define GET_EVENT_STATUS_NOTIFICATION 0x4A
88 #define MODE_SENSE_10 0x5A
93 * SCSI mode page codes
95 #define MODEPAGE_RW_ERROR_RECOVERY 0x01
96 #define MODEPAGE_CD_CAPABILITIES 0x2A
101 #define ATA_SF_ENAB_SATA_SF 0x10
102 #define ATA_SATA_SF_AN 0x05
103 #define ATA_SF_DIS_SATA_SF 0x90
110 #define DPRINTF(format, arg...) do{fprintf(dbg, format, ##arg);fflush(dbg);}while(0)
112 #define DPRINTF(format, arg...)
114 #define WPRINTF(format, arg...) printf(format, ##arg)
117 struct blockif_req io_req;
118 struct ahci_port *io_pr;
119 STAILQ_ENTRY(ahci_ioreq) io_flist;
120 TAILQ_ENTRY(ahci_ioreq) io_blist;
129 struct blockif_ctxt *bctx;
130 struct pci_ahci_softc *pr_sc;
162 struct ahci_ioreq *ioreq;
164 STAILQ_HEAD(ahci_fhead, ahci_ioreq) iofhd;
165 TAILQ_HEAD(ahci_bhead, ahci_ioreq) iobhd;
168 struct ahci_cmd_hdr {
173 uint32_t reserved[4];
176 struct ahci_prdt_entry {
179 #define DBCMASK 0x3fffff
183 struct pci_ahci_softc {
184 struct pci_devinst *asc_pi;
199 struct ahci_port port[MAX_PORTS];
201 #define ahci_ctx(sc) ((sc)->asc_pi->pi_vmctx)
203 static inline void lba_to_msf(uint8_t *buf, int lba)
206 buf[0] = (lba / 75) / 60;
207 buf[1] = (lba / 75) % 60;
212 * generate HBA intr depending on whether or not ports within
213 * the controller have an interrupt pending.
216 ahci_generate_intr(struct pci_ahci_softc *sc)
218 struct pci_devinst *pi;
223 for (i = 0; i < sc->ports; i++) {
224 struct ahci_port *pr;
230 DPRINTF("%s %x\n", __func__, sc->is);
232 if (sc->is && (sc->ghc & AHCI_GHC_IE)) {
233 if (pci_msi_enabled(pi)) {
235 * Generate an MSI interrupt on every edge
237 pci_generate_msi(pi, 0);
238 } else if (!sc->lintr) {
240 * Only generate a pin-based interrupt if one wasn't
244 pci_lintr_assert(pi);
246 } else if (sc->lintr) {
248 * No interrupts: deassert pin-based signal if it had
251 pci_lintr_deassert(pi);
257 ahci_write_fis(struct ahci_port *p, enum sata_fis_type ft, uint8_t *fis)
259 int offset, len, irq;
261 if (p->rfis == NULL || !(p->cmd & AHCI_P_CMD_FRE))
265 case FIS_TYPE_REGD2H:
270 case FIS_TYPE_SETDEVBITS:
275 case FIS_TYPE_PIOSETUP:
281 WPRINTF("unsupported fis type %d\n", ft);
284 memcpy(p->rfis + offset, fis, len);
287 ahci_generate_intr(p->pr_sc);
292 ahci_write_fis_piosetup(struct ahci_port *p)
296 memset(fis, 0, sizeof(fis));
297 fis[0] = FIS_TYPE_PIOSETUP;
298 ahci_write_fis(p, FIS_TYPE_PIOSETUP, fis);
302 ahci_write_fis_sdb(struct ahci_port *p, int slot, uint32_t tfd)
307 error = (tfd >> 8) & 0xff;
308 memset(fis, 0, sizeof(fis));
311 *(uint32_t *)(fis + 4) = (1 << slot);
312 if (fis[2] & ATA_S_ERROR)
313 p->is |= AHCI_P_IX_TFE;
315 ahci_write_fis(p, FIS_TYPE_SETDEVBITS, fis);
319 ahci_write_fis_d2h(struct ahci_port *p, int slot, uint8_t *cfis, uint32_t tfd)
324 error = (tfd >> 8) & 0xff;
325 memset(fis, 0, sizeof(fis));
326 fis[0] = FIS_TYPE_REGD2H;
340 if (fis[2] & ATA_S_ERROR)
341 p->is |= AHCI_P_IX_TFE;
343 p->ci &= ~(1 << slot);
345 ahci_write_fis(p, FIS_TYPE_REGD2H, fis);
349 ahci_write_reset_fis_d2h(struct ahci_port *p)
353 memset(fis, 0, sizeof(fis));
354 fis[0] = FIS_TYPE_REGD2H;
362 ahci_write_fis(p, FIS_TYPE_REGD2H, fis);
366 ahci_check_stopped(struct ahci_port *p)
369 * If we are no longer processing the command list and nothing
370 * is in-flight, clear the running bit, the current command
371 * slot, the command issue and active bits.
373 if (!(p->cmd & AHCI_P_CMD_ST)) {
374 if (p->pending == 0) {
375 p->cmd &= ~(AHCI_P_CMD_CR | AHCI_P_CMD_CCS_MASK);
383 ahci_port_stop(struct ahci_port *p)
385 struct ahci_ioreq *aior;
391 assert(pthread_mutex_isowned_np(&p->pr_sc->mtx));
393 TAILQ_FOREACH(aior, &p->iobhd, io_blist) {
395 * Try to cancel the outstanding blockif request.
397 error = blockif_cancel(p->bctx, &aior->io_req);
403 if (cfis[2] == ATA_WRITE_FPDMA_QUEUED ||
404 cfis[2] == ATA_READ_FPDMA_QUEUED)
408 p->sact &= ~(1 << slot);
410 p->ci &= ~(1 << slot);
413 * This command is now done.
415 p->pending &= ~(1 << slot);
418 * Delete the blockif request from the busy list
420 TAILQ_REMOVE(&p->iobhd, aior, io_blist);
423 * Move the blockif request back to the free list
425 STAILQ_INSERT_TAIL(&p->iofhd, aior, io_flist);
428 ahci_check_stopped(p);
432 ahci_port_reset(struct ahci_port *pr)
437 pr->xfermode = ATA_UDMA6;
438 pr->mult_sectors = 128;
441 pr->ssts = ATA_SS_DET_NO_DEVICE;
442 pr->sig = 0xFFFFFFFF;
446 pr->ssts = ATA_SS_DET_PHY_ONLINE | ATA_SS_SPD_GEN2 |
448 pr->tfd = (1 << 8) | ATA_S_DSC | ATA_S_DMA;
451 pr->tfd |= ATA_S_READY;
453 pr->sig = PxSIG_ATAPI;
454 ahci_write_reset_fis_d2h(pr);
458 ahci_reset(struct pci_ahci_softc *sc)
462 sc->ghc = AHCI_GHC_AE;
466 pci_lintr_deassert(sc->asc_pi);
470 for (i = 0; i < sc->ports; i++) {
473 ahci_port_reset(&sc->port[i]);
478 ata_string(uint8_t *dest, const char *src, int len)
482 for (i = 0; i < len; i++) {
484 dest[i ^ 1] = *src++;
491 atapi_string(uint8_t *dest, const char *src, int len)
495 for (i = 0; i < len; i++) {
504 ahci_handle_dma(struct ahci_port *p, int slot, uint8_t *cfis, uint32_t done,
507 struct ahci_ioreq *aior;
508 struct blockif_req *breq;
509 struct pci_ahci_softc *sc;
510 struct ahci_prdt_entry *prdt;
511 struct ahci_cmd_hdr *hdr;
514 int i, err, iovcnt, ncq, readop;
517 prdt = (struct ahci_prdt_entry *)(cfis + 0x80);
518 hdr = (struct ahci_cmd_hdr *)(p->cmd_lst + slot * AHCI_CL_SIZE);
523 if (cfis[2] == ATA_WRITE_DMA || cfis[2] == ATA_WRITE_DMA48 ||
524 cfis[2] == ATA_WRITE_FPDMA_QUEUED)
527 if (cfis[2] == ATA_WRITE_FPDMA_QUEUED ||
528 cfis[2] == ATA_READ_FPDMA_QUEUED) {
529 lba = ((uint64_t)cfis[10] << 40) |
530 ((uint64_t)cfis[9] << 32) |
531 ((uint64_t)cfis[8] << 24) |
532 ((uint64_t)cfis[6] << 16) |
533 ((uint64_t)cfis[5] << 8) |
535 len = cfis[11] << 8 | cfis[3];
539 } else if (cfis[2] == ATA_READ_DMA48 || cfis[2] == ATA_WRITE_DMA48) {
540 lba = ((uint64_t)cfis[10] << 40) |
541 ((uint64_t)cfis[9] << 32) |
542 ((uint64_t)cfis[8] << 24) |
543 ((uint64_t)cfis[6] << 16) |
544 ((uint64_t)cfis[5] << 8) |
546 len = cfis[13] << 8 | cfis[12];
550 lba = ((cfis[7] & 0xf) << 24) | (cfis[6] << 16) |
551 (cfis[5] << 8) | cfis[4];
556 lba *= blockif_sectsz(p->bctx);
557 len *= blockif_sectsz(p->bctx);
560 * Pull request off free list
562 aior = STAILQ_FIRST(&p->iofhd);
563 assert(aior != NULL);
564 STAILQ_REMOVE_HEAD(&p->iofhd, io_flist);
569 breq = &aior->io_req;
570 breq->br_offset = lba + done;
571 iovcnt = hdr->prdtl - seek;
572 if (iovcnt > BLOCKIF_IOV_MAX) {
573 aior->prdtl = iovcnt - BLOCKIF_IOV_MAX;
574 iovcnt = BLOCKIF_IOV_MAX;
577 breq->br_iovcnt = iovcnt;
580 * Mark this command in-flight.
582 p->pending |= 1 << slot;
585 * Stuff request onto busy list
587 TAILQ_INSERT_HEAD(&p->iobhd, aior, io_blist);
590 * Build up the iovec based on the prdt
592 for (i = 0; i < iovcnt; i++) {
595 dbcsz = (prdt->dbc & DBCMASK) + 1;
596 breq->br_iov[i].iov_base = paddr_guest2host(ahci_ctx(sc),
598 breq->br_iov[i].iov_len = dbcsz;
603 err = blockif_read(p->bctx, breq);
605 err = blockif_write(p->bctx, breq);
609 p->ci &= ~(1 << slot);
613 ahci_handle_flush(struct ahci_port *p, int slot, uint8_t *cfis)
615 struct ahci_ioreq *aior;
616 struct blockif_req *breq;
620 * Pull request off free list
622 aior = STAILQ_FIRST(&p->iofhd);
623 assert(aior != NULL);
624 STAILQ_REMOVE_HEAD(&p->iofhd, io_flist);
630 breq = &aior->io_req;
633 * Mark this command in-flight.
635 p->pending |= 1 << slot;
638 * Stuff request onto busy list
640 TAILQ_INSERT_HEAD(&p->iobhd, aior, io_blist);
642 err = blockif_flush(p->bctx, breq);
647 write_prdt(struct ahci_port *p, int slot, uint8_t *cfis,
650 struct ahci_cmd_hdr *hdr;
651 struct ahci_prdt_entry *prdt;
655 hdr = (struct ahci_cmd_hdr *)(p->cmd_lst + slot * AHCI_CL_SIZE);
658 prdt = (struct ahci_prdt_entry *)(cfis + 0x80);
659 for (i = 0; i < hdr->prdtl && len; i++) {
664 dbcsz = (prdt->dbc & DBCMASK) + 1;
665 ptr = paddr_guest2host(ahci_ctx(p->pr_sc), prdt->dba, dbcsz);
666 sublen = len < dbcsz ? len : dbcsz;
667 memcpy(ptr, from, sublen);
672 hdr->prdbc = size - len;
676 handle_identify(struct ahci_port *p, int slot, uint8_t *cfis)
678 struct ahci_cmd_hdr *hdr;
680 hdr = (struct ahci_cmd_hdr *)(p->cmd_lst + slot * AHCI_CL_SIZE);
681 if (p->atapi || hdr->prdtl == 0) {
682 p->tfd = (ATA_E_ABORT << 8) | ATA_S_READY | ATA_S_ERROR;
683 p->is |= AHCI_P_IX_TFE;
687 int sectsz, psectsz, psectoff;
691 sectsz = blockif_sectsz(p->bctx);
692 sectors = blockif_size(p->bctx) / sectsz;
693 blockif_chs(p->bctx, &cyl, &heads, &sech);
694 blockif_psectsz(p->bctx, &psectsz, &psectoff);
695 memset(buf, 0, sizeof(buf));
700 /* TODO emulate different serial? */
701 ata_string((uint8_t *)(buf+10), "123456", 20);
702 ata_string((uint8_t *)(buf+23), "001", 8);
703 ata_string((uint8_t *)(buf+27), "BHYVE SATA DISK", 40);
704 buf[47] = (0x8000 | 128);
706 buf[49] = (1 << 8 | 1 << 9 | 1 << 11);
708 buf[53] = (1 << 1 | 1 << 2);
710 buf[59] = (0x100 | p->mult_sectors);
712 buf[61] = (sectors >> 16);
714 if (p->xfermode & ATA_WDMA0)
715 buf[63] |= (1 << ((p->xfermode & 7) + 8));
722 buf[76] = (1 << 8 | 1 << 2);
725 buf[82] = (1 << 5 | 1 << 14);
726 buf[83] = (1 << 10 | 1 << 12 | 1 << 13 | 1 << 14);
728 buf[85] = (1 << 5 | 1 << 14);
729 buf[86] = (1 << 10 | 1 << 12 | 1 << 13);
732 if (p->xfermode & ATA_UDMA0)
733 buf[88] |= (1 << ((p->xfermode & 7) + 8));
734 buf[93] = (1 | 1 <<14);
736 buf[101] = (sectors >> 16);
737 buf[102] = (sectors >> 32);
738 buf[103] = (sectors >> 48);
741 if (psectsz > sectsz) {
743 buf[106] |= ffsl(psectsz / sectsz) - 1;
744 buf[209] |= (psectoff / sectsz);
748 buf[117] = sectsz / 2;
749 buf[118] = ((sectsz / 2) >> 16);
751 ahci_write_fis_piosetup(p);
752 write_prdt(p, slot, cfis, (void *)buf, sizeof(buf));
753 p->tfd = ATA_S_DSC | ATA_S_READY;
754 p->is |= AHCI_P_IX_DP;
755 p->ci &= ~(1 << slot);
757 ahci_generate_intr(p->pr_sc);
761 handle_atapi_identify(struct ahci_port *p, int slot, uint8_t *cfis)
764 p->tfd = (ATA_E_ABORT << 8) | ATA_S_READY | ATA_S_ERROR;
765 p->is |= AHCI_P_IX_TFE;
769 memset(buf, 0, sizeof(buf));
770 buf[0] = (2 << 14 | 5 << 8 | 1 << 7 | 2 << 5);
771 /* TODO emulate different serial? */
772 ata_string((uint8_t *)(buf+10), "123456", 20);
773 ata_string((uint8_t *)(buf+23), "001", 8);
774 ata_string((uint8_t *)(buf+27), "BHYVE SATA DVD ROM", 40);
775 buf[49] = (1 << 9 | 1 << 8);
776 buf[50] = (1 << 14 | 1);
777 buf[53] = (1 << 2 | 1 << 1);
785 buf[76] = (1 << 2 | 1 << 1);
787 buf[80] = (0x1f << 4);
793 buf[88] = (1 << 14 | 0x7f);
794 ahci_write_fis_piosetup(p);
795 write_prdt(p, slot, cfis, (void *)buf, sizeof(buf));
796 p->tfd = ATA_S_DSC | ATA_S_READY;
797 p->is |= AHCI_P_IX_DHR;
798 p->ci &= ~(1 << slot);
800 ahci_generate_intr(p->pr_sc);
804 atapi_inquiry(struct ahci_port *p, int slot, uint8_t *cfis)
820 atapi_string(buf + 8, "BHYVE", 8);
821 atapi_string(buf + 16, "BHYVE DVD-ROM", 16);
822 atapi_string(buf + 32, "001", 4);
827 cfis[4] = (cfis[4] & ~7) | ATA_I_CMD | ATA_I_IN;
828 write_prdt(p, slot, cfis, buf, len);
829 ahci_write_fis_d2h(p, slot, cfis, ATA_S_READY | ATA_S_DSC);
833 atapi_read_capacity(struct ahci_port *p, int slot, uint8_t *cfis)
838 sectors = blockif_size(p->bctx) / 2048;
839 be32enc(buf, sectors - 1);
840 be32enc(buf + 4, 2048);
841 cfis[4] = (cfis[4] & ~7) | ATA_I_CMD | ATA_I_IN;
842 write_prdt(p, slot, cfis, buf, sizeof(buf));
843 ahci_write_fis_d2h(p, slot, cfis, ATA_S_READY | ATA_S_DSC);
847 atapi_read_toc(struct ahci_port *p, int slot, uint8_t *cfis)
855 len = be16dec(acmd + 7);
856 format = acmd[9] >> 6;
862 uint8_t start_track, buf[20], *bp;
864 msf = (acmd[1] >> 1) & 1;
865 start_track = acmd[6];
866 if (start_track > 1 && start_track != 0xaa) {
868 p->sense_key = ATA_SENSE_ILLEGAL_REQUEST;
870 tfd = (p->sense_key << 12) | ATA_S_READY | ATA_S_ERROR;
871 cfis[4] = (cfis[4] & ~7) | ATA_I_CMD | ATA_I_IN;
872 ahci_write_fis_d2h(p, slot, cfis, tfd);
878 if (start_track <= 1) {
898 sectors = blockif_size(p->bctx) / blockif_sectsz(p->bctx);
902 lba_to_msf(bp, sectors);
905 be32enc(bp, sectors);
909 be16enc(buf, size - 2);
912 write_prdt(p, slot, cfis, buf, len);
913 cfis[4] = (cfis[4] & ~7) | ATA_I_CMD | ATA_I_IN;
914 ahci_write_fis_d2h(p, slot, cfis, ATA_S_READY | ATA_S_DSC);
921 memset(buf, 0, sizeof(buf));
925 if (len > sizeof(buf))
927 write_prdt(p, slot, cfis, buf, len);
928 cfis[4] = (cfis[4] & ~7) | ATA_I_CMD | ATA_I_IN;
929 ahci_write_fis_d2h(p, slot, cfis, ATA_S_READY | ATA_S_DSC);
936 uint8_t start_track, *bp, buf[50];
938 msf = (acmd[1] >> 1) & 1;
939 start_track = acmd[6];
975 sectors = blockif_size(p->bctx) / blockif_sectsz(p->bctx);
979 lba_to_msf(bp, sectors);
982 be32enc(bp, sectors);
1005 be16enc(buf, size - 2);
1008 write_prdt(p, slot, cfis, buf, len);
1009 cfis[4] = (cfis[4] & ~7) | ATA_I_CMD | ATA_I_IN;
1010 ahci_write_fis_d2h(p, slot, cfis, ATA_S_READY | ATA_S_DSC);
1017 p->sense_key = ATA_SENSE_ILLEGAL_REQUEST;
1019 tfd = (p->sense_key << 12) | ATA_S_READY | ATA_S_ERROR;
1020 cfis[4] = (cfis[4] & ~7) | ATA_I_CMD | ATA_I_IN;
1021 ahci_write_fis_d2h(p, slot, cfis, tfd);
1028 atapi_read(struct ahci_port *p, int slot, uint8_t *cfis,
1029 uint32_t done, int seek)
1031 struct ahci_ioreq *aior;
1032 struct ahci_cmd_hdr *hdr;
1033 struct ahci_prdt_entry *prdt;
1034 struct blockif_req *breq;
1035 struct pci_ahci_softc *sc;
1043 hdr = (struct ahci_cmd_hdr *)(p->cmd_lst + slot * AHCI_CL_SIZE);
1044 prdt = (struct ahci_prdt_entry *)(cfis + 0x80);
1047 lba = be32dec(acmd + 2);
1048 if (acmd[0] == READ_10)
1049 len = be16dec(acmd + 7);
1051 len = be32dec(acmd + 6);
1053 cfis[4] = (cfis[4] & ~7) | ATA_I_CMD | ATA_I_IN;
1054 ahci_write_fis_d2h(p, slot, cfis, ATA_S_READY | ATA_S_DSC);
1060 * Pull request off free list
1062 aior = STAILQ_FIRST(&p->iofhd);
1063 assert(aior != NULL);
1064 STAILQ_REMOVE_HEAD(&p->iofhd, io_flist);
1069 breq = &aior->io_req;
1070 breq->br_offset = lba + done;
1071 iovcnt = hdr->prdtl - seek;
1072 if (iovcnt > BLOCKIF_IOV_MAX) {
1073 aior->prdtl = iovcnt - BLOCKIF_IOV_MAX;
1074 iovcnt = BLOCKIF_IOV_MAX;
1077 breq->br_iovcnt = iovcnt;
1080 * Mark this command in-flight.
1082 p->pending |= 1 << slot;
1085 * Stuff request onto busy list
1087 TAILQ_INSERT_HEAD(&p->iobhd, aior, io_blist);
1090 * Build up the iovec based on the prdt
1092 for (i = 0; i < iovcnt; i++) {
1095 dbcsz = (prdt->dbc & DBCMASK) + 1;
1096 breq->br_iov[i].iov_base = paddr_guest2host(ahci_ctx(sc),
1098 breq->br_iov[i].iov_len = dbcsz;
1099 aior->done += dbcsz;
1102 err = blockif_read(p->bctx, breq);
1107 atapi_request_sense(struct ahci_port *p, int slot, uint8_t *cfis)
1115 if (len > sizeof(buf))
1117 memset(buf, 0, len);
1118 buf[0] = 0x70 | (1 << 7);
1119 buf[2] = p->sense_key;
1122 write_prdt(p, slot, cfis, buf, len);
1123 cfis[4] = (cfis[4] & ~7) | ATA_I_CMD | ATA_I_IN;
1124 ahci_write_fis_d2h(p, slot, cfis, ATA_S_READY | ATA_S_DSC);
1128 atapi_start_stop_unit(struct ahci_port *p, int slot, uint8_t *cfis)
1130 uint8_t *acmd = cfis + 0x40;
1133 switch (acmd[4] & 3) {
1137 cfis[4] = (cfis[4] & ~7) | ATA_I_CMD | ATA_I_IN;
1138 tfd = ATA_S_READY | ATA_S_DSC;
1141 /* TODO eject media */
1142 cfis[4] = (cfis[4] & ~7) | ATA_I_CMD | ATA_I_IN;
1143 p->sense_key = ATA_SENSE_ILLEGAL_REQUEST;
1145 tfd = (p->sense_key << 12) | ATA_S_READY | ATA_S_ERROR;
1148 ahci_write_fis_d2h(p, slot, cfis, tfd);
1152 atapi_mode_sense(struct ahci_port *p, int slot, uint8_t *cfis)
1160 len = be16dec(acmd + 7);
1162 code = acmd[2] & 0x3f;
1167 case MODEPAGE_RW_ERROR_RECOVERY:
1171 if (len > sizeof(buf))
1174 memset(buf, 0, sizeof(buf));
1175 be16enc(buf, 16 - 2);
1180 write_prdt(p, slot, cfis, buf, len);
1181 tfd = ATA_S_READY | ATA_S_DSC;
1184 case MODEPAGE_CD_CAPABILITIES:
1188 if (len > sizeof(buf))
1191 memset(buf, 0, sizeof(buf));
1192 be16enc(buf, 30 - 2);
1198 be16enc(&buf[18], 2);
1199 be16enc(&buf[20], 512);
1200 write_prdt(p, slot, cfis, buf, len);
1201 tfd = ATA_S_READY | ATA_S_DSC;
1210 p->sense_key = ATA_SENSE_ILLEGAL_REQUEST;
1212 tfd = (p->sense_key << 12) | ATA_S_READY | ATA_S_ERROR;
1217 p->sense_key = ATA_SENSE_ILLEGAL_REQUEST;
1219 tfd = (p->sense_key << 12) | ATA_S_READY | ATA_S_ERROR;
1222 cfis[4] = (cfis[4] & ~7) | ATA_I_CMD | ATA_I_IN;
1223 ahci_write_fis_d2h(p, slot, cfis, tfd);
1227 atapi_get_event_status_notification(struct ahci_port *p, int slot,
1235 /* we don't support asynchronous operation */
1236 if (!(acmd[1] & 1)) {
1237 p->sense_key = ATA_SENSE_ILLEGAL_REQUEST;
1239 tfd = (p->sense_key << 12) | ATA_S_READY | ATA_S_ERROR;
1244 len = be16dec(acmd + 7);
1245 if (len > sizeof(buf))
1248 memset(buf, 0, sizeof(buf));
1249 be16enc(buf, 8 - 2);
1253 write_prdt(p, slot, cfis, buf, len);
1254 tfd = ATA_S_READY | ATA_S_DSC;
1256 cfis[4] = (cfis[4] & ~7) | ATA_I_CMD | ATA_I_IN;
1257 ahci_write_fis_d2h(p, slot, cfis, tfd);
1261 handle_packet_cmd(struct ahci_port *p, int slot, uint8_t *cfis)
1271 for (i = 0; i < 16; i++)
1272 DPRINTF("%02x ", acmd[i]);
1278 case TEST_UNIT_READY:
1279 cfis[4] = (cfis[4] & ~7) | ATA_I_CMD | ATA_I_IN;
1280 ahci_write_fis_d2h(p, slot, cfis, ATA_S_READY | ATA_S_DSC);
1283 atapi_inquiry(p, slot, cfis);
1286 atapi_read_capacity(p, slot, cfis);
1290 cfis[4] = (cfis[4] & ~7) | ATA_I_CMD | ATA_I_IN;
1291 ahci_write_fis_d2h(p, slot, cfis, ATA_S_READY | ATA_S_DSC);
1294 atapi_read_toc(p, slot, cfis);
1298 atapi_read(p, slot, cfis, 0, 0);
1301 atapi_request_sense(p, slot, cfis);
1303 case START_STOP_UNIT:
1304 atapi_start_stop_unit(p, slot, cfis);
1307 atapi_mode_sense(p, slot, cfis);
1309 case GET_EVENT_STATUS_NOTIFICATION:
1310 atapi_get_event_status_notification(p, slot, cfis);
1313 cfis[4] = (cfis[4] & ~7) | ATA_I_CMD | ATA_I_IN;
1314 p->sense_key = ATA_SENSE_ILLEGAL_REQUEST;
1316 ahci_write_fis_d2h(p, slot, cfis, (p->sense_key << 12) |
1317 ATA_S_READY | ATA_S_ERROR);
1323 ahci_handle_cmd(struct ahci_port *p, int slot, uint8_t *cfis)
1327 case ATA_ATA_IDENTIFY:
1328 handle_identify(p, slot, cfis);
1330 case ATA_SETFEATURES:
1333 case ATA_SF_ENAB_SATA_SF:
1335 case ATA_SATA_SF_AN:
1336 p->tfd = ATA_S_DSC | ATA_S_READY;
1339 p->tfd = ATA_S_ERROR | ATA_S_READY;
1340 p->tfd |= (ATA_ERROR_ABORT << 8);
1344 case ATA_SF_ENAB_WCACHE:
1345 case ATA_SF_DIS_WCACHE:
1346 case ATA_SF_ENAB_RCACHE:
1347 case ATA_SF_DIS_RCACHE:
1348 p->tfd = ATA_S_DSC | ATA_S_READY;
1350 case ATA_SF_SETXFER:
1352 switch (cfis[12] & 0xf8) {
1358 p->xfermode = (cfis[12] & 0x7);
1361 p->tfd = ATA_S_DSC | ATA_S_READY;
1365 p->tfd = ATA_S_ERROR | ATA_S_READY;
1366 p->tfd |= (ATA_ERROR_ABORT << 8);
1369 ahci_write_fis_d2h(p, slot, cfis, p->tfd);
1373 if (cfis[12] != 0 &&
1374 (cfis[12] > 128 || (cfis[12] & (cfis[12] - 1)))) {
1375 p->tfd = ATA_S_ERROR | ATA_S_READY;
1376 p->tfd |= (ATA_ERROR_ABORT << 8);
1378 p->mult_sectors = cfis[12];
1379 p->tfd = ATA_S_DSC | ATA_S_READY;
1381 p->is |= AHCI_P_IX_DP;
1382 p->ci &= ~(1 << slot);
1383 ahci_generate_intr(p->pr_sc);
1387 case ATA_READ_DMA48:
1388 case ATA_WRITE_DMA48:
1389 case ATA_READ_FPDMA_QUEUED:
1390 case ATA_WRITE_FPDMA_QUEUED:
1391 ahci_handle_dma(p, slot, cfis, 0, 0);
1393 case ATA_FLUSHCACHE:
1394 case ATA_FLUSHCACHE48:
1395 ahci_handle_flush(p, slot, cfis);
1397 case ATA_STANDBY_CMD:
1400 case ATA_STANDBY_IMMEDIATE:
1401 case ATA_IDLE_IMMEDIATE:
1403 ahci_write_fis_d2h(p, slot, cfis, ATA_S_READY | ATA_S_DSC);
1405 case ATA_ATAPI_IDENTIFY:
1406 handle_atapi_identify(p, slot, cfis);
1408 case ATA_PACKET_CMD:
1410 p->tfd = (ATA_E_ABORT << 8) | ATA_S_READY | ATA_S_ERROR;
1411 p->is |= AHCI_P_IX_TFE;
1412 ahci_generate_intr(p->pr_sc);
1414 handle_packet_cmd(p, slot, cfis);
1417 WPRINTF("Unsupported cmd:%02x\n", cfis[2]);
1418 p->tfd = (ATA_E_ABORT << 8) | ATA_S_READY | ATA_S_ERROR;
1419 p->is |= AHCI_P_IX_TFE;
1420 ahci_generate_intr(p->pr_sc);
1426 ahci_handle_slot(struct ahci_port *p, int slot)
1428 struct ahci_cmd_hdr *hdr;
1429 struct ahci_prdt_entry *prdt;
1430 struct pci_ahci_softc *sc;
1435 hdr = (struct ahci_cmd_hdr *)(p->cmd_lst + slot * AHCI_CL_SIZE);
1436 cfl = (hdr->flags & 0x1f) * 4;
1437 cfis = paddr_guest2host(ahci_ctx(sc), hdr->ctba,
1438 0x80 + hdr->prdtl * sizeof(struct ahci_prdt_entry));
1439 prdt = (struct ahci_prdt_entry *)(cfis + 0x80);
1443 for (i = 0; i < cfl; i++) {
1446 DPRINTF("%02x ", cfis[i]);
1450 for (i = 0; i < hdr->prdtl; i++) {
1451 DPRINTF("%d@%08"PRIx64"\n", prdt->dbc & 0x3fffff, prdt->dba);
1456 if (cfis[0] != FIS_TYPE_REGH2D) {
1457 WPRINTF("Not a H2D FIS:%02x\n", cfis[0]);
1461 if (cfis[1] & 0x80) {
1462 ahci_handle_cmd(p, slot, cfis);
1464 if (cfis[15] & (1 << 2))
1466 else if (p->reset) {
1470 p->ci &= ~(1 << slot);
1475 ahci_handle_port(struct ahci_port *p)
1479 if (!(p->cmd & AHCI_P_CMD_ST))
1483 * Search for any new commands to issue ignoring those that
1484 * are already in-flight.
1486 for (i = 0; (i < 32) && p->ci; i++) {
1487 if ((p->ci & (1 << i)) && !(p->pending & (1 << i))) {
1488 p->cmd &= ~AHCI_P_CMD_CCS_MASK;
1489 p->cmd |= i << AHCI_P_CMD_CCS_SHIFT;
1490 ahci_handle_slot(p, i);
1496 * blockif callback routine - this runs in the context of the blockif
1497 * i/o thread, so the mutex needs to be acquired.
1500 ata_ioreq_cb(struct blockif_req *br, int err)
1502 struct ahci_cmd_hdr *hdr;
1503 struct ahci_ioreq *aior;
1504 struct ahci_port *p;
1505 struct pci_ahci_softc *sc;
1508 int pending, slot, ncq;
1510 DPRINTF("%s %d\n", __func__, err);
1513 aior = br->br_param;
1517 pending = aior->prdtl;
1519 hdr = (struct ahci_cmd_hdr *)(p->cmd_lst + slot * AHCI_CL_SIZE);
1521 if (cfis[2] == ATA_WRITE_FPDMA_QUEUED ||
1522 cfis[2] == ATA_READ_FPDMA_QUEUED)
1525 pthread_mutex_lock(&sc->mtx);
1528 * Delete the blockif request from the busy list
1530 TAILQ_REMOVE(&p->iobhd, aior, io_blist);
1533 * Move the blockif request back to the free list
1535 STAILQ_INSERT_TAIL(&p->iofhd, aior, io_flist);
1537 if (pending && !err) {
1538 ahci_handle_dma(p, slot, cfis, aior->done,
1539 hdr->prdtl - pending);
1543 if (!err && aior->done == aior->len) {
1544 tfd = ATA_S_READY | ATA_S_DSC;
1548 hdr->prdbc = aior->len;
1550 tfd = (ATA_E_ABORT << 8) | ATA_S_READY | ATA_S_ERROR;
1553 p->serr |= (1 << slot);
1557 p->sact &= ~(1 << slot);
1558 ahci_write_fis_sdb(p, slot, tfd);
1560 ahci_write_fis_d2h(p, slot, cfis, tfd);
1563 * This command is now complete.
1565 p->pending &= ~(1 << slot);
1567 ahci_check_stopped(p);
1569 pthread_mutex_unlock(&sc->mtx);
1570 DPRINTF("%s exit\n", __func__);
1574 atapi_ioreq_cb(struct blockif_req *br, int err)
1576 struct ahci_cmd_hdr *hdr;
1577 struct ahci_ioreq *aior;
1578 struct ahci_port *p;
1579 struct pci_ahci_softc *sc;
1584 DPRINTF("%s %d\n", __func__, err);
1586 aior = br->br_param;
1590 pending = aior->prdtl;
1592 hdr = (struct ahci_cmd_hdr *)(p->cmd_lst + aior->slot * AHCI_CL_SIZE);
1594 pthread_mutex_lock(&sc->mtx);
1597 * Delete the blockif request from the busy list
1599 TAILQ_REMOVE(&p->iobhd, aior, io_blist);
1602 * Move the blockif request back to the free list
1604 STAILQ_INSERT_TAIL(&p->iofhd, aior, io_flist);
1606 if (pending && !err) {
1607 atapi_read(p, slot, cfis, aior->done, hdr->prdtl - pending);
1611 if (!err && aior->done == aior->len) {
1612 tfd = ATA_S_READY | ATA_S_DSC;
1613 hdr->prdbc = aior->len;
1615 p->sense_key = ATA_SENSE_ILLEGAL_REQUEST;
1617 tfd = (p->sense_key << 12) | ATA_S_READY | ATA_S_ERROR;
1621 cfis[4] = (cfis[4] & ~7) | ATA_I_CMD | ATA_I_IN;
1622 ahci_write_fis_d2h(p, slot, cfis, tfd);
1625 * This command is now complete.
1627 p->pending &= ~(1 << slot);
1629 ahci_check_stopped(p);
1631 pthread_mutex_unlock(&sc->mtx);
1632 DPRINTF("%s exit\n", __func__);
1636 pci_ahci_ioreq_init(struct ahci_port *pr)
1638 struct ahci_ioreq *vr;
1641 pr->ioqsz = blockif_queuesz(pr->bctx);
1642 pr->ioreq = calloc(pr->ioqsz, sizeof(struct ahci_ioreq));
1643 STAILQ_INIT(&pr->iofhd);
1646 * Add all i/o request entries to the free queue
1648 for (i = 0; i < pr->ioqsz; i++) {
1652 vr->io_req.br_callback = ata_ioreq_cb;
1654 vr->io_req.br_callback = atapi_ioreq_cb;
1655 vr->io_req.br_param = vr;
1656 STAILQ_INSERT_TAIL(&pr->iofhd, vr, io_flist);
1659 TAILQ_INIT(&pr->iobhd);
1663 pci_ahci_port_write(struct pci_ahci_softc *sc, uint64_t offset, uint64_t value)
1665 int port = (offset - AHCI_OFFSET) / AHCI_STEP;
1666 offset = (offset - AHCI_OFFSET) % AHCI_STEP;
1667 struct ahci_port *p = &sc->port[port];
1669 DPRINTF("pci_ahci_port %d: write offset 0x%"PRIx64" value 0x%"PRIx64"\n",
1670 port, offset, value);
1689 p->ie = value & 0xFDC000FF;
1690 ahci_generate_intr(sc);
1696 if (!(value & AHCI_P_CMD_ST)) {
1701 p->cmd |= AHCI_P_CMD_CR;
1702 clb = (uint64_t)p->clbu << 32 | p->clb;
1703 p->cmd_lst = paddr_guest2host(ahci_ctx(sc), clb,
1704 AHCI_CL_SIZE * AHCI_MAX_SLOTS);
1707 if (value & AHCI_P_CMD_FRE) {
1710 p->cmd |= AHCI_P_CMD_FR;
1711 fb = (uint64_t)p->fbu << 32 | p->fb;
1712 /* we don't support FBSCP, so rfis size is 256Bytes */
1713 p->rfis = paddr_guest2host(ahci_ctx(sc), fb, 256);
1715 p->cmd &= ~AHCI_P_CMD_FR;
1718 if (value & AHCI_P_CMD_CLO) {
1720 p->cmd &= ~AHCI_P_CMD_CLO;
1723 ahci_handle_port(p);
1729 WPRINTF("pci_ahci_port: read only registers 0x%"PRIx64"\n", offset);
1732 if (!(p->cmd & AHCI_P_CMD_ST)) {
1733 if (value & ATA_SC_DET_RESET)
1746 ahci_handle_port(p);
1756 pci_ahci_host_write(struct pci_ahci_softc *sc, uint64_t offset, uint64_t value)
1758 DPRINTF("pci_ahci_host: write offset 0x%"PRIx64" value 0x%"PRIx64"\n",
1766 DPRINTF("pci_ahci_host: read only registers 0x%"PRIx64"\n", offset);
1769 if (value & AHCI_GHC_HR)
1771 else if (value & AHCI_GHC_IE) {
1772 sc->ghc |= AHCI_GHC_IE;
1773 ahci_generate_intr(sc);
1778 ahci_generate_intr(sc);
1786 pci_ahci_write(struct vmctx *ctx, int vcpu, struct pci_devinst *pi,
1787 int baridx, uint64_t offset, int size, uint64_t value)
1789 struct pci_ahci_softc *sc = pi->pi_arg;
1791 assert(baridx == 5);
1794 pthread_mutex_lock(&sc->mtx);
1796 if (offset < AHCI_OFFSET)
1797 pci_ahci_host_write(sc, offset, value);
1798 else if (offset < AHCI_OFFSET + sc->ports * AHCI_STEP)
1799 pci_ahci_port_write(sc, offset, value);
1801 WPRINTF("pci_ahci: unknown i/o write offset 0x%"PRIx64"\n", offset);
1803 pthread_mutex_unlock(&sc->mtx);
1807 pci_ahci_host_read(struct pci_ahci_softc *sc, uint64_t offset)
1823 uint32_t *p = &sc->cap;
1824 p += (offset - AHCI_CAP) / sizeof(uint32_t);
1832 DPRINTF("pci_ahci_host: read offset 0x%"PRIx64" value 0x%x\n",
1839 pci_ahci_port_read(struct pci_ahci_softc *sc, uint64_t offset)
1842 int port = (offset - AHCI_OFFSET) / AHCI_STEP;
1843 offset = (offset - AHCI_OFFSET) % AHCI_STEP;
1863 uint32_t *p= &sc->port[port].clb;
1864 p += (offset - AHCI_P_CLB) / sizeof(uint32_t);
1873 DPRINTF("pci_ahci_port %d: read offset 0x%"PRIx64" value 0x%x\n",
1874 port, offset, value);
1880 pci_ahci_read(struct vmctx *ctx, int vcpu, struct pci_devinst *pi, int baridx,
1881 uint64_t offset, int size)
1883 struct pci_ahci_softc *sc = pi->pi_arg;
1886 assert(baridx == 5);
1889 pthread_mutex_lock(&sc->mtx);
1891 if (offset < AHCI_OFFSET)
1892 value = pci_ahci_host_read(sc, offset);
1893 else if (offset < AHCI_OFFSET + sc->ports * AHCI_STEP)
1894 value = pci_ahci_port_read(sc, offset);
1897 WPRINTF("pci_ahci: unknown i/o read offset 0x%"PRIx64"\n", offset);
1900 pthread_mutex_unlock(&sc->mtx);
1906 pci_ahci_init(struct vmctx *ctx, struct pci_devinst *pi, char *opts, int atapi)
1908 char bident[sizeof("XX:X:X")];
1909 struct blockif_ctxt *bctxt;
1910 struct pci_ahci_softc *sc;
1916 fprintf(stderr, "pci_ahci: backing device required\n");
1921 dbg = fopen("/tmp/log", "w+");
1924 sc = calloc(1, sizeof(struct pci_ahci_softc));
1927 sc->ports = MAX_PORTS;
1930 * Only use port 0 for a backing device. All other ports will be
1933 sc->port[0].atapi = atapi;
1936 * Attempt to open the backing image. Use the PCI
1937 * slot/func for the identifier string.
1939 snprintf(bident, sizeof(bident), "%d:%d", pi->pi_slot, pi->pi_func);
1940 bctxt = blockif_open(opts, bident);
1941 if (bctxt == NULL) {
1945 sc->port[0].bctx = bctxt;
1946 sc->port[0].pr_sc = sc;
1949 * Allocate blockif request structures and add them
1952 pci_ahci_ioreq_init(&sc->port[0]);
1954 pthread_mutex_init(&sc->mtx, NULL);
1956 /* Intel ICH8 AHCI */
1957 slots = sc->port[0].ioqsz;
1961 sc->cap = AHCI_CAP_64BIT | AHCI_CAP_SNCQ | AHCI_CAP_SSNTF |
1962 AHCI_CAP_SMPS | AHCI_CAP_SSS | AHCI_CAP_SALP |
1963 AHCI_CAP_SAL | AHCI_CAP_SCLO | (0x3 << AHCI_CAP_ISS_SHIFT)|
1964 AHCI_CAP_PMD | AHCI_CAP_SSC | AHCI_CAP_PSC |
1965 (slots << AHCI_CAP_NCS_SHIFT) | AHCI_CAP_SXS | (sc->ports - 1);
1967 /* Only port 0 implemented */
1970 sc->cap2 = AHCI_CAP2_APST;
1973 pci_set_cfgdata16(pi, PCIR_DEVICE, 0x2821);
1974 pci_set_cfgdata16(pi, PCIR_VENDOR, 0x8086);
1975 pci_set_cfgdata8(pi, PCIR_CLASS, PCIC_STORAGE);
1976 pci_set_cfgdata8(pi, PCIR_SUBCLASS, PCIS_STORAGE_SATA);
1977 pci_set_cfgdata8(pi, PCIR_PROGIF, PCIP_STORAGE_SATA_AHCI_1_0);
1978 pci_emul_add_msicap(pi, 1);
1979 pci_emul_alloc_bar(pi, 5, PCIBAR_MEM32,
1980 AHCI_OFFSET + sc->ports * AHCI_STEP);
1982 pci_lintr_request(pi);
1986 blockif_close(sc->port[0].bctx);
1994 pci_ahci_hd_init(struct vmctx *ctx, struct pci_devinst *pi, char *opts)
1997 return (pci_ahci_init(ctx, pi, opts, 0));
2001 pci_ahci_atapi_init(struct vmctx *ctx, struct pci_devinst *pi, char *opts)
2004 return (pci_ahci_init(ctx, pi, opts, 1));
2008 * Use separate emulation names to distinguish drive and atapi devices
2010 struct pci_devemu pci_de_ahci_hd = {
2011 .pe_emu = "ahci-hd",
2012 .pe_init = pci_ahci_hd_init,
2013 .pe_barwrite = pci_ahci_write,
2014 .pe_barread = pci_ahci_read
2016 PCI_EMUL_SET(pci_de_ahci_hd);
2018 struct pci_devemu pci_de_ahci_cd = {
2019 .pe_emu = "ahci-cd",
2020 .pe_init = pci_ahci_atapi_init,
2021 .pe_barwrite = pci_ahci_write,
2022 .pe_barread = pci_ahci_read
2024 PCI_EMUL_SET(pci_de_ahci_cd);