/* $OpenBSD: bcm2711_pcie.c,v 1.10 2021/12/06 18:02:58 kettenis Exp $ */ /* * Copyright (c) 2020 Mark Kettenis * * Permission to use, copy, modify, and distribute this software for any * purpose with or without fee is hereby granted, provided that the above * copyright notice and this permission notice appear in all copies. * * THE SOFTWARE IS PROVIDED "AS IS" AND THE AUTHOR DISCLAIMS ALL WARRANTIES * WITH REGARD TO THIS SOFTWARE INCLUDING ALL IMPLIED WARRANTIES OF * MERCHANTABILITY AND FITNESS. IN NO EVENT SHALL THE AUTHOR BE LIABLE FOR * ANY SPECIAL, DIRECT, INDIRECT, OR CONSEQUENTIAL DAMAGES OR ANY DAMAGES * WHATSOEVER RESULTING FROM LOSS OF USE, DATA OR PROFITS, WHETHER IN AN * ACTION OF CONTRACT, NEGLIGENCE OR OTHER TORTIOUS ACTION, ARISING OUT OF * OR IN CONNECTION WITH THE USE OR PERFORMANCE OF THIS SOFTWARE. */ #include #include #include #include #include #include #include #include #include #include #include #include #include #include #define PCIE_MISC_CPU_2_PCIE_MEM_WIN0_LO 0x400c #define PCIE_MISC_CPU_2_PCIE_MEM_WIN0_HI 0x4010 #define PCIE_MISC_CPU_2_PCIE_MEM_WIN0_BASE_LIMIT 0x4070 #define PCIE_MISC_CPU_2_PCIE_MEM_WIN0_BASE_HI 0x4080 #define PCIE_MISC_CPU_2_PCIE_MEM_WIN0_LIMIT_HI 0x4084 #define PCIE_EXT_CFG_DATA 0x8000 #define PCIE_EXT_CFG_INDEX 0x9000 #define PCIE_RGR1_SW_INIT_1 0x9210 #define PCIE_RGR1_SW_INIT_1_PERST_MASK (1 << 0) #define PCIE_RGR1_SW_INIT_1_INIT_MASK (1 << 1) #define HREAD4(sc, reg) \ (bus_space_read_4((sc)->sc_iot, (sc)->sc_ioh, (reg))) #define HWRITE4(sc, reg, val) \ bus_space_write_4((sc)->sc_iot, (sc)->sc_ioh, (reg), (val)) struct bcmpcie_range { uint32_t flags; uint64_t pci_base; uint64_t phys_base; uint64_t size; }; struct bcmpcie_softc { struct device sc_dev; bus_space_tag_t sc_iot; bus_space_handle_t sc_ioh; bus_dma_tag_t sc_dmat; int sc_node; int sc_acells; int sc_scells; int sc_pacells; int sc_pscells; struct bcmpcie_range *sc_ranges; int sc_nranges; struct bcmpcie_range *sc_dmaranges; int sc_ndmaranges; struct bus_space sc_bus_iot; struct bus_space sc_bus_memt; struct machine_bus_dma_tag sc_dma; struct machine_pci_chipset sc_pc; int sc_bus; }; int bcmpcie_match(struct device *, void *, void *); void bcmpcie_attach(struct device *, struct device *, void *); struct cfattach bcmpcie_ca = { sizeof (struct bcmpcie_softc), bcmpcie_match, bcmpcie_attach }; struct cfdriver bcmpcie_cd = { NULL, "bcmpcie", DV_DULL }; int bcmpcie_match(struct device *parent, void *match, void *aux) { struct fdt_attach_args *faa = aux; return OF_is_compatible(faa->fa_node, "brcm,bcm2711-pcie"); } void bcmpcie_attach_hook(struct device *, struct device *, struct pcibus_attach_args *); int bcmpcie_bus_maxdevs(void *, int); pcitag_t bcmpcie_make_tag(void *, int, int, int); void bcmpcie_decompose_tag(void *, pcitag_t, int *, int *, int *); int bcmpcie_conf_size(void *, pcitag_t); pcireg_t bcmpcie_conf_read(void *, pcitag_t, int); void bcmpcie_conf_write(void *, pcitag_t, int, pcireg_t); int bcmpcie_probe_device_hook(void *, struct pci_attach_args *); int bcmpcie_intr_map(struct pci_attach_args *, pci_intr_handle_t *); const char *bcmpcie_intr_string(void *, pci_intr_handle_t); void *bcmpcie_intr_establish(void *, pci_intr_handle_t, int, struct cpu_info *, int (*)(void *), void *, char *); void bcmpcie_intr_disestablish(void *, void *); int bcmpcie_bs_iomap(bus_space_tag_t, bus_addr_t, bus_size_t, int, bus_space_handle_t *); int bcmpcie_bs_memmap(bus_space_tag_t, bus_addr_t, bus_size_t, int, bus_space_handle_t *); int bcmpcie_dmamap_load_buffer(bus_dma_tag_t, bus_dmamap_t, void *, bus_size_t, struct proc *, int, paddr_t *, int *, int); int bcmpcie_dmamap_load_raw(bus_dma_tag_t, bus_dmamap_t, bus_dma_segment_t *, int, bus_size_t, int); void bcmpcie_attach(struct device *parent, struct device *self, void *aux) { struct bcmpcie_softc *sc = (struct bcmpcie_softc *)self; struct fdt_attach_args *faa = aux; struct pcibus_attach_args pba; uint32_t *ranges; int i, j, nranges, rangeslen; uint32_t reg; if (faa->fa_nreg < 1) { printf(": no registers\n"); return; } sc->sc_iot = faa->fa_iot; if (bus_space_map(sc->sc_iot, faa->fa_reg[0].addr, faa->fa_reg[0].size, 0, &sc->sc_ioh)) { printf(": can't map registers\n"); return; } reg = HREAD4(sc, PCIE_RGR1_SW_INIT_1); if (reg & PCIE_RGR1_SW_INIT_1_INIT_MASK) { printf(": disabled\n"); return; } sc->sc_node = faa->fa_node; sc->sc_dmat = faa->fa_dmat; sc->sc_acells = OF_getpropint(sc->sc_node, "#address-cells", faa->fa_acells); sc->sc_scells = OF_getpropint(sc->sc_node, "#size-cells", faa->fa_scells); sc->sc_pacells = faa->fa_acells; sc->sc_pscells = faa->fa_scells; /* Memory and IO space translations. */ rangeslen = OF_getproplen(sc->sc_node, "ranges"); if (rangeslen <= 0 || (rangeslen % sizeof(uint32_t)) || (rangeslen / sizeof(uint32_t)) % (sc->sc_acells + sc->sc_pacells + sc->sc_scells)) { printf(": invalid ranges property\n"); return; } ranges = malloc(rangeslen, M_TEMP, M_WAITOK); OF_getpropintarray(sc->sc_node, "ranges", ranges, rangeslen); nranges = (rangeslen / sizeof(uint32_t)) / (sc->sc_acells + sc->sc_pacells + sc->sc_scells); sc->sc_ranges = mallocarray(nranges, sizeof(struct bcmpcie_range), M_DEVBUF, M_WAITOK); sc->sc_nranges = nranges; for (i = 0, j = 0; i < sc->sc_nranges; i++) { sc->sc_ranges[i].flags = ranges[j++]; sc->sc_ranges[i].pci_base = ranges[j++]; if (sc->sc_acells - 1 == 2) { sc->sc_ranges[i].pci_base <<= 32; sc->sc_ranges[i].pci_base |= ranges[j++]; } sc->sc_ranges[i].phys_base = ranges[j++]; if (sc->sc_pacells == 2) { sc->sc_ranges[i].phys_base <<= 32; sc->sc_ranges[i].phys_base |= ranges[j++]; } sc->sc_ranges[i].size = ranges[j++]; if (sc->sc_scells == 2) { sc->sc_ranges[i].size <<= 32; sc->sc_ranges[i].size |= ranges[j++]; } } free(ranges, M_TEMP, rangeslen); /* DMA translations */ rangeslen = OF_getproplen(sc->sc_node, "dma-ranges"); if (rangeslen > 0) { if ((rangeslen % sizeof(uint32_t)) || (rangeslen / sizeof(uint32_t)) % (sc->sc_acells + sc->sc_pacells + sc->sc_scells)) { printf(": invalid dma-ranges property\n"); free(sc->sc_ranges, M_DEVBUF, sc->sc_nranges * sizeof(struct bcmpcie_range)); return; } ranges = malloc(rangeslen, M_TEMP, M_WAITOK); OF_getpropintarray(sc->sc_node, "dma-ranges", ranges, rangeslen); nranges = (rangeslen / sizeof(uint32_t)) / (sc->sc_acells + sc->sc_pacells + sc->sc_scells); sc->sc_dmaranges = mallocarray(nranges, sizeof(struct bcmpcie_range), M_DEVBUF, M_WAITOK); sc->sc_ndmaranges = nranges; for (i = 0, j = 0; i < sc->sc_ndmaranges; i++) { sc->sc_dmaranges[i].flags = ranges[j++]; sc->sc_dmaranges[i].pci_base = ranges[j++]; if (sc->sc_acells - 1 == 2) { sc->sc_dmaranges[i].pci_base <<= 32; sc->sc_dmaranges[i].pci_base |= ranges[j++]; } sc->sc_dmaranges[i].phys_base = ranges[j++]; if (sc->sc_pacells == 2) { sc->sc_dmaranges[i].phys_base <<= 32; sc->sc_dmaranges[i].phys_base |= ranges[j++]; } sc->sc_dmaranges[i].size = ranges[j++]; if (sc->sc_scells == 2) { sc->sc_dmaranges[i].size <<= 32; sc->sc_dmaranges[i].size |= ranges[j++]; } } free(ranges, M_TEMP, rangeslen); } /* * Reprogram the outbound window to match the configuration in * the device tree. This is necessary since the EDK2-based * UEFI firmware reprograms the window. */ for (i = 0; i < sc->sc_nranges; i++) { if ((sc->sc_ranges[i].flags & 0x03000000) == 0x02000000) { uint64_t cpu_base = sc->sc_ranges[i].phys_base; uint64_t cpu_limit = sc->sc_ranges[i].phys_base + sc->sc_ranges[i].size - 1; HWRITE4(sc, PCIE_MISC_CPU_2_PCIE_MEM_WIN0_LO, sc->sc_ranges[i].pci_base); HWRITE4(sc, PCIE_MISC_CPU_2_PCIE_MEM_WIN0_HI, sc->sc_ranges[i].pci_base >> 32); HWRITE4(sc, PCIE_MISC_CPU_2_PCIE_MEM_WIN0_BASE_LIMIT, (cpu_base & PPB_MEM_MASK) >> PPB_MEM_SHIFT | (cpu_limit & PPB_MEM_MASK)); HWRITE4(sc, PCIE_MISC_CPU_2_PCIE_MEM_WIN0_BASE_HI, cpu_base >> 32); HWRITE4(sc, PCIE_MISC_CPU_2_PCIE_MEM_WIN0_LIMIT_HI, cpu_limit >> 32); } } printf("\n"); memcpy(&sc->sc_bus_iot, sc->sc_iot, sizeof(sc->sc_bus_iot)); sc->sc_bus_iot.bus_private = sc; sc->sc_bus_iot._space_map = bcmpcie_bs_iomap; memcpy(&sc->sc_bus_memt, sc->sc_iot, sizeof(sc->sc_bus_memt)); sc->sc_bus_memt.bus_private = sc; sc->sc_bus_memt._space_map = bcmpcie_bs_memmap; memcpy(&sc->sc_dma, sc->sc_dmat, sizeof(sc->sc_dma)); sc->sc_dma._dmamap_load_buffer = bcmpcie_dmamap_load_buffer; sc->sc_dma._dmamap_load_raw = bcmpcie_dmamap_load_raw; sc->sc_dma._cookie = sc; sc->sc_pc.pc_conf_v = sc; sc->sc_pc.pc_attach_hook = bcmpcie_attach_hook; sc->sc_pc.pc_bus_maxdevs = bcmpcie_bus_maxdevs; sc->sc_pc.pc_make_tag = bcmpcie_make_tag; sc->sc_pc.pc_decompose_tag = bcmpcie_decompose_tag; sc->sc_pc.pc_conf_size = bcmpcie_conf_size; sc->sc_pc.pc_conf_read = bcmpcie_conf_read; sc->sc_pc.pc_conf_write = bcmpcie_conf_write; sc->sc_pc.pc_probe_device_hook = bcmpcie_probe_device_hook; sc->sc_pc.pc_intr_v = sc; sc->sc_pc.pc_intr_map = bcmpcie_intr_map; sc->sc_pc.pc_intr_map_msi = _pci_intr_map_msi; sc->sc_pc.pc_intr_map_msix = _pci_intr_map_msix; sc->sc_pc.pc_intr_string = bcmpcie_intr_string; sc->sc_pc.pc_intr_establish = bcmpcie_intr_establish; sc->sc_pc.pc_intr_disestablish = bcmpcie_intr_disestablish; memset(&pba, 0, sizeof(pba)); pba.pba_busname = "pci"; pba.pba_iot = &sc->sc_bus_iot; pba.pba_memt = &sc->sc_bus_memt; pba.pba_dmat = &sc->sc_dma; pba.pba_pc = &sc->sc_pc; pba.pba_domain = pci_ndomains++; pba.pba_bus = 0; config_found(self, &pba, NULL); } void bcmpcie_attach_hook(struct device *parent, struct device *self, struct pcibus_attach_args *pba) { } int bcmpcie_bus_maxdevs(void *v, int bus) { struct bcmpcie_softc *sc = v; if (bus == sc->sc_bus || bus == sc->sc_bus + 1) return 1; return 32; } pcitag_t bcmpcie_make_tag(void *v, int bus, int device, int function) { /* Return ECAM address. */ return ((bus << 20) | (device << 15) | (function << 12)); } void bcmpcie_decompose_tag(void *v, pcitag_t tag, int *bp, int *dp, int *fp) { if (bp != NULL) *bp = (tag >> 20) & 0xff; if (dp != NULL) *dp = (tag >> 15) & 0x1f; if (fp != NULL) *fp = (tag >> 12) & 0x7; } int bcmpcie_conf_size(void *v, pcitag_t tag) { return PCIE_CONFIG_SPACE_SIZE; } pcireg_t bcmpcie_conf_read(void *v, pcitag_t tag, int reg) { struct bcmpcie_softc *sc = v; int bus, dev, fn; bcmpcie_decompose_tag(sc, tag, &bus, &dev, &fn); if (bus == 0) { KASSERT(dev == 0); return HREAD4(sc, tag | reg); } HWRITE4(sc, PCIE_EXT_CFG_INDEX, tag); return HREAD4(sc, PCIE_EXT_CFG_DATA + reg); } void bcmpcie_conf_write(void *v, pcitag_t tag, int reg, pcireg_t data) { struct bcmpcie_softc *sc = v; int bus, dev, fn; bcmpcie_decompose_tag(sc, tag, &bus, &dev, &fn); if (bus == 0) { KASSERT(dev == 0); HWRITE4(sc, tag | reg, data); return; } HWRITE4(sc, PCIE_EXT_CFG_INDEX, tag); HWRITE4(sc, PCIE_EXT_CFG_DATA + reg, data); } int bcmpcie_probe_device_hook(void *v, struct pci_attach_args *pa) { return 0; } int bcmpcie_intr_map(struct pci_attach_args *pa, pci_intr_handle_t *ihp) { int pin = pa->pa_rawintrpin; if (pin == 0 || pin > PCI_INTERRUPT_PIN_MAX) return -1; if (pa->pa_tag == 0) return -1; ihp->ih_pc = pa->pa_pc; ihp->ih_tag = pa->pa_intrtag; ihp->ih_intrpin = pa->pa_intrpin; ihp->ih_type = PCI_INTX; return 0; } const char * bcmpcie_intr_string(void *v, pci_intr_handle_t ih) { switch (ih.ih_type) { case PCI_MSI: return "msi"; case PCI_MSIX: return "msix"; } return "intx"; } void * bcmpcie_intr_establish(void *v, pci_intr_handle_t ih, int level, struct cpu_info *ci, int (*func)(void *), void *arg, char *name) { struct bcmpcie_softc *sc = v; int bus, dev, fn; uint32_t reg[4]; KASSERT(ih.ih_type == PCI_INTX); bcmpcie_decompose_tag(sc, ih.ih_tag, &bus, &dev, &fn); reg[0] = bus << 16 | dev << 11 | fn << 8; reg[1] = reg[2] = 0; reg[3] = ih.ih_intrpin; return fdt_intr_establish_imap_cpu(sc->sc_node, reg, sizeof(reg), level, ci, func, arg, name); } void bcmpcie_intr_disestablish(void *v, void *cookie) { } int bcmpcie_bs_iomap(bus_space_tag_t t, bus_addr_t addr, bus_size_t size, int flags, bus_space_handle_t *bshp) { struct bcmpcie_softc *sc = t->bus_private; int i; for (i = 0; i < sc->sc_nranges; i++) { uint64_t pci_start = sc->sc_ranges[i].pci_base; uint64_t pci_end = pci_start + sc->sc_ranges[i].size; uint64_t phys_start = sc->sc_ranges[i].phys_base; if ((sc->sc_ranges[i].flags & 0x03000000) == 0x01000000 && addr >= pci_start && addr + size <= pci_end) { return bus_space_map(sc->sc_iot, addr - pci_start + phys_start, size, flags, bshp); } } return ENXIO; } int bcmpcie_bs_memmap(bus_space_tag_t t, bus_addr_t addr, bus_size_t size, int flags, bus_space_handle_t *bshp) { struct bcmpcie_softc *sc = t->bus_private; int i; for (i = 0; i < sc->sc_nranges; i++) { uint64_t pci_start = sc->sc_ranges[i].pci_base; uint64_t pci_end = pci_start + sc->sc_ranges[i].size; uint64_t phys_start = sc->sc_ranges[i].phys_base; if ((sc->sc_ranges[i].flags & 0x03000000) == 0x02000000 && addr >= pci_start && addr + size <= pci_end) { return bus_space_map(sc->sc_iot, addr - pci_start + phys_start, size, flags, bshp); } } return ENXIO; } int bcmpcie_dmamap_load_buffer(bus_dma_tag_t t, bus_dmamap_t map, void *buf, bus_size_t buflen, struct proc *p, int flags, paddr_t *lastaddrp, int *segp, int first) { struct bcmpcie_softc *sc = t->_cookie; int seg, firstseg = *segp; int error; error = sc->sc_dmat->_dmamap_load_buffer(sc->sc_dmat, map, buf, buflen, p, flags, lastaddrp, segp, first); if (error) return error; if (sc->sc_dmaranges == NULL) return 0; /* For each segment. */ for (seg = firstseg; seg <= *segp; seg++) { uint64_t addr = map->dm_segs[seg].ds_addr; uint64_t size = map->dm_segs[seg].ds_len; int i; /* For each range. */ for (i = 0; i < sc->sc_ndmaranges; i++) { uint64_t pci_start = sc->sc_dmaranges[i].pci_base; uint64_t phys_start = sc->sc_dmaranges[i].phys_base; uint64_t phys_end = phys_start + sc->sc_dmaranges[i].size; if (addr >= phys_start && addr + size <= phys_end) { map->dm_segs[seg].ds_addr -= phys_start; map->dm_segs[seg].ds_addr += pci_start; break; } } if (i == sc->sc_ndmaranges) return EINVAL; } return 0; } int bcmpcie_dmamap_load_raw(bus_dma_tag_t t, bus_dmamap_t map, bus_dma_segment_t *segs, int nsegs, bus_size_t size, int flags) { struct bcmpcie_softc *sc = t->_cookie; int seg, error; error = sc->sc_dmat->_dmamap_load_raw(sc->sc_dmat, map, segs, nsegs, size, flags); if (error) return error; if (sc->sc_dmaranges == NULL) return 0; /* For each segment. */ for (seg = 0; seg < map->dm_nsegs; seg++) { uint64_t addr = map->dm_segs[seg].ds_addr; uint64_t size = map->dm_segs[seg].ds_len; int i; /* For each range. */ for (i = 0; i < sc->sc_ndmaranges; i++) { uint64_t pci_start = sc->sc_dmaranges[i].pci_base; uint64_t phys_start = sc->sc_dmaranges[i].phys_base; uint64_t phys_end = phys_start + sc->sc_dmaranges[i].size; if (addr >= phys_start && addr + size <= phys_end) { map->dm_segs[seg].ds_addr -= phys_start; map->dm_segs[seg].ds_addr += pci_start; break; } } if (i == sc->sc_ndmaranges) return EINVAL; } return 0; }