Skip site navigation (1)Skip section navigation (2)
Date:      Fri, 3 Jun 2016 10:28:06 +0000 (UTC)
From:      Andrew Turner <andrew@FreeBSD.org>
To:        src-committers@freebsd.org, svn-src-all@freebsd.org, svn-src-head@freebsd.org
Subject:   svn commit: r301265 - in head/sys: arm64/arm64 arm64/include conf
Message-ID:  <201606031028.u53AS64t058415@repo.freebsd.org>

next in thread | raw e-mail | index | archive | help
Author: andrew
Date: Fri Jun  3 10:28:06 2016
New Revision: 301265
URL: https://svnweb.freebsd.org/changeset/base/301265

Log:
  Add the GICv3 ITS intrng driver. As the interface to the interrupt
  framework has significantly changed the driver has moved to a new file.
  While it shares some code with the existing driver this has been modified
  to work better with the intrng framework.
  
  This has been tested on the ThunderX servers in the netperf cluster and has
  been used to boot them for other testing, including DTrace and hwpmc.
  
  With this we can use intrng on all supported arm64 platforms I was able to
  test on. It is expected we will move to intrng soon, and disable the old
  arm64 interrupt framework.
  
  Obtained from:	ABT Systems Ltd
  Sponsored by:	The FreeBSD Foundation
  Differential Revision:	https://reviews.freebsd.org/D6437

Added:
  head/sys/arm64/arm64/gicv3_its.c   (contents, props changed)
Modified:
  head/sys/arm64/arm64/gic_v3.c
  head/sys/arm64/arm64/gic_v3_fdt.c
  head/sys/arm64/arm64/gic_v3_var.h
  head/sys/arm64/include/intr.h
  head/sys/conf/files.arm64

Modified: head/sys/arm64/arm64/gic_v3.c
==============================================================================
--- head/sys/arm64/arm64/gic_v3.c	Fri Jun  3 10:17:19 2016	(r301264)
+++ head/sys/arm64/arm64/gic_v3.c	Fri Jun  3 10:28:06 2016	(r301265)
@@ -63,6 +63,8 @@ __FBSDID("$FreeBSD$");
 #include "gic_v3_reg.h"
 #include "gic_v3_var.h"
 
+static bus_read_ivar_t gic_v3_read_ivar;
+
 #ifdef INTRNG
 static pic_disable_intr_t gic_v3_disable_intr;
 static pic_enable_intr_t gic_v3_enable_intr;
@@ -101,6 +103,9 @@ static device_method_t gic_v3_methods[] 
 	/* Device interface */
 	DEVMETHOD(device_detach,	gic_v3_detach),
 
+	/* Bus interface */
+	DEVMETHOD(bus_read_ivar,	gic_v3_read_ivar),
+
 #ifdef INTRNG
 	/* Interrupt controller interface */
 	DEVMETHOD(pic_disable_intr,	gic_v3_disable_intr),
@@ -179,6 +184,44 @@ static gic_v3_initseq_t gic_v3_secondary
 };
 #endif
 
+#ifdef INTRNG
+uint32_t
+gic_r_read_4(device_t dev, bus_size_t offset)
+{
+	struct gic_v3_softc *sc;
+
+	sc = device_get_softc(dev);
+	return (bus_read_4(sc->gic_redists.pcpu[PCPU_GET(cpuid)], offset));
+}
+
+uint64_t
+gic_r_read_8(device_t dev, bus_size_t offset)
+{
+	struct gic_v3_softc *sc;
+
+	sc = device_get_softc(dev);
+	return (bus_read_8(sc->gic_redists.pcpu[PCPU_GET(cpuid)], offset));
+}
+
+void
+gic_r_write_4(device_t dev, bus_size_t offset, uint32_t val)
+{
+	struct gic_v3_softc *sc;
+
+	sc = device_get_softc(dev);
+	bus_write_4(sc->gic_redists.pcpu[PCPU_GET(cpuid)], offset, val);
+}
+
+void
+gic_r_write_8(device_t dev, bus_size_t offset, uint64_t val)
+{
+	struct gic_v3_softc *sc;
+
+	sc = device_get_softc(dev);
+	bus_write_8(sc->gic_redists.pcpu[PCPU_GET(cpuid)], offset, val);
+}
+#endif
+
 /*
  * Device interface.
  */
@@ -327,17 +370,39 @@ gic_v3_detach(device_t dev)
 	return (0);
 }
 
+static int
+gic_v3_read_ivar(device_t dev, device_t child, int which, uintptr_t *result)
+{
+	struct gic_v3_softc *sc;
+
+	sc = device_get_softc(dev);
+
+	switch (which) {
+	case GICV3_IVAR_NIRQS:
+		*result = sc->gic_nirqs;
+		return (0);
+	case GICV3_IVAR_REDIST_VADDR:
+		*result = (uintptr_t)rman_get_virtual(
+		    sc->gic_redists.pcpu[PCPU_GET(cpuid)]);
+		return (0);
+	}
+
+	return (ENOENT);
+}
+
 #ifdef INTRNG
 int
 arm_gic_v3_intr(void *arg)
 {
 	struct gic_v3_softc *sc = arg;
 	struct gic_v3_irqsrc *gi;
+	struct intr_pic *pic;
 	uint64_t active_irq;
 	struct trapframe *tf;
 	bool first;
 
 	first = true;
+	pic = sc->gic_pic;
 
 	while (1) {
 		if (CPU_MATCH_ERRATA_CAVIUM_THUNDER_1_1) {
@@ -357,6 +422,11 @@ arm_gic_v3_intr(void *arg)
 			active_irq = gic_icc_read(IAR1);
 		}
 
+		if (active_irq >= GIC_FIRST_LPI) {
+			intr_child_irq_handler(pic, active_irq);
+			continue;
+		}
+
 		if (__predict_false(active_irq >= sc->gic_nirqs))
 			return (FILTER_HANDLED);
 
@@ -733,11 +803,12 @@ gic_v3_bind_intr(device_t dev, struct in
 static void
 gic_v3_init_secondary(device_t dev)
 {
+	device_t child;
 	struct gic_v3_softc *sc;
 	gic_v3_initseq_t *init_func;
 	struct intr_irqsrc *isrc;
 	u_int cpu, irq;
-	int err;
+	int err, i;
 
 	sc = device_get_softc(dev);
 	cpu = PCPU_GET(cpuid);
@@ -766,6 +837,11 @@ gic_v3_init_secondary(device_t dev)
 		if (intr_isrc_init_on_cpu(isrc, cpu))
 			gic_v3_enable_intr(dev, isrc);
 	}
+
+	for (i = 0; i < sc->gic_nchildren; i++) {
+		child = sc->gic_children[i];
+		PIC_INIT_SECONDARY(child);
+	}
 }
 
 static void

Modified: head/sys/arm64/arm64/gic_v3_fdt.c
==============================================================================
--- head/sys/arm64/arm64/gic_v3_fdt.c	Fri Jun  3 10:17:19 2016	(r301264)
+++ head/sys/arm64/arm64/gic_v3_fdt.c	Fri Jun  3 10:28:06 2016	(r301265)
@@ -139,7 +139,8 @@ gic_v3_fdt_attach(device_t dev)
 
 #ifdef INTRNG
 	xref = OF_xref_from_node(ofw_bus_get_node(dev));
-	if (intr_pic_register(dev, xref) == NULL) {
+	sc->gic_pic = intr_pic_register(dev, xref);
+	if (sc->gic_pic == NULL) {
 		device_printf(dev, "could not register PIC\n");
 		err = ENXIO;
 		goto error;
@@ -164,6 +165,11 @@ gic_v3_fdt_attach(device_t dev)
 		}
 	}
 
+#ifdef INTRNG
+	if (device_get_children(dev, &sc->gic_children, &sc->gic_nchildren) != 0)
+		sc->gic_nchildren = 0;
+#endif
+
 	return (err);
 
 error:

Modified: head/sys/arm64/arm64/gic_v3_var.h
==============================================================================
--- head/sys/arm64/arm64/gic_v3_var.h	Fri Jun  3 10:17:19 2016	(r301264)
+++ head/sys/arm64/arm64/gic_v3_var.h	Fri Jun  3 10:28:06 2016	(r301265)
@@ -36,10 +36,12 @@
 
 DECLARE_CLASS(gic_v3_driver);
 
+#ifndef INTRNG
 #define	LPI_FLAGS_CONF_FLUSH	(1UL << 0)
 #define	LPI_CONFTAB_SIZE	PAGE_SIZE_64K
 /* 1 bit per LPI + 1 KB more for the obligatory PPI, SGI, SPI stuff */
 #define	LPI_PENDTAB_SIZE	((LPI_CONFTAB_SIZE / 8) + 0x400)
+#endif
 
 #ifdef INTRNG
 struct gic_v3_irqsrc {
@@ -86,6 +88,9 @@ struct gic_v3_softc {
 	boolean_t		gic_registered;
 
 #ifdef INTRNG
+	int			gic_nchildren;
+	device_t		*gic_children;
+	struct intr_pic		*gic_pic;
 	struct gic_v3_irqsrc	*gic_irqs;
 #endif
 };
@@ -96,25 +101,38 @@ struct gic_v3_softc {
 
 MALLOC_DECLARE(M_GIC_V3);
 
+/* ivars */
+enum {
+	GICV3_IVAR_NIRQS,
+	GICV3_IVAR_REDIST_VADDR,
+};
+
+__BUS_ACCESSOR(gicv3, nirqs, GICV3, NIRQS, u_int);
+__BUS_ACCESSOR(gicv3, redist_vaddr, GICV3, REDIST_VADDR, void *);
+
 /* Device methods */
 int gic_v3_attach(device_t dev);
 int gic_v3_detach(device_t dev);
 int arm_gic_v3_intr(void *);
 
+#ifdef INTRNG
+uint32_t gic_r_read_4(device_t, bus_size_t);
+uint64_t gic_r_read_8(device_t, bus_size_t);
+void gic_r_write_4(device_t, bus_size_t, uint32_t var);
+void gic_r_write_8(device_t, bus_size_t, uint64_t var);
+#endif
+
 /*
  * ITS
  */
-#define	GIC_V3_ITS_DEVSTR	"ARM GIC Interrupt Translation Service"
-#define	GIC_V3_ITS_COMPSTR	"arm,gic-v3-its"
-
-DECLARE_CLASS(gic_v3_its_driver);
 
 /* LPI chunk owned by ITS device */
 struct lpi_chunk {
 	u_int	lpi_base;
 	u_int	lpi_free;	/* First free LPI in set */
+#ifndef INTRNG
 	u_int	*lpi_col_ids;
-
+#endif
 	u_int	lpi_num;	/* Total number of LPIs in chunk */
 	u_int	lpi_busy;	/* Number of busy LPIs in chink */
 };
@@ -132,6 +150,7 @@ struct its_dev {
 	vm_offset_t		itt;
 	size_t			itt_size;
 };
+#ifndef INTRNG
 TAILQ_HEAD(its_dev_list, its_dev);
 
 /* ITS private table description */
@@ -152,6 +171,11 @@ struct its_cmd {
 	uint64_t	cmd_dword[4];	/* ITS command double word */
 };
 
+#define	GIC_V3_ITS_DEVSTR	"ARM GIC Interrupt Translation Service"
+#define	GIC_V3_ITS_COMPSTR	"arm,gic-v3-its"
+
+DECLARE_CLASS(gic_v3_its_driver);
+
 /* ITS commands encoding */
 #define	ITS_CMD_MOVI		(0x01)
 #define	ITS_CMD_SYNC		(0x05)
@@ -183,6 +207,7 @@ struct its_cmd {
 /* Valid command bit */
 #define	CMD_VALID_SHIFT		(63)
 #define	CMD_VALID_MASK		(1UL << CMD_VALID_SHIFT)
+#endif /* INTRNG */
 
 /*
  * ITS command descriptor.
@@ -237,13 +262,14 @@ struct its_cmd_desc {
 	};
 };
 
+#define	ITS_TARGET_NONE		0xFBADBEEF
+
+#ifndef INTRNG
 #define	ITS_CMDQ_SIZE		PAGE_SIZE_64K
 #define	ITS_CMDQ_NENTRIES	(ITS_CMDQ_SIZE / sizeof(struct its_cmd))
 
 #define	ITS_FLAGS_CMDQ_FLUSH	(1UL << 0)
 
-#define	ITS_TARGET_NONE		0xFBADBEEF
-
 struct gic_v3_its_softc {
 	device_t		dev;
 	struct resource	*	its_res;
@@ -255,7 +281,9 @@ struct gic_v3_its_softc {
 
 	uint64_t		its_flags;
 
+#ifndef INTRNG
 	struct its_dev_list	its_dev_list;
+#endif
 
 	bitstr_t *		its_lpi_bitmap;
 	uint32_t		its_lpi_maxid;
@@ -290,6 +318,7 @@ int its_init_cpu(struct gic_v3_its_softc
 int lpi_migrate(device_t, uint32_t, u_int);
 void lpi_unmask_irq(device_t, uint32_t);
 void lpi_mask_irq(device_t, uint32_t);
+#endif
 /*
  * GIC Distributor accessors.
  * Notice that only GIC sofc can be passed.

Added: head/sys/arm64/arm64/gicv3_its.c
==============================================================================
--- /dev/null	00:00:00 1970	(empty, because file is newly added)
+++ head/sys/arm64/arm64/gicv3_its.c	Fri Jun  3 10:28:06 2016	(r301265)
@@ -0,0 +1,1585 @@
+/*-
+ * Copyright (c) 2015-2016 The FreeBSD Foundation
+ * All rights reserved.
+ *
+ * This software was developed by Andrew Turner under
+ * the sponsorship of the FreeBSD Foundation.
+ *
+ * This software was developed by Semihalf under
+ * the sponsorship of the FreeBSD Foundation.
+ *
+ * Redistribution and use in source and binary forms, with or without
+ * modification, are permitted provided that the following conditions
+ * are met:
+ * 1. Redistributions of source code must retain the above copyright
+ *    notice, this list of conditions and the following disclaimer.
+ * 2. Redistributions in binary form must reproduce the above copyright
+ *    notice, this list of conditions and the following disclaimer in the
+ *    documentation and/or other materials provided with the distribution.
+ *
+ * THIS SOFTWARE IS PROVIDED BY THE AUTHOR AND CONTRIBUTORS ``AS IS'' AND
+ * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
+ * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
+ * ARE DISCLAIMED. IN NO EVENT SHALL THE AUTHOR OR CONTRIBUTORS BE LIABLE
+ * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
+ * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
+ * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
+ * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
+ * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
+ * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
+ * SUCH DAMAGE.
+ */
+
+#include "opt_platform.h"
+
+#include <sys/cdefs.h>
+__FBSDID("$FreeBSD$");
+
+#include <sys/param.h>
+#include <sys/systm.h>
+#include <sys/bus.h>
+#include <sys/cpuset.h>
+#include <sys/endian.h>
+#include <sys/kernel.h>
+#include <sys/malloc.h>
+#include <sys/module.h>
+#include <sys/proc.h>
+#include <sys/queue.h>
+#include <sys/rman.h>
+#include <sys/smp.h>
+#include <sys/vmem.h>
+
+#include <vm/vm.h>
+#include <vm/pmap.h>
+
+#include <machine/bus.h>
+#include <machine/intr.h>
+
+#include <arm64/arm64/gic_v3_reg.h>
+#include <arm64/arm64/gic_v3_var.h>
+
+#ifdef FDT
+#include <dev/ofw/openfirm.h>
+#include <dev/ofw/ofw_bus.h>
+#include <dev/ofw/ofw_bus_subr.h>
+#endif
+#include <dev/pci/pcireg.h>
+#include <dev/pci/pcivar.h>
+
+#include "pcib_if.h"
+#include "pic_if.h"
+#include "msi_if.h"
+
+MALLOC_DEFINE(M_GICV3_ITS, "GICv3 ITS",
+    "ARM GICv3 Interrupt Translation Service");
+
+#define	LPI_NIRQS		(64 * 1024)
+
+/* The size and alignment of the command circular buffer */
+#define	ITS_CMDQ_SIZE		(64 * 1024)	/* Must be a multiple of 4K */
+#define	ITS_CMDQ_ALIGN		(64 * 1024)
+
+#define	LPI_CONFTAB_SIZE	LPI_NIRQS
+#define	LPI_CONFTAB_ALIGN	(64 * 1024)
+#define	LPI_CONFTAB_MAX_ADDR	((1ul << 48) - 1) /* We need a 47 bit PA */
+
+/* 1 bit per SPI, PPI, and SGI (8k), and 1 bit per LPI (LPI_CONFTAB_SIZE) */
+#define	LPI_PENDTAB_SIZE	((LPI_NIRQS + GIC_FIRST_LPI) / 8)
+#define	LPI_PENDTAB_ALIGN	(64 * 1024)
+#define	LPI_PENDTAB_MAX_ADDR	((1ul << 48) - 1) /* We need a 47 bit PA */
+
+#define	LPI_INT_TRANS_TAB_ALIGN	256
+#define	LPI_INT_TRANS_TAB_MAX_ADDR ((1ul << 48) - 1)
+
+/* ITS commands encoding */
+#define	ITS_CMD_MOVI		(0x01)
+#define	ITS_CMD_SYNC		(0x05)
+#define	ITS_CMD_MAPD		(0x08)
+#define	ITS_CMD_MAPC		(0x09)
+#define	ITS_CMD_MAPTI		(0x0a)
+#define	ITS_CMD_MAPI		(0x0b)
+#define	ITS_CMD_INV		(0x0c)
+#define	ITS_CMD_INVALL		(0x0d)
+/* Command */
+#define	CMD_COMMAND_MASK	(0xFFUL)
+/* PCI device ID */
+#define	CMD_DEVID_SHIFT		(32)
+#define	CMD_DEVID_MASK		(0xFFFFFFFFUL << CMD_DEVID_SHIFT)
+/* Size of IRQ ID bitfield */
+#define	CMD_SIZE_MASK		(0xFFUL)
+/* Virtual LPI ID */
+#define	CMD_ID_MASK		(0xFFFFFFFFUL)
+/* Physical LPI ID */
+#define	CMD_PID_SHIFT		(32)
+#define	CMD_PID_MASK		(0xFFFFFFFFUL << CMD_PID_SHIFT)
+/* Collection */
+#define	CMD_COL_MASK		(0xFFFFUL)
+/* Target (CPU or Re-Distributor) */
+#define	CMD_TARGET_SHIFT	(16)
+#define	CMD_TARGET_MASK		(0xFFFFFFFFUL << CMD_TARGET_SHIFT)
+/* Interrupt Translation Table address */
+#define	CMD_ITT_MASK		(0xFFFFFFFFFF00UL)
+/* Valid command bit */
+#define	CMD_VALID_SHIFT		(63)
+#define	CMD_VALID_MASK		(1UL << CMD_VALID_SHIFT)
+
+/* ITS command. Each command is 32 bytes long */
+struct its_cmd {
+	uint64_t	cmd_dword[4];	/* ITS command double word */
+};
+
+/* An ITS private table */
+struct its_ptable {
+	vm_offset_t	ptab_vaddr;
+	unsigned long	ptab_size;
+};
+
+/* ITS collection description. */
+struct its_col {
+	uint64_t	col_target;	/* Target Re-Distributor */
+	uint64_t	col_id;		/* Collection ID */
+};
+
+struct gicv3_its_irqsrc {
+	struct intr_irqsrc	gi_isrc;
+	u_int			gi_irq;
+	struct its_dev		*gi_its_dev;
+};
+
+struct gicv3_its_softc {
+	struct intr_pic *sc_pic;
+	struct resource *sc_its_res;
+
+	struct its_ptable sc_its_ptab[GITS_BASER_NUM];
+	struct its_col *sc_its_cols[MAXCPU];	/* Per-CPU collections */
+
+	/*
+	 * TODO: We should get these from the parent as we only want a
+	 * single copy of each across the interrupt controller.
+	 */
+	vm_offset_t sc_conf_base;
+	vm_offset_t sc_pend_base[MAXCPU];
+
+	/* Command handling */
+	struct mtx sc_its_cmd_lock;
+	struct its_cmd *sc_its_cmd_base; /* Command circular buffer address */
+	size_t sc_its_cmd_next_idx;
+
+	vmem_t *sc_irq_alloc;
+	struct gicv3_its_irqsrc	*sc_irqs;
+
+	struct mtx sc_its_dev_lock;
+	TAILQ_HEAD(its_dev_list, its_dev) sc_its_dev_list;
+
+#define	ITS_FLAGS_CMDQ_FLUSH		0x00000001
+#define	ITS_FLAGS_LPI_CONF_FLUSH	0x00000002
+#define	ITS_FLAGS_ERRATA_CAVIUM_22375	0x00000004
+	u_int sc_its_flags;
+};
+
+typedef void (its_quirk_func_t)(device_t);
+static its_quirk_func_t its_quirk_cavium_22375;
+
+static const struct {
+	const char *desc;
+	uint32_t iidr;
+	uint32_t iidr_mask;
+	its_quirk_func_t *func;
+} its_quirks[] = {
+	{
+		/* Cavium ThunderX Pass 1.x */
+		.desc = "Cavoum ThunderX errata: 22375, 24313",
+		.iidr = GITS_IIDR_RAW(GITS_IIDR_IMPL_CAVIUM,
+		    GITS_IIDR_PROD_THUNDER, GITS_IIDR_VAR_THUNDER_1, 0),
+		.iidr_mask = ~GITS_IIDR_REVISION_MASK,
+		.func = its_quirk_cavium_22375,
+	},
+};
+
+static u_int gic_irq_cpu;
+
+#define	gic_its_read_4(sc, reg)			\
+    bus_read_4((sc)->sc_its_res, (reg))
+#define	gic_its_read_8(sc, reg)			\
+    bus_read_8((sc)->sc_its_res, (reg))
+
+#define	gic_its_write_4(sc, reg, val)		\
+    bus_write_4((sc)->sc_its_res, (reg), (val))
+#define	gic_its_write_8(sc, reg, val)		\
+    bus_write_8((sc)->sc_its_res, (reg), (val))
+
+static device_attach_t gicv3_its_attach;
+static device_detach_t gicv3_its_detach;
+
+static pic_disable_intr_t gicv3_its_disable_intr;
+static pic_enable_intr_t gicv3_its_enable_intr;
+static pic_map_intr_t gicv3_its_map_intr;
+static pic_setup_intr_t gicv3_its_setup_intr;
+static pic_post_filter_t gicv3_its_post_filter;
+static pic_post_ithread_t gicv3_its_post_ithread;
+static pic_pre_ithread_t gicv3_its_pre_ithread;
+static pic_bind_intr_t gicv3_its_bind_intr;
+#ifdef SMP
+static pic_init_secondary_t gicv3_its_init_secondary;
+#endif
+static msi_alloc_msi_t gicv3_its_alloc_msi;
+static msi_release_msi_t gicv3_its_release_msi;
+static msi_alloc_msix_t gicv3_its_alloc_msix;
+static msi_release_msix_t gicv3_its_release_msix;
+static msi_map_msi_t gicv3_its_map_msi;
+
+static void its_cmd_movi(device_t, struct gicv3_its_irqsrc *);
+static void its_cmd_mapc(device_t, struct its_col *, uint8_t);
+static void its_cmd_mapti(device_t, struct gicv3_its_irqsrc *);
+static void its_cmd_mapd(device_t, struct its_dev *, uint8_t);
+static void its_cmd_inv(device_t, struct its_dev *, struct gicv3_its_irqsrc *);
+static void its_cmd_invall(device_t, struct its_col *);
+
+static device_method_t gicv3_its_methods[] = {
+	/* Device interface */
+	DEVMETHOD(device_detach,	gicv3_its_detach),
+
+	/* Interrupt controller interface */
+	DEVMETHOD(pic_disable_intr,	gicv3_its_disable_intr),
+	DEVMETHOD(pic_enable_intr,	gicv3_its_enable_intr),
+	DEVMETHOD(pic_map_intr,		gicv3_its_map_intr),
+	DEVMETHOD(pic_setup_intr,	gicv3_its_setup_intr),
+	DEVMETHOD(pic_post_filter,	gicv3_its_post_filter),
+	DEVMETHOD(pic_post_ithread,	gicv3_its_post_ithread),
+	DEVMETHOD(pic_pre_ithread,	gicv3_its_pre_ithread),
+#ifdef SMP
+	DEVMETHOD(pic_bind_intr,	gicv3_its_bind_intr),
+	DEVMETHOD(pic_init_secondary,	gicv3_its_init_secondary),
+#endif
+
+	/* MSI/MSI-X */
+	DEVMETHOD(msi_alloc_msi,	gicv3_its_alloc_msi),
+	DEVMETHOD(msi_release_msi,	gicv3_its_release_msi),
+	DEVMETHOD(msi_alloc_msix,	gicv3_its_alloc_msix),
+	DEVMETHOD(msi_release_msix,	gicv3_its_release_msix),
+	DEVMETHOD(msi_map_msi,		gicv3_its_map_msi),
+
+	/* End */
+	DEVMETHOD_END
+};
+
+static DEFINE_CLASS_0(gic, gicv3_its_driver, gicv3_its_methods,
+    sizeof(struct gicv3_its_softc));
+
+static void
+gicv3_its_cmdq_init(struct gicv3_its_softc *sc)
+{
+	vm_paddr_t cmd_paddr;
+	uint64_t reg, tmp;
+
+	/* Set up the command circular buffer */
+	sc->sc_its_cmd_base = contigmalloc(ITS_CMDQ_SIZE, M_GICV3_ITS,
+	    M_WAITOK | M_ZERO, 0, (1ul << 48) - 1, ITS_CMDQ_ALIGN, 0);
+	sc->sc_its_cmd_next_idx = 0;
+
+	cmd_paddr = vtophys(sc->sc_its_cmd_base);
+
+	/* Set the base of the command buffer */
+	reg = GITS_CBASER_VALID |
+	    (GITS_CBASER_CACHE_NIWAWB << GITS_CBASER_CACHE_SHIFT) |
+	    cmd_paddr | (GITS_CBASER_SHARE_IS << GITS_CBASER_SHARE_SHIFT) |
+	    (ITS_CMDQ_SIZE / 4096 - 1);
+	gic_its_write_8(sc, GITS_CBASER, reg);
+
+	/* Read back to check for fixed value fields */
+	tmp = gic_its_read_8(sc, GITS_CBASER);
+
+	if ((tmp & GITS_CBASER_SHARE_MASK) !=
+	    (GITS_CBASER_SHARE_IS << GITS_CBASER_SHARE_SHIFT)) {
+		/* Check if the hardware reported non-shareable */
+		if ((tmp & GITS_CBASER_SHARE_MASK) ==
+		    (GITS_CBASER_SHARE_NS << GITS_CBASER_SHARE_SHIFT)) {
+			/* If so remove the cache attribute */
+			reg &= ~GITS_CBASER_CACHE_MASK;
+			reg &= ~GITS_CBASER_SHARE_MASK;
+			/* Set to Non-cacheable, Non-shareable */
+			reg |= GITS_CBASER_CACHE_NIN << GITS_CBASER_CACHE_SHIFT;
+			reg |= GITS_CBASER_SHARE_NS << GITS_CBASER_SHARE_SHIFT;
+
+			gic_its_write_8(sc, GITS_CBASER, reg);
+		}
+
+		/* The command queue has to be flushed after each command */
+		sc->sc_its_flags |= ITS_FLAGS_CMDQ_FLUSH;
+	}
+
+	/* Get the next command from the start of the buffer */
+	gic_its_write_8(sc, GITS_CWRITER, 0x0);
+}
+
+static int
+gicv3_its_table_init(device_t dev, struct gicv3_its_softc *sc)
+{
+	vm_offset_t table;
+	vm_paddr_t paddr;
+	uint64_t cache, reg, share, tmp, type;
+	size_t esize, its_tbl_size, nidents, nitspages, npages;
+	int i, page_size;
+	int devbits;
+
+	if ((sc->sc_its_flags & ITS_FLAGS_ERRATA_CAVIUM_22375) != 0) {
+		/*
+		 * GITS_TYPER[17:13] of ThunderX reports that device IDs
+		 * are to be 21 bits in length. The entry size of the ITS
+		 * table can be read from GITS_BASERn[52:48] and on ThunderX
+		 * is supposed to be 8 bytes in length (for device table).
+		 * Finally the page size that is to be used by ITS to access
+		 * this table will be set to 64KB.
+		 *
+		 * This gives 0x200000 entries of size 0x8 bytes covered by
+		 * 256 pages each of which 64KB in size. The number of pages
+		 * (minus 1) should then be written to GITS_BASERn[7:0]. In
+		 * that case this value would be 0xFF but on ThunderX the
+		 * maximum value that HW accepts is 0xFD.
+		 *
+		 * Set an arbitrary number of device ID bits to 20 in order
+		 * to limit the number of entries in ITS device table to
+		 * 0x100000 and the table size to 8MB.
+		 */
+		devbits = 20;
+		cache = 0;
+	} else {
+		devbits = GITS_TYPER_DEVB(gic_its_read_8(sc, GITS_TYPER));
+		cache = GITS_BASER_CACHE_WAWB;
+	}
+	share = GITS_BASER_SHARE_IS;
+	page_size = PAGE_SIZE_64K;
+
+	for (i = 0; i < GITS_BASER_NUM; i++) {
+		reg = gic_its_read_8(sc, GITS_BASER(i));
+		/* The type of table */
+		type = GITS_BASER_TYPE(reg);
+		/* The table entry size */
+		esize = GITS_BASER_ESIZE(reg);
+
+		switch(type) {
+		case GITS_BASER_TYPE_DEV:
+			nidents = (1 << devbits);
+			its_tbl_size = esize * nidents;
+			its_tbl_size = roundup2(its_tbl_size, PAGE_SIZE_64K);
+			break;
+		case GITS_BASER_TYPE_VP:
+		case GITS_BASER_TYPE_PP: /* Undocumented? */
+		case GITS_BASER_TYPE_IC:
+			its_tbl_size = page_size;
+			break;
+		default:
+			continue;
+		}
+		npages = howmany(its_tbl_size, PAGE_SIZE);
+
+		/* Allocate the table */
+		table = (vm_offset_t)contigmalloc(npages * PAGE_SIZE,
+		    M_GICV3_ITS, M_WAITOK | M_ZERO, 0, (1ul << 48) - 1,
+		    PAGE_SIZE, 0);
+
+		sc->sc_its_ptab[i].ptab_vaddr = table;
+		sc->sc_its_ptab[i].ptab_size = npages * PAGE_SIZE;
+
+		paddr = vtophys(table);
+
+		while (1) {
+			nitspages = howmany(its_tbl_size, page_size);
+
+			/* Clear the fields we will be setting */
+			reg &= ~(GITS_BASER_VALID |
+			    GITS_BASER_CACHE_MASK | GITS_BASER_TYPE_MASK |
+			    GITS_BASER_ESIZE_MASK | GITS_BASER_PA_MASK |
+			    GITS_BASER_SHARE_MASK | GITS_BASER_PSZ_MASK |
+			    GITS_BASER_SIZE_MASK);
+			/* Set the new values */
+			reg |= GITS_BASER_VALID |
+			    (cache << GITS_BASER_CACHE_SHIFT) |
+			    (type << GITS_BASER_TYPE_SHIFT) |
+			    ((esize - 1) << GITS_BASER_ESIZE_SHIFT) |
+			    paddr | (share << GITS_BASER_SHARE_SHIFT) |
+			    (nitspages - 1);
+
+			switch (page_size) {
+			case PAGE_SIZE:		/* 4KB */
+				reg |=
+				    GITS_BASER_PSZ_4K << GITS_BASER_PSZ_SHIFT;
+				break;
+			case PAGE_SIZE_16K:	/* 16KB */
+				reg |=
+				    GITS_BASER_PSZ_4K << GITS_BASER_PSZ_SHIFT;
+				break;
+			case PAGE_SIZE_64K:	/* 64KB */
+				reg |=
+				    GITS_BASER_PSZ_64K << GITS_BASER_PSZ_SHIFT;
+				break;
+			}
+
+			gic_its_write_8(sc, GITS_BASER(i), reg);
+
+			/* Read back to check */
+			tmp = gic_its_read_8(sc, GITS_BASER(i));
+
+			/* Do the snareability masks line up? */
+			if ((tmp & GITS_BASER_SHARE_MASK) !=
+			    (reg & GITS_BASER_SHARE_MASK)) {
+				share = (tmp & GITS_BASER_SHARE_MASK) >>
+				    GITS_BASER_SHARE_SHIFT;
+				continue;
+			}
+
+			if ((tmp & GITS_BASER_PSZ_MASK) !=
+			    (reg & GITS_BASER_PSZ_MASK)) {
+				switch (page_size) {
+				case PAGE_SIZE_16K:
+					page_size = PAGE_SIZE;
+					continue;
+				case PAGE_SIZE_64K:
+					page_size = PAGE_SIZE_16K;
+					continue;
+				}
+			}
+
+			if (tmp != reg) {
+				device_printf(dev, "GITS_BASER%d: "
+				    "unable to be updated: %lx != %lx\n",
+				    i, reg, tmp);
+				return (ENXIO);
+			}
+
+			/* We should have made all needed changes */
+			break;
+		}
+	}
+
+	return (0);
+}
+
+static void
+gicv3_its_conftable_init(struct gicv3_its_softc *sc)
+{
+
+	sc->sc_conf_base = (vm_offset_t)contigmalloc(LPI_CONFTAB_SIZE,
+	    M_GICV3_ITS, M_WAITOK, 0, LPI_CONFTAB_MAX_ADDR, LPI_CONFTAB_ALIGN,
+	    0);
+
+	/* Set the default configuration */
+	memset((void *)sc->sc_conf_base, GIC_PRIORITY_MAX | LPI_CONF_GROUP1,
+	    LPI_CONFTAB_SIZE);
+
+	/* Flush the table to memory */
+	cpu_dcache_wb_range(sc->sc_conf_base, LPI_CONFTAB_SIZE);
+}
+
+static void
+gicv3_its_pendtables_init(struct gicv3_its_softc *sc)
+{
+	int i;
+
+	for (i = 0; i < mp_ncpus; i++) {
+		if (CPU_ISSET(i, &all_cpus) == 0)
+			continue;
+
+		sc->sc_pend_base[i] = (vm_offset_t)contigmalloc(
+		    LPI_PENDTAB_SIZE, M_GICV3_ITS, M_WAITOK | M_ZERO,
+		    0, LPI_PENDTAB_MAX_ADDR, LPI_PENDTAB_ALIGN, 0);
+
+		/* Flush so the ITS can see the memory */
+		cpu_dcache_wb_range((vm_offset_t)sc->sc_pend_base,
+		    LPI_PENDTAB_SIZE);
+	}
+}
+
+static int
+its_init_cpu(device_t dev, struct gicv3_its_softc *sc)
+{
+	device_t gicv3;
+	vm_paddr_t target;
+	uint64_t xbaser, tmp;
+	uint32_t ctlr;
+	u_int cpuid;
+
+	gicv3 = device_get_parent(dev);
+	cpuid = PCPU_GET(cpuid);
+
+	/* Check if the ITS is enabled on this CPU */
+	if ((gic_r_read_4(gicv3, GICR_TYPER) & GICR_TYPER_PLPIS) == 0) {
+		return (ENXIO);
+	}
+
+	/* Disable LPIs */
+	ctlr = gic_r_read_4(gicv3, GICR_CTLR);
+	ctlr &= ~GICR_CTLR_LPI_ENABLE;
+	gic_r_write_4(gicv3, GICR_CTLR, ctlr);
+
+	/* Make sure changes are observable my the GIC */
+	dsb(sy);
+
+	/*
+	 * Set the redistributor base
+	 */
+	xbaser = vtophys(sc->sc_conf_base) |
+	    (GICR_PROPBASER_SHARE_IS << GICR_PROPBASER_SHARE_SHIFT) |
+	    (GICR_PROPBASER_CACHE_NIWAWB << GICR_PROPBASER_CACHE_SHIFT) |
+	    (flsl(LPI_CONFTAB_SIZE | GIC_FIRST_LPI) - 1);
+	gic_r_write_8(gicv3, GICR_PROPBASER, xbaser);
+
+	/* Check the cache attributes we set */
+	tmp = gic_r_read_8(gicv3, GICR_PROPBASER);
+
+	if ((tmp & GICR_PROPBASER_SHARE_MASK) !=
+	    (xbaser & GICR_PROPBASER_SHARE_MASK)) {
+		if ((tmp & GICR_PROPBASER_SHARE_MASK) ==
+		    (GICR_PROPBASER_SHARE_NS << GICR_PROPBASER_SHARE_SHIFT)) {
+			/* We need to mark as non-cacheable */
+			xbaser &= ~(GICR_PROPBASER_SHARE_MASK |
+			    GICR_PROPBASER_CACHE_MASK);
+			/* Non-cacheable */
+			xbaser |= GICR_PROPBASER_CACHE_NIN <<
+			    GICR_PROPBASER_CACHE_SHIFT;
+			/* Non-sareable */
+			xbaser |= GICR_PROPBASER_SHARE_NS <<
+			    GICR_PROPBASER_SHARE_SHIFT;
+			gic_r_write_8(gicv3, GICR_PROPBASER, xbaser);
+		}
+		sc->sc_its_flags |= ITS_FLAGS_LPI_CONF_FLUSH;
+	}
+
+	/*
+	 * Set the LPI pending table base
+	 */
+	xbaser = vtophys(sc->sc_pend_base[cpuid]) |
+	    (GICR_PENDBASER_CACHE_NIWAWB << GICR_PENDBASER_CACHE_SHIFT) |
+	    (GICR_PENDBASER_SHARE_IS << GICR_PENDBASER_SHARE_SHIFT);
+
+	gic_r_write_8(gicv3, GICR_PENDBASER, xbaser);
+
+	tmp = gic_r_read_8(gicv3, GICR_PENDBASER);
+
+	if ((tmp & GICR_PENDBASER_SHARE_MASK) ==
+	    (GICR_PENDBASER_SHARE_NS << GICR_PENDBASER_SHARE_SHIFT)) {
+		/* Clear the cahce and shareability bits */
+		xbaser &= ~(GICR_PENDBASER_CACHE_MASK |
+		    GICR_PENDBASER_SHARE_MASK);
+		/* Mark as non-shareable */
+		xbaser |= GICR_PENDBASER_SHARE_NS << GICR_PENDBASER_SHARE_SHIFT;
+		/* And non-cacheable */
+		xbaser |= GICR_PENDBASER_CACHE_NIN <<
+		    GICR_PENDBASER_CACHE_SHIFT;
+	}
+
+	/* Enable LPIs */
+	ctlr = gic_r_read_4(gicv3, GICR_CTLR);
+	ctlr |= GICR_CTLR_LPI_ENABLE;
+	gic_r_write_4(gicv3, GICR_CTLR, ctlr);
+
+	/* Make sure the GIC has seen everything */
+	dsb(sy);
+
+	if ((gic_its_read_8(sc, GITS_TYPER) & GITS_TYPER_PTA) != 0) {
+		/* This ITS wants the redistributor physical address */
+		target = vtophys(gicv3_get_redist_vaddr(dev));
+	} else {
+		/* This ITS wants the unique processor number */
+		target = GICR_TYPER_CPUNUM(gic_r_read_8(gicv3, GICR_TYPER));
+	}
+
+	sc->sc_its_cols[cpuid]->col_target = target;
+	sc->sc_its_cols[cpuid]->col_id = cpuid;
+
+	its_cmd_mapc(dev, sc->sc_its_cols[cpuid], 1);
+	its_cmd_invall(dev, sc->sc_its_cols[cpuid]);
+
+	return (0);
+}
+
+static int
+gicv3_its_attach(device_t dev)
+{
+	struct gicv3_its_softc *sc;
+	const char *name;
+	uint32_t iidr;
+	int err, i, rid;
+
+	sc = device_get_softc(dev);
+
+	rid = 0;
+	sc->sc_its_res = bus_alloc_resource_any(dev, SYS_RES_MEMORY, &rid,
+	    RF_ACTIVE);
+	if (sc->sc_its_res == NULL) {
+		device_printf(dev, "Could not allocate memory\n");
+		return (ENXIO);
+	}
+
+	iidr = gic_its_read_4(sc, GITS_IIDR);
+	for (i = 0; i < nitems(its_quirks); i++) {
+		if ((iidr & its_quirks[i].iidr_mask) == its_quirks[i].iidr) {
+			if (bootverbose) {
+				device_printf(dev, "Applying %s\n",
+				    its_quirks[i].desc);
+			}
+			its_quirks[i].func(dev);
+			break;
+		}
+	}
+
+	/* Allocate the private tables */
+	err = gicv3_its_table_init(dev, sc);
+	if (err != 0)
+		return (err);
+
+	/* Protects access to the device list */
+	mtx_init(&sc->sc_its_dev_lock, "ITS device lock", NULL, MTX_SPIN);
+
+	/* Protects access to the ITS command circular buffer. */
+	mtx_init(&sc->sc_its_cmd_lock, "ITS cmd lock", NULL, MTX_SPIN);
+
+	/* Allocate the command circular buffer */
+	gicv3_its_cmdq_init(sc);
+
+	/* Allocate the per-CPU collections */
+	for (int cpu = 0; cpu < mp_ncpus; cpu++)
+		if (CPU_ISSET(cpu, &all_cpus) != 0)
+			sc->sc_its_cols[cpu] = malloc(
+			    sizeof(*sc->sc_its_cols[0]), M_GICV3_ITS,
+			    M_WAITOK | M_ZERO);
+		else
+			sc->sc_its_cols[cpu] = NULL;
+
+	/* Enable the ITS */
+	gic_its_write_4(sc, GITS_CTLR,
+	    gic_its_read_4(sc, GITS_CTLR) | GITS_CTLR_EN);
+
+	/* Create the LPI configuration table */
+	gicv3_its_conftable_init(sc);
+
+	/* And the pending tebles */
+	gicv3_its_pendtables_init(sc);
+
+	/* Enable LPIs on this CPU */
+	its_init_cpu(dev, sc);
+
+	TAILQ_INIT(&sc->sc_its_dev_list);
+
+	/*
+	 * Create the vmem object to allocate IRQs from. We try to use all
+	 * IRQs not already used by the GICv3.
+	 * XXX: This assumes there are no other interrupt controllers in the
+	 * system.
+	 */
+	sc->sc_irq_alloc = vmem_create("GICv3 ITS IRQs", 0,
+	    NIRQ - gicv3_get_nirqs(dev), 1, 1, M_FIRSTFIT | M_WAITOK);
+
+	sc->sc_irqs = malloc(sizeof(*sc->sc_irqs) * LPI_NIRQS, M_GICV3_ITS,
+	    M_WAITOK | M_ZERO);
+	name = device_get_nameunit(dev);
+	for (i = 0; i < LPI_NIRQS; i++) {
+		sc->sc_irqs[i].gi_irq = i;
+		err = intr_isrc_register(&sc->sc_irqs[i].gi_isrc, dev, 0,
+		    "%s,%u", name, i);
+	}
+
+	return (0);
+}
+
+static int
+gicv3_its_detach(device_t dev)
+{
+
+	return (ENXIO);
+}
+
+static void
+its_quirk_cavium_22375(device_t dev)
+{
+	struct gicv3_its_softc *sc;
+
+	sc = device_get_softc(dev);

*** DIFF OUTPUT TRUNCATED AT 1000 LINES ***



Want to link to this message? Use this URL: <https://mail-archive.FreeBSD.org/cgi/mid.cgi?201606031028.u53AS64t058415>