/*      $NetBSD: rmixl_fmn.c,v 1.5 2023/08/11 07:05:39 mrg Exp $        */
/*-
* Copyright (c) 2010 The NetBSD Foundation, Inc.
* All rights reserved.
*
* This code is derived from software contributed to The NetBSD Foundation
* by Cliff Neighbors.
*
* Redistribution and use in source and binary forms, with or without
* modification, are permitted provided that the following conditions
* are met:
* 1. Redistributions of source code must retain the above copyright
*    notice, this list of conditions and the following disclaimer.
* 2. Redistributions in binary form must reproduce the above copyright
*    notice, this list of conditions and the following disclaimer in the
*    documentation and/or other materials provided with the distribution.
*
* THIS SOFTWARE IS PROVIDED BY THE NETBSD FOUNDATION, INC. AND CONTRIBUTORS
* ``AS IS'' AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED
* TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR
* PURPOSE ARE DISCLAIMED.  IN NO EVENT SHALL THE FOUNDATION OR CONTRIBUTORS
* BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
* CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
* SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS
* INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN
* CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE)
* ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE
* POSSIBILITY OF SUCH DAMAGE.
*/

#include "opt_ddb.h"

#include <sys/cdefs.h>
#include <sys/param.h>
#include <sys/systm.h>
#include <sys/cpu.h>
#include <mips/cpuregs.h>
#include <mips/rmi/rmixlreg.h>
#include <mips/rmi/rmixlvar.h>
#include <mips/rmi/rmixl_intr.h>
#include <mips/rmi/rmixl_fmnvar.h>

#ifdef FMN_DEBUG
# define DPRINTF(x)     do { printf x ; } while(0)
#else
# define DPRINTF(x)
#endif

#ifdef DIAGNOSTIC
# define DIAG_PRF(x)    do { printf x ; } while(0)
#else
# define DIAG_PRF(x)
#endif



/*
* index CPU-dependent table by (global) bucket ID to obtain logical Station ID
* see Table 12.1 in the XLS PRM
*/
/* use this table for XLS6xx, XLS4xx */
static const int station_xls_4xx[] = {
       [0 ... 7]       = RMIXLS_FMN_STID_CORE0,
       [8 ... 15]      = RMIXLS_FMN_STID_CORE1,
       [16 ... 23]     = RMIXLS_FMN_STID_CORE2,
       [24 ... 31]     = RMIXLS_FMN_STID_CORE3,
       [32 ... 63]     = RMIXLS_FMN_STID_RESERVED,
       [64 ... 71]     = RMIXLS_FMN_STID_PCIE,
       [72 ... 79]     = RMIXLS_FMN_STID_RESERVED,
       [80 ... 87]     = RMIXLS_FMN_STID_GMAC_Q1,
       [88 ... 95]     = RMIXLS_FMN_STID_RESERVED,
       [96 ... 103]    = RMIXLS_FMN_STID_GMAC_Q0,
       [104 ... 107]   = RMIXLS_FMN_STID_DMA,
       [108 ... 109]   = RMIXLS_FMN_STID_CDE,
       [110 ... 119]   = RMIXLS_FMN_STID_RESERVED,
       [120 ... 127]   = RMIXLS_FMN_STID_SAE,
};

/* use this table for XLS408Lite, XLS404Lite */
static const int station_xls_4xx_lite[] = {
       [0 ... 7]       = RMIXLS_FMN_STID_CORE0,
       [8 ... 15]      = RMIXLS_FMN_STID_CORE1,
       [16 ... 23]     = RMIXLS_FMN_STID_CORE2,
       [24 ... 31]     = RMIXLS_FMN_STID_CORE3,
       [32 ... 79]     = RMIXLS_FMN_STID_RESERVED,
       [80 ... 87]     = RMIXLS_FMN_STID_GMAC_Q1,
       [88 ... 95]     = RMIXLS_FMN_STID_RESERVED,
       [96 ... 103]    = RMIXLS_FMN_STID_GMAC_Q0,
       [104 ... 107]   = RMIXLS_FMN_STID_DMA,
       [108 ... 109]   = RMIXLS_FMN_STID_CDE,
       [110 ... 115]   = RMIXLS_FMN_STID_RESERVED,
       [116 ... 119]   = RMIXLS_FMN_STID_PCIE,
       [120 ... 127]   = RMIXLS_FMN_STID_SAE,
};

/* use this table for XLS2xx */
static const int station_xls_2xx[] = {
       [0 ... 7]       = RMIXLS_FMN_STID_CORE0,
       [8 ... 15]      = RMIXLS_FMN_STID_CORE1,
       [16 ... 23]     = RMIXLS_FMN_STID_CORE2,
       [24 ... 31]     = RMIXLS_FMN_STID_CORE3,
       [32 ... 63]     = RMIXLS_FMN_STID_RESERVED,
       [64 ... 71]     = RMIXLS_FMN_STID_PCIE,
       [72 ... 95]     = RMIXLS_FMN_STID_RESERVED,
       [96 ... 103]    = RMIXLS_FMN_STID_GMAC_Q0,
       [104 ... 107]   = RMIXLS_FMN_STID_DMA,
       [108 ... 119]   = RMIXLS_FMN_STID_RESERVED,
       [120 ... 127]   = RMIXLS_FMN_STID_SAE,
};

/* use this table for XLS1xx */
static const int station_xls_1xx[] = {
       [0 ... 7]       = RMIXLS_FMN_STID_CORE0,
       [8 ... 15]      = RMIXLS_FMN_STID_CORE1,
       [16 ... 23]     = RMIXLS_FMN_STID_CORE2,
       [24 ... 31]     = RMIXLS_FMN_STID_CORE3,
       [32 ... 63]     = RMIXLS_FMN_STID_RESERVED,
       [64 ... 71]     = RMIXLS_FMN_STID_PCIE,
       [72 ... 95]     = RMIXLS_FMN_STID_RESERVED,
       [96 ... 101]    = RMIXLS_FMN_STID_GMAC_Q0,
       [102 ... 103]   = RMIXLS_FMN_STID_RESERVED,
       [104 ... 107]   = RMIXLS_FMN_STID_DMA,
       [108 ... 119]   = RMIXLS_FMN_STID_RESERVED,
       [120 ... 127]   = RMIXLS_FMN_STID_SAE,
};

/* use this table for XLRxxx */
static const int station_xlr_xxx[] = {
       [0 ... 7]       = RMIXLR_FMN_STID_CORE0,
       [8 ... 15]      = RMIXLR_FMN_STID_CORE1,
       [16 ... 23]     = RMIXLR_FMN_STID_CORE2,
       [24 ... 31]     = RMIXLR_FMN_STID_CORE3,
       [32 ... 39]     = RMIXLR_FMN_STID_CORE4,
       [40 ... 47]     = RMIXLR_FMN_STID_CORE5,
       [48 ... 55]     = RMIXLR_FMN_STID_CORE6,
       [56 ... 63]     = RMIXLR_FMN_STID_CORE7,
       [64 ... 79]     = RMIXLR_FMN_STID_TXRX_0,
       [80 ... 95]     = RMIXLR_FMN_STID_TXRX_1,
       [96 ... 103]    = RMIXLR_FMN_STID_RGMII,
       [104 ... 107]   = RMIXLR_FMN_STID_DMA,
       [108 ... 111]   = RMIXLR_FMN_STID_RESERVED,
       [112 ... 113]   = RMIXLR_FMN_STID_FREE_0,
       [114 ... 115]   = RMIXLR_FMN_STID_FREE_0,
       [116 ... 119]   = RMIXLR_FMN_STID_RESERVED,
       [120 ... 127]   = RMIXLR_FMN_STID_SAE,
};

typedef struct fmn_station_info {
       const char     *si_name;
       const u_int     si_buckets_max;
       const u_int     si_stid_first;
       const u_int     si_stid_last;
       const u_int     si_bucket_size_dflt;
       const u_int     si_credits_min;
       const u_int     si_regbase;
} fmn_station_info_t;

/* use this table for XLS6xx, XLS4xx */
static const fmn_station_info_t station_info_xls_4xx[RMIXLS_FMN_NSTID] = {
       [RMIXLS_FMN_STID_CORE0]   = { "core0",  8,   0,   7,  32, 4, 0 },
       [RMIXLS_FMN_STID_CORE1]   = { "core1",  8,   8,  15,  32, 4, 0 },
       [RMIXLS_FMN_STID_CORE2]   = { "core2",  8,  16,  23,  32, 4, 0 },
       [RMIXLS_FMN_STID_CORE3]   = { "core3",  8,  24,  31,  32, 4, 0 },
       [RMIXLS_FMN_STID_GMAC_Q0] = { "gmac_q0",        3,  80,  87,  32, 0, RMIXL_IO_DEV_GMAC_0 },
       [RMIXLS_FMN_STID_GMAC_Q1] = { "gmac_q1",        3,  96, 103,  32, 0, RMIXL_IO_DEV_GMAC_4 },
       [RMIXLS_FMN_STID_DMA]     = { "dma",    4, 104, 107,  64, 0, RMIXL_IO_DEV_DMA },
       [RMIXLS_FMN_STID_CDE]     = { "cde",    4, 108, 109, 128, 0, RMIXL_IO_DEV_CDE },
       [RMIXLS_FMN_STID_PCIE]    = { "pcie",   8,  64,  71,  32, 0, RMIXL_IO_DEV_PCIE_BE },
       [RMIXLS_FMN_STID_SAE]     = { "sae",    2, 120, 121, 128, 0, RMIXL_IO_DEV_SAE },
};

/* use this table for XLS4xxLite */
static const fmn_station_info_t station_info_xls_4xx_lite[RMIXLS_FMN_NSTID] = {
       [RMIXLS_FMN_STID_CORE0]   = { "core0",  8,   0,   7,  32, 4, 0 },
       [RMIXLS_FMN_STID_CORE1]   = { "core1",  8,   8,  15,  32, 4, 0 },
       [RMIXLS_FMN_STID_CORE2]   = { "core2",  8,  16,  23,  32, 4, 0 },
       [RMIXLS_FMN_STID_CORE3]   = { "core3",  8,  24,  31,  32, 4, 0 },
       [RMIXLS_FMN_STID_GMAC_Q0] = { "gmac_q0",        3,  80,  87,  32, 0, RMIXL_IO_DEV_GMAC_0 },
       [RMIXLS_FMN_STID_GMAC_Q1] = { "gmac_q1",        3,  96, 103,  32, 0, RMIXL_IO_DEV_GMAC_4 },
       [RMIXLS_FMN_STID_DMA]     = { "dma",    4, 104, 107,  64, 0, RMIXL_IO_DEV_DMA },
       [RMIXLS_FMN_STID_CDE]     = { "cde",    4, 108, 109, 128, 0, RMIXL_IO_DEV_CDE },
       [RMIXLS_FMN_STID_PCIE]    = { "pcie",   4, 116, 119,  64, 0, RMIXL_IO_DEV_PCIE_BE },
       [RMIXLS_FMN_STID_SAE]     = { "sae",    2, 120, 121, 128, 0, RMIXL_IO_DEV_SAE },
};

/* use this table for XLS2xx */
static const fmn_station_info_t station_info_xls_2xx[RMIXLS_FMN_NSTID] = {
       [RMIXLS_FMN_STID_CORE0]   = { "core0",  8,   0,   7,  32, 4, 0 },
       [RMIXLS_FMN_STID_CORE1]   = { "core1",  8,   8,  15,  32, 4, 0 },
       [RMIXLS_FMN_STID_CORE2]   = { "core2",  8,  16,  23,  32, 4, 0 },
       [RMIXLS_FMN_STID_CORE3]   = { "core3",  8,  24,  31,  32, 4, 0 },
       [RMIXLS_FMN_STID_GMAC_Q0] = { "gmac_q0",        3,  96, 103,  32, 0, RMIXL_IO_DEV_GMAC_0 },
       [RMIXLS_FMN_STID_DMA]     = { "dma",    4, 104, 107,  64, 0, RMIXL_IO_DEV_DMA },
       [RMIXLS_FMN_STID_PCIE]    = { "pcie",   8,  64,  71,  32, 0, RMIXL_IO_DEV_PCIE_BE },
       [RMIXLS_FMN_STID_SAE]     = { "sae",    2, 120, 121, 128, 0, RMIXL_IO_DEV_SAE },
};

/* use this table for XLS1xx */
static const fmn_station_info_t station_info_xls_1xx[RMIXLS_FMN_NSTID] = {
       [RMIXLS_FMN_STID_CORE0]   = { "core0",  8,   0,   7,  32, 4, 0 },
       [RMIXLS_FMN_STID_CORE1]   = { "core1",  8,   8,  15,  32, 4, 0 },
       [RMIXLS_FMN_STID_CORE2]   = { "core2",  8,  16,  23,  32, 4, 0 },
       [RMIXLS_FMN_STID_CORE3]   = { "core3",  8,  24,  31,  32, 4, 0 },
       [RMIXLS_FMN_STID_GMAC_Q0] = { "gmac_q0",        3,  96, 101,  32, 0, RMIXL_IO_DEV_GMAC_0 },
       [RMIXLS_FMN_STID_DMA]     = { "dma",    4, 104, 107,  64, 0, RMIXL_IO_DEV_PCIE_BE },
       [RMIXLS_FMN_STID_PCIE]    = { "pcie",   4,  64,  67,  32, 0, RMIXL_IO_DEV_PCIE_BE },
       [RMIXLS_FMN_STID_SAE]     = { "sae",    2, 120, 121, 128, 0, RMIXL_IO_DEV_SAE },
};

/*
* use this table for XLRxxx
* caution:
* - the XGMII/SPI4 stations si_regbase are 'special'
* - the RGMII station si_regbase is 'special'
*/
static const fmn_station_info_t station_info_xlr_xxx[RMIXLR_FMN_NSTID] = {
       [RMIXLR_FMN_STID_CORE0]   = { "core0",  8,   0,   7,  32, 4, 0 },
       [RMIXLR_FMN_STID_CORE1]   = { "core1",  8,   8,  15,  32, 4, 0 },
       [RMIXLR_FMN_STID_CORE2]   = { "core2",  8,  16,  23,  32, 4, 0 },
       [RMIXLR_FMN_STID_CORE3]   = { "core3",  8,  24,  31,  32, 4, 0 },
       [RMIXLR_FMN_STID_CORE4]   = { "core4",  8,  32,  39,  32, 4, 0 },
       [RMIXLR_FMN_STID_CORE5]   = { "core5",  8,  40,  47,  32, 4, 0 },
       [RMIXLR_FMN_STID_CORE6]   = { "core6",  8,  48,  55,  32, 4, 0 },
       [RMIXLR_FMN_STID_CORE7]   = { "core7",  8,  56,  63,  32, 4, 0 },
       [RMIXLR_FMN_STID_TXRX_0]  = { "txrx0",  1,  64,  79,  16, 0, RMIXL_IO_DEV_XGMAC_A },
       [RMIXLR_FMN_STID_TXRX_1]  = { "txrx1",  1,  80,  95,  16, 0, RMIXL_IO_DEV_XGMAC_B },
       [RMIXLR_FMN_STID_RGMII]   = { "rgmii",  8,  96, 103,  32, 0, RMIXL_IO_DEV_GMAC_A },
       [RMIXLR_FMN_STID_DMA]     = { "dma",    4, 104, 107,  64, 0, RMIXL_IO_DEV_DMA },
       [RMIXLR_FMN_STID_FREE_0]  = { "free0",  2, 112, 113, 128, 0, RMIXL_IO_DEV_XGMAC_A },
       [RMIXLR_FMN_STID_FREE_1]  = { "free1",  2, 114, 115, 128, 0, RMIXL_IO_DEV_XGMAC_B },
       [RMIXLR_FMN_STID_SAE]     = { "sae",    5, 120, 124,  32, 0, RMIXL_IO_DEV_SAE },
};


typedef struct fmn_intrhand {
       int             (*ih_func)(void *, rmixl_fmn_rxmsg_t *);
       void            *ih_arg;
       struct evcnt    ih_count;
} fmn_intrhand_t;

/*
* per-core FMN structure
*/
typedef struct fmn {
       kmutex_t                       *fmn_lock;
       u_int                           fmn_core;
       u_int                           fmn_thread;
       u_int                           fmn_nstid;
       const int                      *fmn_stidtab;
       const fmn_station_info_t       *fmn_stinfo;
       void                           *fmn_ih;
       fmn_intrhand_t                  fmn_intrhand[RMIXL_FMN_NSTID];
} fmn_t;

static fmn_t fmn_store[1 << 10];        /* index by cpuid) *//* XXX assumes 1 node */
#define NFMN    (sizeof(fmn_store) / sizeof(fmn_store[0]))

static fmn_t *
fmn_lookup(cpuid_t cpuid)
{
       KASSERT(cpuid < (cpuid_t)NFMN);
       return &fmn_store[cpuid];
}

static void rmixl_fmn_init_core_xlr(fmn_t *);
static void rmixl_fmn_init_core_xls(fmn_t *);
static void     rmixl_fmn_config_noncore(fmn_t *);
static void     rmixl_fmn_config_core(fmn_t *);
#ifdef NOTYET
static int      rmixl_fmn_intr_dispatch(void *);
#endif  /* NOTYET */
static int      rmixl_fmn_msg_recv_subr(u_int, rmixl_fmn_rxmsg_t *);

#ifdef FMN_DEBUG
void    rmixl_fmn_cp2_dump(void);
void    rmixl_fmn_cc_dump(void);
#endif

/*
* macros used because mtc2, mfc2, dmtc2, dmfc2 instructions
* must use literal values for rd and sel operands
* so let the compiler sort it out
*/

/*
* write v to all 8 SELs for given RD
*/
#define FMN_CP2_4SEL_READ(rd, sel, vp)                                  \
       do {                                                            \
               uint32_t *rp = vp;                                      \
               RMIXL_MFC2(rd, sel,   rp[0]);                           \
               RMIXL_MFC2(rd, sel+1, rp[1]);                           \
               RMIXL_MFC2(rd, sel+2, rp[2]);                           \
               RMIXL_MFC2(rd, sel+3, rp[3]);                           \
       } while (0)

/*
* write v to all 8 SELs for given RD
*/
#define FMN_CP2_4SEL_WRITE(rd, sel, v)                                  \
       do {                                                            \
               RMIXL_MTC2(rd, sel,   v);                               \
               RMIXL_MTC2(rd, sel+1, v);                               \
               RMIXL_MTC2(rd, sel+2, v);                               \
               RMIXL_MTC2(rd, sel+3, v);                               \
       } while (0)

#define FMN_CP2_8SEL_WRITE(rd, v)                                       \
       do {                                                            \
               RMIXL_MTC2(rd, 0, v);                                   \
               RMIXL_MTC2(rd, 1, v);                                   \
               RMIXL_MTC2(rd, 2, v);                                   \
               RMIXL_MTC2(rd, 3, v);                                   \
               RMIXL_MTC2(rd, 4, v);                                   \
               RMIXL_MTC2(rd, 5, v);                                   \
               RMIXL_MTC2(rd, 6, v);                                   \
               RMIXL_MTC2(rd, 7, v);                                   \
       } while (0)


#define FMN_CP2_SEL_CASE_READ(rd, sel, v)                               \
       case sel:                                                       \
               RMIXL_MFC2(rd, sel, v);                                 \
               break
#define FMN_CP2_SEL_CASE_WRITE(rd, sel, v)                              \
       case sel:                                                       \
               RMIXL_MTC2(rd, sel, v);                                 \
               break
/*
* read/write a single arbitrary sel for the given rd
*/
#define FMN_CP2_SEL_SWITCH_RW(rw, rd, sel, val)                         \
       do {                                                            \
               switch (sel) {                                          \
                       FMN_CP2_SEL_CASE_ ## rw(rd, 0, val);            \
                       FMN_CP2_SEL_CASE_ ## rw(rd, 1, val);            \
                       FMN_CP2_SEL_CASE_ ## rw(rd, 2, val);            \
                       FMN_CP2_SEL_CASE_ ## rw(rd, 3, val);            \
                       FMN_CP2_SEL_CASE_ ## rw(rd, 4, val);            \
                       FMN_CP2_SEL_CASE_ ## rw(rd, 5, val);            \
                       FMN_CP2_SEL_CASE_ ## rw(rd, 6, val);            \
                       FMN_CP2_SEL_CASE_ ## rw(rd, 7, val);            \
                       default:                                        \
                               panic("%s:%d: bad sel %d\n",            \
                                       __func__, __LINE__, sel);       \
               }                                                       \
       } while (0)

#define FMN_CP2_RD_CASE_RW(rw, rd, sel, val)                            \
       case rd:                                                        \
               FMN_CP2_SEL_SWITCH_RW(rw, rd, sel, val);                \
               break
/*
* read/write a single arbitrary Credit Counter at (rd, sel)
* eg:
*      FMN_CP2_RD_SWITCH_RW(READ,  16, 2, val)
*      FMN_CP2_RD_SWITCH_RW(WRITE, 18, 0, val)
*/
#define FMN_CP2_RD_SWITCH_RW(rw, rd, sel, val)                          \
       do {                                                            \
               switch(rd) {                                            \
                       FMN_CP2_RD_CASE_RW(rw, 0,  sel, val);           \
                       FMN_CP2_RD_CASE_RW(rw, 1,  sel, val);           \
                       FMN_CP2_RD_CASE_RW(rw, 2,  sel, val);           \
                       FMN_CP2_RD_CASE_RW(rw, 3,  sel, val);           \
                       FMN_CP2_RD_CASE_RW(rw, 4,  sel, val);           \
                       FMN_CP2_RD_CASE_RW(rw, 5,  sel, val);           \
                       FMN_CP2_RD_CASE_RW(rw, 6,  sel, val);           \
                       FMN_CP2_RD_CASE_RW(rw, 7,  sel, val);           \
                       FMN_CP2_RD_CASE_RW(rw, 8,  sel, val);           \
                       FMN_CP2_RD_CASE_RW(rw, 9,  sel, val);           \
                       FMN_CP2_RD_CASE_RW(rw, 10, sel, val);           \
                       FMN_CP2_RD_CASE_RW(rw, 11, sel, val);           \
                       FMN_CP2_RD_CASE_RW(rw, 12, sel, val);           \
                       FMN_CP2_RD_CASE_RW(rw, 13, sel, val);           \
                       FMN_CP2_RD_CASE_RW(rw, 14, sel, val);           \
                       FMN_CP2_RD_CASE_RW(rw, 15, sel, val);           \
                       FMN_CP2_RD_CASE_RW(rw, 16, sel, val);           \
                       FMN_CP2_RD_CASE_RW(rw, 17, sel, val);           \
                       FMN_CP2_RD_CASE_RW(rw, 18, sel, val);           \
                       FMN_CP2_RD_CASE_RW(rw, 19, sel, val);           \
                       FMN_CP2_RD_CASE_RW(rw, 20, sel, val);           \
                       FMN_CP2_RD_CASE_RW(rw, 21, sel, val);           \
                       FMN_CP2_RD_CASE_RW(rw, 22, sel, val);           \
                       FMN_CP2_RD_CASE_RW(rw, 23, sel, val);           \
                       FMN_CP2_RD_CASE_RW(rw, 24, sel, val);           \
                       FMN_CP2_RD_CASE_RW(rw, 25, sel, val);           \
                       FMN_CP2_RD_CASE_RW(rw, 26, sel, val);           \
                       FMN_CP2_RD_CASE_RW(rw, 27, sel, val);           \
                       FMN_CP2_RD_CASE_RW(rw, 28, sel, val);           \
                       FMN_CP2_RD_CASE_RW(rw, 29, sel, val);           \
                       FMN_CP2_RD_CASE_RW(rw, 30, sel, val);           \
                       FMN_CP2_RD_CASE_RW(rw, 31, sel, val);           \
                       default:                                        \
                               panic("%s:%d: bad regno %d\n",          \
                                       __func__, __LINE__, rd);        \
               }                                                       \
       } while (0)


void
rmixl_fmn_init(void)
{
       int cpu;
       fmn_t *fmnp;
       static bool once=false;

       KASSERTMSG((CPU_IS_PRIMARY(curcpu())), "ci=%p, index=%d\n",
               curcpu(), cpu_index(curcpu()));
       fmnp = fmn_lookup(curcpu()->ci_cpuid);

       if (once == true)
               panic("%s: call only once!", __func__);
       once = true;

       for (cpu=0; cpu < NFMN; cpu++) {
               fmnp[cpu].fmn_core = RMIXL_CPU_CORE(cpu);
               fmnp[cpu].fmn_thread = RMIXL_CPU_THREAD(cpu);
       }

       rmixl_fmn_init_core();          /* for initial boot cpu (#0) */
       rmixl_fmn_config_noncore(fmnp); /* boot cpu initializes noncore */
}

/*
* link to TX station ID table for RMI XLR type chip
*/
static void
rmixl_fmn_init_core_xlr(fmn_t *fmnp)
{
       fmnp->fmn_nstid = RMIXLR_FMN_NSTID;
       fmnp->fmn_stidtab = station_xlr_xxx;
       fmnp->fmn_stinfo = station_info_xlr_xxx;
}

/*
* link to TX station ID table for RMI XLS type chip
*/
static void
rmixl_fmn_init_core_xls(fmn_t *fmnp)
{
       const fmn_station_info_t *info = NULL;
       const int *tab = NULL;

       switch (MIPS_PRID_IMPL(mips_options.mips_cpu_id)) {
       case MIPS_XLS104:
       case MIPS_XLS108:
               tab = station_xls_1xx;
               info = station_info_xls_1xx;
               break;
       case MIPS_XLS204:
       case MIPS_XLS208:
               tab = station_xls_2xx;
               info = station_info_xls_2xx;
               break;
       case MIPS_XLS404:
       case MIPS_XLS408:
       case MIPS_XLS416:
       case MIPS_XLS608:
       case MIPS_XLS616:
               tab = station_xls_4xx;
               info = station_info_xls_4xx;
               break;
       case MIPS_XLS404LITE:
       case MIPS_XLS408LITE:
               tab = station_xls_4xx_lite;
               info = station_info_xls_4xx_lite;
               break;
       default:
               panic("%s: unknown PRID IMPL %#x\n", __func__,
                       MIPS_PRID_IMPL(mips_options.mips_cpu_id));
       }

       fmnp->fmn_nstid = RMIXLS_FMN_NSTID;
       fmnp->fmn_stidtab = tab;
       fmnp->fmn_stinfo = info;
}

void
rmixl_fmn_init_core(void)
{
       fmn_t *fmnp;
       kmutex_t *lk;

       fmnp = fmn_lookup(curcpu()->ci_cpuid);
       KASSERT(fmnp != NULL);
       KASSERT(fmnp->fmn_core == RMIXL_CPU_CORE(curcpu()->ci_cpuid));
       KASSERT(fmnp->fmn_thread == RMIXL_CPU_THREAD(curcpu()->ci_cpuid));

       lk = mutex_obj_alloc(MUTEX_DEFAULT, RMIXL_FMN_INTR_IPL);
       if (lk == NULL)
               panic("%s: mutex_obj_alloc failed", __func__);
       fmnp->fmn_lock = lk;

       mutex_enter(fmnp->fmn_lock);

       /*
        * do chip-dependent per-core FMN initialization
        */
       switch(cpu_rmixl_chip_type(mips_options.mips_cpu)) {
       case CIDFL_RMI_TYPE_XLR:
               rmixl_fmn_init_core_xlr(fmnp);
               break;
       case CIDFL_RMI_TYPE_XLS:
               rmixl_fmn_init_core_xls(fmnp);
               break;
       case CIDFL_RMI_TYPE_XLP:
               panic("%s: RMI XLP not yet supported", __func__);
       default:
               panic("%s: RMI chip type %#x unknown", __func__,
                       cpu_rmixl_chip_type(mips_options.mips_cpu));
       }

       /*
        * thread #0 for each core owns 'global' CP2 regs
        */
       if (fmnp->fmn_thread == 0)
               rmixl_fmn_config_core(fmnp);

       mutex_exit(fmnp->fmn_lock);
}

/*
* rmixl_fmn_config_noncore
*
*      initialize bucket sizes and (minimum) credits for non-core stations to ZERO
*      configured through memory write operations instead of CP2
*/
static void
rmixl_fmn_config_noncore(fmn_t *fmnp)
{
       for (u_int sid=0; sid < fmnp->fmn_nstid; sid++) {
               u_int regoff = fmnp->fmn_stinfo[sid].si_regbase;
               if (regoff != 0) {
                       u_int buckets_max = fmnp->fmn_stinfo[sid].si_buckets_max;
                       regoff += RMIXL_FMN_BS_FIRST;
                       for (u_int bucket=0; bucket < buckets_max; bucket++) {
                               RMIXL_IOREG_WRITE(regoff, 0);
                               regoff += sizeof(uint32_t);
                       }
               }
       }
}

/*
* rmixl_fmn_config_core
*
*      - assumes fmn_mutex is owned
*      - configure FMN
*      - initialize bucket sizes and (minimum) credits for a core
*/
static void
rmixl_fmn_config_core(fmn_t *fmnp)
{
       const fmn_station_info_t *info = fmnp->fmn_stinfo;
       uint32_t sts1;
       uint32_t cfg;
       uint32_t cp0_status;

       KASSERT(mutex_owned(fmnp->fmn_lock) != 0);
       KASSERT(fmnp->fmn_thread == 0);
       cp0_status = rmixl_cp2_enable();

       /* check/clear any pre-existing status1 error(s) */
       RMIXL_MFC2(RMIXL_COP_2_MSG_STS, 1, sts1);
       if ((sts1 & RMIXL_MSG_STS1_ERRS) != 0)
               RMIXL_MTC2(RMIXL_COP_2_MSG_STS, 1, sts1);

       /* set up MsgConfig reg */
       cfg = ((1 << RMIXL_MSG_CFG0_WMSHIFT)                    /* watermark */
           |  (RMIXL_INTRVEC_FMN << RMIXL_MSG_CFG0_IV_SHIFT)   /* irq */
           |  (1 << RMIXL_MSG_CFG0_ITM_SHIFT)                  /* thread mask */
           |   RMIXL_MSG_CFG0_WIE                              /* watermark intr enb */
           |   RMIXL_MSG_CFG0_EIE);                            /* rx not empty intr enb */
       RMIXL_DMTC2(RMIXL_COP_2_MSG_CFG, 0, cfg);

       /* disable trace mode, credit overrun intr, messaging errors intr */
       RMIXL_DMTC2(RMIXL_COP_2_MSG_CFG, 0, 0);

       /* XXX using 4 buckets per core */
       KASSERT(4 <= info->si_buckets_max);

       /*
        * initialize default sizes for core buckets
        * zero sizes for unused buckets
        */
       KASSERT(info->si_buckets_max == 8);
       uint32_t sz = info->si_bucket_size_dflt;
       KASSERT((sz & ~RMIXL_MSG_BSZ_SIZE) == 0);
       RMIXL_MTC2(RMIXL_COP_2_MSG_BSZ, 0, sz);
       RMIXL_MTC2(RMIXL_COP_2_MSG_BSZ, 1, sz);
       RMIXL_MTC2(RMIXL_COP_2_MSG_BSZ, 2, sz);
       RMIXL_MTC2(RMIXL_COP_2_MSG_BSZ, 3, sz);
       RMIXL_MTC2(RMIXL_COP_2_MSG_BSZ, 4, 0);
       RMIXL_MTC2(RMIXL_COP_2_MSG_BSZ, 5, 0);
       RMIXL_MTC2(RMIXL_COP_2_MSG_BSZ, 6, 0);
       RMIXL_MTC2(RMIXL_COP_2_MSG_BSZ, 7, 0);

       /*
        * configure minimum credits for each core, 4 buckets
        * zero all unused credit counters for this core
        */
       uint32_t cr = info->si_credits_min;

       FMN_CP2_4SEL_WRITE(RMIXL_COP_2_CREDITS,   0, cr);
       FMN_CP2_4SEL_WRITE(RMIXL_COP_2_CREDITS,   4,  0);
       FMN_CP2_4SEL_WRITE(RMIXL_COP_2_CREDITS+1, 0, cr);
       FMN_CP2_4SEL_WRITE(RMIXL_COP_2_CREDITS+1, 4,  0);
       FMN_CP2_4SEL_WRITE(RMIXL_COP_2_CREDITS+2, 0, cr);
       FMN_CP2_4SEL_WRITE(RMIXL_COP_2_CREDITS+2, 4,  0);
       FMN_CP2_4SEL_WRITE(RMIXL_COP_2_CREDITS+3, 0, cr);
       FMN_CP2_4SEL_WRITE(RMIXL_COP_2_CREDITS+3, 4,  0);

       FMN_CP2_8SEL_WRITE(RMIXL_COP_2_CREDITS+4,     0);
       FMN_CP2_8SEL_WRITE(RMIXL_COP_2_CREDITS+5,     0);
       FMN_CP2_8SEL_WRITE(RMIXL_COP_2_CREDITS+6,     0);
       FMN_CP2_8SEL_WRITE(RMIXL_COP_2_CREDITS+7,     0);
       FMN_CP2_8SEL_WRITE(RMIXL_COP_2_CREDITS+8,     0);
       FMN_CP2_8SEL_WRITE(RMIXL_COP_2_CREDITS+9,     0);
       FMN_CP2_8SEL_WRITE(RMIXL_COP_2_CREDITS+10,    0);
       FMN_CP2_8SEL_WRITE(RMIXL_COP_2_CREDITS+11,    0);
       FMN_CP2_8SEL_WRITE(RMIXL_COP_2_CREDITS+12,    0);
       FMN_CP2_8SEL_WRITE(RMIXL_COP_2_CREDITS+13,    0);
       FMN_CP2_8SEL_WRITE(RMIXL_COP_2_CREDITS+14,    0);
       FMN_CP2_8SEL_WRITE(RMIXL_COP_2_CREDITS+15,    0);

       RMIXL_MFC2(RMIXL_COP_2_MSG_STS, 1, sts1);
       KASSERT((sts1 & RMIXL_MSG_STS1_ERRS) == 0);

       rmixl_cp2_restore(cp0_status);
}

void
rmixl_fmn_init_cpu_intr(void)
{
       fmn_t *fmnp;

       fmnp = fmn_lookup(curcpu()->ci_cpuid);
       mutex_enter(fmnp->fmn_lock);

       for (int i=0; i < fmnp->fmn_nstid; i++)
               evcnt_attach_dynamic(&fmnp->fmn_intrhand[i].ih_count,
                       EVCNT_TYPE_INTR, NULL, "rmixl_fmn", fmnp->fmn_stinfo[i].si_name);

#ifdef NOTYET
       /*
        * establish dispatcher for FMN interrupt
        */
       extern kmutex_t rmixl_intr_lock;
       void *ih;

       mutex_enter(&rmixl_intr_lock);
       ih = rmixl_vec_establish(RMIXL_INTRVEC_FMN, -1, RMIXL_FMN_INTR_IPL,
               rmixl_fmn_intr_dispatch, fmnp, "fmn");
       if (ih == NULL)
               panic("%s: rmixl_vec_establish failed", __func__);
       mutex_exit(&rmixl_intr_lock);
       fmnp->fmn_ih = ih;
#endif

       mutex_exit(fmnp->fmn_lock);
}

void *
rmixl_fmn_intr_establish(int txstid, int (*func)(void *, rmixl_fmn_rxmsg_t *), void *arg)
{
       fmn_t *fmnp;
       fmn_intrhand_t *ih;

       fmnp = fmn_lookup(curcpu()->ci_cpuid);

       mutex_enter(fmnp->fmn_lock);

       ih = &fmnp->fmn_intrhand[txstid];

       if (ih->ih_func != NULL) {
#ifdef DEBUG
               panic("%s: intrhand[%d] busy", __func__, txstid);
#endif
               ih = NULL;
       }  else {
               ih->ih_func = func;
               ih->ih_arg = arg;
       }

       mutex_exit(fmnp->fmn_lock);

       return ih;
}

void
rmixl_fmn_intr_disestablish(void *cookie)
{
       fmn_t *fmnp;
       fmn_intrhand_t *ih = cookie;

       fmnp = fmn_lookup(curcpu()->ci_cpuid);
       mutex_enter(fmnp->fmn_lock);

       if (ih->ih_func != NULL) {
               ih->ih_func = NULL;
               ih->ih_arg = NULL;
       }
#ifdef DEBUG
       else {
               panic("%s: intrhand[%ld] not in use",
                       __func__, ih - &fmnp->fmn_intrhand[0]);
       }
#endif

       mutex_exit(fmnp->fmn_lock);
}

void
rmixl_fmn_intr_poll(u_int bucket, rmixl_fmn_rxmsg_t *rxmsg)
{
       uint32_t bit = 1 << bucket;
       uint32_t cp0_status;

       KASSERT(bucket < 8);

       cp0_status = rmixl_cp2_enable();

       for(;;) {
               rmixl_fmn_msgwait(bit);
               if (rmixl_fmn_msg_recv(bucket, rxmsg) == 0)
                       break;
               DELAY(10);              /* XXX */
       }

       rmixl_cp2_restore(cp0_status);
}

#ifdef NOTYET
static int
rmixl_fmn_intr_dispatch(void *arg)
{
       fmn_t *fmnp = arg;
       uint32_t msg_status;
       uint32_t cp0_status;
       uint32_t rfbne;
       int txstid;
       int rv = 0;

       mutex_enter(fmnp->fmn_lock);
       cp0_status = rmixl_cp2_enable();

       RMIXL_MFC2(RMIXL_COP_2_MSG_STS, 0, msg_status);
       rfbne = (~msg_status) >> RMIXL_MSG_STS0_RFBE_SHIFT;

       if (rfbne != 0) {
               DPRINTF(("%s: rfbne %#x\n", __func__, rfbne));
               for (u_int bucket=0; bucket < 8; bucket++) {
                       rmixl_fmn_rxmsg_t rxmsg;
                       fmn_intrhand_t *ih;

                       if ((rfbne & (1 << bucket)) == 0)
                               continue;
                       if (rmixl_fmn_msg_recv_subr(bucket, &rxmsg) != 0)
                               continue;
                       rv = 1;
                       txstid = fmnp->fmn_stidtab[rxmsg.rxsid];
                       ih = &fmnp->fmn_intrhand[txstid];
                       if (ih->ih_func != NULL)
                               if ((ih->ih_func)(ih->ih_arg, &rxmsg) != 0)
                                       ih->ih_count.ev_count++;
               }

       }
       rmixl_cp2_restore(cp0_status);
       mutex_exit(fmnp->fmn_lock);

       return rv;
}
#endif  /* NOTYET */

int
rmixl_fmn_msg_send(u_int size, u_int code, u_int dest_id, rmixl_fmn_msg_t *msg)
{
       fmn_t *fmnp;
       uint32_t cp0_status;
       uint32_t msg_status;
       uint32_t msg_status1;
       uint32_t desc;
       int rv = 0;

       KASSERT((size >= 1) && size <= 4);
       KASSERT(code <= 0xff);
       KASSERT(dest_id <= 0xff);

       fmnp = fmn_lookup(curcpu()->ci_cpuid);
       mutex_enter(fmnp->fmn_lock);
       cp0_status = rmixl_cp2_enable();

       switch(size) {
       case 1:
               RMIXL_DMTC2(RMIXL_COP_2_TXBUF, 0, msg->data[0]);
               break;
       case 2:
               RMIXL_DMTC2(RMIXL_COP_2_TXBUF, 0, msg->data[0]);
               RMIXL_DMTC2(RMIXL_COP_2_TXBUF, 1, msg->data[1]);
               break;
       case 3:
               RMIXL_DMTC2(RMIXL_COP_2_TXBUF, 0, msg->data[0]);
               RMIXL_DMTC2(RMIXL_COP_2_TXBUF, 1, msg->data[1]);
               RMIXL_DMTC2(RMIXL_COP_2_TXBUF, 2, msg->data[2]);
               break;
       case 4:
               RMIXL_DMTC2(RMIXL_COP_2_TXBUF, 0, msg->data[0]);
               RMIXL_DMTC2(RMIXL_COP_2_TXBUF, 1, msg->data[1]);
               RMIXL_DMTC2(RMIXL_COP_2_TXBUF, 2, msg->data[2]);
               RMIXL_DMTC2(RMIXL_COP_2_TXBUF, 3, msg->data[3]);
               break;
       default:
               DIAG_PRF(("%s: bad size %d", __func__, size));
               rv = -1;
               goto out;
       }

       for (int try=16; try--; ) {
               RMIXL_MFC2(RMIXL_COP_2_MSG_STS, 0, msg_status);
               if ((msg_status & (RMIXL_MSG_STS0_LPF|RMIXL_MSG_STS0_SPF|RMIXL_MSG_STS0_SMP)) == 0)
                       goto send;
               DELAY(10);              /* XXX ??? */
       }
       DIAG_PRF(("%s: cpu%u, msg %p, dst_id=%d, sts=%#x: can't send\n",
               __func__, cpu_number(), msg, dest_id, msg_status));
       rv = -1;
       goto out;
send:
       desc = RMIXL_MSGSND_DESC(size, code, dest_id);
       DPRINTF(("%s: cpu%u, desc %#x\n", __func__, cpu_number(), desc));
       for (int try=16; try--; ) {
               rmixl_msgsnd(desc);
               RMIXL_MFC2(RMIXL_COP_2_MSG_STS, 0, msg_status);
               RMIXL_MFC2(RMIXL_COP_2_MSG_STS, 1, msg_status1);
               if (((msg_status  & RMIXL_MSG_STS0_SCF) == 0)
               &&  ((msg_status1 & RMIXL_MSG_STS1_ERRS) == 0))
                       goto out;
#if 0
#ifdef DEBUG
               if ((msg_status & RMIXL_MSG_STS0_SCF) != 0) {
                       uint32_t r;
                       u_int regno = RMIXL_COP_2_CREDITS+fmnp->fmn_core;
                       u_int sel = fmnp->fmn_thread;
                       printf("%s: CC[%d,%d]=", __func__, regno, sel);
                       FMN_CP2_RD_SWITCH_RW(READ, regno, sel, r);
                       printf("%s: CC[%d,%d]=%d\n", __func__, regno, sel, r);
               }
#endif  /* DEBUG */
#endif  /* 0 */
               /* clear status1 error(s) */
               if ((msg_status1 & RMIXL_MSG_STS1_ERRS) != 0) {
                       RMIXL_MFC2(RMIXL_COP_2_MSG_STS, 1, msg_status1);
                       RMIXL_MTC2(RMIXL_COP_2_MSG_STS, 1, msg_status1);
               }
               DIAG_PRF(("%s: src=%ld, dst=%d, sts=%#x, %#x: send error, try %d\n",
                       __func__, curcpu()->ci_cpuid, dest_id, msg_status, msg_status1, try));
               DELAY(10);
       }
       rv = -1;
out:
       rmixl_cp2_restore(cp0_status);
       mutex_exit(fmnp->fmn_lock);

       return rv;
}

/*
* rmixl_fmn_msg_recv
*
*      - grab fmn_lock and call rmixl_fmn_msg_recv_subr to do the real work
*      - assume cp2 access is already enabled
*/
int
rmixl_fmn_msg_recv(u_int bucket, rmixl_fmn_rxmsg_t *rxmsg)
{
       fmn_t *fmnp;
       int rv;

       fmnp = fmn_lookup(curcpu()->ci_cpuid);
       mutex_enter(fmnp->fmn_lock);
       rv = rmixl_fmn_msg_recv_subr(bucket, rxmsg);
       mutex_exit(fmnp->fmn_lock);

       return rv;
}

/*
* rmixl_fmn_msg_recv_subr
*
*      - assume fmn_lock is owned
*      - assume cp2 access is already enabled
*/
static int
rmixl_fmn_msg_recv_subr(u_int bucket, rmixl_fmn_rxmsg_t *rxmsg)
{
       fmn_t *fmnp;
       uint32_t msg_status = 0 /* XXXGCC12 */;
       int rv;

       fmnp = fmn_lookup(curcpu()->ci_cpuid);
       KASSERT(mutex_owned(fmnp->fmn_lock) != 0);

       for (int try=16; try--; ) {
               RMIXL_MFC2(RMIXL_COP_2_MSG_STS, 0, msg_status);
               if ((msg_status & (RMIXL_MSG_STS0_LPF)) == 0)
                       goto recv;
       }
       DIAG_PRF(("%s: cpu%u, bucket=%d, sts=%#x: Load Pending Fail\n",
               __func__, cpu_number(), bucket, msg_status));
       rv = -1;
       goto out;
recv:
       rmixl_msgld(bucket);
       RMIXL_MFC2(RMIXL_COP_2_MSG_STS, 0, msg_status);
       DPRINTF(("%s: cpu%u, bucket=%d, sts=%#x\n",
               __func__, cpu_number(), bucket, msg_status));
       rv = msg_status & (RMIXL_MSG_STS0_LEF|RMIXL_MSG_STS0_LPF);
       if (rv == 0) {
               rxmsg->rxsid = (msg_status & RMIXL_MSG_STS0_RMSID)
                               >> RMIXL_MSG_STS0_RMSID_SHIFT;
               rxmsg->code = (msg_status & RMIXL_MSG_STS0_RMSC)
                               >> RMIXL_MSG_STS0_RMSC_SHIFT;
               rxmsg->size = ((msg_status & RMIXL_MSG_STS0_RMS)
                               >> RMIXL_MSG_STS0_RMS_SHIFT) + 1;
               switch(rxmsg->size) {
               case 1:
                       RMIXL_DMFC2(RMIXL_COP_2_RXBUF, 0, rxmsg->msg.data[0]);
                       break;
               case 2:
                       RMIXL_DMFC2(RMIXL_COP_2_RXBUF, 0, rxmsg->msg.data[0]);
                       RMIXL_DMFC2(RMIXL_COP_2_RXBUF, 1, rxmsg->msg.data[1]);
                       break;
               case 3:
                       RMIXL_DMFC2(RMIXL_COP_2_RXBUF, 0, rxmsg->msg.data[0]);
                       RMIXL_DMFC2(RMIXL_COP_2_RXBUF, 1, rxmsg->msg.data[1]);
                       RMIXL_DMFC2(RMIXL_COP_2_RXBUF, 2, rxmsg->msg.data[2]);
                       break;
               case 4:
                       RMIXL_DMFC2(RMIXL_COP_2_RXBUF, 0, rxmsg->msg.data[0]);
                       RMIXL_DMFC2(RMIXL_COP_2_RXBUF, 1, rxmsg->msg.data[1]);
                       RMIXL_DMFC2(RMIXL_COP_2_RXBUF, 2, rxmsg->msg.data[2]);
                       RMIXL_DMFC2(RMIXL_COP_2_RXBUF, 3, rxmsg->msg.data[3]);
                       break;
               default:
                       /* "impossible" due to bitfield width */
                       panic("%s: bad size %d", __func__, rxmsg->size);
               }
       }
out:

       return rv;
}

#ifdef FMN_DEBUG
void
rmixl_fmn_cp2_dump(void)
{
       uint32_t cp0_status;

       cp0_status = rmixl_cp2_enable();

       CPU2_PRINT_8(RMIXL_COP_2_TXBUF, 0);
       CPU2_PRINT_8(RMIXL_COP_2_TXBUF, 1);
       CPU2_PRINT_8(RMIXL_COP_2_TXBUF, 2);
       CPU2_PRINT_8(RMIXL_COP_2_TXBUF, 3);

       CPU2_PRINT_8(RMIXL_COP_2_RXBUF, 0);
       CPU2_PRINT_8(RMIXL_COP_2_RXBUF, 1);
       CPU2_PRINT_8(RMIXL_COP_2_RXBUF, 2);
       CPU2_PRINT_8(RMIXL_COP_2_RXBUF, 3);

       CPU2_PRINT_4(RMIXL_COP_2_MSG_STS, 0);
       CPU2_PRINT_4(RMIXL_COP_2_MSG_STS, 1);

       CPU2_PRINT_4(RMIXL_COP_2_MSG_CFG, 0);
       CPU2_PRINT_4(RMIXL_COP_2_MSG_CFG, 1);

       CPU2_PRINT_4(RMIXL_COP_2_MSG_BSZ, 0);
       CPU2_PRINT_4(RMIXL_COP_2_MSG_BSZ, 1);
       CPU2_PRINT_4(RMIXL_COP_2_MSG_BSZ, 2);
       CPU2_PRINT_4(RMIXL_COP_2_MSG_BSZ, 3);
       CPU2_PRINT_4(RMIXL_COP_2_MSG_BSZ, 4);
       CPU2_PRINT_4(RMIXL_COP_2_MSG_BSZ, 5);
       CPU2_PRINT_4(RMIXL_COP_2_MSG_BSZ, 6);
       CPU2_PRINT_4(RMIXL_COP_2_MSG_BSZ, 7);

       CPU2_PRINT_4(RMIXL_COP_2_CREDITS + 0, 0);
       CPU2_PRINT_4(RMIXL_COP_2_CREDITS + 0, 1);
       CPU2_PRINT_4(RMIXL_COP_2_CREDITS + 0, 2);
       CPU2_PRINT_4(RMIXL_COP_2_CREDITS + 0, 3);
       CPU2_PRINT_4(RMIXL_COP_2_CREDITS + 0, 4);
       CPU2_PRINT_4(RMIXL_COP_2_CREDITS + 0, 5);
       CPU2_PRINT_4(RMIXL_COP_2_CREDITS + 0, 6);
       CPU2_PRINT_4(RMIXL_COP_2_CREDITS + 0, 7);

       CPU2_PRINT_4(RMIXL_COP_2_CREDITS + 1, 0);
       CPU2_PRINT_4(RMIXL_COP_2_CREDITS + 1, 1);
       CPU2_PRINT_4(RMIXL_COP_2_CREDITS + 1, 2);
       CPU2_PRINT_4(RMIXL_COP_2_CREDITS + 1, 3);
       CPU2_PRINT_4(RMIXL_COP_2_CREDITS + 1, 4);
       CPU2_PRINT_4(RMIXL_COP_2_CREDITS + 1, 5);
       CPU2_PRINT_4(RMIXL_COP_2_CREDITS + 1, 6);
       CPU2_PRINT_4(RMIXL_COP_2_CREDITS + 1, 7);

       CPU2_PRINT_4(RMIXL_COP_2_CREDITS + 2, 0);
       CPU2_PRINT_4(RMIXL_COP_2_CREDITS + 2, 1);
       CPU2_PRINT_4(RMIXL_COP_2_CREDITS + 2, 2);
       CPU2_PRINT_4(RMIXL_COP_2_CREDITS + 2, 3);
       CPU2_PRINT_4(RMIXL_COP_2_CREDITS + 2, 4);
       CPU2_PRINT_4(RMIXL_COP_2_CREDITS + 2, 5);
       CPU2_PRINT_4(RMIXL_COP_2_CREDITS + 2, 6);
       CPU2_PRINT_4(RMIXL_COP_2_CREDITS + 2, 7);

       CPU2_PRINT_4(RMIXL_COP_2_CREDITS + 3, 0);
       CPU2_PRINT_4(RMIXL_COP_2_CREDITS + 3, 1);
       CPU2_PRINT_4(RMIXL_COP_2_CREDITS + 3, 2);
       CPU2_PRINT_4(RMIXL_COP_2_CREDITS + 3, 3);
       CPU2_PRINT_4(RMIXL_COP_2_CREDITS + 3, 4);
       CPU2_PRINT_4(RMIXL_COP_2_CREDITS + 3, 5);
       CPU2_PRINT_4(RMIXL_COP_2_CREDITS + 3, 6);
       CPU2_PRINT_4(RMIXL_COP_2_CREDITS + 3, 7);

       CPU2_PRINT_4(RMIXL_COP_2_CREDITS + 4, 0);
       CPU2_PRINT_4(RMIXL_COP_2_CREDITS + 4, 1);
       CPU2_PRINT_4(RMIXL_COP_2_CREDITS + 4, 2);
       CPU2_PRINT_4(RMIXL_COP_2_CREDITS + 4, 3);
       CPU2_PRINT_4(RMIXL_COP_2_CREDITS + 4, 4);
       CPU2_PRINT_4(RMIXL_COP_2_CREDITS + 4, 5);
       CPU2_PRINT_4(RMIXL_COP_2_CREDITS + 4, 6);
       CPU2_PRINT_4(RMIXL_COP_2_CREDITS + 4, 7);

       CPU2_PRINT_4(RMIXL_COP_2_CREDITS + 5, 0);
       CPU2_PRINT_4(RMIXL_COP_2_CREDITS + 5, 1);
       CPU2_PRINT_4(RMIXL_COP_2_CREDITS + 5, 2);
       CPU2_PRINT_4(RMIXL_COP_2_CREDITS + 5, 3);
       CPU2_PRINT_4(RMIXL_COP_2_CREDITS + 5, 4);
       CPU2_PRINT_4(RMIXL_COP_2_CREDITS + 5, 5);
       CPU2_PRINT_4(RMIXL_COP_2_CREDITS + 5, 6);
       CPU2_PRINT_4(RMIXL_COP_2_CREDITS + 5, 7);

       CPU2_PRINT_4(RMIXL_COP_2_CREDITS + 6, 0);
       CPU2_PRINT_4(RMIXL_COP_2_CREDITS + 6, 1);
       CPU2_PRINT_4(RMIXL_COP_2_CREDITS + 6, 2);
       CPU2_PRINT_4(RMIXL_COP_2_CREDITS + 6, 3);
       CPU2_PRINT_4(RMIXL_COP_2_CREDITS + 6, 4);
       CPU2_PRINT_4(RMIXL_COP_2_CREDITS + 6, 5);
       CPU2_PRINT_4(RMIXL_COP_2_CREDITS + 6, 6);
       CPU2_PRINT_4(RMIXL_COP_2_CREDITS + 6, 7);

       CPU2_PRINT_4(RMIXL_COP_2_CREDITS + 7, 0);
       CPU2_PRINT_4(RMIXL_COP_2_CREDITS + 7, 1);
       CPU2_PRINT_4(RMIXL_COP_2_CREDITS + 7, 2);
       CPU2_PRINT_4(RMIXL_COP_2_CREDITS + 7, 3);
       CPU2_PRINT_4(RMIXL_COP_2_CREDITS + 7, 4);
       CPU2_PRINT_4(RMIXL_COP_2_CREDITS + 7, 5);
       CPU2_PRINT_4(RMIXL_COP_2_CREDITS + 7, 6);
       CPU2_PRINT_4(RMIXL_COP_2_CREDITS + 7, 7);

       CPU2_PRINT_4(RMIXL_COP_2_CREDITS + 8, 0);
       CPU2_PRINT_4(RMIXL_COP_2_CREDITS + 8, 1);
       CPU2_PRINT_4(RMIXL_COP_2_CREDITS + 8, 2);
       CPU2_PRINT_4(RMIXL_COP_2_CREDITS + 8, 3);
       CPU2_PRINT_4(RMIXL_COP_2_CREDITS + 8, 4);
       CPU2_PRINT_4(RMIXL_COP_2_CREDITS + 8, 5);
       CPU2_PRINT_4(RMIXL_COP_2_CREDITS + 8, 6);
       CPU2_PRINT_4(RMIXL_COP_2_CREDITS + 8, 7);

       CPU2_PRINT_4(RMIXL_COP_2_CREDITS + 9, 0);
       CPU2_PRINT_4(RMIXL_COP_2_CREDITS + 9, 1);
       CPU2_PRINT_4(RMIXL_COP_2_CREDITS + 9, 2);
       CPU2_PRINT_4(RMIXL_COP_2_CREDITS + 9, 3);
       CPU2_PRINT_4(RMIXL_COP_2_CREDITS + 9, 4);
       CPU2_PRINT_4(RMIXL_COP_2_CREDITS + 9, 5);
       CPU2_PRINT_4(RMIXL_COP_2_CREDITS + 9, 6);
       CPU2_PRINT_4(RMIXL_COP_2_CREDITS + 9, 7);

       CPU2_PRINT_4(RMIXL_COP_2_CREDITS + 10, 0);
       CPU2_PRINT_4(RMIXL_COP_2_CREDITS + 10, 1);
       CPU2_PRINT_4(RMIXL_COP_2_CREDITS + 10, 2);
       CPU2_PRINT_4(RMIXL_COP_2_CREDITS + 10, 3);
       CPU2_PRINT_4(RMIXL_COP_2_CREDITS + 10, 4);
       CPU2_PRINT_4(RMIXL_COP_2_CREDITS + 10, 5);
       CPU2_PRINT_4(RMIXL_COP_2_CREDITS + 10, 6);
       CPU2_PRINT_4(RMIXL_COP_2_CREDITS + 10, 7);

       CPU2_PRINT_4(RMIXL_COP_2_CREDITS + 11, 0);
       CPU2_PRINT_4(RMIXL_COP_2_CREDITS + 11, 1);
       CPU2_PRINT_4(RMIXL_COP_2_CREDITS + 11, 2);
       CPU2_PRINT_4(RMIXL_COP_2_CREDITS + 11, 3);
       CPU2_PRINT_4(RMIXL_COP_2_CREDITS + 11, 4);
       CPU2_PRINT_4(RMIXL_COP_2_CREDITS + 11, 5);
       CPU2_PRINT_4(RMIXL_COP_2_CREDITS + 11, 6);
       CPU2_PRINT_4(RMIXL_COP_2_CREDITS + 11, 7);

       CPU2_PRINT_4(RMIXL_COP_2_CREDITS + 12, 0);
       CPU2_PRINT_4(RMIXL_COP_2_CREDITS + 12, 1);
       CPU2_PRINT_4(RMIXL_COP_2_CREDITS + 12, 2);
       CPU2_PRINT_4(RMIXL_COP_2_CREDITS + 12, 3);
       CPU2_PRINT_4(RMIXL_COP_2_CREDITS + 12, 4);
       CPU2_PRINT_4(RMIXL_COP_2_CREDITS + 12, 5);
       CPU2_PRINT_4(RMIXL_COP_2_CREDITS + 12, 6);
       CPU2_PRINT_4(RMIXL_COP_2_CREDITS + 12, 7);

       CPU2_PRINT_4(RMIXL_COP_2_CREDITS + 13, 0);
       CPU2_PRINT_4(RMIXL_COP_2_CREDITS + 13, 1);
       CPU2_PRINT_4(RMIXL_COP_2_CREDITS + 13, 2);
       CPU2_PRINT_4(RMIXL_COP_2_CREDITS + 13, 3);
       CPU2_PRINT_4(RMIXL_COP_2_CREDITS + 13, 4);
       CPU2_PRINT_4(RMIXL_COP_2_CREDITS + 13, 5);
       CPU2_PRINT_4(RMIXL_COP_2_CREDITS + 13, 6);
       CPU2_PRINT_4(RMIXL_COP_2_CREDITS + 13, 7);

       CPU2_PRINT_4(RMIXL_COP_2_CREDITS + 14, 0);
       CPU2_PRINT_4(RMIXL_COP_2_CREDITS + 14, 1);
       CPU2_PRINT_4(RMIXL_COP_2_CREDITS + 14, 2);
       CPU2_PRINT_4(RMIXL_COP_2_CREDITS + 14, 3);
       CPU2_PRINT_4(RMIXL_COP_2_CREDITS + 14, 4);
       CPU2_PRINT_4(RMIXL_COP_2_CREDITS + 14, 5);
       CPU2_PRINT_4(RMIXL_COP_2_CREDITS + 14, 6);
       CPU2_PRINT_4(RMIXL_COP_2_CREDITS + 14, 7);

       CPU2_PRINT_4(RMIXL_COP_2_CREDITS + 15, 0);
       CPU2_PRINT_4(RMIXL_COP_2_CREDITS + 15, 1);
       CPU2_PRINT_4(RMIXL_COP_2_CREDITS + 15, 2);
       CPU2_PRINT_4(RMIXL_COP_2_CREDITS + 15, 3);
       CPU2_PRINT_4(RMIXL_COP_2_CREDITS + 15, 4);
       CPU2_PRINT_4(RMIXL_COP_2_CREDITS + 15, 5);
       CPU2_PRINT_4(RMIXL_COP_2_CREDITS + 15, 6);
       CPU2_PRINT_4(RMIXL_COP_2_CREDITS + 15, 7);

       rmixl_cp2_restore(cp0_status);
}


void
rmixl_fmn_cc_dump(void)
{
       uint32_t cc[4][8];

       FMN_CP2_4SEL_READ(RMIXL_COP_2_CREDITS,   0, &cc[0][0]);
       FMN_CP2_4SEL_READ(RMIXL_COP_2_CREDITS,   4, &cc[0][4]);
       FMN_CP2_4SEL_READ(RMIXL_COP_2_CREDITS+1, 0, &cc[1][0]);
       FMN_CP2_4SEL_READ(RMIXL_COP_2_CREDITS+1, 4, &cc[1][4]);
       FMN_CP2_4SEL_READ(RMIXL_COP_2_CREDITS+2, 0, &cc[2][0]);
       FMN_CP2_4SEL_READ(RMIXL_COP_2_CREDITS+2, 4, &cc[2][4]);
       FMN_CP2_4SEL_READ(RMIXL_COP_2_CREDITS+3, 0, &cc[3][0]);
       FMN_CP2_4SEL_READ(RMIXL_COP_2_CREDITS+3, 4, &cc[3][4]);

       printf("%s: cpu%u\n", __func__, cpu_number());
       for (int i=0; i < 4; i++) {
               for (int j=0; j < 8; j++)
                       printf(" %#x,", cc[i][j]);
               printf("\n");
       }
}

#endif  /* FMN_DEBUG */