#include <stdlib.h>
#include "asm.h"
#include "processor.h"
#include "spinlock.h"
#include "irq.h"
#include "exi.h"
#include "cache.h"
#include "ogcsys.h"
#include "lwp.h"
#include "lwp_threads.h"
#include "lwp_watchdog.h"
#include "lwip/debug.h"
#include "lwip/opt.h"
#include "lwip/def.h"
#include "lwip/mem.h"
#include "lwip/pbuf.h"
#include "lwip/sys.h"
#include "netif/etharp.h"

#include "netif/gcif/gcif.h"

//#define _BBA_DEBUG

#define IFNAME0		'e'
#define IFNAME1		'0'

#define GCIF_TX_TQ				8
#define GCIF_EXI_TQ				9

#define BBA_MINPKTSIZE			60

#define BBA_CID					0x04020200

#define BBA_CMD_IRMASKALL		0x00
#define BBA_CMD_IRMASKNONE		0xF8

#define BBA_NCRA				0x00		/* Network Control Register A, RW */
#define BBA_NCRA_RESET			(1<<0)	/* RESET */
#define BBA_NCRA_ST0			(1<<1)	/* ST0, Start transmit command/status */
#define BBA_NCRA_ST1			(1<<2)	/* ST1,  " */
#define BBA_NCRA_SR				(1<<3)	/* SR, Start Receive */

#define BBA_NCRB				0x01		/* Network Control Register B, RW */
#define BBA_NCRB_PR				(1<<0)	/* PR, Promiscuous Mode */
#define BBA_NCRB_CA				(1<<1)	/* CA, Capture Effect Mode */
#define BBA_NCRB_PM				(1<<2)	/* PM, Pass Multicast */
#define BBA_NCRB_PB				(1<<3)	/* PB, Pass Bad Frame */
#define BBA_NCRB_AB				(1<<4)	/* AB, Accept Broadcast */
#define BBA_NCRB_HBD			(1<<5)	/* HBD, reserved */
#define BBA_NCRB_RXINTC0		(1<<6)	/* RXINTC, Receive Interrupt Counter */
#define BBA_NCRB_RXINTC1		(1<<7)	/*  " */
#define BBA_NCRB_1_PACKET_PER_INT  (0<<6)	/* 0 0 */
#define BBA_NCRB_2_PACKETS_PER_INT (1<<6)	/* 0 1 */
#define BBA_NCRB_4_PACKETS_PER_INT (2<<6)	/* 1 0 */
#define BBA_NCRB_8_PACKETS_PER_INT (3<<6)	/* 1 1 */

#define BBA_LTPS 0x04		/* Last Transmitted Packet Status, RO */
#define BBA_LRPS 0x05		/* Last Received Packet Status, RO */

#define BBA_IMR 0x08		/* Interrupt Mask Register, RW, 00h */
#define   BBA_IMR_FRAGIM     (1<<0)	/* FRAGIM, Fragment Counter Int Mask */
#define   BBA_IMR_RIM        (1<<1)	/* RIM, Receive Interrupt Mask */
#define   BBA_IMR_TIM        (1<<2)	/* TIM, Transmit Interrupt Mask */
#define   BBA_IMR_REIM       (1<<3)	/* REIM, Receive Error Interrupt Mask */
#define   BBA_IMR_TEIM       (1<<4)	/* TEIM, Transmit Error Interrupt Mask */
#define   BBA_IMR_FIFOEIM    (1<<5)	/* FIFOEIM, FIFO Error Interrupt Mask */
#define   BBA_IMR_BUSEIM     (1<<6)	/* BUSEIM, BUS Error Interrupt Mask */
#define   BBA_IMR_RBFIM      (1<<7)	/* RBFIM, RX Buffer Full Interrupt Mask */

#define BBA_IR 0x09		/* Interrupt Register, RW, 00h */
#define   BBA_IR_FRAGI       (1<<0)	/* FRAGI, Fragment Counter Interrupt */
#define   BBA_IR_RI          (1<<1)	/* RI, Receive Interrupt */
#define   BBA_IR_TI          (1<<2)	/* TI, Transmit Interrupt */
#define   BBA_IR_REI         (1<<3)	/* REI, Receive Error Interrupt */
#define   BBA_IR_TEI         (1<<4)	/* TEI, Transmit Error Interrupt */
#define   BBA_IR_FIFOEI      (1<<5)	/* FIFOEI, FIFO Error Interrupt */
#define   BBA_IR_BUSEI       (1<<6)	/* BUSEI, BUS Error Interrupt */
#define   BBA_IR_RBFI        (1<<7)	/* RBFI, RX Buffer Full Interrupt */

#define BBA_BP   0x0a/*+0x0b*/	/* Boundary Page Pointer Register */
#define BBA_TLBP 0x0c/*+0x0d*/	/* TX Low Boundary Page Pointer Register */
#define BBA_TWP  0x0e/*+0x0f*/	/* Transmit Buffer Write Page Pointer Register */
#define BBA_TRP  0x12/*+0x13*/	/* Transmit Buffer Read Page Pointer Register */
#define BBA_RWP  0x16/*+0x17*/	/* Receive Buffer Write Page Pointer Register */
#define BBA_RRP  0x18/*+0x19*/	/* Receive Buffer Read Page Pointer Register */
#define BBA_RHBP 0x1a/*+0x1b*/	/* Receive High Boundary Page Pointer Register */

#define BBA_RXINTT    0x14/*+0x15*/	/* Receive Interrupt Timer Register */

#define BBA_NAFR_PAR0 0x20	/* Physical Address Register Byte 0 */
#define BBA_NAFR_PAR1 0x21	/* Physical Address Register Byte 1 */
#define BBA_NAFR_PAR2 0x22	/* Physical Address Register Byte 2 */
#define BBA_NAFR_PAR3 0x23	/* Physical Address Register Byte 3 */
#define BBA_NAFR_PAR4 0x24	/* Physical Address Register Byte 4 */
#define BBA_NAFR_PAR5 0x25	/* Physical Address Register Byte 5 */

#define BBA_NWAYC 0x30		/* NWAY Configuration Register, RW, 84h */
#define   BBA_NWAYC_FD       (1<<0)	/* FD, Full Duplex Mode */
#define   BBA_NWAYC_PS100    (1<<1)	/* PS100/10, Port Select 100/10 */
#define   BBA_NWAYC_ANE      (1<<2)	/* ANE, Autonegotiation Enable */
#define   BBA_NWAYC_ANS_RA   (1<<3)	/* ANS, Restart Autonegotiation */
#define   BBA_NWAYC_LTE      (1<<7)	/* LTE, Link Test Enable */

#define	BBA_HALF_100		 (BBA_NWAYC_PS100)
#define	BBA_FULL_100		 (BBA_NWAYC_PS100|BBA_NWAYC_FD)
#define	BBA_HALF_10 		 (BBA_NWAYC_ANE)
#define	BBA_FULL_10 		 (BBA_NWAYC_FD)

#define BBA_NWAYS 0x31
#define   BBA_NWAYS_LS10	 (1<<0)
#define   BBA_NWAYS_LS100	 (1<<1)
#define   BBA_NWAYS_LPNWAY   (1<<2)
#define   BBA_NWAYS_ANCLPT	 (1<<3)
#define   BBA_NWAYS_100TXF	 (1<<4)
#define   BBA_NWAYS_100TXH	 (1<<5)
#define   BBA_NWAYS_10TXF	 (1<<6)
#define   BBA_NWAYS_10TXH	 (1<<7)

#define BBA_GCA 0x32			/* GMAC Configuration A Register, RW, 00h */
#define   BBA_GCA_ARXERRB		(1<<3)	/* ARXERRB, Accept RX packet with error */
#define   BBA_GCA_TXFIFOCNTEN   (1<<6)	/* TX FIFO cnt enable */

#define BBA_MISC 0x3d		/* MISC Control Register 1, RW, 3ch */
#define   BBA_MISC_BURSTDMA  (1<<0)
#define   BBA_MISC_DISLDMA   (1<<1)

#define BBA_TXFIFOCNT 0x3e/*0x3f*/	/* Transmit FIFO Counter Register */
#define BBA_WRTXFIFOD 0x48/*-0x4b*/	/* Write TX FIFO Data Port Register */

#define BBA_MISC2 0x50		/* MISC Control Register 2, RW, 00h */
#define   BBA_MISC2_HBRLEN0		(1<<0)	/* HBRLEN, Host Burst Read Length */
#define   BBA_MISC2_HBRLEN1		(1<<1)	/*  " */
#define   BBA_MISC2_RUNTSIZE	(1<<2)	/*  " */
#define   BBA_MISC2_DREQBCTRL	(1<<3)	/*  " */
#define   BBA_MISC2_RINTSEL		(1<<4)	/*  " */
#define   BBA_MISC2_ITPSEL		(3<<5)	/*  " */
#define   BBA_MISC2_AUTORCVR	(1<<7)	/* Auto RX Full Recovery */

#define BBA_RX_STATUS_BF      (1<<0)
#define BBA_RX_STATUS_CRC     (1<<1)
#define BBA_RX_STATUS_FAE     (1<<2)
#define BBA_RX_STATUS_FO      (1<<3)
#define BBA_RX_STATUS_RW      (1<<4)
#define BBA_RX_STATUS_MF      (1<<5)
#define BBA_RX_STATUS_RF      (1<<6)
#define BBA_RX_STATUS_RERR    (1<<7)

#define BBA_TX_STATUS_CC0     (1<<0)
#define BBA_TX_STATUS_CC1     (1<<1)
#define BBA_TX_STATUS_CC2     (1<<2)
#define BBA_TX_STATUS_CC3     (1<<3)
#define  BBA_TX_STATUS_CCMASK (0x0f)
#define BBA_TX_STATUS_CRSLOST (1<<4)
#define BBA_TX_STATUS_UF      (1<<5)
#define BBA_TX_STATUS_OWC     (1<<6)
#define BBA_TX_STATUS_OWN     (1<<7)
#define BBA_TX_STATUS_TERR    (1<<7)

#define BBA_SI_ACTRL	0x5c
#define BBA_SI_STATUS	0x5d
#define BBA_SI_ACTRL2	0x60

#define BBA_INIT_TLBP	0x00
#define BBA_INIT_BP		0x01
#define BBA_INIT_RHBP	0x0f
#define BBA_INIT_RWP	BBA_INIT_BP
#define BBA_INIT_RRP	BBA_INIT_BP

#define BBA_TX_MAX_PACKET_SIZE	(1518)									/* 14+1500+4 */
#define BBA_RX_MAX_PACKET_SIZE	(1536)									/* 6 pages * 256 bytes */

#define BBA_NAPI_WEIGHT 16

#define X(a,b)  b,a
struct bba_descr {
	u32 X(X(next_packet_ptr:12, packet_len:12), status:8);
} __attribute((packed));

#define _SHIFTL(v, s, w)	\
    ((u32) (((u32)(v) & ((0x01 << (w)) - 1)) << (s)))
#define _SHIFTR(v, s, w)	\
    ((u32)(((u32)(v) >> (s)) & ((0x01 << (w)) - 1)))

struct bba_priv {
	u8 flag;
	u8 revid;
	u16 devid;
	u8 acstart;
	u8 linkstate;
	lwpq_t tq_xmit;
	err_t state;
	struct eth_addr *ethaddr;
	struct dev_stats {
		u32 rx_errors,rx_overerrors,rx_crcerrors;
		u32 rx_fifoerrors,rx_lengtherrors,rx_frameerrors;
		u32 rx_bytes,rx_packets;
		u32 tx_errors,tx_carriererrors,tx_fifoerrors;
		u32 tx_windowerrors,tx_collisions;
	} txrx_stats;
};

static lwpq_t wait_exi_queue;
static struct bba_descr cur_descr;
static struct netif *gc_netif = NULL;
static const struct eth_addr ethbroadcast = {{0xffU,0xffU,0xffU,0xffU,0xffU,0xffU}};

static err_t __bba_link_tx(struct netif *dev,struct pbuf *p);
static u32 __bba_rx_err(u8 status,struct bba_priv *priv);

extern void udelay(int us);

/* new functions */
#define bba_select()		EXI_Select(EXI_CHANNEL_0,EXI_DEVICE_2,EXI_SPEED32MHZ)
#define bba_deselect()		EXI_Deselect(EXI_CHANNEL_0)
#define bba_sync()			EXI_Sync(EXI_CHANNEL_0)

#define bba_in12(reg)		((bba_in8((reg))&0xff)|((bba_in8(((reg)+1))&0x0f)<<8))
#define bba_out12(reg,val)	do { \
									bba_out8((reg),((val)&0xff)); \
									bba_out8(((reg)+1),(((val)&0x0f00)>>8)); \
							} while(0)
#define bba_in16(reg)		((bba_in8((reg))&0xff)|((bba_in8(((reg)+1))&0xff)<<8))
#define bba_out16(reg,val)	do { \
									bba_out8((reg),((val)&0xff)); \
									bba_out8(((reg)+1),(((val)&0xff00)>>8)); \
							} while(0)

static __inline__ void bba_cmd_insnosel(u32 reg,void *val,u32 len)
{
	u16 req;
	req = reg<<8;
	EXI_Imm(EXI_CHANNEL_0,&req,sizeof(req),EXI_WRITE,NULL);
	EXI_Sync(EXI_CHANNEL_0);
	EXI_ImmEx(EXI_CHANNEL_0,val,len,EXI_READ);
}

static __inline__ void bba_cmd_outsnosel(u32 reg,void *val,u32 len)
{
	u16 req;
	req = (reg<<8)|0x4000;
	EXI_Imm(EXI_CHANNEL_0,&req,sizeof(req),EXI_WRITE,NULL);
	EXI_Sync(EXI_CHANNEL_0);
	EXI_ImmEx(EXI_CHANNEL_0,val,len,EXI_WRITE);
}

static __inline__ void bba_insnosel(u32 reg,void *val,u32 len)
{
	u32 req;
	req = (reg<<8)|0x80000000;
	EXI_Imm(EXI_CHANNEL_0,&req,sizeof(req),EXI_WRITE,NULL);
	EXI_Sync(EXI_CHANNEL_0);
	EXI_ImmEx(EXI_CHANNEL_0,val,len,EXI_READ);
}

static __inline__ void bba_outsnosel(u32 reg,void *val,u32 len)
{
	u32 req;
	req = (reg<<8)|0xC0000000;
	EXI_Imm(EXI_CHANNEL_0,&req,sizeof(req),EXI_WRITE,NULL);
	EXI_Sync(EXI_CHANNEL_0);
	EXI_ImmEx(EXI_CHANNEL_0,val,len,EXI_WRITE);
}

static __inline__ void bba_insregister(u32 reg)
{
	u32 req;
	req = (reg<<8)|0x80000000;
	EXI_Imm(EXI_CHANNEL_0,&req,sizeof(req),EXI_WRITE,NULL);
	EXI_Sync(EXI_CHANNEL_0);
}

static __inline__ void bba_insdata(void *val,u32 len)
{
	EXI_ImmEx(EXI_CHANNEL_0,val,len,EXI_READ);
}

static __inline__ void bba_insdmadata(void *val,u32 len,s32 (*dmasubrcv)(s32 chn,s32 dev))
{
	EXI_Dma(EXI_CHANNEL_0,val,len,EXI_READ,dmasubrcv);
}

static void bba_insdata_fast(void *val,s32 len)
{
	u32 roundlen;
	s32 missalign;
	u8 *ptr = val;

	if(!val || len<=0) return;

	missalign = -((u32)val)&0x1f;
	if((s32)(len-missalign)<32) {
		bba_insdata(val,len);
		return;
	}

	if(missalign>0) {
		bba_insdata(ptr,missalign);
		len -= missalign;
		ptr += missalign;
	}

	roundlen = (len&~0x1f);
	DCInvalidateRange(ptr,roundlen);
	bba_insdmadata(ptr,roundlen,NULL);
	bba_sync();

	len -= roundlen;
	ptr += roundlen;
	if(len>0) bba_insdata(ptr,len);
}

static __inline__ void bba_outsregister(u32 reg)
{
	u32 req;
	req = (reg<<8)|0xC0000000;
	EXI_Imm(EXI_CHANNEL_0,&req,sizeof(req),EXI_WRITE,NULL);
	EXI_Sync(EXI_CHANNEL_0);
}

static __inline__ void bba_outsdata(void *val,u32 len)
{
	EXI_ImmEx(EXI_CHANNEL_0,val,len,EXI_WRITE);
}

static __inline__ void bba_outsdmadata(void *val,u32 len,s32 (*dmasubsnd)(s32 chn,s32 dev))
{
	EXI_Dma(EXI_CHANNEL_0,val,len,EXI_WRITE,dmasubsnd);
}

static void bba_outsdata_fast(void *val,s32 len)
{
	u32 roundlen;
	s32 missalign;
	u8 *ptr = val;

	if(!val || len<=0) return;

	missalign = -((u32)val)&0x1f;
	if((s32)(len-missalign)<32) {
		bba_outsdata(val,len);
		return;
	}

	if(missalign>0) {
		bba_outsdata(ptr,missalign);
		len -= missalign;
		ptr += missalign;
	}

	roundlen = (len&~0x1f);
	DCStoreRange(ptr,roundlen);
	bba_outsdmadata(ptr,roundlen,NULL);
	bba_sync();

	len -= roundlen;
	ptr += roundlen;
	if(len>0) bba_outsdata(ptr,len);
}

static inline void bba_cmd_ins(u32 reg,void *val,u32 len)
{
	bba_select();
	bba_cmd_insnosel(reg,val,len);
	bba_deselect();
}

static inline void bba_cmd_outs(u32 reg,void *val,u32 len)
{
	bba_select();
	bba_cmd_outsnosel(reg,val,len);
	bba_deselect();
}

static inline u8 bba_cmd_in8(u32 reg)
{
	u8 val;
	bba_cmd_ins(reg,&val,sizeof(val));
	return val;
}

static inline u8 bba_cmd_in8_slow(u32 reg)
{
	u8 val;
	bba_select();
	bba_cmd_insnosel(reg,&val,sizeof(val));
	udelay(200);			//usleep doesn't work on this amount, decrementer is based on 10ms, wait is 200us
	bba_deselect();
	return val;
}

static inline void bba_cmd_out8(u32 reg,u8 val)
{
	bba_cmd_outs(reg,&val,sizeof(val));
}

static inline void bba_ins(u32 reg,void *val,u32 len)
{
	bba_select();
	bba_insnosel(reg,val,len);
	bba_deselect();
}

static inline void bba_outs(u32 reg,void *val,u32 len)
{
	bba_select();
	bba_outsnosel(reg,val,len);
	bba_deselect();
}

static inline u8 bba_in8(u32 reg)
{
	u8 val;
	bba_ins(reg,&val,sizeof(val));
	return val;
}

static inline void bba_out8(u32 reg,u8 val)
{
	bba_outs(reg,&val,sizeof(val));
}

static s32 __bba_exi_unlockcb(s32 chn,s32 dev)
{
	LWP_ThreadBroadcast(wait_exi_queue);
	return 1;
}

static __inline__ void __bba_exi_stop(struct bba_priv *priv)
{
	u32 level;

	_CPU_ISR_Disable(level);
	while(EXI_Lock(EXI_CHANNEL_0,EXI_DEVICE_2,__bba_exi_unlockcb)==0) {
		LWIP_DEBUGF(NETIF_DEBUG|1,("__bba_exi_wait(exi locked)\n"));
		LWP_ThreadSleep(wait_exi_queue);
	}
	_CPU_ISR_Restore(level);
}

static __inline__ void __bba_exi_wake(struct bba_priv *priv)
{
	EXI_Unlock(EXI_CHANNEL_0);
}

static __inline__ void __bba_tx_stop(struct bba_priv *priv)
{
	u32 level;

	_CPU_ISR_Disable(level);
	while(priv->state==ERR_TXPENDING) {
		LWIP_DEBUGF(NETIF_DEBUG,("__bba_tx_stop(pending tx)\n"));
		LWP_ThreadSleep(priv->tq_xmit);
	}
	priv->state = ERR_TXPENDING;
	_CPU_ISR_Restore(level);
}

static __inline__ void __bba_tx_wake(struct bba_priv *priv)
{
	u32 level;

	_CPU_ISR_Disable(level);
	if(priv->state==ERR_TXPENDING) {
		priv->state = ERR_OK;
		LWP_ThreadBroadcast(priv->tq_xmit);
	}
	_CPU_ISR_Restore(level);
}

static __inline__ u8 __linkstate(struct bba_priv *priv)
{
	u8 nways = 0;

	nways = bba_in8(BBA_NWAYS);
	priv->linkstate = nways;
	if(nways&BBA_NWAYS_LS10 || nways&BBA_NWAYS_LS100) return nways;
	return 0;
}

static bool __bba_get_linkstateasync(struct bba_priv *priv)
{
	u32 ret,cnt,sec;

	for(cnt=0;cnt<10000;cnt++) {
		udelay(500);
		ret = __linkstate(priv);

		if(ret&0xf0 && ret&0x08) break;
	}

	// only sleep for additional 2 seconds if linkstate is ok
	if(cnt<10000) {
		sec = 1;
		if(!(ret&0x04)) sec = 2;
		udelay(sec*TB_USPERSEC);
	}

	return (cnt<10000);
}

static u32 __bba_read_cid()
{
	u16 cmd = 0;
	u32 cid = 0;

	bba_select();
	EXI_Imm(EXI_CHANNEL_0,&cmd,2,EXI_WRITE,NULL);
	EXI_Sync(EXI_CHANNEL_0);
	EXI_Imm(EXI_CHANNEL_0,&cid,4,EXI_READ,NULL);
	EXI_Sync(EXI_CHANNEL_0);
	bba_deselect();

	return cid;
}

static void __bba_reset()
{
	bba_out8(0x60,0x00);
	udelay(10000);
	bba_cmd_in8_slow(0x0F);
	udelay(10000);
	bba_out8(BBA_NCRA,BBA_NCRA_RESET);
	udelay(100);
	bba_out8(BBA_NCRA,0x00);
	udelay(100);
}

static void __bba_recv_init()
{
	bba_out8(BBA_NCRB,(BBA_NCRB_AB|BBA_NCRB_CA|BBA_NCRB_2_PACKETS_PER_INT));
	bba_out8(BBA_SI_ACTRL2,0x74);
	bba_out8(BBA_RXINTT, 0x00);
	bba_out8(BBA_RXINTT+1, 0x06); /* 0x0600 = 61us */

	bba_out8(BBA_MISC2,BBA_MISC2_AUTORCVR);

	bba_out12(BBA_TLBP, BBA_INIT_TLBP);
	bba_out12(BBA_BP,BBA_INIT_BP);
	bba_out12(BBA_RHBP,BBA_INIT_RHBP);
	bba_out12(BBA_RWP,BBA_INIT_RWP);
	bba_out12(BBA_RRP,BBA_INIT_RRP);

	bba_out8(BBA_GCA,BBA_GCA_ARXERRB);
	bba_out8(BBA_NCRA,BBA_NCRA_SR);
}

static u32 __bba_tx_err(u8 status,struct bba_priv *priv)
{
	u32 last_errors = priv->txrx_stats.tx_errors;

	if(status&BBA_TX_STATUS_TERR) {
		priv->txrx_stats.tx_errors++;
		if(status&BBA_TX_STATUS_CCMASK)
			priv->txrx_stats.tx_collisions += (status&BBA_TX_STATUS_CCMASK);

		if(status&BBA_TX_STATUS_CRSLOST)
			priv->txrx_stats.tx_carriererrors++;

		if(status&BBA_TX_STATUS_UF)
			priv->txrx_stats.tx_fifoerrors++;

		if(status&BBA_TX_STATUS_OWC)
			priv->txrx_stats.tx_windowerrors++;
	}
	if(last_errors!=priv->txrx_stats.tx_errors)
		LWIP_ERROR(("__bba_tx_err(%02x)\n",status));

	return priv->txrx_stats.tx_errors;
}

static u32 __bba_rx_err(u8 status,struct bba_priv *priv)
{
	u32 last_errors = priv->txrx_stats.tx_errors;

	if(status&0xff) {
		priv->txrx_stats.rx_overerrors++;
		priv->txrx_stats.rx_errors++;
	} else {
		if(status&BBA_RX_STATUS_RERR) {
			priv->txrx_stats.rx_errors++;
			if(status&BBA_RX_STATUS_BF)
				priv->txrx_stats.rx_overerrors++;

			if(status&BBA_RX_STATUS_CRC)
				priv->txrx_stats.rx_crcerrors++;

			if(status&BBA_RX_STATUS_FO)
				priv->txrx_stats.rx_fifoerrors++;

			if(status&BBA_RX_STATUS_RW)
				priv->txrx_stats.rx_lengtherrors++;

			if(status&BBA_RX_STATUS_RF)
				priv->txrx_stats.rx_lengtherrors++;

			if(status&BBA_RX_STATUS_BF)
				priv->txrx_stats.rx_overerrors++;
		}
		if(status&BBA_RX_STATUS_FAE) {
			priv->txrx_stats.rx_errors++;
			priv->txrx_stats.rx_frameerrors++;
		}
	}
	if(last_errors!=priv->txrx_stats.rx_errors)
		LWIP_ERROR(("__bba_rx_err(%02x)\n",status));

	return priv->txrx_stats.rx_errors;
}

void bba_process(struct pbuf *p,struct netif *dev)
{
	struct eth_hdr *ethhdr = NULL;
	struct bba_priv *priv = (struct bba_priv*)dev->state;
	const s32 hlen = sizeof(struct eth_hdr);

	if(p) {
		ethhdr = p->payload;
		switch(htons(ethhdr->type)) {
			case ETHTYPE_IP:
				LWIP_DEBUGF(NETIF_DEBUG,("bba_process: passing packet up to IP layer\n"));

				etharp_ip_input(dev,p);
				pbuf_header(p,-(hlen));
				ip_input(p,dev);
				break;
			case ETHTYPE_ARP:
				/* pass p to ARP module, get ARP reply or ARP queued packet */
				LWIP_DEBUGF(NETIF_DEBUG,("bba_process: passing packet up to ARP layer\n"));
				etharp_arp_input(dev, priv->ethaddr, p);
				break;
			/* unsupported Ethernet packet type */
			default:
				/* free pbuf */
				pbuf_free(p);
				break;
		}
	}
}

static err_t __bba_link_tx(struct netif *dev,struct pbuf *p)
{
	u8 tmpbuf[BBA_MINPKTSIZE];
	struct pbuf *tmp;
	struct bba_priv *priv = (struct bba_priv*)dev->state;

	__bba_tx_stop(priv);
	__bba_exi_stop(priv);

	if(p->tot_len>BBA_TX_MAX_PACKET_SIZE) {
		LWIP_ERROR(("__bba_link_tx(%d,%p) pkt_size\n",p->tot_len,LWP_GetSelf()));
		__bba_tx_wake(priv);
		__bba_exi_wake(priv);
		return ERR_PKTSIZE;
	}

	if(!__linkstate(priv)) {
		LWIP_ERROR(("__bba_link_tx(error link state)\n"));
		__bba_tx_wake(priv);
		__bba_exi_wake(priv);
		return ERR_ABRT;
	}

	LWIP_DEBUGF(NETIF_DEBUG,("__bba_link_tx(%d,%p)\n",p->tot_len,LWP_GetSelf()));

	bba_out12(BBA_TXFIFOCNT,p->tot_len);

	bba_select();
	bba_outsregister(BBA_WRTXFIFOD);
	for(tmp=p;tmp!=NULL;tmp=tmp->next) {
		bba_outsdata_fast(tmp->payload,tmp->len);
	}
	if(p->tot_len<BBA_MINPKTSIZE) bba_outsdata(tmpbuf,(BBA_MINPKTSIZE-p->tot_len));
	bba_deselect();

	bba_out8(BBA_NCRA,((bba_in8(BBA_NCRA)&~BBA_NCRA_ST0)|BBA_NCRA_ST1));		//&~BBA_NCRA_ST0
	__bba_exi_wake(priv);
	return ERR_OK;
}

static err_t __bba_start_tx(struct netif *dev,struct pbuf *p,struct ip_addr *ipaddr)
{
	LWIP_DEBUGF(NETIF_DEBUG,("__bba_start_tx(%p)\n",LWP_GetSelf()));
	return etharp_output(dev,ipaddr,p);
}

static err_t bba_start_rx(struct netif *dev,u32 budget)
{
	s32 size;
	u16 top,pos,rrp,rwp;
	u32 pkt_status,recvd;
	struct pbuf *tmp,*p = NULL;
	struct bba_priv *priv = (struct bba_priv*)dev->state;

	LWIP_DEBUGF(NETIF_DEBUG,("bba_start_rx()\n"));

	recvd = 0;
	rwp = bba_in12(BBA_RWP);
	rrp = bba_in12(BBA_RRP);
	while(recvd<budget && rrp!=rwp) {
		LWIP_DEBUGF(NETIF_DEBUG,("bba_start_rx(%04x,%04x)\n",rrp,rwp));
		bba_ins(rrp<<8,(void*)(&cur_descr),sizeof(struct bba_descr));
		le32_to_cpus((u32*)((void*)(&cur_descr)));

		size = (cur_descr.packet_len-4);
		pkt_status = cur_descr.status;
		if(size>(BBA_RX_MAX_PACKET_SIZE+4)) {
			LWIP_DEBUGF(NETIF_DEBUG|2,("bba_start_rx(size>BBA_RX_MAX_PACKET_SIZE)\n"));
			continue;
		}

		if(pkt_status&(BBA_RX_STATUS_RERR|BBA_RX_STATUS_FAE)) {
			LWIP_DEBUGF(NETIF_DEBUG|2,("bba_start_rx(pkt_status = 02x)\n",pkt_status));
			__bba_rx_err(pkt_status,priv);
			rwp = bba_in12(BBA_RWP);
			rrp = bba_in12(BBA_RRP);
			continue;
		}

		pos = ((rrp<<8)+4);
		top = ((BBA_INIT_RHBP+1)<<8);
		LWIP_DEBUGF(NETIF_DEBUG,("bba_start_rx(%04x,%d,%04x)\n",pos,size,top));

		p = pbuf_alloc(PBUF_RAW,size,PBUF_POOL);
		if(p) {
			for(tmp=p;tmp!=NULL;tmp=tmp->next) {
				size = tmp->len;

				bba_select();
				bba_insregister(pos);
				if((pos+size)<top) {
					bba_insdata_fast(tmp->payload,size);
				} else {
					s32 chunk_size = (top-pos);

					size -= chunk_size;
					pos = (BBA_INIT_RRP<<8);
					bba_insdata_fast(tmp->payload,chunk_size);
					bba_deselect();
					bba_select();
					bba_insregister(pos);
					bba_insdata_fast(tmp->payload+chunk_size,size);
				}
				bba_deselect();
				pos += size;
			}
			dev->input(p,dev);
		} else
			break;

		recvd++;
		bba_out12(BBA_RRP,(rrp=cur_descr.next_packet_ptr));
		rwp = bba_in12(BBA_RWP);
	}
	if(priv->flag&BBA_IR_RBFI) {
		priv->flag &= ~BBA_IR_RBFI;
		bba_out8(BBA_IMR,(bba_in8(BBA_IMR)|BBA_IMR_RBFIM));
	}

	LWIP_DEBUGF(NETIF_DEBUG,("bba_start_rx(rx interrupt close)\n"));
	return ERR_OK;
}

static inline void bba_interrupt(struct netif *dev)
{
	u8 ir,imr,status,lrps,ltps;
	struct bba_priv *priv = (struct bba_priv*)dev->state;

	ir = bba_in8(BBA_IR);
	imr = bba_in8(BBA_IMR);
	status = ir&imr;
	while(status) {
		LWIP_DEBUGF(NETIF_DEBUG,("bba_interrupt(%02x)\n",status));
		bba_out8(BBA_IR,status);
		if(status&BBA_IR_RBFI) {
			bba_out8(BBA_IMR,(bba_in8(BBA_IMR)&~BBA_IMR_RBFIM));
			priv->flag |= BBA_IMR_RBFIM;
		}
		if(status&(BBA_IR_RI|BBA_IR_RBFI)) {
			bba_start_rx(dev,0x20);
		}
		if(status&(BBA_IR_TI|BBA_IR_FIFOEI)) {
			__bba_tx_wake(priv);
		}
		if(status&(BBA_IR_RBFI|BBA_IR_REI)) {
			lrps = bba_in8(BBA_LRPS);
			__bba_rx_err(lrps,priv);
		}
		if(status&BBA_IR_TEI) {
			ltps = bba_in8(BBA_LTPS);
			__bba_tx_err(ltps,priv);
			__bba_tx_wake(priv);
		}
		if(status&BBA_IR_FRAGI) {
			LWIP_DEBUGF(NETIF_DEBUG,("bba_interrupt(BBA_IR_FRAGI)\n"));
		}
		if(status&BBA_IR_FIFOEI) {
			LWIP_DEBUGF(NETIF_DEBUG,("bba_interrupt(BBA_IR_FIFOEI)\n"));
		}
		if(status&BBA_IR_BUSEI) {
			LWIP_DEBUGF(NETIF_DEBUG,("bba_interrupt(BBA_IR_BUSEI)\n"));
		}

		ir = bba_in8(BBA_IR);
		imr = bba_in8(BBA_IMR);
		status = ir&imr;
	}
	LWIP_DEBUGF(NETIF_DEBUG,("bba_interrupt(exit)\n"));
}

static err_t __bba_init(struct netif *dev)
{
	u8 nwayc;
	struct bba_priv *priv = (struct bba_priv*)dev->state;

	if(!priv) return ERR_IF;

	LWIP_DEBUGF(NETIF_DEBUG,("initializing BBA...\n"));
	bba_cmd_out8(0x02,BBA_CMD_IRMASKALL);

	__bba_reset();

	priv->revid = bba_cmd_in8(0x01);

	bba_cmd_outs(0x04,&priv->devid,2);
	bba_cmd_out8(0x05,priv->acstart);

	/* Assume you are being started by something which has fucked NWAY!
	   So reset to power on defaults for SIACTRL/SIACONN */
	bba_out8(0x58, 0x80);
	bba_out8(0x59, 0x00);
	bba_out8(0x5a, 0x03);
	bba_out8(0x5b, 0x83);
	bba_out8(0x5c, 0x32);
	bba_out8(0x5d, 0xfe);
	bba_out8(0x5e, 0x1f);
	bba_out8(0x5f, 0x1f);
	udelay(100);

	__bba_recv_init();

	/* This doesn't set the speed anymore - it simple kicks off NWAY */
	nwayc = bba_in8(BBA_NWAYC)&0xc0;
	bba_out8(BBA_NWAYC,nwayc);
	udelay(100);
	nwayc |= 0x04;
	bba_out8(BBA_NWAYC,nwayc);
	udelay(100);
	nwayc |= 0x08;
	bba_out8(BBA_NWAYC,nwayc);
	udelay(100);

	bba_ins(BBA_NAFR_PAR0,priv->ethaddr->addr, 6);
	LWIP_DEBUGF(NETIF_DEBUG,("MAC ADDRESS %02x:%02x:%02x:%02x:%02x:%02x\n",
		priv->ethaddr->addr[0], priv->ethaddr->addr[1], priv->ethaddr->addr[2],
		priv->ethaddr->addr[3], priv->ethaddr->addr[4], priv->ethaddr->addr[5]));

	bba_out8(BBA_IR,0xFF);
	bba_out8(BBA_IMR,0xFF&~BBA_IMR_FIFOEIM);

	bba_cmd_out8(0x02,BBA_CMD_IRMASKNONE);

	return ERR_OK;
}

static err_t bba_init_one(struct netif *dev)
{
	struct bba_priv *priv = (struct bba_priv*)dev->state;

	if(!priv) return ERR_IF;

	priv->revid = 0xf0;
	priv->devid = 0xD107;
	priv->acstart = 0x4E;

	__bba_init(dev);

	return ERR_OK;
}

static err_t bba_probe(struct netif *dev)
{
	u32 cid;
	err_t ret;

	cid = __bba_read_cid();
	if(cid!=BBA_CID) return ERR_NODEV;

	ret = bba_init_one(dev);
	return ret;
}

static u32 bba_calc_response(struct bba_priv *priv,u32 val)
{
	u8 i0,i1,i2,i3;
	u8 c0,c1,c2,c3;
	u8 revid_0,revid_eth_0,revid_eth_1;

	revid_0 = priv->revid;
	revid_eth_0 = _SHIFTR(priv->devid,8,8);
	revid_eth_1 = _SHIFTR(priv->devid,0,8);

	i0 = _SHIFTR(val,24,8);
	i1 = _SHIFTR(val,16,8);
	i2 = _SHIFTR(val, 8,8);
	i3 = _SHIFTR(val, 0,8);

	c0 = ((i0+i1*0xc1+0x18+revid_0)^(i3*i2+0x90))&0xff;
	c1 = ((i1+i2+0x90)^(c0+i0-0xc1))&0xff;
	c2 = ((i2+0xc8)^(c0+((revid_eth_0+revid_0*0x23)^0x19)))&0xff;
	c3 = ((i0+0xc1)^(i3+((revid_eth_1+0xc8)^0x90)))&0xff;

	return ((c0<<24)|(c1<<16)|(c2<<8)|c3);
}

static s32 bba_event_handler(s32 nChn,s32 nDev)
{
	u8 status;
	struct bba_priv *priv = (struct bba_priv*)gc_netif->state;

	if(EXI_Lock(EXI_CHANNEL_0,EXI_DEVICE_2,bba_event_handler)==0) {
		LWIP_DEBUGF(NETIF_DEBUG|1,("bba_event_handler(exi locked)\n"));
		return 1;
	}

	status = bba_cmd_in8(0x03);
	bba_cmd_out8(0x02,BBA_CMD_IRMASKALL);

	LWIP_DEBUGF(NETIF_DEBUG,("bba_event_handler(status(%02x))\n",status));

	if(status&0x80) {
		LWIP_DEBUGF(NETIF_DEBUG,("bba_event_handler(bba_interrupt(%02x))\n",status));
		bba_interrupt(gc_netif);
		bba_cmd_out8(0x03,0x80);
		bba_cmd_out8(0x02,BBA_CMD_IRMASKNONE);
		EXI_Unlock(EXI_CHANNEL_0);
		return 1;
	}
	if(status&0x40) {
		LWIP_ERROR(("bba_event_handler(bba_reset(%02x))\n",status));
		__bba_init(gc_netif);
		bba_cmd_out8(0x03, 0x40);
		bba_cmd_out8(0x02, BBA_CMD_IRMASKNONE);
		EXI_Unlock(EXI_CHANNEL_0);
		return 1;
	}
	if(status&0x20) {
		LWIP_DEBUGF(NETIF_DEBUG,("bba_event_handler(unknown(%02x))\n",status));
		bba_cmd_out8(0x03, 0x20);
		bba_cmd_out8(0x02, BBA_CMD_IRMASKNONE);
		EXI_Unlock(EXI_CHANNEL_0);
		return 1;
	}
	if(status&0x10) {
		u32 response,challange;
		LWIP_DEBUGF(NETIF_DEBUG,("bba_event_handler(challange/response(%02x))\n",status));
		bba_cmd_out8(0x05,priv->acstart);
		bba_cmd_ins(0x08,&challange,sizeof(challange));
		response = bba_calc_response(priv,challange);
		bba_cmd_outs(0x09,&response,sizeof(response));

		bba_cmd_out8(0x03, 0x10);
		bba_cmd_out8(0x02, BBA_CMD_IRMASKNONE);
		EXI_Unlock(EXI_CHANNEL_0);
		return 1;
	}
	if(status&0x08) {
		LWIP_DEBUGF(NETIF_DEBUG,("bba_event_handler(challange/response status(%02x))\n",bba_cmd_in8(0x0b)));
		bba_cmd_out8(0x03, 0x08);
		bba_cmd_out8(0x02, BBA_CMD_IRMASKNONE);
		EXI_Unlock(EXI_CHANNEL_0);
		return 1;
	}
	LWIP_ERROR(("GCIF - EXI - ?? %02x\n", status));
	bba_interrupt(gc_netif);
	bba_cmd_out8(0x02,BBA_CMD_IRMASKNONE);
	EXI_Unlock(EXI_CHANNEL_0);
	return 1;
}

err_t bba_init(struct netif *dev)
{
	err_t ret;
	struct bba_priv *priv = (struct bba_priv*)dev->state;

	__bba_exi_stop(priv);

	LWIP_DEBUGF(NETIF_DEBUG, ("bba_init(call EXI_RegisterEXICallback())\n"));
	EXI_RegisterEXICallback(EXI_CHANNEL_2,bba_event_handler);

	ret = bba_probe(dev);
	if(ret!=ERR_OK) {
		EXI_RegisterEXICallback(EXI_CHANNEL_2,NULL);
		__bba_exi_wake(priv);
		return ret;
	}

	ret = __bba_get_linkstateasync(priv);
	if(ret) {
		dev->flags |= NETIF_FLAG_LINK_UP;
		ret = ERR_OK;
	} else {
		EXI_RegisterEXICallback(EXI_CHANNEL_2,NULL);
		ret = ERR_IF;
	}

	__bba_exi_wake(priv);
	return ret;
}

dev_s bba_create(struct netif *dev)
{
	struct bba_priv *priv = NULL;

	LWIP_DEBUGF(NETIF_DEBUG, ("bba_create()\n"));

	priv = (struct bba_priv*)mem_malloc(sizeof(struct bba_priv));
	if(!priv) {
		LWIP_ERROR(("bba_create: out of memory for bba_priv\n"));
		return NULL;
	}
	memset(priv,0,sizeof(struct bba_priv));

	LWP_InitQueue(&priv->tq_xmit);
	LWP_InitQueue(&wait_exi_queue);

	dev->name[0] = IFNAME0;
	dev->name[1] = IFNAME1;
	dev->output = __bba_start_tx;
	dev->linkoutput = __bba_link_tx;
	dev->mtu = 1500;
	dev->flags = NETIF_FLAG_BROADCAST;
	dev->hwaddr_len = 6;

	priv->ethaddr = (struct eth_addr*)&(dev->hwaddr[0]);
	priv->state = ERR_OK;

	gc_netif = dev;
	return priv;
}