#include <linux/init.h>
#include <linux/module.h>
#include <linux/device.h>
#include <linux/interrupt.h>
#include <linux/mutex.h>
#include <linux/delay.h>
#include <linux/sched.h>
#include <linux/slab.h>
#include <linux/mtd/mtd.h>
#include <linux/mtd/map.h>
#include <linux/mtd/partitions.h>
#include <linux/spi/flash.h>
#include <linux/version.h>
#include "bspchip.h"

#define SPI_FEAT_0705	0

#define SFCR_DIV(x)	  ((x&7) << 29)
#define SFCR_RBO_BE	  (1 << 28)
#define SFCR_WBO_BE	  (1 << 27)
#define SFCR_TCS(x)   (((x)&0x1f) << 22)

#define CSNONE		  3
#define CS0			  1
#define CS1			  2

#define SFCSR_CS(x)	  ((x) << 30)
#define SFCSR_LEN(x)  (((x)&3) << 28)
#define SFCSR_RDY     (1<<27)
#define SFCSR_IDLE    (1<<4)

/* REVISION
   1.0.000 
     Initial version
 */
#define SPI_DRV_VERSION "1.0.000"


#define dbg(fmt, arg...) //printk(fmt, ##arg)
/* Flash opcodes. */
#define	OPCODE_RDSR		0x05	/* Read status register */
#define	OPCODE_WRSR		0x01	/* Write status register 1 byte */
#define	OPCODE_RDID		0x9f	/* Read JEDEC ID */

/* Used for Macronix flashes only. */
#define OPCODE_EN4B             0xb7    /* Enter 4-byte mode */
#define OPCODE_EX4B             0xe9    /* Exit 4-byte mode */

/* Status Register bits. */
#define	SR_WIP			1	/* Write in progress */
#define	SR_WEL			2	/* Write enable latch */

#define	MAX_READY_WAIT_JIFFIES	(10 * HZ)

#define CS_LOW_DELAY (udelay(3)) /* 2.4us is the worst case scenario according to designer's calculation */
#define JEDEC_MFR(_jedec_id)    ((_jedec_id) >> 16)
#define ADDR4B_OP(f)	((f)&6)
/****************************************************************************/

struct flash_info;
struct rtk_flash_dev;

struct spi_chip_cmd {
	u8 cREAD;
	u8 cFREAD;
	u8 cPP;
	u8 cSE;
	u8 cBE32K;
	u8 cBE;
	u8 cCE;
	u8 cWREN;
	u8 cWRDI;
	/* special 4B commands */
	u8 cREAD4;
	u8 cFREAD4;
	u8 cPP4;
	u8 cSE4;
	u8 cBE32K4;
	u8 cBE4;	
};

/* Generic Command Sets */
static const struct spi_chip_cmd generic_cmd = {
	/* READ  */.cREAD = 0x03, .cFREAD = 0x0B,
	           .cREAD4 = 0x13, .cFREAD4 = 0x0C,
	/* WRITE */.cPP = 0x02, 
	           .cPP4 = 0x12,
	/* ERASE */.cSE = 0x20, .cBE32K = 0x52, .cBE = 0xD8, .cCE = 0xC7,
	           .cSE4 = 0x21, .cBE32K4 = 0x5C, .cBE4 = 0xDC, 
	/* OTHER */.cWREN = 0x06, .cWRDI = 0x04
};

static const struct spi_chip_cmd generic_cmd3 = {
	/* READ  */.cREAD = 0x03, .cFREAD = 0x0B,	           
	/* WRITE */.cPP = 0x02, 	           
	/* ERASE */.cSE = 0x20, .cBE32K = 0x52, .cBE = 0xD8, .cCE = 0xC7,	           
	/* OTHER */.cWREN = 0x06, .cWRDI = 0x04
};


struct spi_chip_ops {
	int (*read)(struct rtk_flash_dev *, u32 from, u8 *buf, u32 buflen);	
	int (*write)(struct rtk_flash_dev *, u32 to, const u8 *buf, u32 buflen);
	int (*erase_4k)(struct rtk_flash_dev *, u32 addr);
	int (*erase_32k)(struct rtk_flash_dev *, u32 addr);
	int (*erase)(struct rtk_flash_dev *, u32 addr);
	int (*erase_chip)(struct rtk_flash_dev *);
	int (*switch_4b)(struct rtk_flash_dev *, int);
	int (*read_status)(struct rtk_flash_dev *, u8 *status);
	int (*write_status)(struct rtk_flash_dev *, u8 *status);
	int (*write_enable)(struct rtk_flash_dev *, int);
};

#define GEN_INFO(_name, _jedec_id, _ext_id, _sector_size, _n_sectors)	{\
	.name = (_name),				\
	.jedec_id = (_jedec_id),		\
	.ext_id = (_ext_id),			\
	.sector_size = (_sector_size),	\
	.n_sectors = (_n_sectors),		\
	.page_size = 256,				\
	.cmd = &generic_cmd3,			\
	.ops = &generic_ops				\
}

#define GEN_INFO_1(_name, _jedec_id, _ext_id, _sector_size, _n_sectors, cmdtbl)	{\
	.name = (_name),				\
	.jedec_id = (_jedec_id),		\
	.ext_id = (_ext_id),			\
	.sector_size = (_sector_size),	\
	.n_sectors = (_n_sectors),		\
	.page_size = 256,				\
	.cmd = &cmdtbl,			\
	.ops = &generic_ops				\
}

struct flash_info {
	char		*name;
	u32	 jedec_id;
	u16  ext_id;
	u32	 sector_size;
	u16	 n_sectors;
	u16  page_size;

	const struct spi_chip_cmd *cmd;
	const struct spi_chip_ops *ops;	
};

struct spi_req {
	u8		chip;
	u8 		cmd;	
	u8		dummy_len;
	u8		is_read;
	u8 		addr_len;
	u32 	addr;	
	u8		*data;
	u32 	data_len;
};

struct rtk_flash_dev {
	int chip;
	struct mutex	 lock;
	struct mtd_info	 mtd;
	u16				 page_size;
	u8               addr_width;
	
	u8				 op_read;
	u8				 op_write;
	u8				 op_erase4k;
	u8				 op_erase32k;
	u8				 op_erase;
	u8				 op_erase_chip;
	
	u8				 read_dummy;
	u8			     command[8];
	
	char			 allow_mode;
	char			 use_quadio;
	
	const struct spi_chip_cmd *cmd;
	const struct spi_chip_ops *ops;
};

static inline struct rtk_flash_dev *mtd_to_flashinfo(struct mtd_info *mtd)
{
	return container_of(mtd, struct rtk_flash_dev, mtd);
}

static void rtk_spi_reg_init(void) {
	#if 0 
	REG32(BSP_SFCR) = (REG32(BSP_SFCR) & 0x3fffff) | SFCR_RBO_BE | SFCR_WBO_BE |
		SFCR_DIV(2) |  /* SPI_clock = DRAM clock(e.g.166)/DIV  */
		SFCR_TCS(15);
	#endif
	/* Assume bootloader or other has setup for us */
	
	printk("SFCR: %08x  SFCR2: %08x\n", REG32(BSP_SFCR), REG32(BSP_SFCR2));
}

static void rspi_busy_wait_ready(void) {
	#if SPI_FEAT_0705
	unsigned int total = 0;
	#define READY_MASK (SFCSR_IDLE|SFCSR_RDY)
	while ((REG32(BSP_SFCSR)&READY_MASK)!=READY_MASK) {
		total++;
		if (unlikely(total >= 1000000)) {
			printk("SPI jam? RDY=0 for too long\n"); 
			BUG();
		}
	}
	#else
	/* Need to get 100 consecutive RDY before we know HW is really ready */
	int i = 0, ready = 0, total = 0;
	while (!ready) {
		
		if ((REG32(BSP_SFCSR) & SFCSR_RDY)) {
			i++;
		} else {
			i = 0;
		}
		total++;		
		if (unlikely(total >= 1000000)) {
			printk("SPI jam? RDY=0 for too long\n"); 
			BUG();
		}		
		if (unlikely(i >= 100))
			ready = 1;
	}	
	#endif
}

u32 __attribute__((weak)) bsp_spif_mmio_copy(void* to, loff_t from, u32 len) {
	printk_once("rtk_spi: missing bsp_spif_mmio_copy\n");
	return 0;
}

void __attribute__((weak)) bsp_spif_mmio_inv(u32 from, u32 len) {
	printk_once("rtk_spi: missing bsp_spif_mmio_inv\n");
}

static void flush_prediction(volatile unsigned int x) {
	if (x>1)
		flush_prediction(x-1);
}

#define DEBUG_CMD 0
static inline void debug_print_cmd(u8 *cmd, int cmdlen, const char *msg) {
	int i;
	if (DEBUG_CMD) {
		if (cmdlen > 16)
			cmdlen = 16;
		printk("%s CMD: ", msg);
		for (i=0; i<cmdlen; i++)
			printk("%02x ", cmd[i]);
		printk("\n");
	}
}

static inline void debug_print_request(struct spi_req *req) {	
	if (DEBUG_CMD) {
		printk("Req %02x ",req->cmd);
		if (req->addr_len)
			printk(" addr=%x(%d) ",req->addr,req->addr_len);
		if (req->dummy_len)
			printk(" dummy=%d ",req->dummy_len);
		printk("\n");
	}
}

static void rtk_spi_pio(void) {	
	flush_prediction(10);
	rspi_busy_wait_ready();	
	REG32(BSP_SFCSR) = SFCSR_LEN(0) | SFCSR_CS(CSNONE) | SFCSR_RDY;
	rspi_busy_wait_ready();	
	REG32(BSP_SFCSR) = SFCSR_LEN(0) | SFCSR_CS(0) | SFCSR_RDY;
	CS_LOW_DELAY; 
	REG32(BSP_SFCSR) = SFCSR_LEN(0) | SFCSR_CS(CSNONE) | SFCSR_RDY;			
	rspi_busy_wait_ready();	
}

static int rtkspi_request(struct spi_req *req) {
	/* sanity check */
	if (req->addr_len && ((req->addr_len > 4) || (req->addr_len < 3))) {
		printk("Invalide address length(%d)\n",req->addr_len);
		return -1;
	}
	
	if (req->dummy_len > 4) {
		printk("Dummy length not supported(%d)\n",req->dummy_len);
		return -1;
	}
	
	debug_print_request(req);
	
	rtk_spi_pio();
	/* command phase */
	REG32(BSP_SFCSR) = SFCSR_CS(req->chip) | SFCSR_LEN(0) | SFCSR_RDY;
	rspi_busy_wait_ready();	
	REG32(BSP_SFDR) = req->cmd << 24;
	rspi_busy_wait_ready();	
	
	/* address phase */
	if (req->addr_len) {		
		REG32(BSP_SFCSR) = SFCSR_CS(req->chip) | SFCSR_LEN(req->addr_len - 1) | SFCSR_RDY;
		rspi_busy_wait_ready();	
		REG32(BSP_SFDR) = (req->addr_len==3) ? (req->addr << 8) : req->addr;		
		rspi_busy_wait_ready();	
	}
	
	if (req->dummy_len) {				
		REG32(BSP_SFCSR) = SFCSR_CS(req->chip) | SFCSR_LEN(req->dummy_len - 1) | SFCSR_RDY;
		rspi_busy_wait_ready();	
		REG32(BSP_SFDR) = 0;
		rspi_busy_wait_ready();	
	}
	
	/* data phase */
	if (req->data_len) {
		u32 len = req->data_len;
		u8  *buf = req->data;

		while (len) {
			u32 word, to_access;
			to_access = (len > 4) ? 4 : len;
			REG32(BSP_SFCSR) = SFCSR_CS(req->chip) | SFCSR_LEN(to_access - 1) | SFCSR_RDY;
			word = 0;
			rspi_busy_wait_ready();	
			if (req->is_read) {
				word = REG32(BSP_SFDR);				
				memcpy(buf, &word, to_access);
			} else {
				memcpy(&word, buf, to_access);
				REG32(BSP_SFDR) = word;
			}			
			buf += to_access;
			len -= to_access;
			rspi_busy_wait_ready();	
		}
	}
	
	/* close */
	CS_LOW_DELAY;//rspi_busy_wait_ready();
	REG32(BSP_SFCSR) = SFCSR_CS(CSNONE);
	return 0;
}

static int rtkspi_cmd(struct rtk_flash_dev *f, u8 cmd)  {
	struct spi_req req;
	memset(&req, 0, sizeof(req));
	req.chip = f->chip;
	req.cmd  = cmd;
	return rtkspi_request(&req);
}

static int rtkspi_cmd_addr(struct rtk_flash_dev *f, u8 cmd, u32 addr) {
	struct spi_req req;
	memset(&req, 0, sizeof(req));
		
	req.chip = f->chip;
	req.cmd  = cmd;
	req.addr = addr;
	req.addr_len  = f->addr_width;
	//req.dummy_len = f->read_dummy;	
	req.data_len = 0;
	
	return rtkspi_request(&req);
}

static int rtkspi_cmd_read(struct rtk_flash_dev *f, u8 cmd, u8 *data, u32 data_len) {
	struct spi_req req;
	memset(&req, 0, sizeof(req));
		
	req.chip = f->chip;
	req.cmd  = cmd;
	req.data = data;
	req.data_len = data_len;
	req.is_read = 1;
	
	return rtkspi_request(&req);
}

static int rtkspi_cmd_addr_write(struct rtk_flash_dev *f, u8 cmd, u32 addr, const u8 *data, u32 data_len) {
	struct spi_req req;
	memset(&req, 0, sizeof(req));
		
	req.chip = f->chip;
	req.cmd  = cmd;
	req.addr = addr;
	req.addr_len  = f->addr_width;	
	req.data = (u8 *)data;
	req.data_len = data_len;	
	return rtkspi_request(&req);
}

/***************************************************************************
GENERIC TEMPLATES - MXIC like 
***************************************************************************/
static inline int setup_cmd_addr_dummy(struct rtk_flash_dev *f, u8 cmd, u32 addr, int dummy) {
	int cmdsiz = 0;
	
	f->command[cmdsiz++] = cmd; 
	if (4==f->addr_width) 
		f->command[cmdsiz++] = (0xff & (addr >> 24)); 
	f->command[cmdsiz++] = (0xff & (addr >> 16)); 
	f->command[cmdsiz++] = (0xff & (addr >> 8)); 
	f->command[cmdsiz++] = (0xff & (addr >> 0)); 
	if (dummy)
		f->command[cmdsiz++] = 0; 
	return cmdsiz;
}


static int generic_wait_till_ready(struct rtk_flash_dev *f)
{
	unsigned long deadline;
	u8 status;
	deadline = jiffies + MAX_READY_WAIT_JIFFIES;

	do {
		if (f->ops->read_status(f, &status) != 0)
			break;
		else if (!(status & SR_WIP))
			return 0;

		cond_resched();

	} while (!time_after_eq(jiffies, deadline));

	return 1;
}

static int generic_read(struct rtk_flash_dev *f, u32 from, u8 *buf, u32 buflen) {
	struct spi_req req;
	memset(&req, 0, sizeof(req));
		
	if ((from + buflen) > f->mtd.size) { /* trim extra */
		buflen = f->mtd.size - from;
	}
	req.chip = f->chip;
	req.cmd  = f->op_read;
	req.addr = from;
	req.addr_len  = f->addr_width;
	req.dummy_len = f->read_dummy ? 1 : 0;
	req.data = buf;
	req.data_len = buflen;
	req.is_read = 1;
		
	if (!rtkspi_request(&req)) {
		return buflen;
	}
	return 0;	
}

static int generic_write(struct rtk_flash_dev *f, u32 to, const u8 *buf, u32 buflen) {	
	u32 page_offset, page_size;
	struct spi_req req;
		
	if ((to + buflen) > f->mtd.size) { /* trim extra */
		buflen = f->mtd.size - to;
	}
	
	memset(&req, 0, sizeof(req));
	
	/* what page do we start with? */
	page_offset = to & (f->page_size - 1);	
	f->ops->write_enable(f, 1);
	
	/* do all the bytes fit onto one page? */
	if (page_offset + buflen <= f->page_size) {			
		rtkspi_cmd_addr_write(f, f->op_write, to, buf, buflen);
		generic_wait_till_ready(f);
	} else {
		u32 i;
		
		/* the size of data remaining on the first page */
		page_size = f->page_size - page_offset;		
		rtkspi_cmd_addr_write(f, f->op_write, to, buf, page_size);
		
		/* write everything in PAGESIZE chunks */
		for (i = page_size; i < buflen; i += page_size) {
			page_size = buflen - i;
			if (page_size > f->page_size)
				page_size = f->page_size;
						
			generic_wait_till_ready(f);			
			f->ops->write_enable(f, 1);			
			rtkspi_cmd_addr_write(f, f->op_write, to+i, buf+i, page_size);			
		}
		generic_wait_till_ready(f);
	}	

	return buflen;
}

static int __generic_erase_xxk(struct rtk_flash_dev *f, u8 code, u32 addr) {
	f->ops->write_enable(f, 1);
	rtkspi_cmd_addr(f, code, addr);
	if (generic_wait_till_ready(f))
		return -1;
	
	return 0;
}

static int generic_erase_4k(struct rtk_flash_dev *f, u32 addr) {	
	return __generic_erase_xxk(f, f->op_erase4k, addr);	
}

static int generic_erase_32k(struct rtk_flash_dev *f, u32 addr) {
	return __generic_erase_xxk(f, f->op_erase32k, addr);
}

static int generic_erase(struct rtk_flash_dev *f, u32 addr) {
	return __generic_erase_xxk(f, f->op_erase, addr);	
}

static int generic_erase_chip(struct rtk_flash_dev *f) {
		
	if (generic_wait_till_ready(f))
		return 1;	
	f->ops->write_enable(f, 1);
	rtkspi_cmd(f, f->op_erase_chip);
	return 0;
}

static int generic_read_status(struct rtk_flash_dev *f, u8 *status) {
	int retval;
	retval = rtkspi_cmd_read(f, OPCODE_RDSR, status, 1);

	if (retval < 0) {
		printk(KERN_ERR "error %d reading SR\n",
				(int) retval);
		return 1;
	}

	return 0;	
}

static int generic_switch_4b(struct rtk_flash_dev *f, int to4b) {
	u8	code = to4b ? OPCODE_EN4B : OPCODE_EX4B;

	return rtkspi_cmd(f, code);
}

static int generic_write_enable(struct rtk_flash_dev *f, int enable)
{
	u8	code = enable ? f->cmd->cWREN : f->cmd->cWRDI;

	return rtkspi_cmd(f, code);
}


static const struct spi_chip_ops generic_ops = {
	.read 	= generic_read,
	.write 	= generic_write,
	.erase_4k = generic_erase_4k,
	.erase_32k = generic_erase_32k,
	.erase = generic_erase,
	.erase_chip = generic_erase_chip,
	.read_status = generic_read_status,	
	.write_enable = generic_write_enable,
	.switch_4b = generic_switch_4b,
};

/****************************************************************************/

 
/****************************************************************************/

/*
 * MTD implementation
 */
static int rtk_mtd_erase(struct mtd_info *mtd, struct erase_info *instr)
{
	struct rtk_flash_dev *flash = mtd_to_flashinfo(mtd);
	u32 addr,len;
	uint32_t rem;
	
	pr_debug("%s %s 0x%llx, len %lld\n",
	      __func__, "at", (long long)instr->addr, (long long)instr->len);

	/* sanity checks */
	if (instr->addr + instr->len > flash->mtd.size)
		return -EINVAL;
	rem = instr->len & (mtd->erasesize - 1);
	if (rem) {
		printk("Warning: %lld not multiple of erase size %d. Will pad to erase size\n", instr->len, mtd->erasesize);
		instr->len = (instr->len + (mtd->erasesize - 1)) & ~(mtd->erasesize - 1);
		//return -EINVAL;
	}

	addr = instr->addr;
	len = instr->len;
	
	mutex_lock(&flash->lock);

	/* whole-chip erase? */
	if (len == flash->mtd.size) {
		if (flash->ops->erase_chip(flash)) {
			instr->state = MTD_ERASE_FAILED;
			mutex_unlock(&flash->lock);
			return -EIO;
		}	
	} else {
		
		while (len) {
			u32 incr;
			int ret;
			ret = -1;
			if (flash->ops->erase && (len >= 0x10000) && (0==(addr & 0xffff))) { /* can block erase */
				incr = 0x10000;
				ret = flash->ops->erase(flash, addr);
			}
			#if 0 /* Winbond erase_32k command isn't well supported */
			else if (flash->ops->erase_32k && (len >= 0x8000) && (0==(addr & 0x7fff))) {
				incr = 0x8000;
				ret = flash->ops->erase_32k(flash, addr);
			} 
			#endif
			else if (flash->ops->erase_4k && (len >= 0x1000) && (0==(addr & 0xfff))) {
				incr = 0x1000;
				ret = flash->ops->erase_4k(flash, addr);				
			}		
			
			if (ret) {
				instr->state = MTD_ERASE_FAILED;
				mutex_unlock(&flash->lock);
				return -EIO;
			}

			addr +=incr;
			len -= incr;
		}
	}

	bsp_spif_mmio_inv(instr->addr, instr->len);
	mutex_unlock(&flash->lock);	
	instr->state = MTD_ERASE_DONE;
	mtd_erase_callback(instr);

	return 0;
}

static int rtk_mtd_read(struct mtd_info *mtd, loff_t from, size_t len,
	size_t *retlen, u_char *buf)
{
	struct rtk_flash_dev *flash = mtd_to_flashinfo(mtd);
	size_t ret;	
			
	pr_debug("%s %s 0x%llx, len %lld\n",
	      __func__, "from", (long long)from, (long long)len);

	/* sanity checks */
	if (!len)
		return 0;

	if (from + len > flash->mtd.size)
		return -EINVAL;

	if (retlen)
		*retlen = 0;

	mutex_lock(&flash->lock);/* Wait till previous write/erase is done. */
		
	/* let HW do partial work for us */	
	ret = bsp_spif_mmio_copy(buf, from, len);	
	//printk("%llx: %02x %02x %02x %02x \n",from,buf[0],buf[1],buf[2],buf[3]);
	if (unlikely(ret<len)) {				
		len  -= ret;
		from += ret;
		buf  += ret;
		ret  += flash->ops->read(flash, from, buf, len);
	}
	
	*retlen = ret;

	mutex_unlock(&flash->lock);

	return 0;
}
 
static int rtk_mtd_write(struct mtd_info *mtd, loff_t to, size_t len,
	size_t *retlen, const u_char *buf)
{
	struct rtk_flash_dev *flash = mtd_to_flashinfo(mtd);
	size_t ret;

	dbg("%s %s 0x%llx, len %lld\n",
	      __func__, "to", (long long)to, (long long)len);
		  
	if (retlen)
		*retlen = 0;

	/* sanity checks */
	if (!len)
		return(0);

	if (to + len > flash->mtd.size)
		return -EINVAL;

	mutex_lock(&flash->lock);

	/* Wait until finished previous write command. */
	if (generic_wait_till_ready(flash)) {
		mutex_unlock(&flash->lock);
		return 1;
	}
	
	ret = flash->ops->write(flash, to, buf, len);
	*retlen = ret;
	bsp_spif_mmio_inv((u32)to, ret);
	mutex_unlock(&flash->lock);

	return 0;
}

static struct flash_info /*__initdata*/ rtk_flash_data [] = {
	/* Mxic */
	GEN_INFO  ("MX25L64" , 0xc22017, 0, 64*1024, 128),
	GEN_INFO  ("MX25L128", 0xc22018, 0, 64*1024, 256), /* checked */
	GEN_INFO_1("MX25L256", 0xc22019, 0, 64*1024, 512, generic_cmd), /* MX25L256F */
	//GEN_INFO_1("MX25L256", 0xc22019, 0, 64*1024, 512, generic_cmd3),	/* MX25L256E - not recommended */

	/* Winbond */
	GEN_INFO  ("W25Q64",   0xef4017, 0, 64*1024, 128),
	GEN_INFO  ("W25Q128",  0xef4018, 0, 64*1024, 256),
	GEN_INFO_1("W25Q256",  0xef4019, 0, 64*1024, 512, generic_cmd), /* W25Q256JV */
	
	/* Gigadevice */
	GEN_INFO_1("GD25Q512MC", 0xc84020, 0, 64*1024, 512, generic_cmd),

	/* Micron */
	GEN_INFO_1("MT25QL256", 0x20ba19, 0, 64*1024, 512, generic_cmd),
};

static struct flash_info *__init flash_id_probe(struct rtk_flash_dev *f)
{
	int			tmp;
	u8			id[5];
	u32			flash_id;
	u16                     ext_jedec;
	struct flash_info	*info;
	
	static struct flash_info	s_info;
	static char s_name[32];
	
	rtkspi_cmd_read(f, OPCODE_RDID, id, sizeof(id));
	
	flash_id = (id[0] << 16) | (id[1] << 8) | id[2];
	ext_jedec = id[3] << 8 | id[4];
	
	for (tmp = 0, info = rtk_flash_data;
			tmp < ARRAY_SIZE(rtk_flash_data);
			tmp++, info++) {
		if (info->jedec_id == flash_id) {
			if (info->ext_id != 0 && info->ext_id != ext_jedec)
				continue;
			return info;
		}
	}
	
	/* try our best guess here. */
	info = NULL;
	memset((void*)&s_info, 0,sizeof(s_info)); 
	s_name[0]='\0';	
	switch (id[0]) {
	case 0xc2: /* MXIC */
		snprintf(s_name, sizeof(s_name)-1, "MXIC-%02x%02x%02x(auto)",id[0],id[1],id[2]);
		info = &s_info;
		break;
	case 0xef: /* Winbond */
		if (id[2]>=0x19) /* need to check if 32M+ is supported. */
			break;
		snprintf(s_name, sizeof(s_name)-1, "Winbond-%02x%02x%02x(auto)",id[0],id[1],id[2]);
		info = &s_info;
		break;	
	}
	
	if (info) {
		info->name = s_name;		
		info->jedec_id = flash_id;
		info->sector_size = 64*1024;
		info->n_sectors = 1 << (id[2] - 16); 
		info->page_size = 256;
		info->ops = &generic_ops;
		info->cmd = (info->n_sectors>=512) ? &generic_cmd : &generic_cmd3;
		return info;
	}
	
	printk("unrecognized flash id %06x\n", flash_id);
	return NULL;
}

static int is_support_4b_cmd(struct flash_info *info) {	
	if ((0==info->cmd->cREAD4) || (0==info->cmd->cBE4) || (0==info->cmd->cPP4))
		return 0;
	return 1;
}

static struct mtd_info * rtk_spi_probe(struct map_info *map)
{
	struct rtk_flash_dev			*flash;
	struct flash_info		*info;
	unsigned			i;

	rtk_spi_reg_init();
	rtk_spi_pio();

	flash = kzalloc(sizeof *flash, GFP_KERNEL);
	if (!flash)
		return 0;

	mutex_init(&flash->lock);
	map->fldrv_priv = (void *)flash;
		
	flash->chip = CS0;
	
	info = flash_id_probe(flash);

	if (!info) {
		kfree(flash);
		return 0;
	}
	
	flash->mtd.name = map->name;
	flash->mtd.type = MTD_NORFLASH;
	flash->mtd.writesize = 1;
	flash->mtd.flags = MTD_CAP_NORFLASH;
	flash->mtd.size = info->sector_size * info->n_sectors;
	#if (LINUX_VERSION_CODE >= KERNEL_VERSION(3,0,0))
	flash->mtd._erase = rtk_mtd_erase;
	flash->mtd._write = rtk_mtd_write;
	flash->mtd._read  = rtk_mtd_read;
	#else
	flash->mtd.erase = rtk_mtd_erase;
	flash->mtd.write = rtk_mtd_write;
	flash->mtd.read  = rtk_mtd_read;
	#endif
	
	flash->page_size  = info->page_size;
	
	flash->ops = info->ops;
	flash->cmd = info->cmd;
	
	/* 4b address for 16M+ flash */
	flash->addr_width = (flash->mtd.size > 0x1000000) ? 4 : 3;
	// flash->allow_mode = 1;
	printk("%s (%lld Kbytes) ", info->name, (long long)flash->mtd.size >> 10);	
	
	/* select process - */
	flash->op_erase_chip = flash->cmd->cCE;	
	if ((4==flash->addr_width) && is_support_4b_cmd(info)) {
		printk("using 4B command set.\n");
		if (flash->cmd->cFREAD4) {
			flash->read_dummy = 1;
			flash->op_read = flash->cmd->cFREAD4;
		} else {
			flash->read_dummy = 0;
			flash->op_read = flash->cmd->cREAD4;
		}			
		flash->op_write = flash->cmd->cPP4;
		flash->op_erase = flash->cmd->cBE4;
		flash->op_erase32k = flash->cmd->cBE32K4;
		flash->op_erase4k = flash->cmd->cSE4;			
	} else {
		if (4==flash->addr_width) {
			if (!flash->allow_mode) {
				printk("4B mode not allowed!\n");
				return NULL;
			}
			if ((NULL==flash->ops->switch_4b) || (flash->ops->switch_4b(flash, 1))){
				printk("switch to 4B mode failed!\n");
				return NULL;
			}
			printk("switched to 4B mode.\n");
		} else {
			printk("using 3B command set.\n");
		}
		if (flash->cmd->cFREAD) {
			flash->read_dummy = 1;
			flash->op_read = flash->cmd->cFREAD;
		} else {
			flash->read_dummy = 0;
			flash->op_read = flash->cmd->cREAD;
		}
		flash->op_write = flash->cmd->cPP;
		flash->op_erase = flash->cmd->cBE;
		flash->op_erase32k = flash->cmd->cBE32K;
		flash->op_erase4k = flash->cmd->cSE;		
	}
		
	if (flash->ops->erase_4k) 
		flash->mtd.erasesize = 0x1000;
	else if (flash->ops->erase_32k)
		flash->mtd.erasesize = 0x8000;
	else if (flash->ops->erase)
		flash->mtd.erasesize = 0x10000;		

	pr_debug(
		"mtd .name = %s, .size = 0x%llx (%lldMiB) "
			".erasesize = 0x%.8x (%uKiB) .numeraseregions = %d\n",
		flash->mtd.name,
		(long long)flash->mtd.size, (long long)(flash->mtd.size >> 20),
		flash->mtd.erasesize, flash->mtd.erasesize / 1024,
		flash->mtd.numeraseregions);

	if (flash->mtd.numeraseregions)
		for (i = 0; i < flash->mtd.numeraseregions; i++)
			pr_debug(
				"mtd.eraseregions[%d] = { .offset = 0x%llx, "
				".erasesize = 0x%.8x (%uKiB), "
				".numblocks = %d }\n",
				i, (long long)flash->mtd.eraseregions[i].offset,
				flash->mtd.eraseregions[i].erasesize,
				flash->mtd.eraseregions[i].erasesize / 1024,
				flash->mtd.eraseregions[i].numblocks);

	return &flash->mtd;
}



static struct mtd_chip_driver rtkspi_driver = {
	.probe  = rtk_spi_probe,
	.name   = "rtkspi_probe",
	.module = THIS_MODULE
};


static int __init rtk_spi_init(void)
{
	printk("SPI Flash Driver for RTK SoC, Version " SPI_DRV_VERSION "\n");
	register_mtd_chip_driver(&rtkspi_driver);	
	return 0;
}


static void __exit rtk_spi_exit(void)
{
	unregister_mtd_chip_driver(&rtkspi_driver);	
}


module_init(rtk_spi_init);
module_exit(rtk_spi_exit);

MODULE_LICENSE("GPL");
MODULE_AUTHOR("Andrew Chang <yachang@realtek.com>");
MODULE_DESCRIPTION("SPI driver for Realtek SoC");