Excel转化成DataTable实现:NPOI和OLEDb

Posted 二奎

tags:

篇首语:本文由小常识网(cha138.com)小编为大家整理,主要介绍了Excel转化成DataTable实现:NPOI和OLEDb相关的知识,希望对你有一定的参考价值。

使用两种方式实现的excel数据转化成DataSet,再结合前一篇的DataTable转化为实体,就可以解决excel到实体之间的转化。

代码如下:

首先定义一个接口:

    public interface IExcelAccess
    {
        DataSet Load(ExcelConfig config);
    }
public class ExcelConfig
    {
        /// <summary>
        /// 文件存储路径
        /// </summary>
        public string Path { get; set; }

        /// <summary>
        /// 文件表头所在行索引
        /// </summary>
        public int HeaderIndex { get; set; }
    }

再来看一下使用NPOI的实现:

public class NpoiExcelAccess : IExcelAccess
    {
        /// <summary>
        /// 根据文件扩展名,获取workbook实例
        /// </summary>
        /// <param name="ext"></param>
        /// <returns></returns>
        private IWorkbook GetWorkBook(string ext, Stream stream)
        {
            IWorkbook workbook = null;

            switch (ext)
            {
                case ".xlsx":
                    workbook = new XSSFWorkbook(stream);
                    break;
                case ".xls":
                    workbook = new HSSFWorkbook(stream);
                    break;
                default:
                    break;
            }

            return workbook;
        }

        /// <summary>
        /// 加载数据,可设置跳过前几行
        /// </summary>
        /// <param name="path"></param>
        /// <param name="skipRows"></param>
        /// <returns></returns>
        public DataSet Load(ExcelConfig config)
        {
            using (var fileStream = new FileStream(config.Path, FileMode.Open, FileAccess.Read))
            {
                var ds = new DataSet();
                var ext = Path.GetExtension(config.Path);

                // 新建IWorkbook对象 
                var workbook = this.GetWorkBook(ext, fileStream);

                for (int i = 0; i < workbook.NumberOfSheets; i++)
                {
                    ISheet sheet = workbook.GetSheetAt(i);
                    DataTable dt = GetDataTable(sheet, config.HeaderIndex);
                    ds.Tables.Add(dt);
                }

                return ds;
            }
        }

        private DataTable GetDataTable(ISheet sheet, int headerIndex)
        {
            var dt = new DataTable();
            // 获取表头行
            var headerRow = sheet.GetRow(headerIndex);
            var cellCount = GetCellCount(sheet, headerIndex);

            // 设置表头
            for (int i = 0; i < cellCount; i++)
            {
                if (headerRow.GetCell(i) != null)
                {
                    dt.Columns.Add(headerRow.GetCell(i).StringCellValue, typeof(string));
                }
            }
            
            for (int i = headerIndex + 1; i <= sheet.LastRowNum; i++)
            {
                IRow row = sheet.GetRow(i);
                DataRow dr = dt.NewRow();
                FillDataRow(row, ref dr);
                dt.Rows.Add(dr);
            }

            dt.TableName = sheet.SheetName;
            return dt;

        }

        private void FillDataRow(IRow row, ref DataRow dr)
        {
            if (row != null)
            {
                for (int j = 0; j < dr.Table.Columns.Count; j++)
                {
                    ICell cell = row.GetCell(j);

                    if (cell != null)
                    {
                        switch (cell.CellType)
                        {
                            case CellType.Blank:
                                dr[j] = DBNull.Value;
                                break;
                            case CellType.Boolean:
                                dr[j] = cell.BooleanCellValue;
                                break;
                            case CellType.Numeric:
                                if (DateUtil.IsCellDateFormatted(cell))
                                {
                                    dr[j] = cell.DateCellValue;
                                }
                                else
                                {
                                    dr[j] = cell.NumericCellValue;
                                }
                                break;
                            case CellType.String:
                                dr[j] = cell.StringCellValue;
                                break;
                            case CellType.Error:
                                dr[j] = cell.ErrorCellValue;
                                break;
                            case CellType.Formula:
                                // cell = evaluator.EvaluateInCell(cell) as HSSFCell;
                                dr[j] = cell.ToString();
                                break;
                            default:
                                throw new NotSupportedException(string.Format("Catched unhandle CellType[{0}]", cell.CellType));
                        }
                    }
                }
            }
        }

        /// <summary>
        /// 获取表头列数
        /// </summary>
        /// <param name="sheet"></param>
        /// <param name="skipRows"></param>
        /// <returns></returns>
        private int GetCellCount(ISheet sheet, int headerIndex)
        {
            var headerRow = sheet.GetRow(headerIndex);

            return headerRow.LastCellNum;
        }
    }

 

最后看一下使用OLEDB的实现,这里,我只实现了excel2003的版本,07版本的总是失败,查了原因,是需要在本机安装一个组件才能支持导入.xlsx文件。

 public class OleDbExcelAccess : IExcelAccess
    {
        private string strConn;

        public OleDbExcelAccess()
        {
            //TODO 需要根据扩展名,来决定 使用哪一种连接字符串
            strConn = " Provider = Microsoft.Jet.OLEDB.4.0 ; Data Source = {0};Extended Properties=‘Excel 8.0;IMEX=1;HDR=NO‘";
        }

        public DataSet Load(ExcelConfig config)
        {
            var ds = new DataSet();
            var sheets = GetSheetNames(config.Path);
            var strConnTmp = string.Format(strConn, config.Path);

            foreach (string sheet in sheets)
            {
                using (var oleConn = new OleDbConnection(strConnTmp))
                {
                    var strsql = "SELECT * FROM [" + sheet + "]";
                    var oleDaExcel = new OleDbDataAdapter(strsql, oleConn);
                    oleConn.Open();
                    oleDaExcel.Fill(ds, sheet);
                }
            }

            return ds;
        }

        /// <summary>
        /// 获取Excel的所有的sheet
        /// </summary>
        /// <param name="path"></param>
        /// <returns></returns>
        private string[] GetSheetNames(string path)
        {
            DataTable dt = new DataTable();
            if (File.Exists(path))
            {
                string strConnTmp = string.Format(strConn, path);
                using (var conn = new OleDbConnection(strConnTmp))
                {
                    conn.Open();
                    //返回Excel的架构,包括各个sheet表的名称,类型,创建时间和修改时间等    
                    dt = conn.GetOleDbSchemaTable(OleDbSchemaGuid.Tables, new object[] { null, null, null, "Table" });
                }
                //包含excel中表名的字符串数组
                var sheetNames = new List<string>();
                for (int k = 0; k < dt.Rows.Count; k++)
                {
                    string tableName = dt.Rows[k]["TABLE_NAME"].ToString();
                    //修正出现兼容性视图名称时过滤表名
                    if (!tableName.Substring(tableName.Length - 1).Equals("_"))
                    {
                        sheetNames.Add(tableName);
                    }
                }
                return sheetNames.ToArray();

            }
            return null;

        }
    }

 

最后看一下客户端的调用 :

 private void TestExcelImport()
        {
            var excelFile = Path.Combine("C:\\Users\\hankk\\Desktop\\ICON", "2003版本.xls");

            ExcelConfig config = new ExcelConfig()
            {
                Path = excelFile,
                HeaderIndex = 1
            };

            IExcelAccess npoiAccess = new NpoiExcelAccess();
            var npoiDs = npoiAccess.Load(config);

            IExcelAccess oleDbAccess = new OleDbExcelAccess();
            var oleDs = oleDbAccess.Load(config);
        }

 

代码已上传到github: https://github.com/hankuikuide/ExcelAccessor

 

以上是关于Excel转化成DataTable实现:NPOI和OLEDb的主要内容,如果未能解决你的问题,请参考以下文章

NPOI DataTable转Excel ,Excel转DataTable

使用NPOI读取Excel到DataTable

datatable导出excel---NPOI

NPOI DataTable导出excel

Excel操作--使用NPOI导入导出Excel为DataTable

NPOI 将excel转换为datatable或者将datatable转换为excel