NET CORE讀取Excel.xlsx單元格圖片的場景,一般是批量導入業務數據,例如:藥品的圖片,醫師資格證,商品上架、商家營業資質、水果信息、用戶頭像等等
這里我截個圖,圖文并茂更好理解
特別聲明:粘貼圖片,直接復制在excel里,和在單元格嵌圖片資源是兩回事的。
上面這個圖片是怎么來的呢?步驟如下:
沒錯,我講的技術實現方案,是基于這樣的嵌入單元格的圖片。
代碼的實現是:excel其實是一個壓縮包,修改后綴xlsx變成zip,這里必須是新版的xlsx格式,老板的excel 我研究了,發現excel的壓縮包的存儲邏輯和新版本的excel不一樣,自己可以修改后綴,解壓出來看看。
解壓完zip的包之后,開始讀取指定的文件,圖片路徑都是固定的,excel里有你的業務id,根據當前行的圖片所在位置,就可以在excel文件里找到對接的標識,通過標識找圖片。excel解壓出來的文件,都是xml,這時學習xml也是有必要的,要不然,你玩不明白。
處理完數據后,記得刪除zip文件。其實你可以解壓zip流,在內存中操作,操作完釋放zip流,這里我為了簡單直白,是解壓到服務器指定位置的,方便處理完后刪文件。
整體原理就是如此。
下面我上代碼:新建一個 net core api 解決方案,引用一下? NPOI Nuget包。本地創建一個 .xlsx 格式的excel文件,當然你可以用其他 操作excel的Nuget包。
我直接把所有的代碼整理好了,粘貼復制,直接可以使用,代碼里有注釋。
我是一個不愛說廢話的程序員,一言不合就是反手扔代碼。
using ICSharpCode.SharpZipLib.Zip;
using Microsoft.AspNetCore.Mvc;
using NPOI.HSSF.UserModel;
using NPOI.SS.UserModel;
using NPOI.XSSF.UserModel;
using System.Data;
using System.Xml;namespace ExcelOption.Controllers
{[ApiController][Route("[controller]")]public class ImportExcelController : ControllerBase{private readonly Microsoft.AspNetCore.Hosting.IHostingEnvironment _hostingEnvironment;public ImportExcelController(Microsoft.AspNetCore.Hosting.IHostingEnvironment hostingEnvironment){_hostingEnvironment = hostingEnvironment;}[HttpGet(Name = "dele")]public bool dele(){string zipFileName = "filezip" + ".zip";string xlsxFileName = "filexlsx" + ".xlsx";var mapPath = _hostingEnvironment.ContentRootPath;//業務邏輯處理完了就把原來的文件和解壓的文件夾刪除Directory.Delete(mapPath + @"\" + "filezip", true);System.IO.File.Delete(mapPath + @"\" + xlsxFileName);//File.Delete(mapPath + "\\" + xlsxFileName);System.IO.File.Delete(mapPath + @"\" + zipFileName);return true;}[HttpPost(Name = "ImportExcel_Img")]public bool ImportExcel_Img(IFormFileCollection files){if (files.Count > 0){var file = files[0];//讀取導入的文件類型var fileExt = file.FileName.Substring(file.FileName.LastIndexOf('.')).ToLower();if (!fileExt.Equals(".xlsx")){//提示文件類型不正確return false;}//轉換保存zipstring zipFileName = "filezip" + ".zip";string xlsxFileName = "filexlsx" + ".xlsx";var mapPath = _hostingEnvironment.ContentRootPath;//保存xlsx到服務器using (var stream = new FileStream(mapPath + xlsxFileName, FileMode.OpenOrCreate, FileAccess.ReadWrite)){file.CopyToAsync(stream);}//保存zip到服務器using (var stream = new FileStream(mapPath + zipFileName, FileMode.OpenOrCreate, FileAccess.ReadWrite)){file.CopyToAsync(stream);}var dt = ExcelHelper.ExcelToDataTable(mapPath + xlsxFileName);//解壓,如果解壓成功則根據xml處理 (應為方便我就放在ExcelHelper里面了)if (UnZipFile(mapPath + zipFileName, out string path)){//excel 圖片信息List<o_ExcelImgModel> o_ExcelImgModelList = new List<o_ExcelImgModel>();//圖片路徑文件夾var mediaFolderPath = path + @"xl\media";//判斷是否存在此文件夾如果有則處理(如果沒有圖片他是不會有這個文件夾的)if (System.IO.Directory.Exists(mediaFolderPath)){//解壓成功獲取xml 節點做處理var exclNode = GetXmlExclNodeList(path);var pictNode = GetXmlPictNodeList(path);//獲取圖片信息與地址foreach (var nl in exclNode){XmlElement sondNode = (XmlElement)nl;XmlNodeList descendDodeList = sondNode.ChildNodes;XmlNodeList picNodeList = descendDodeList[0].ChildNodes;XmlNodeList nvPicPrNodeList = picNodeList[0].ChildNodes;XmlElement cNvPrElement = (XmlElement)nvPicPrNodeList.Item(0);string name = cNvPrElement.GetAttribute("name").ToString();XmlNodeList blipFillNodeList = picNodeList[1].ChildNodes;XmlElement picElement = (XmlElement)blipFillNodeList.Item(0);string id = picElement.GetAttribute("r:embed").ToString();foreach (XmlNode xn in pictNode){XmlElement xe = (XmlElement)xn;if (xe.GetAttribute("Id").ToString() == id){var pathOfPicture = xe.GetAttribute("Target").ToString().Replace("..", "").Replace("/", @"\");pathOfPicture = path + @"xl\" + pathOfPicture;o_ExcelImgModelList.Add(new o_ExcelImgModel(){ID = id,Name = name,PathOfPicture = pathOfPicture});break;}}}//圖片對應dt的哪一列,存到dt然后再循環dt去處理(這個是小編的思維,如果有更好的做法可以隨緣發揮)foreach (var item in o_ExcelImgModelList){//item.PathOfPicture 圖片路徑取到了,此時你可以存儲了}}//現在dt某一列存放了圖片的絕對路徑就可以通過table去處理了//循環表插入數據及上傳foreach (DataRow item in dt.Rows){//此時你excel轉換的 dataTable表的圖片字段的 值是:"_xlfn.DISPIMG(\"ID_CD49305586E940EF8F78CD3B54A4BCD3\",1)"item["用戶名"].ToString(); //"zhao1"//var kkl= item["IMG"].ToString(); // "_xlfn.DISPIMG(\"ID_CD49305586E940EF8F78CD3B54A4BCD3\",1)"var breakApart = item["IMG"].ToString().Split('\\', '"')[1];var imgPath= o_ExcelImgModelList.FirstOrDefault(x => x.Name == breakApart);//獲取圖片然后做上傳邏輯,這個自己實現我就不多講了}}else{//解壓時報直接返回,這個返回啥類型或者啥數據自己定義就好我這邊demo 隨緣來個bool意思下return false;}//業務邏輯處理完了就把原來的文件和解壓的文件夾刪除Directory.Delete(mapPath + "\\" + "filezip", true);System.IO.File.Delete(mapPath + "\\" + xlsxFileName);//File.Delete(mapPath + "\\" + xlsxFileName);System.IO.File.Delete(mapPath + "\\" + zipFileName);}return true;}public static string MidStrEx(string sourse, string startstr, string endstr){string result = string.Empty;int startindex, endindex;try{startindex = sourse.IndexOf(startstr);if (startindex == -1)return result;string tmpstr = sourse.Substring(startindex + startstr.Length);endindex = tmpstr.IndexOf(endstr);if (endindex == -1)return result;result = tmpstr.Remove(endindex);}catch (Exception ex){Console.Write("MidStrEx Err:" + ex.Message);}return result;}/// <summary>/// Xml圖片表格位置及路徑ID/// </summary>private const string _XmlExcel = @"xl\cellimages.xml";/// <summary>/// Xml圖片路徑/// </summary>private const string _XmlPict = @"xl\_rels\cellimages.xml.rels";/// <summary>/// 獲取圖片路徑 Xml節點/// </summary>/// <param name="path">解壓后的文件夾路徑</param>/// <returns></returns>private XmlNodeList GetXmlPictNodeList(string path){XmlDocument doc = new XmlDocument();doc.Load(path + _XmlPict);XmlNode root = doc.DocumentElement;return root.ChildNodes;}/// <summary>/// 獲取圖片表格位置及路徑ID Xml節點/// </summary>/// <param name="path">解壓后的文件夾路徑</param>/// <returns></returns>private XmlNodeList GetXmlExclNodeList(string path){XmlDocument doc = new XmlDocument();doc.Load(path + _XmlExcel);XmlNode root = doc.DocumentElement;return root.ChildNodes;}/// <summary>/// 解壓文件/// </summary>/// <param name="zipFilePath">壓縮文件路徑</param>/// <param name="path">返回壓縮文件夾路徑</param>/// <param name="unZipDir">解壓文件存放路徑,為空時默認與壓縮文件同一級目錄下,跟壓縮文件同名的文件夾</param>/// <returns></returns>private bool UnZipFile(string zipFilePath, out string path, string unZipDir = null){if (zipFilePath == string.Empty){path = null;return false;}if (!System.IO.File.Exists(zipFilePath)){path = null;return false;}//解壓文件夾為空時默認與壓縮文件同一級目錄下,跟壓縮文件同名的文件夾 if (string.IsNullOrWhiteSpace(unZipDir))unZipDir = zipFilePath.Replace(Path.GetFileName(zipFilePath), Path.GetFileNameWithoutExtension(zipFilePath));if (!unZipDir.EndsWith("\\"))unZipDir += "\\";if (!Directory.Exists(unZipDir))Directory.CreateDirectory(unZipDir);try{using (ZipInputStream s = new ZipInputStream(System.IO.File.OpenRead(zipFilePath))){ZipEntry theEntry;while ((theEntry = s.GetNextEntry()) != null){string directoryName = Path.GetDirectoryName(theEntry.Name);string fileName = Path.GetFileName(theEntry.Name);if (directoryName.Length > 0){Directory.CreateDirectory(unZipDir + directoryName);}if (!directoryName.EndsWith("\\"))directoryName += "\\";if (fileName != String.Empty){using (FileStream streamWriter = System.IO.File.Create(unZipDir + theEntry.Name)){int size = 2048;byte[] data = new byte[2048];while (true){size = s.Read(data, 0, data.Length);if (size > 0){streamWriter.Write(data, 0, size);}else{break;}}}}}}}catch{path = null;return false;}path = unZipDir;return true;}}/// <summary>/// excel 圖片信息/// </summary>public class o_ExcelImgModel{/// <summary>/// ID/// </summary>public string ID { get; set; }/// <summary>/// 上傳圖片生成的id/// </summary>public string Name { get; set; }/// <summary>/// 圖片文件絕對路徑/// </summary>public string PathOfPicture { get; set; }}public class ExcelHelper{private static IWorkbook workbook = null;private static FileStream fs = null;/// <summary>/// 將excel中的數據導入到DataTable中/// </summary>/// <param name="fileName">excel文件路徑</param>/// <param name="sheetName">excel工作薄sheet的名稱</param>/// <param name="isFirstRowColumn">第一行是否是DataTable的列名</param>/// <returns>返回的DataTable</returns>public static DataTable ExcelToDataTable(string fileName, string sheetName = null, bool isFirstRowColumn = true){ISheet sheet = null;DataTable data = new DataTable();int startRow = 0;try{fs = new FileStream(fileName, FileMode.Open, FileAccess.Read);if (fileName.IndexOf(".xlsx") > 0) // 2007版本workbook = new XSSFWorkbook(fs);else if (fileName.IndexOf(".xls") > 0) // 2003版本workbook = new HSSFWorkbook(fs);if (sheetName != null){sheet = workbook.GetSheet(sheetName);if (sheet == null) //如果沒有找到指定的sheetName對應的sheet,則嘗試獲取第一個sheet{sheet = workbook.GetSheetAt(0);}}else{sheet = workbook.GetSheetAt(0);}if (sheet != null){IRow firstRow = sheet.GetRow(0);int cellCount = firstRow.LastCellNum; //一行最后一個cell的編號 即總的列數if (isFirstRowColumn){for (int i = firstRow.FirstCellNum; i < cellCount; ++i){ICell cell = firstRow.GetCell(i);if (cell != null){string cellValue = cell.StringCellValue;if (cellValue != null){DataColumn column = new DataColumn(cellValue);data.Columns.Add(column);}}}startRow = sheet.FirstRowNum + 1;}else{for (int i = firstRow.FirstCellNum; i < cellCount; i++){DataColumn column = new DataColumn(i.ToString());data.Columns.Add(column);}startRow = sheet.FirstRowNum;}//最后一列的標號int rowCount = sheet.LastRowNum;for (int i = startRow; i <= rowCount; ++i){IRow row = sheet.GetRow(i);if (row == null) continue; //沒有數據的行默認是null DataRow dataRow = data.NewRow();for (int j = row.FirstCellNum; j < cellCount; ++j){if (row.GetCell(j) != null) //同理,沒有數據的單元格都默認是nulldataRow[j] = row.GetCell(j).ToString();}data.Rows.Add(dataRow);}}return data;}catch (Exception ex){Console.WriteLine("Exception: " + ex.Message);return null;}}}
}
如果你看完了,就點贊轉發一下唄,給小編打打氣。我發技術文章的目的就是給自己的技術生涯留下點痕跡、或者蛛絲馬跡,畢竟互聯網是有記憶的,將來我五六十、七八十了,希望我長命百歲,還能搜到我曾經年輕時分享的技術文章,或者我的后代能看到他爸爸?爺爺 or 姥爺?太爺爺 爺爺留下來的【財富】