All Downloads are FREE. Search and download functionalities are using the official Maven repository.

org.dromara.hutool.poi.excel.sax.ExcelSaxUtil Maven / Gradle / Ivy

/*
 * Copyright (c) 2013-2024 Hutool Team and hutool.cn
 *
 * Licensed under the Apache License, Version 2.0 (the "License");
 * you may not use this file except in compliance with the License.
 * You may obtain a copy of the License at
 *
 * http://www.apache.org/licenses/LICENSE-2.0
 *
 * Unless required by applicable law or agreed to in writing, software
 * distributed under the License is distributed on an "AS IS" BASIS,
 * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
 * See the License for the specific language governing permissions and
 * limitations under the License.
 */

package org.dromara.hutool.poi.excel.sax;

import org.dromara.hutool.core.date.DateTime;
import org.dromara.hutool.core.date.DateUtil;
import org.dromara.hutool.core.exception.DependencyException;
import org.dromara.hutool.core.io.IORuntimeException;
import org.dromara.hutool.core.text.CharUtil;
import org.dromara.hutool.core.text.StrUtil;
import org.dromara.hutool.core.util.ObjUtil;
import org.dromara.hutool.poi.excel.ExcelDateUtil;
import org.dromara.hutool.poi.excel.sax.handler.RowHandler;
import org.dromara.hutool.poi.POIException;
import org.apache.poi.hssf.eventusermodel.FormatTrackingHSSFListener;
import org.apache.poi.hssf.record.CellValueRecordInterface;
import org.apache.poi.ss.usermodel.DataFormatter;
import org.apache.poi.util.XMLHelper;
import org.apache.poi.xssf.model.SharedStrings;
import org.apache.poi.xssf.usermodel.XSSFRichTextString;
import org.xml.sax.ContentHandler;
import org.xml.sax.InputSource;
import org.xml.sax.SAXException;
import org.xml.sax.XMLReader;

import javax.xml.parsers.ParserConfigurationException;
import java.io.IOException;
import java.io.InputStream;

/**
 * Sax方式读取Excel相关工具类
 *
 * @author looly
 */
public class ExcelSaxUtil {

	/**
	 * 填充字符串
 	 */
	public static final char CELL_FILL_CHAR = '@';
	/**
	 * 列的最大位数
	 */
	public static final int MAX_CELL_BIT = 3;

	/**
	 * 创建 {@link ExcelSaxReader}
	 *
	 * @param isXlsx     是否为xlsx格式(07格式)
	 * @param rowHandler 行处理器
	 * @return {@link ExcelSaxReader}
	 * @since 5.4.4
	 */
	public static ExcelSaxReader createSaxReader(final boolean isXlsx, final RowHandler rowHandler) {
		return isXlsx
				? new Excel07SaxReader(rowHandler)
				: new Excel03SaxReader(rowHandler);
	}

	/**
	 * 根据数据类型获取数据
	 *
	 * @param cellDataType  数据类型枚举
	 * @param value         数据值
	 * @param sharedStrings {@link SharedStrings}
	 * @param numFmtString  数字格式名
	 * @return 数据值
	 */
	public static Object getDataValue(CellDataType cellDataType, final String value, final SharedStrings sharedStrings, final String numFmtString) {
		if (null == value) {
			return null;
		}

		if (null == cellDataType) {
			cellDataType = CellDataType.NULL;
		}

		Object result = null;
		switch (cellDataType) {
			case BOOL:
				result = (value.charAt(0) != '0');
				break;
			case ERROR:
				result = StrUtil.format("\\\"ERROR: {} ", value);
				break;
			case FORMULA:
				result = StrUtil.format("\"{}\"", value);
				break;
			case INLINESTR:
				result = new XSSFRichTextString(value).toString();
				break;
			case SSTINDEX:
				try {
					final int index = Integer.parseInt(value);
					result = sharedStrings.getItemAt(index).getString();
				} catch (final NumberFormatException e) {
					result = value;
				}
				break;
			case DATE:
				try {
					result = getDateValue(value);
				} catch (final Exception e) {
					result = value;
				}
				break;
			default:
				try {
					result = getNumberValue(value, numFmtString);
				} catch (final NumberFormatException ignore) {
				}

				if(null == result){
					result = value;
				}
				break;
		}
		return result;
	}

	/**
	 * 格式化数字或日期值
	 *
	 * @param value        值
	 * @param numFmtIndex  数字格式索引
	 * @param numFmtString 数字格式名
	 * @return 格式化后的值
	 */
	public static String formatCellContent(String value, final int numFmtIndex, final String numFmtString) {
		if (null != numFmtString) {
			try {
				value = new DataFormatter().formatRawCellContents(Double.parseDouble(value), numFmtIndex, numFmtString);
			} catch (final NumberFormatException e) {
				// ignore
			}
		}
		return value;
	}

	/**
	 * 计算两个单元格之间的单元格数目(同一行)
	 *
	 * @param preRef 前一个单元格位置,例如A1
	 * @param ref    当前单元格位置,例如A8
	 * @return 同一行中两个单元格之间的空单元格数
	 */
	public static int countNullCell(final String preRef, final String ref) {
		// excel2007最大行数是1048576,最大列数是16384,最后一列列名是XFD
		// 数字代表列,去掉列信息
		String preXfd = ObjUtil.defaultIfNull(preRef, "@").replaceAll("\\d+", "");
		String xfd = ObjUtil.defaultIfNull(ref, "@").replaceAll("\\d+", "");

		// A表示65,@表示64,如果A算作1,那@代表0
		// 填充最大位数3
		preXfd = StrUtil.fillBefore(preXfd, CELL_FILL_CHAR, MAX_CELL_BIT);
		xfd = StrUtil.fillBefore(xfd, CELL_FILL_CHAR, MAX_CELL_BIT);

		final char[] preLetter = preXfd.toCharArray();
		final char[] letter = xfd.toCharArray();
		// 用字母表示则最多三位,每26个字母进一位
		final int res = (letter[0] - preLetter[0]) * 26 * 26 + (letter[1] - preLetter[1]) * 26 + (letter[2] - preLetter[2]);
		return res - 1;
	}

	/**
	 * 从Excel的XML文档中读取内容,并使用{@link ContentHandler}处理
	 *
	 * @param xmlDocStream Excel的XML文档流
	 * @param handler      文档内容处理接口,实现此接口用于回调处理数据
	 * @throws DependencyException 依赖异常
	 * @throws POIException        POI异常,包装了SAXException
	 * @throws IORuntimeException  IO异常,如流关闭或异常等
	 * @since 5.1.4
	 */
	public static void readFrom(final InputStream xmlDocStream, final ContentHandler handler) throws DependencyException, POIException, IORuntimeException {
		final XMLReader xmlReader;
		try {
			xmlReader = XMLHelper.newXMLReader();
		} catch (final SAXException | ParserConfigurationException e) {
			if (e.getMessage().contains("org.apache.xerces.parsers.SAXParser")) {
				throw new DependencyException(e, "You need to add 'xerces:xercesImpl' to your project and version >= 2.11.0");
			} else {
				throw new POIException(e);
			}
		}
		xmlReader.setContentHandler(handler);
		try {
			xmlReader.parse(new InputSource(xmlDocStream));
		} catch (final IOException e) {
			throw new IORuntimeException(e);
		} catch (final SAXException e) {
			throw new POIException(e);
		}
	}

	/**
	 * 判断数字Record中是否为日期格式
	 *
	 * @param cell           单元格记录
	 * @param formatListener {@link FormatTrackingHSSFListener}
	 * @return 是否为日期格式
	 * @since 5.4.8
	 */
	public static boolean isDateFormat(final CellValueRecordInterface cell, final FormatTrackingHSSFListener formatListener) {
		final int formatIndex = formatListener.getFormatIndex(cell);
		final String formatString = formatListener.getFormatString(cell);
		return isDateFormat(formatIndex, formatString);
	}

	/**
	 * 判断日期格式
	 *
	 * @param formatIndex  格式索引,一般用于内建格式
	 * @param formatString 格式字符串
	 * @return 是否为日期格式
	 * @see ExcelDateUtil#isDateFormat(int, String)
	 * @since 5.5.3
	 */
	public static boolean isDateFormat(final int formatIndex, final String formatString) {
		return ExcelDateUtil.isDateFormat(formatIndex, formatString);
	}

	/**
	 * 获取日期
	 *
	 * @param value 单元格值
	 * @return 日期
	 * @since 5.3.6
	 */
	public static DateTime getDateValue(final String value) {
		return getDateValue(Double.parseDouble(value));
	}

	/**
	 * 获取日期
	 *
	 * @param value 单元格值
	 * @return 日期
	 * @since 4.1.0
	 */
	public static DateTime getDateValue(final double value) {
		return DateUtil.date(org.apache.poi.ss.usermodel.DateUtil.getJavaDate(value, false));
	}

	/**
	 * 在Excel03 sax读取中获取日期或数字类型的结果值
	 *
	 * @param cell           记录单元格
	 * @param value          值
	 * @param formatListener {@link FormatTrackingHSSFListener}
	 * @return 值,可能为Date或Double或Long
	 * @since 5.5.0
	 */
	public static Object getNumberOrDateValue(final CellValueRecordInterface cell, final double value, final FormatTrackingHSSFListener formatListener) {
		if (isDateFormat(cell, formatListener)) {
			// 可能为日期格式
			return getDateValue(value);
		}
		return getNumberValue(value, formatListener.getFormatString(cell));
	}

	/**
	 * 获取数字类型值
	 *
	 * @param value        值
	 * @param numFmtString 格式
	 * @return 数字,可以是Double、Long
	 * @since 4.1.0
	 */
	private static Number getNumberValue(final String value, final String numFmtString) {
		if (StrUtil.isBlank(value)) {
			return null;
		}
		return getNumberValue(Double.parseDouble(value), numFmtString);
	}

	/**
	 * 获取数字类型值,除非格式中明确数字保留小数,否则无小数情况下按照long返回
	 *
	 * @param numValue     值
	 * @param numFmtString 格式
	 * @return 数字,可以是Double、Long
	 * @since 5.5.3
	 */
	private static Number getNumberValue(final double numValue, final String numFmtString) {
		// 普通数字
		if (null != numFmtString && !StrUtil.contains(numFmtString, CharUtil.DOT)) {
			final long longPart = (long) numValue;
			//noinspection RedundantIfStatement
			if (longPart == numValue) {
				// 对于无小数部分的数字类型,转为Long
				return longPart;
			}
		}
		return numValue;
	}
}




© 2015 - 2025 Weber Informatics LLC | Privacy Policy