You can not select more than 25 topics Topics must start with a letter or number, can include dashes ('-') and can be up to 35 characters long.

188 lines
7.5 KiB

8 months ago
package com.dsideal.base.Tools.Test;
8 months ago
import com.dsideal.base.Tools.FillData.ExcelKit.ExcelKit;
8 months ago
import com.jfinal.kit.StrKit;
8 months ago
import org.apache.poi.openxml4j.exceptions.InvalidFormatException;
import org.dom4j.Document;
import org.dom4j.DocumentException;
import org.dom4j.Element;
import org.dom4j.io.SAXReader;
import org.xml.sax.SAXException;
import javax.xml.parsers.ParserConfigurationException;
import javax.xml.xpath.XPathExpressionException;
import java.io.File;
import java.io.FileInputStream;
import java.io.FileOutputStream;
import java.io.IOException;
8 months ago
import java.util.ArrayList;
8 months ago
import java.util.HashMap;
8 months ago
import java.util.List;
8 months ago
import java.util.Map;
8 months ago
import java.util.zip.ZipEntry;
import java.util.zip.ZipInputStream;
public class TestOutSideExcel {
/**
*
*
* @throws IOException
*/
8 months ago
public static void UnCompress(String wordPath, String workingPath) throws IOException {
8 months ago
workingPath = workingPath.replace("\\", "/");
if (!workingPath.endsWith("/")) workingPath += "/";
8 months ago
File file = new File(wordPath);//取得word文件
8 months ago
FileInputStream inputStream = new FileInputStream(file);
ZipInputStream zipInputStream = new ZipInputStream(inputStream);
ZipEntry entry;
8 months ago
byte[] ch = new byte[256];
8 months ago
while ((entry = zipInputStream.getNextEntry()) != null) {
8 months ago
File zFile = new File(workingPath + entry.getName());
8 months ago
if (entry.isDirectory()) {
if (!zFile.exists()) {
zFile.mkdirs();
}
zipInputStream.closeEntry();
} else {
File fpath = new File(zFile.getParent());
if (!fpath.exists()) {
fpath.mkdirs();
}
FileOutputStream outputStream = new FileOutputStream(zFile);
int i;
while ((i = zipInputStream.read(ch)) != -1) {
outputStream.write(ch, 0, i);
}
zipInputStream.closeEntry();
outputStream.close();
}
}
inputStream.close();
}
8 months ago
/**
* Chart
*
* @param workingPath
* @param chartNumber
*/
8 months ago
public static List<List<String>> readChar(String workingPath, int chartNumber) throws DocumentException {
8 months ago
List<List<String>> matrix = new ArrayList<>();
8 months ago
String xml = workingPath + "\\word\\charts\\chart" + chartNumber + ".xml";
if (!(new File(xml).exists())) {
System.out.println("没有找到第" + chartNumber + "个图表");
8 months ago
return matrix ;
8 months ago
}
//3、开始读取
8 months ago
// 创建 SAXReader 对象,读取 XML 文件
8 months ago
SAXReader reader = new SAXReader();
Document document = reader.read(new File(xml));
// 获取根元素
Element root = document.getRootElement();
//折线图
//将xml用IDEA打开搜索关键的数据值然后右键查看XPATH完整路径可以获取到下面的路径
///c:chartSpace/c:chart/c:plotArea/c:lineChart/c:ser/c:cat/c:numRef/c:numCache/c:pt/c:v
8 months ago
//在每个已知的图表类型中查找,找到后跳出循环
//声明一个数组,图表的所有类型
String[] CHART_TYPES = {"lineChart", "barChart"};//折线,柱状
String type = "";
for (String chartType : CHART_TYPES) {
if (root.element("chart").element("plotArea")
.element(chartType) != null) {
type = chartType;
break;
}
}
if (StrKit.isBlank(type)) {
System.out.println("没有找到图表类型,请扩充图表类型");
System.out.println(root.element("chart").element("plotArea"));
System.exit(-1);
}
8 months ago
List<Element> xList = root.element("chart").element("plotArea")
8 months ago
.element(type).element("ser").element("cat")
8 months ago
.element("numRef").element("numCache").elements("pt");
8 months ago
8 months ago
List<Object> allValueList = new ArrayList<>();
8 months ago
///c:chartSpace/c:chart/c:plotArea/c:lineChart/c:ser/c:val/c:numRef/c:numCache
8 months ago
for (Element ser : root.element("chart").element("plotArea")
.element(type).elements("ser")) {
8 months ago
List<Element> yList = ser.element("val").element("numRef").element("numCache").elements("pt");
//记录都有哪些有效数值和索引号
Map<Integer, Element> map = new HashMap<>();
for (Element e : yList) {
map.put(Integer.parseInt(e.attribute("idx").getValue()), e);
}
List<Object> lo = new ArrayList<>();
for (int i = 0; i < xList.size(); i++) {
if (map.containsKey(i)) {
lo.add(map.get(i));
} else {
lo.add(null);
}
}
allValueList.add(lo);
8 months ago
}
8 months ago
8 months ago
for (int i = 0; i < allValueList.size(); i++) {
8 months ago
List<String> row = new ArrayList<>();
8 months ago
List<Element> lo = (List<Element>) allValueList.get(i);
for (Element e : lo) {
if (e == null) {
8 months ago
row.add(null);
} else {
8 months ago
row.add(e.element("v").getText());
8 months ago
}
8 months ago
}
8 months ago
matrix.add(row);
8 months ago
}
8 months ago
//上面生成的数据格式需要行转列,横坐标是年份,纵坐标是数据
// 计算行数和列数
int rowCount = matrix.size();
int colCount = matrix.getFirst().size();
// 创建一个一维列表,用于存储转换后的列
List<List<String>> transposed = new ArrayList<>();
// 遍历每一列
for (int col = 0; col < colCount; col++) {
// 创建一个新的内部列表,用于存储当前列的所有行
List<String> column = new ArrayList<>();
// 遍历每一行,将当前列的值添加到新的内部列表中
for (int row = 0; row < rowCount; row++) {
column.add(matrix.get(row).get(col));
}
// 将当前列添加到结果列表中
transposed.add(column);
}
// 在每一行的第一列插入序号
for (int i = 0; i < transposed.size(); i++) {
List<String> column = transposed.get(i);
column.addFirst(xList.get(i).element("v").getText()); // 在每行的开始插入序号
}
return transposed;
8 months ago
}
public static void main(String[] args) throws IOException, InvalidFormatException, InterruptedException, ParserConfigurationException, SAXException, XPathExpressionException, DocumentException {
String sourceDoc = "c:/西双版纳州人口变化及其对教育的影响20240420.docx";
//1、将word文件解压缩
String workingPath = "C:\\zipFile";
UnCompress(sourceDoc, workingPath);
//2、我们需要第几个图表
8 months ago
for (int chartNumber = 4; chartNumber <= 4; chartNumber++) {
System.out.println("正在处理第" + chartNumber + "个图表的信息~");
//读取图表
List<List<String>> list = readChar(workingPath, chartNumber);
ExcelKit.printTable(list);
System.out.println("=========================================================");
}
8 months ago
}
}