From 885d76dcc2c5136e83b749a2000c18cddf67b5b3 Mon Sep 17 00:00:00 2001 From: 0007 <0007@qq.com> Date: Wed, 27 Aug 2025 19:59:17 +0800 Subject: [PATCH] Add File --- .../document/parser/PoiDocumentParser.java | 36 +++++++++++++++++++ 1 file changed, 36 insertions(+) create mode 100644 agents-flex-document-parser/agents-flex-document-parser-poi/src/main/java/com/agentsflex/document/parser/PoiDocumentParser.java diff --git a/agents-flex-document-parser/agents-flex-document-parser-poi/src/main/java/com/agentsflex/document/parser/PoiDocumentParser.java b/agents-flex-document-parser/agents-flex-document-parser-poi/src/main/java/com/agentsflex/document/parser/PoiDocumentParser.java new file mode 100644 index 0000000..d83d812 --- /dev/null +++ b/agents-flex-document-parser/agents-flex-document-parser-poi/src/main/java/com/agentsflex/document/parser/PoiDocumentParser.java @@ -0,0 +1,36 @@ +/* + * Copyright (c) 2023-2025, Agents-Flex (fuhai999@gmail.com). + *
+ * Licensed under the Apache License, Version 2.0 (the "License"); + * you may not use this file except in compliance with the License. + * You may obtain a copy of the License at + *
+ * http://www.apache.org/licenses/LICENSE-2.0 + *
+ * Unless required by applicable law or agreed to in writing, software + * distributed under the License is distributed on an "AS IS" BASIS, + * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. + * See the License for the specific language governing permissions and + * limitations under the License. + */ +package com.agentsflex.document.parser; + +import com.agentsflex.core.document.Document; +import com.agentsflex.core.document.DocumentParser; +import org.apache.poi.extractor.ExtractorFactory; +import org.apache.poi.extractor.POITextExtractor; + +import java.io.IOException; +import java.io.InputStream; + +public class PoiDocumentParser implements DocumentParser { + @Override + public Document parse(InputStream stream) { + try (POITextExtractor extractor = ExtractorFactory.createExtractor(stream)) { + String text = extractor.getText(); + return new Document(text); + } catch (IOException e) { + throw new RuntimeException(e); + } + } +}