diff --git a/agents-flex-document-parser/agents-flex-document-parser-poi/src/main/java/com/agentsflex/document/parser/PoiDocumentParser.java b/agents-flex-document-parser/agents-flex-document-parser-poi/src/main/java/com/agentsflex/document/parser/PoiDocumentParser.java new file mode 100644 index 0000000..d83d812 --- /dev/null +++ b/agents-flex-document-parser/agents-flex-document-parser-poi/src/main/java/com/agentsflex/document/parser/PoiDocumentParser.java @@ -0,0 +1,36 @@ +/* + * Copyright (c) 2023-2025, Agents-Flex (fuhai999@gmail.com). + *

+ * Licensed under the Apache License, Version 2.0 (the "License"); + * you may not use this file except in compliance with the License. + * You may obtain a copy of the License at + *

+ * http://www.apache.org/licenses/LICENSE-2.0 + *

+ * Unless required by applicable law or agreed to in writing, software + * distributed under the License is distributed on an "AS IS" BASIS, + * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. + * See the License for the specific language governing permissions and + * limitations under the License. + */ +package com.agentsflex.document.parser; + +import com.agentsflex.core.document.Document; +import com.agentsflex.core.document.DocumentParser; +import org.apache.poi.extractor.ExtractorFactory; +import org.apache.poi.extractor.POITextExtractor; + +import java.io.IOException; +import java.io.InputStream; + +public class PoiDocumentParser implements DocumentParser { + @Override + public Document parse(InputStream stream) { + try (POITextExtractor extractor = ExtractorFactory.createExtractor(stream)) { + String text = extractor.getText(); + return new Document(text); + } catch (IOException e) { + throw new RuntimeException(e); + } + } +}