java - Android + Apache POI 我需要读取 .docx 并转换为文本

标签 java android apache-poi

我需要阅读 .docx 并转换为文本。我正在尝试使用 Apache POI 库,但出现了一些错误

构建.gradle

apply plugin: 'com.android.application'

apply plugin: 'kotlin-android'

apply plugin: 'kotlin-android-extensions'

android {
    compileSdkVersion 29
    defaultConfig {
        applicationId "by.roman.irtov.apachepoi"
        minSdkVersion 23
        targetSdkVersion 29
        versionCode 1
        versionName "1.0"
        multiDexEnabled true
    }
    buildTypes {
        release {
            minifyEnabled false
            proguardFiles getDefaultProguardFile('proguard-android-optimize.txt'), 'proguard-rules.pro'
        }
    }

    compileOptions {
        sourceCompatibility = 1.8
        targetCompatibility = 1.8
    }

}

dependencies {
    implementation fileTree(dir: 'libs', include: ['*.jar'])
    implementation "org.jetbrains.kotlin:kotlin-stdlib-jdk7:$kotlin_version"
    implementation 'androidx.appcompat:appcompat:1.0.2'
    implementation 'androidx.core:core-ktx:1.0.2'
    implementation 'androidx.constraintlayout:constraintlayout:1.1.3'
    implementation 'com.android.support:multidex:1.0.3'
    implementation 'org.apache.poi:poi:4.1.0'
    implementation 'org.apache.poi:poi-ooxml:4.1.0'
}

申请

class App : MultiDexApplication() {

    override fun onCreate() {
        super.onCreate()
        MultiDex.install(this)
    }
}

block 正在读取 docx

private fun readDocx(){
        try {
            val dir = Environment.getExternalStorageDirectory()
            val yourFile = File(dir, "test.docx")
            val opcPackage = OPCPackage.open(yourFile, PackageAccess.READ)
            val docx = XWPFDocument(opcPackage)
            val wx = XWPFWordExtractor(docx)
            val text = wx.text
        } catch (ex: Exception) {
            ex.printStackTrace()
        }
    }

在线 - val docx = XWPFDocument(opcPackage) 我发现错误 ->

FATAL EXCEPTION: main
    Process: by.roman.irtov.apachepoi, PID: 8158
    java.lang.NoClassDefFoundError: Failed resolution of: Ljavax/xml/stream/XMLStreamReader;
        at org.apache.xmlbeans.XmlBeans.buildStreamToNodeMethod(XmlBeans.java:251)
        at org.apache.xmlbeans.XmlBeans.<clinit>(XmlBeans.java:138)
        at org.apache.xmlbeans.XmlBeans.typeLoaderForClassLoader(XmlBeans.java:719)
        at org.openxmlformats.schemas.wordprocessingml.x2006.main.DocumentDocument$Factory.getTypeLoader(Unknown Source:25)
        at org.openxmlformats.schemas.wordprocessingml.x2006.main.DocumentDocument$Factory.parse(Unknown Source:0)
        at org.apache.poi.xwpf.usermodel.XWPFDocument.onDocumentRead(XWPFDocument.java:178)
        at org.apache.poi.ooxml.POIXMLDocument.load(POIXMLDocument.java:184)
        at org.apache.poi.xwpf.usermodel.XWPFDocument.<init>(XWPFDocument.java:138)
        at by.roman.irtov.apachepoi.MainActivity.openOpenPDF(MainActivity.kt:50)
        at by.roman.irtov.apachepoi.MainActivity.access$openOpenPDF(MainActivity.kt:15)
        at by.roman.irtov.apachepoi.MainActivity$onCreate$1.onClick(MainActivity.kt:22)
        at android.view.View.performClick(View.java:6608)
        at android.view.View.performClickInternal(View.java:6585)
        at android.view.View.access$3100(View.java:785)
        at android.view.View$PerformClick.run(View.java:25921)
        at android.os.Handler.handleCallback(Handler.java:873)
        at android.os.Handler.dispatchMessage(Handler.java:99)
        at android.os.Looper.loop(Looper.java:201)
        at android.app.ActivityThread.main(ActivityThread.java:6810)
        at java.lang.reflect.Method.invoke(Native Method)
        at com.android.internal.os.RuntimeInit$MethodAndArgsCaller.run(RuntimeInit.java:547)
        at com.android.internal.os.ZygoteInit.main(ZygoteInit.java:873)
     Caused by: java.lang.ClassNotFoundException: Didn't find class "javax.xml.stream.XMLStreamReader" on path: DexPathList[[zip file "/data/app/by.roman.irtov.apachepoi-dz-oAIxqfj8GBAesyNnFKA==/base.apk"],nativeLibraryDirectories=[/data/app/by.roman.irtov.apachepoi-dz-oAIxqfj8GBAesyNnFKA==/lib/arm64, /system/lib64]]
        at dalvik.system.BaseDexClassLoader.findClass(BaseDexClassLoader.java:134)
        at java.lang.ClassLoader.loadClass(ClassLoader.java:379)
        at java.lang.ClassLoader.loadClass(ClassLoader.java:312)
        at org.apache.xmlbeans.XmlBeans.buildStreamToNodeMethod(XmlBeans.java:251) 
        at org.apache.xmlbeans.XmlBeans.<clinit>(XmlBeans.java:138) 
        at org.apache.xmlbeans.XmlBeans.typeLoaderForClassLoader(XmlBeans.java:719) 
        at org.openxmlformats.schemas.wordprocessingml.x2006.main.DocumentDocument$Factory.getTypeLoader(Unknown Source:25) 
        at org.openxmlformats.schemas.wordprocessingml.x2006.main.DocumentDocument$Factory.parse(Unknown Source:0) 
        at org.apache.poi.xwpf.usermodel.XWPFDocument.onDocumentRead(XWPFDocument.java:178) 
        at org.apache.poi.ooxml.POIXMLDocument.load(POIXMLDocument.java:184) 
        at org.apache.poi.xwpf.usermodel.XWPFDocument.<init>(XWPFDocument.java:138) 
        at by.roman.irtov.apachepoi.MainActivity.openOpenPDF(MainActivity.kt:50) 
        at by.roman.irtov.apachepoi.MainActivity.access$openOpenPDF(MainActivity.kt:15) 
        at by.roman.irtov.apachepoi.MainActivity$onCreate$1.onClick(MainActivity.kt:22) 
        at android.view.View.performClick(View.java:6608) 
        at android.view.View.performClickInternal(View.java:6585) 
        at android.view.View.access$3100(View.java:785) 
        at android.view.View$PerformClick.run(View.java:25921) 
        at android.os.Handler.handleCallback(Handler.java:873) 
        at android.os.Handler.dispatchMessage(Handler.java:99) 
        at android.os.Looper.loop(Looper.java:201) 
        at android.app.ActivityThread.main(ActivityThread.java:6810) 
        at java.lang.reflect.Method.invoke(Native Method) 
        at com.android.internal.os.RuntimeInit$MethodAndArgsCaller.run(RuntimeInit.java:547) 
        at com.android.internal.os.ZygoteInit.main(ZygoteInit.java:873) 

然后我尝试添加库 -> 实现 'javax.xml.stream:stax-api:1.0' 现在我发现错误 ->

 java.lang.RuntimeException: http://xml.org/sax/properties/declaration-handler
        at org.apache.xmlbeans.impl.store.Locale$SaxLoader.<init>(Locale.java:3397)
        at org.apache.xmlbeans.impl.store.Locale$XmlReaderSaxLoader.<init>(Locale.java:3087)
        at org.apache.xmlbeans.impl.store.Locale.getSaxLoader(Locale.java:3072)
        at org.apache.xmlbeans.impl.store.Locale.parseToXmlObject(Locale.java:1272)
        at org.apache.xmlbeans.impl.store.Locale.parseToXmlObject(Locale.java:1259)
        at org.apache.xmlbeans.impl.schema.SchemaTypeLoaderBase.parse(SchemaTypeLoaderBase.java:345)
        at org.openxmlformats.schemas.wordprocessingml.x2006.main.DocumentDocument$Factory.parse(Unknown Source:6)
        at org.apache.poi.xwpf.usermodel.XWPFDocument.onDocumentRead(XWPFDocument.java:178)
        at org.apache.poi.ooxml.POIXMLDocument.load(POIXMLDocument.java:184)
        at org.apache.poi.xwpf.usermodel.XWPFDocument.<init>(XWPFDocument.java:138)
        at by.roman.irtov.apachepoi.MainActivity.openOpenPDF(MainActivity.kt:50)
        at by.roman.irtov.apachepoi.MainActivity.access$openOpenPDF(MainActivity.kt:15)
        at by.roman.irtov.apachepoi.MainActivity$onCreate$1.onClick(MainActivity.kt:22)
        at android.view.View.performClick(View.java:6608)
        at android.view.View.performClickInternal(View.java:6585)
        at android.view.View.access$3100(View.java:785)
        at android.view.View$PerformClick.run(View.java:25921)
        at android.os.Handler.handleCallback(Handler.java:873)
        at android.os.Handler.dispatchMessage(Handler.java:99)
        at android.os.Looper.loop(Looper.java:201)
        at android.app.ActivityThread.main(ActivityThread.java:6810)
        at java.lang.reflect.Method.invoke(Native Method)
        at com.android.internal.os.RuntimeInit$MethodAndArgsCaller.run(RuntimeInit.java:547)
        at com.android.internal.os.ZygoteInit.main(ZygoteInit.java:873)
     Caused by: org.xml.sax.SAXNotRecognizedException: http://xml.org/sax/properties/declaration-handler
        at org.apache.harmony.xml.ExpatReader.setProperty(ExpatReader.java:162)
        at org.apache.xmlbeans.impl.store.Locale$SaxLoader.<init>(Locale.java:3391)
        at org.apache.xmlbeans.impl.store.Locale$XmlReaderSaxLoader.<init>(Locale.java:3087) 
        at org.apache.xmlbeans.impl.store.Locale.getSaxLoader(Locale.java:3072) 
        at org.apache.xmlbeans.impl.store.Locale.parseToXmlObject(Locale.java:1272) 
        at org.apache.xmlbeans.impl.store.Locale.parseToXmlObject(Locale.java:1259) 
        at org.apache.xmlbeans.impl.schema.SchemaTypeLoaderBase.parse(SchemaTypeLoaderBase.java:345) 
        at org.openxmlformats.schemas.wordprocessingml.x2006.main.DocumentDocument$Factory.parse(Unknown Source:6) 
        at org.apache.poi.xwpf.usermodel.XWPFDocument.onDocumentRead(XWPFDocument.java:178) 
        at org.apache.poi.ooxml.POIXMLDocument.load(POIXMLDocument.java:184) 
        at org.apache.poi.xwpf.usermodel.XWPFDocument.<init>(XWPFDocument.java:138) 
        at by.roman.irtov.apachepoi.MainActivity.openOpenPDF(MainActivity.kt:50) 
        at by.roman.irtov.apachepoi.MainActivity.access$openOpenPDF(MainActivity.kt:15) 
        at by.roman.irtov.apachepoi.MainActivity$onCreate$1.onClick(MainActivity.kt:22) 
        at android.view.View.performClick(View.java:6608) 
        at android.view.View.performClickInternal(View.java:6585) 
        at android.view.View.access$3100(View.java:785) 
        at android.view.View$PerformClick.run(View.java:25921) 
        at android.os.Handler.handleCallback(Handler.java:873) 
        at android.os.Handler.dispatchMessage(Handler.java:99) 
        at android.os.Looper.loop(Looper.java:201) 
        at android.app.ActivityThread.main(ActivityThread.java:6810) 
        at java.lang.reflect.Method.invoke(Native Method) 
        at com.android.internal.os.RuntimeInit$MethodAndArgsCaller.run(RuntimeInit.java:547) 
        at com.android.internal.os.ZygoteInit.main(ZygoteInit.java:873) 

谁知道如何正确使用 Apache Poi? 安卓上可以吗? 有工作示例吗? (Apache POI 用于 .docx 到文本)

最佳答案

关于java - Android + Apache POI 我需要读取 .docx 并转换为文本,我们在Stack Overflow上找到一个类似的问题: https://stackoverflow.com/questions/57871093/

相关文章:

java - 如何通过 HSSFWorkbook 设置图像大小

java - 如何使用 Apache POI 设置漂亮的浮点值?

java - kie workbench部署 war 不工作(tomcat)

java - 实体方面( Spring )

javascript - Canvas获取图像的触摸事件

java - 当我尝试删除 Activity 上的操作栏时,为什么会出现此异常?

java - 数组上的 Wordsearch 难题 nullpointerException

java - 问 : Rental Car Calculator | Use a sentinel value loop

java - OpenCV + Android + 车牌识别

java - 使用 apache poi 或 docx4j 基于页脚分割 docx