实现word转换为xml list数据。
Ubuntu 或 Centos7,安装如下依赖:
sudo apt-get install poppler-utils wv unrtf tidy
go get github.com/JalfResi/justext
github action 配置docker参数: USERNAME, PASSWORD, REGISTRY, GITHUB_RUN_NUMBER
useradd -u 5678 wordtohtml
docker pull ccr.ccs.tencentyun.com/jianboy/wordtohtml:v1.0.5
docker run -it --rm -v /data/wordtohtml:/app ccr.ccs.tencentyun.com/jianboy/wordtohtml:v1.0.5
alias wordtohtml='docker run -it --rm -v /data:/app jianboy/wordtohtml'
alias pdf2htmlEX='docker run -ti --rm -v `pwd`:/pdf bwits/pdf2htmlex pdf2htmlEX'
pdf2htmlEX --zoom 1 test.pdf