在项目中遇到一个需求:需要将doc文档转为html格式;
最终觉得mammoth.js是非常好用的一个插件。但是目前仅支持本地资源,网络地址不能识别。
<!DOCTYPE html>
<html lang="en">
<head>
<meta charset="UTF-8">
<meta name="viewport" content="width=device-width, initial-scale=1.0">
<meta http-equiv="X-UA-Compatible" content="ie=edge">
<title>test</title>
</head>
<body>
<div class="container">
<input id="document" type="file" />
<div class="row" style="width: 100%;">
<div class="span8">
<div id="output" class="well"></div>
</div>
</div>
</div>
<script src="./jquery.min.js"></script>
<!-- 引入本地的jquery库 -->
<script src="https://cdn.bootcss.com/mammoth/1.4.8/mammoth.browser.js"></script>
<!-- 引入mammoth库 -->
<script type="text/javascript">
document.getElementById("document")
.addEventListener("change", readFileInputEventAsArrayBuffer, false);
function displayResult(result) {
let html = result.value;
console.log(html)
let newHTML = html.replace(//g, '')
.replace('<h1>', '<h1 style="text-align: center;">')
.replace(/<table>/g, '<table style="border-collapse: collapse;">')
.replace(/<tr>/g, '<tr style="height: 30px;">')
.replace(/<td>/g, '<td style="border: 1px solid pink;">')
.replace(/<p>/g, '<p style="text-indent: 2em;">');
document.getElementById("output").innerHTML = newHTML;
}
function readFileInputEventAsArrayBuffer(event) {
var file = event.target.files[0];
// 为文件改名字,此部分可删除,不影响效果
Object.defineProperty(file, 'name', {
writable: true //设置属性为可写
});
file.name = 'https://wb.flk.npc.gov.cn/flfg/WORD/547fd4d3dcfb4c4ba6842d2604961cd2.docx';//在名字中加入时间戳,可以是任意的字符串
// 为文件改名字结束
var reader = new FileReader();
reader.onload = function (loadEvent) {
var arrayBuffer = loadEvent.target.result;//arrayBuffer
mammoth.convertToHtml({ arrayBuffer: arrayBuffer })
.then(displayResult)
.done();
};
reader.readAsArrayBuffer(file);
}
</script>
</body>
</html>