search
HomeWeb Front-endHTML Tutorialword转html(一)_html/css_WEB-ITnose

一、依赖的包,部署环境

二、后台代码实现

import com.jacob.activeX.ActiveXComponent;import com.jacob.com.Dispatch;import com.jacob.com.Variant;/**	 *	 * <p>【导入word文件,解析word文件转换成HTML】</p>	 * <p>条件:</p>	 * <p>备注:</p>	 * <p>例子:</p>	 * <p>日志:</p>	 *	 * @author:zhu  [2016年1月29日 下午2:50:28]	 */	public void importDocToHtml() {		//启动word		ActiveXComponent axc = new ActiveXComponent("Word.Application");		StringWriter stringWriter = null;		try {			// doc临时存放文件夹路径			String realpath = ServletActionContext.getServletContext().getRealPath("/UserUploadFile/WordToHTML");			File tempfile = null;			if (docFile != null) {				String tempName = String.valueOf((new Date()).getTime());				tempfile = new File(new File(realpath), tempName + ".doc");				//判断文件是否存在				if (!tempfile.getParentFile().exists()) {					//创建文件					tempfile.getParentFile().mkdirs();				}				//copy文件的创建的文件上				FileUtils.copyFile(docFile, tempfile);				//设置word不可见				axc.setProperty("Visible", new Variant(false));				Dispatch docs = axc.getProperty("Documents").toDispatch();				//打开word文档				Dispatch doc = Dispatch.invoke(docs, "Open", Dispatch.Method,						new Object[] { docFile.getPath(), new Variant(false), new Variant(true) }, new int[1])						.toDispatch();				String htmlUrl = tempfile.getPath().substring(0, tempfile.getPath().lastIndexOf(".") + 1) + "html";				//作为html格式保存到临时文件				Dispatch.invoke(doc, "SaveAs", Dispatch.Method, new Object[] { htmlUrl, new Variant(8) }, new int[1]);				Variant f = new Variant(false);				Dispatch.call(doc, "Close", f);				//删除文件				//FileUtils.forceDelete(tempfile);				File file = new File(htmlUrl);				//读取需要注意编码				InputStreamReader isr = new InputStreamReader(new FileInputStream(file), "gb2312");				BufferedReader br = new BufferedReader(isr);				String s = null;				StringBuffer html = new StringBuffer();				while ((s = br.readLine()) != null) {//使用readLine方法,一次读一行					html.append(s);				}				br.close();				Map<String, Object> result = new HashMap<String, Object>();				//因为一次读一行的原因,可以标签和属性之间没间隔,所以需要格式化				result.put("html", formatHTML(html.toString(), tempName));				// 操作成功的话,将文档id返回				Struts2Utils.outJSON(result);			}		} catch (Exception e) {			setErrMessage("导入Excel数据错误,请检查数据!");		} finally {			axc.invoke("Quit", new Variant[] {});		}	}	/**	 * 	 * <p>【对当前html进行处理】</p>	 * <p>条件:</p>	 * <p>备注:如果有图片会在html同目录下生成一个存放图片的文件夹</p>	 * <p>例子:</p>	 * <p>日志:</p>	 *	 * @param html			html的内容	 * @param htmlName		html文件名	 * @return	 * @author:zhu  [2016年2月3日 下午5:01:36]	 */	private String formatHTML(String html, String htmlName) {		//对src进行处理,可能和标签链接紧密		html = html.replaceAll("src", "\t src");		org.jsoup.nodes.Document doc = Jsoup.parse(html);		//只需要body内的html代码,style不要,如果html在转成doc会出现问题		Element body = doc.body();		//对style进行处理,可能和标签链接紧密		body = body.html(body.html().replaceAll("style", "\t style").replaceAll("lang", "\t lang"));		//span标签的lang 有些情况下双引号会把style包掉,特殊处理下,不处理也没关系,没发现样式乱的情况		/*Elements spans = body.getElementsByTag("span");		for (Element ele : spans) {			String span = ele.attr("lang");			if (!span.isEmpty()) {				if (span.length() > 5) {					ele.removeAttr("lang");					ele.attr("style", span.substring(span.indexOf("\'"), span.lastIndexOf("\'")));				} else {					ele.removeAttr("lang");				}			}		}		*/		String bodyContent = body.html();		//图片需要真是的路径		bodyContent = bodyContent.replaceAll(htmlName, "../../UserUploadFile/WordToHTML/" + htmlName);		return bodyContent;	}

三、前台实现

     前台主要一个上传,和获取html代码后直接赋值到编辑器上的功能。

    我使用uploadify实现上传,核心代码

$(function() {		$("#fileUp").uploadify({			swf				: '${request.contextPath}/resources/uploadify/uploadify.swf', 			uploader		: 'hdAction!importDocToHtml.shtml',							// 用于接收上传文件的action			auto			: true,									// 是否自动开始 上传			buttonText		: '导入Word', 							// 按钮上的文字 			debug			: false,								// 是否调试状态			fileObjName		: 'docFile',							// action中的文件对象名	 		fileSizeLimit	: (100*1024*1024), 						// 设置单个文件大小限制,单位为byte。设置为100m			fileTypeDesc	: '支持格式:*.doc', 				// 如果配置了以下的'fileExt'属性,那么这个属性是必须的  	 		fileTypeExts	: '*.doc',								// 允许的格式,如:*.jpg;*.gif;*.jpeg;*.png;*.bmp			method          : 'post',								// 上传数据的方法			multi			: true,									// 是否支持多文件上传 			onUploadSuccess : function(file, data, response) {				var result=$.parseJSON(data);				//eWebEditor编辑器赋值				$("#eWebEditor1").contents().find("body").find("#eWebEditor").contents().find("body").html(result.html);			},			onError: function(event, queueID, fileObj) {				alert("文件:" + fileObj.name + "上传失败!");  			},					onUploadError : function(file,errorCode,errorMsg,errorString,swfuploadifyQueue) {// 上传文件出错是触发(每个出错文件触发一次)				alert( '上传文件出错,id: ' + file.id						+ ' \r\n- 索引: ' + file.index						+ ' \r\n- 文件名: ' + file.name						+ ' \r\n- 文件大小: ' + file.size						+ ' \r\n- 类型: ' + file.type						+ ' \r\n- 创建日期: ' + file.creationdate						+ ' \r\n- 修改日期: ' + file.modificationdate						+ ' \r\n- 文件状态: ' + file.filestatus						+ ' \r\n- 错误代码: ' + errorCode						+ ' \r\n- 错误描述: ' + errorMsg						+ ' \r\n- 简要错误描述: ' + errorString						+ ' \r\n- 出错的文件数: ' + swfuploadifyQueue.filesErrored						+ ' \r\n- 错误信息: ' + swfuploadifyQueue.errorMsg						+ ' \r\n- 要添加至队列的数量: ' + swfuploadifyQueue.filesSelected						+ ' \r\n- 添加至对立的数量: ' + swfuploadifyQueue.filesQueued						+ ' \r\n- 队列长度: ' + swfuploadifyQueue.queueLength);			},			onCancel: function(event, queueID, fileObj){  				//alert("取消了" + fileObj.name);  			}		});		})
<tr>    	<th></th>    	<td><input type='file' id='fileUp' name='fileUp' /></td>  </tr>


Statement
The content of this article is voluntarily contributed by netizens, and the copyright belongs to the original author. This site does not assume corresponding legal responsibility. If you find any content suspected of plagiarism or infringement, please contact admin@php.cn
Difficulty in updating caching of official account web pages: How to avoid the old cache affecting the user experience after version update?Difficulty in updating caching of official account web pages: How to avoid the old cache affecting the user experience after version update?Mar 04, 2025 pm 12:32 PM

The official account web page update cache, this thing is simple and simple, and it is complicated enough to drink a pot of it. You worked hard to update the official account article, but the user still opened the old version. Who can bear the taste? In this article, let’s take a look at the twists and turns behind this and how to solve this problem gracefully. After reading it, you can easily deal with various caching problems, allowing your users to always experience the freshest content. Let’s talk about the basics first. To put it bluntly, in order to improve access speed, the browser or server stores some static resources (such as pictures, CSS, JS) or page content. Next time you access it, you can directly retrieve it from the cache without having to download it again, and it is naturally fast. But this thing is also a double-edged sword. The new version is online,

How to efficiently add stroke effects to PNG images on web pages?How to efficiently add stroke effects to PNG images on web pages?Mar 04, 2025 pm 02:39 PM

This article demonstrates efficient PNG border addition to webpages using CSS. It argues that CSS offers superior performance compared to JavaScript or libraries, detailing how to adjust border width, style, and color for subtle or prominent effect

How do I use HTML5 form validation attributes to validate user input?How do I use HTML5 form validation attributes to validate user input?Mar 17, 2025 pm 12:27 PM

The article discusses using HTML5 form validation attributes like required, pattern, min, max, and length limits to validate user input directly in the browser.

What is the purpose of the <datalist> element?What is the purpose of the <datalist> element?Mar 21, 2025 pm 12:33 PM

The article discusses the HTML <datalist> element, which enhances forms by providing autocomplete suggestions, improving user experience and reducing errors.Character count: 159

What is the purpose of the <progress> element?What is the purpose of the <progress> element?Mar 21, 2025 pm 12:34 PM

The article discusses the HTML <progress> element, its purpose, styling, and differences from the <meter> element. The main focus is on using <progress> for task completion and <meter> for stati

What are the best practices for cross-browser compatibility in HTML5?What are the best practices for cross-browser compatibility in HTML5?Mar 17, 2025 pm 12:20 PM

Article discusses best practices for ensuring HTML5 cross-browser compatibility, focusing on feature detection, progressive enhancement, and testing methods.

What is the purpose of the <meter> element?What is the purpose of the <meter> element?Mar 21, 2025 pm 12:35 PM

The article discusses the HTML <meter> element, used for displaying scalar or fractional values within a range, and its common applications in web development. It differentiates <meter> from <progress> and ex

What is the purpose of the <iframe> tag? What are the security considerations when using it?What is the purpose of the <iframe> tag? What are the security considerations when using it?Mar 20, 2025 pm 06:05 PM

The article discusses the <iframe> tag's purpose in embedding external content into webpages, its common uses, security risks, and alternatives like object tags and APIs.

See all articles

Hot AI Tools

Undresser.AI Undress

Undresser.AI Undress

AI-powered app for creating realistic nude photos

AI Clothes Remover

AI Clothes Remover

Online AI tool for removing clothes from photos.

Undress AI Tool

Undress AI Tool

Undress images for free

Clothoff.io

Clothoff.io

AI clothes remover

AI Hentai Generator

AI Hentai Generator

Generate AI Hentai for free.

Hot Article

Repo: How To Revive Teammates
1 months agoBy尊渡假赌尊渡假赌尊渡假赌
R.E.P.O. Energy Crystals Explained and What They Do (Yellow Crystal)
2 weeks agoBy尊渡假赌尊渡假赌尊渡假赌
Hello Kitty Island Adventure: How To Get Giant Seeds
1 months agoBy尊渡假赌尊渡假赌尊渡假赌

Hot Tools

Atom editor mac version download

Atom editor mac version download

The most popular open source editor

mPDF

mPDF

mPDF is a PHP library that can generate PDF files from UTF-8 encoded HTML. The original author, Ian Back, wrote mPDF to output PDF files "on the fly" from his website and handle different languages. It is slower than original scripts like HTML2FPDF and produces larger files when using Unicode fonts, but supports CSS styles etc. and has a lot of enhancements. Supports almost all languages, including RTL (Arabic and Hebrew) and CJK (Chinese, Japanese and Korean). Supports nested block-level elements (such as P, DIV),

SublimeText3 Linux new version

SublimeText3 Linux new version

SublimeText3 Linux latest version

VSCode Windows 64-bit Download

VSCode Windows 64-bit Download

A free and powerful IDE editor launched by Microsoft

ZendStudio 13.5.1 Mac

ZendStudio 13.5.1 Mac

Powerful PHP integrated development environment