In this article, we will be exporting HTML to Word doc file with images using jQuery plugin or without using any plugin, with pure javascript. Although there are many plugin available on internet which converts html page into word document but we will be using jquery.wordexport.js which also requires filesaver.js to save files on client browser, using HTML 5 Localstorage.
HTML page to Word Doc with images using Javascript
In the method, we will not be using any jquery plugin, we will be converting complete HTML with image into doc using javascript code.
1. Create the javascript function to export to doc
function ExportToDoc(filename = ''){
var HtmlHead = "<html xmlns:o='urn:schemas-microsoft-com:office:office' xmlns:w='urn:schemas-microsoft-com:office:word' xmlns='http://www.w3.org/TR/REC-html40'><head><meta charset='utf-8'><title>Export HTML To Doc</title></head><body>";
var EndHtml = "</body></html>";
//complete html
var html = HtmlHead +document.getElementById("MainHTML").innerHTML+EndHtml;
//specify the type
var blob = new Blob(['\ufeff', html], {
type: 'application/msword'
});
// Specify link url
var url = 'data:application/vnd.ms-word;charset=utf-8,' + encodeURIComponent(html);
// Specify file name
filename = filename?filename+'.doc':'document.doc';
// Create download link element
var downloadLink = document.createElement("a");
document.body.appendChild(downloadLink);
if(navigator.msSaveOrOpenBlob ){
navigator.msSaveOrOpenBlob(blob, filename);
}else{
// Create a link to the file
downloadLink.href = url;
// Setting the file name
downloadLink.download = filename;
//triggering the function
downloadLink.click();
}
document.body.removeChild(downloadLink);
}
In the above code, we are getting contents of element with id "MainHTML" and then converting it into blob of type MSWord. You can also modify code to pass element dynamically by adding an argument in "ExportToDoc" function and then passing that element's html.
2. Let's create the HTML which we will export
<div id="MainHTML">
<h1>
<center>Centered HTML H1 Heading</center>
</h1>
<h2>
Heading 2
</h2>
<p>
Some text inside paragraph.
</p>
<p>
<img src="https://res.cloudinary.com/dmsxwwfb5/image/upload/v1580916756/buy-me-min.png">
</p>
</div>
<div>
<a class="word-export" href="javascript:void(0)" onclick="ExportToDoc()">Export to Doc</a>
</div>
Codepen sample
Output:
HTML page to word doc with images using jQuery plugin
Let's create a simple HTML page with image, which we will be using to convert to MS word Document.
<div id="MainHTML">
<h1>
<center>Centered HTML H1 Heading</center>
</h1>
<h2>
Heading 2
</h2>
<p>
Some text inside paragraph.
</p>
<p>
<img src=" ">
</p>
</div>
<div>
<a class="word-export" href="javascript:void(0)">Export to Doc</a>
</div>
In the above code, we have simply added few headings and a image file in base64 format.
Now, let's add the required plugins, which is filesaver.js, jquery.js
<script src="https://cdnjs.cloudflare.com/ajax/libs/jquery/3.3.1/jquery.js"></script>
<script src="https://cdnjs.cloudflare.com/ajax/libs/FileSaver.js/1.3.8/FileSaver.min.js"></script>
I have not added link to jQuery.wordexport.js, as we will be using direct plugin code because it is not available on cdn as of now, and here the complete function code
// jQuery html to word plugin function
if (typeof jQuery !== "undefined" && typeof saveAs !== "undefined") {
(function($) {
$.fn.wordExport = function(fileName) {
fileName = typeof fileName !== 'undefined' ? fileName : "jQuery-Word-Export";
var static = {
mhtml: {
top: "Mime-Version: 1.0\nContent-Base: " + location.href + "\nContent-Type: Multipart/related; boundary=\"NEXT.ITEM-BOUNDARY\";type=\"text/html\"\n\n--NEXT.ITEM-BOUNDARY\nContent-Type: text/html; charset=\"utf-8\"\nContent-Location: " + location.href + "\n\n<!DOCTYPE html>\n<html>\n_html_</html>",
head: "<head>\n<meta http-equiv=\"Content-Type\" content=\"text/html; charset=utf-8\">\n<style>\n_styles_\n</style>\n</head>\n",
body: "<body>_body_</body>"
}
};
var options = {
maxWidth: 624
};
// Clone selected element before manipulating it
var markup = $(this).clone();
// Remove hidden elements from the output
markup.each(function() {
var self = $(this);
if (self.is(':hidden'))
self.remove();
});
// Embed all images using Data URLs
var images = Array();
var img = markup.find('img');
for (var i = 0; i < img.length; i++) {
// Calculate dimensions of output image
var w = Math.min(img[i].width, options.maxWidth);
var h = img[i].height * (w / img[i].width);
// Create canvas for converting image to data URL
var canvas = document.createElement("CANVAS");
canvas.width = w;
canvas.height = h;
// Draw image to canvas
var context = canvas.getContext('2d');
context.drawImage(img[i], 0, 0, w, h);
// Get data URL encoding of image
var uri = canvas.toDataURL("image/png");
$(img[i]).attr("src", img[i].src);
img[i].width = w;
img[i].height = h;
// Save encoded image to array
images[i] = {
type: uri.substring(uri.indexOf(":") + 1, uri.indexOf(";")),
encoding: uri.substring(uri.indexOf(";") + 1, uri.indexOf(",")),
location: $(img[i]).attr("src"),
data: uri.substring(uri.indexOf(",") + 1)
};
}
// Prepare bottom of mhtml file with image data
var mhtmlBottom = "\n";
for (var i = 0; i < images.length; i++) {
mhtmlBottom += "--NEXT.ITEM-BOUNDARY\n";
mhtmlBottom += "Content-Location: " + images[i].location + "\n";
mhtmlBottom += "Content-Type: " + images[i].type + "\n";
mhtmlBottom += "Content-Transfer-Encoding: " + images[i].encoding + "\n\n";
mhtmlBottom += images[i].data + "\n\n";
}
mhtmlBottom += "--NEXT.ITEM-BOUNDARY--";
//TODO: load css from included stylesheet
var styles = "";
// Aggregate parts of the file together
var fileContent = static.mhtml.top.replace("_html_", static.mhtml.head.replace("_styles_", styles) + static.mhtml.body.replace("_body_", markup.html())) + mhtmlBottom;
// Create a Blob with the file contents
var blob = new Blob([fileContent], {
type: "application/msword;charset=utf-8"
});
saveAs(blob, fileName + ".doc");
};
})(jQuery);
} else {
if (typeof jQuery === "undefined") {
console.error("jQuery Word Export: missing dependency (jQuery)");
}
if (typeof saveAs === "undefined") {
console.error("jQuery Word Export: missing dependency (FileSaver.js)");
}
}
Now, add the jQuery code to call the above function on click and convert html to doc
jQuery(document).ready(function($) {
$("a.word-export").click(function(event) {
$("#MainHTML").wordExport();
});
});
That's, it, we are ready, here is the Codepen sample
Output is same as above, but in this approach we are using jQuery plugin and also converting image into base64 to get it work.
You may also to read:
Export html table to excel using jQuery / Javascript
How to get user location using Javascript / HTML5 Geolocation?
vikas_jk
Hello, I am not sure how big is your images, but I tried 2.5 mb image and converted it HTML to word using Javascript, which works for me.
Here is the sample fiddle link, which has 2.5 MB image converted into base 64 and it works.
https://jsfiddle.net/7dxe5tm1/
Take a look. If your images are bigger than 5 mb reduce file size while uploading if possible.
Edited at :- 6/17/2020 8:31:50 AM
AleksandraŻełubowska
Thank you for your answer.
I tried for images 5.75MB, when the image have more than 5.5 there is a problem.
vikas_jk
Then you should reduce image file 5.5 MB is already too large , try checking this JS based solution to compress image before upload.
https://github.com/brunobar79/J-I-C
Note: You need to use .jpg as output so it can work properly.
https://stackoverflow.com/a/9949679/3559462
Hope it helps.