Import of Word Documents to ServiceNow Knowledge base

welterp · ‎02-10-2014

I am trying to import Word Documents to ServiceNow Knowledge Articles with out losing any images. I have tried using the Word Cleaner and SED installs without any success. Is there any fix that works?

conmic · ‎09-09-2014

IMPORTANT UPDATE - 03/03/2016:

I updated the entire script as I ran into some errors. And now it can also be used with journal fields!

See my reply: Re: Import of Word Documents to ServiceNow Knowledge base

You can also read more about it here: Create Knowledge Base Article (HTML field) or Comments (Journal field) from Email

you corrected the thrown exception errors on 4 of the lines in the script.

example on your line 18 with the part:

while(match == regex.exec(searchBody)){

the actual script is

while(match = regex.exec(searchBody)){

I know it throws an errors, but that's somehow required for the script to work. Because later you're going to use the value in the variable 'match' that has been set in line 18... If somebody has any idea how to formulate this correctly, you're welcome to help out.

Here is the full script that I use:

var gdt = new GlideDate();

gdt.addDays(2);

//current.valid_to = gdt;

var desc = email.subject;

desc = desc.replace("Knowledge:","");

current.short_description = desc.trim();

current.workflow_state = "draft";

current.topic = "General";

//current.category = "";

current.roles = "knowledge";



//Find and replace the image tags with the proper source.

//Get the number of attachments so the loop can be exited

//so it will stop no mater what.

var currentCount = 0;

var newBody = email.body_html;

var searchBody = email.body_html.replace(/\n/g, " ");



var regex = /<img(.*?)>/ig;

var match;

var match2;

while(match = regex.exec(searchBody)){

   //Add a style float tag next to the align tag.

   var alignText = match[0].replace(/align=['"]?left['"]?/gi, 'align="left" style="FLOAT: left"');

   alignText = alignText.replace(/align=['"]?right['"]?/gi, 'align="right" style="FLOAT: right"');

   searchBody = searchBody.replace(match[0], alignText);

   var regex2 = /src=("(.)*?"|'(.)*?'|(.)*?\s+$)?/ig;

   while(match2 = regex2.exec(alignText)){

   findAndReplaceImage(match2[1].replace(/\s+$/,"").replace(/"+/g,"").replace(/'+/g,""));

   }

   currentCount += 1;

   if(currentCount >= 100)

   break;

}

searchBody = searchBody.replace(/<o:p>(.*?)<\/o:p>/ig, "");

currentCount = 0;

var regex2 = /<!--\[if(.*?)<!\[endif\]-->/ig;

while(match = regex2.exec(searchBody)){

   searchBody = searchBody.replace(match[0], "");

   currentCount += 1;

   if(currentCount >= 100)

   break;

}

currentCount = 0;

var regex2 = /<!\[if !vml\]>(.*?)<!\[endif\]>/ig;

while(match = regex2.exec(searchBody)){

   searchBody = searchBody.replace(match[0], match[1]);

   currentCount += 1;

   if(currentCount >= 100)

   break;

}



//gs.log("Create Morning Post: " + searchBody);



current.text = searchBody;



current.insert();



event.state="stop_processing";



function getEmailSYSID(emailuid) {

   var em = new GlideRecord('sys_email');

   em.addQuery('uid', emailuid);

   em.query();

   while(em.next()) {

   //we execute the return only within a certain time difference between the creation of the attachment and now (in seconds)

   var dif = gs.dateDiff(em.sys_created_on, gs.nowNoTZ(), true);

   //gs.log("difference: " + dif + "eid: " + em.sys_id + " uid: " + em.uid); //debug

   if(dif < 300 && dif > -300){

   //gs.log('passed dif if: ' + em.sys_id + " uid: " + em.uid); //debug

   return em.sys_id;

   }

   }

   return "";

}




function findAndReplaceImage(imageText){

   var img = imageText;

   var imgName = img.substring(4, img.search(/@/i));

   var imgCode = "sys_attachment.do?sys_id=";

   //Get the sys_id of the attachment

   var gr = new GlideRecord("sys_attachment");

   gr.addQuery("file_name", imgName);

   gr.addQuery("table_sys_id", getEmailSYSID(email.uid));

   gr.query();

   if (gr.next()) {

   imgCode += gr.sys_id;

   }

   searchBody = searchBody.replace(img, imgCode);

}

View solution in original post

DrewW · ‎03-03-2016

Nice to see people are keeping up on this code but with the new word doc import in the KB I cannot help but think this no longer needed.

conmic · ‎03-03-2016

Hi Drew,

I agree and I don't. It depends on the situation.

Our users prefer to write an email. We also publish communications and news in the Knowledge Base, therefore an email is way more effective. I am even building a logic that depending to which email address you send the email, it will put it in the according knowledge base.

And as said, this code now also works for Journal fields if you add the processed data between [code][/code] tags.