(JavaScript) Scrub Xml
Demonstrates the Scrub method for some common XML cleaning needs.
Note: This example requires Chilkat v9.5.0.77 or greater.
var success = false;
// The Scrub method has options for trimming whitespace from the ends of attributes and content,
// trimming inside whitespace, and for case conversion for tags and attribute names.
// Trimming inside whitespace is defined as replacing CR, LF, and tab chars with SPACE chars, and
// removing extra SPACE chars so that at most one SPACE separates non-SPACE chars.
// For example, load the following XML:
var s = "<xyz><td class=\" colHoldingPercent col7\" style=\"border-bottom-color: rgb(221, 221, 221); border-image-outset: 0; \"> abc\r\n123 456</td></xyz>";
var xml = new CkXml();
success = xml.LoadXml(s);
console.log(xml.GetXml());
// The XML before scrubbing is:
// <xyz>
// <td class=" colHoldingPercent col7" style="border-bottom-color: rgb(221, 221, 221); border-image-outset: 0; ">abc
// 123 456</td>
// </xyz>
xml.Scrub("AttrTrimEnds,AttrTrimInside,ContentTrimEnds,ContentTrimInside");
console.log(xml.GetXml());
// The XML after scrubbing is:
// <?xml version="1.0" encoding="utf-8"?>
// <xyz>
// <td class="colHoldingPercent col7" style="border-bottom-color: rgb(221, 221, 221); border-image-outset: 0;">abc 123 456</td>
// </xyz>
|