You can not select more than 25 topics
			Topics must start with a letter or number, can include dashes ('-') and can be up to 35 characters long.
		
		
		
		
		
			
		
			
				
					
					
						
							1566 lines
						
					
					
						
							42 KiB
						
					
					
				
			
		
		
	
	
							1566 lines
						
					
					
						
							42 KiB
						
					
					
				| ;(function (sax) { // wrapper for non-node envs
 | |
|   sax.parser = function (strict, opt) { return new SAXParser(strict, opt) }
 | |
|   sax.SAXParser = SAXParser
 | |
|   sax.SAXStream = SAXStream
 | |
|   sax.createStream = createStream
 | |
| 
 | |
|   // When we pass the MAX_BUFFER_LENGTH position, start checking for buffer overruns.
 | |
|   // When we check, schedule the next check for MAX_BUFFER_LENGTH - (max(buffer lengths)),
 | |
|   // since that's the earliest that a buffer overrun could occur.  This way, checks are
 | |
|   // as rare as required, but as often as necessary to ensure never crossing this bound.
 | |
|   // Furthermore, buffers are only tested at most once per write(), so passing a very
 | |
|   // large string into write() might have undesirable effects, but this is manageable by
 | |
|   // the caller, so it is assumed to be safe.  Thus, a call to write() may, in the extreme
 | |
|   // edge case, result in creating at most one complete copy of the string passed in.
 | |
|   // Set to Infinity to have unlimited buffers.
 | |
|   sax.MAX_BUFFER_LENGTH = 64 * 1024
 | |
| 
 | |
|   var buffers = [
 | |
|     'comment', 'sgmlDecl', 'textNode', 'tagName', 'doctype',
 | |
|     'procInstName', 'procInstBody', 'entity', 'attribName',
 | |
|     'attribValue', 'cdata', 'script'
 | |
|   ]
 | |
| 
 | |
|   sax.EVENTS = [
 | |
|     'text',
 | |
|     'processinginstruction',
 | |
|     'sgmldeclaration',
 | |
|     'doctype',
 | |
|     'comment',
 | |
|     'opentagstart',
 | |
|     'attribute',
 | |
|     'opentag',
 | |
|     'closetag',
 | |
|     'opencdata',
 | |
|     'cdata',
 | |
|     'closecdata',
 | |
|     'error',
 | |
|     'end',
 | |
|     'ready',
 | |
|     'script',
 | |
|     'opennamespace',
 | |
|     'closenamespace'
 | |
|   ]
 | |
| 
 | |
|   function SAXParser (strict, opt) {
 | |
|     if (!(this instanceof SAXParser)) {
 | |
|       return new SAXParser(strict, opt)
 | |
|     }
 | |
| 
 | |
|     var parser = this
 | |
|     clearBuffers(parser)
 | |
|     parser.q = parser.c = ''
 | |
|     parser.bufferCheckPosition = sax.MAX_BUFFER_LENGTH
 | |
|     parser.opt = opt || {}
 | |
|     parser.opt.lowercase = parser.opt.lowercase || parser.opt.lowercasetags
 | |
|     parser.looseCase = parser.opt.lowercase ? 'toLowerCase' : 'toUpperCase'
 | |
|     parser.tags = []
 | |
|     parser.closed = parser.closedRoot = parser.sawRoot = false
 | |
|     parser.tag = parser.error = null
 | |
|     parser.strict = !!strict
 | |
|     parser.noscript = !!(strict || parser.opt.noscript)
 | |
|     parser.state = S.BEGIN
 | |
|     parser.strictEntities = parser.opt.strictEntities
 | |
|     parser.ENTITIES = parser.strictEntities ? Object.create(sax.XML_ENTITIES) : Object.create(sax.ENTITIES)
 | |
|     parser.attribList = []
 | |
| 
 | |
|     // namespaces form a prototype chain.
 | |
|     // it always points at the current tag,
 | |
|     // which protos to its parent tag.
 | |
|     if (parser.opt.xmlns) {
 | |
|       parser.ns = Object.create(rootNS)
 | |
|     }
 | |
| 
 | |
|     // mostly just for error reporting
 | |
|     parser.trackPosition = parser.opt.position !== false
 | |
|     if (parser.trackPosition) {
 | |
|       parser.position = parser.line = parser.column = 0
 | |
|     }
 | |
|     emit(parser, 'onready')
 | |
|   }
 | |
| 
 | |
|   if (!Object.create) {
 | |
|     Object.create = function (o) {
 | |
|       function F () {}
 | |
|       F.prototype = o
 | |
|       var newf = new F()
 | |
|       return newf
 | |
|     }
 | |
|   }
 | |
| 
 | |
|   if (!Object.keys) {
 | |
|     Object.keys = function (o) {
 | |
|       var a = []
 | |
|       for (var i in o) if (o.hasOwnProperty(i)) a.push(i)
 | |
|       return a
 | |
|     }
 | |
|   }
 | |
| 
 | |
|   function checkBufferLength (parser) {
 | |
|     var maxAllowed = Math.max(sax.MAX_BUFFER_LENGTH, 10)
 | |
|     var maxActual = 0
 | |
|     for (var i = 0, l = buffers.length; i < l; i++) {
 | |
|       var len = parser[buffers[i]].length
 | |
|       if (len > maxAllowed) {
 | |
|         // Text/cdata nodes can get big, and since they're buffered,
 | |
|         // we can get here under normal conditions.
 | |
|         // Avoid issues by emitting the text node now,
 | |
|         // so at least it won't get any bigger.
 | |
|         switch (buffers[i]) {
 | |
|           case 'textNode':
 | |
|             closeText(parser)
 | |
|             break
 | |
| 
 | |
|           case 'cdata':
 | |
|             emitNode(parser, 'oncdata', parser.cdata)
 | |
|             parser.cdata = ''
 | |
|             break
 | |
| 
 | |
|           case 'script':
 | |
|             emitNode(parser, 'onscript', parser.script)
 | |
|             parser.script = ''
 | |
|             break
 | |
| 
 | |
|           default:
 | |
|             error(parser, 'Max buffer length exceeded: ' + buffers[i])
 | |
|         }
 | |
|       }
 | |
|       maxActual = Math.max(maxActual, len)
 | |
|     }
 | |
|     // schedule the next check for the earliest possible buffer overrun.
 | |
|     var m = sax.MAX_BUFFER_LENGTH - maxActual
 | |
|     parser.bufferCheckPosition = m + parser.position
 | |
|   }
 | |
| 
 | |
|   function clearBuffers (parser) {
 | |
|     for (var i = 0, l = buffers.length; i < l; i++) {
 | |
|       parser[buffers[i]] = ''
 | |
|     }
 | |
|   }
 | |
| 
 | |
|   function flushBuffers (parser) {
 | |
|     closeText(parser)
 | |
|     if (parser.cdata !== '') {
 | |
|       emitNode(parser, 'oncdata', parser.cdata)
 | |
|       parser.cdata = ''
 | |
|     }
 | |
|     if (parser.script !== '') {
 | |
|       emitNode(parser, 'onscript', parser.script)
 | |
|       parser.script = ''
 | |
|     }
 | |
|   }
 | |
| 
 | |
|   SAXParser.prototype = {
 | |
|     end: function () { end(this) },
 | |
|     write: write,
 | |
|     resume: function () { this.error = null; return this },
 | |
|     close: function () { return this.write(null) },
 | |
|     flush: function () { flushBuffers(this) }
 | |
|   }
 | |
| 
 | |
|   var Stream
 | |
|   try {
 | |
|     Stream = require('stream').Stream
 | |
|   } catch (ex) {
 | |
|     Stream = function () {}
 | |
|   }
 | |
| 
 | |
|   var streamWraps = sax.EVENTS.filter(function (ev) {
 | |
|     return ev !== 'error' && ev !== 'end'
 | |
|   })
 | |
| 
 | |
|   function createStream (strict, opt) {
 | |
|     return new SAXStream(strict, opt)
 | |
|   }
 | |
| 
 | |
|   function SAXStream (strict, opt) {
 | |
|     if (!(this instanceof SAXStream)) {
 | |
|       return new SAXStream(strict, opt)
 | |
|     }
 | |
| 
 | |
|     Stream.apply(this)
 | |
| 
 | |
|     this._parser = new SAXParser(strict, opt)
 | |
|     this.writable = true
 | |
|     this.readable = true
 | |
| 
 | |
|     var me = this
 | |
| 
 | |
|     this._parser.onend = function () {
 | |
|       me.emit('end')
 | |
|     }
 | |
| 
 | |
|     this._parser.onerror = function (er) {
 | |
|       me.emit('error', er)
 | |
| 
 | |
|       // if didn't throw, then means error was handled.
 | |
|       // go ahead and clear error, so we can write again.
 | |
|       me._parser.error = null
 | |
|     }
 | |
| 
 | |
|     this._decoder = null
 | |
| 
 | |
|     streamWraps.forEach(function (ev) {
 | |
|       Object.defineProperty(me, 'on' + ev, {
 | |
|         get: function () {
 | |
|           return me._parser['on' + ev]
 | |
|         },
 | |
|         set: function (h) {
 | |
|           if (!h) {
 | |
|             me.removeAllListeners(ev)
 | |
|             me._parser['on' + ev] = h
 | |
|             return h
 | |
|           }
 | |
|           me.on(ev, h)
 | |
|         },
 | |
|         enumerable: true,
 | |
|         configurable: false
 | |
|       })
 | |
|     })
 | |
|   }
 | |
| 
 | |
|   SAXStream.prototype = Object.create(Stream.prototype, {
 | |
|     constructor: {
 | |
|       value: SAXStream
 | |
|     }
 | |
|   })
 | |
| 
 | |
|   SAXStream.prototype.write = function (data) {
 | |
|     if (typeof Buffer === 'function' &&
 | |
|       typeof Buffer.isBuffer === 'function' &&
 | |
|       Buffer.isBuffer(data)) {
 | |
|       if (!this._decoder) {
 | |
|         var SD = require('string_decoder').StringDecoder
 | |
|         this._decoder = new SD('utf8')
 | |
|       }
 | |
|       data = this._decoder.write(data)
 | |
|     }
 | |
| 
 | |
|     this._parser.write(data.toString())
 | |
|     this.emit('data', data)
 | |
|     return true
 | |
|   }
 | |
| 
 | |
|   SAXStream.prototype.end = function (chunk) {
 | |
|     if (chunk && chunk.length) {
 | |
|       this.write(chunk)
 | |
|     }
 | |
|     this._parser.end()
 | |
|     return true
 | |
|   }
 | |
| 
 | |
|   SAXStream.prototype.on = function (ev, handler) {
 | |
|     var me = this
 | |
|     if (!me._parser['on' + ev] && streamWraps.indexOf(ev) !== -1) {
 | |
|       me._parser['on' + ev] = function () {
 | |
|         var args = arguments.length === 1 ? [arguments[0]] : Array.apply(null, arguments)
 | |
|         args.splice(0, 0, ev)
 | |
|         me.emit.apply(me, args)
 | |
|       }
 | |
|     }
 | |
| 
 | |
|     return Stream.prototype.on.call(me, ev, handler)
 | |
|   }
 | |
| 
 | |
|   // this really needs to be replaced with character classes.
 | |
|   // XML allows all manner of ridiculous numbers and digits.
 | |
|   var CDATA = '[CDATA['
 | |
|   var DOCTYPE = 'DOCTYPE'
 | |
|   var XML_NAMESPACE = 'http://www.w3.org/XML/1998/namespace'
 | |
|   var XMLNS_NAMESPACE = 'http://www.w3.org/2000/xmlns/'
 | |
|   var rootNS = { xml: XML_NAMESPACE, xmlns: XMLNS_NAMESPACE }
 | |
| 
 | |
|   // http://www.w3.org/TR/REC-xml/#NT-NameStartChar
 | |
|   // This implementation works on strings, a single character at a time
 | |
|   // as such, it cannot ever support astral-plane characters (10000-EFFFF)
 | |
|   // without a significant breaking change to either this  parser, or the
 | |
|   // JavaScript language.  Implementation of an emoji-capable xml parser
 | |
|   // is left as an exercise for the reader.
 | |
|   var nameStart = /[:_A-Za-z\u00C0-\u00D6\u00D8-\u00F6\u00F8-\u02FF\u0370-\u037D\u037F-\u1FFF\u200C-\u200D\u2070-\u218F\u2C00-\u2FEF\u3001-\uD7FF\uF900-\uFDCF\uFDF0-\uFFFD]/
 | |
| 
 | |
|   var nameBody = /[:_A-Za-z\u00C0-\u00D6\u00D8-\u00F6\u00F8-\u02FF\u0370-\u037D\u037F-\u1FFF\u200C-\u200D\u2070-\u218F\u2C00-\u2FEF\u3001-\uD7FF\uF900-\uFDCF\uFDF0-\uFFFD\u00B7\u0300-\u036F\u203F-\u2040.\d-]/
 | |
| 
 | |
|   var entityStart = /[#:_A-Za-z\u00C0-\u00D6\u00D8-\u00F6\u00F8-\u02FF\u0370-\u037D\u037F-\u1FFF\u200C-\u200D\u2070-\u218F\u2C00-\u2FEF\u3001-\uD7FF\uF900-\uFDCF\uFDF0-\uFFFD]/
 | |
|   var entityBody = /[#:_A-Za-z\u00C0-\u00D6\u00D8-\u00F6\u00F8-\u02FF\u0370-\u037D\u037F-\u1FFF\u200C-\u200D\u2070-\u218F\u2C00-\u2FEF\u3001-\uD7FF\uF900-\uFDCF\uFDF0-\uFFFD\u00B7\u0300-\u036F\u203F-\u2040.\d-]/
 | |
| 
 | |
|   function isWhitespace (c) {
 | |
|     return c === ' ' || c === '\n' || c === '\r' || c === '\t'
 | |
|   }
 | |
| 
 | |
|   function isQuote (c) {
 | |
|     return c === '"' || c === '\''
 | |
|   }
 | |
| 
 | |
|   function isAttribEnd (c) {
 | |
|     return c === '>' || isWhitespace(c)
 | |
|   }
 | |
| 
 | |
|   function isMatch (regex, c) {
 | |
|     return regex.test(c)
 | |
|   }
 | |
| 
 | |
|   function notMatch (regex, c) {
 | |
|     return !isMatch(regex, c)
 | |
|   }
 | |
| 
 | |
|   var S = 0
 | |
|   sax.STATE = {
 | |
|     BEGIN: S++, // leading byte order mark or whitespace
 | |
|     BEGIN_WHITESPACE: S++, // leading whitespace
 | |
|     TEXT: S++, // general stuff
 | |
|     TEXT_ENTITY: S++, // & and such.
 | |
|     OPEN_WAKA: S++, // <
 | |
|     SGML_DECL: S++, // <!BLARG
 | |
|     SGML_DECL_QUOTED: S++, // <!BLARG foo "bar
 | |
|     DOCTYPE: S++, // <!DOCTYPE
 | |
|     DOCTYPE_QUOTED: S++, // <!DOCTYPE "//blah
 | |
|     DOCTYPE_DTD: S++, // <!DOCTYPE "//blah" [ ...
 | |
|     DOCTYPE_DTD_QUOTED: S++, // <!DOCTYPE "//blah" [ "foo
 | |
|     COMMENT_STARTING: S++, // <!-
 | |
|     COMMENT: S++, // <!--
 | |
|     COMMENT_ENDING: S++, // <!-- blah -
 | |
|     COMMENT_ENDED: S++, // <!-- blah --
 | |
|     CDATA: S++, // <![CDATA[ something
 | |
|     CDATA_ENDING: S++, // ]
 | |
|     CDATA_ENDING_2: S++, // ]]
 | |
|     PROC_INST: S++, // <?hi
 | |
|     PROC_INST_BODY: S++, // <?hi there
 | |
|     PROC_INST_ENDING: S++, // <?hi "there" ?
 | |
|     OPEN_TAG: S++, // <strong
 | |
|     OPEN_TAG_SLASH: S++, // <strong /
 | |
|     ATTRIB: S++, // <a
 | |
|     ATTRIB_NAME: S++, // <a foo
 | |
|     ATTRIB_NAME_SAW_WHITE: S++, // <a foo _
 | |
|     ATTRIB_VALUE: S++, // <a foo=
 | |
|     ATTRIB_VALUE_QUOTED: S++, // <a foo="bar
 | |
|     ATTRIB_VALUE_CLOSED: S++, // <a foo="bar"
 | |
|     ATTRIB_VALUE_UNQUOTED: S++, // <a foo=bar
 | |
|     ATTRIB_VALUE_ENTITY_Q: S++, // <foo bar="""
 | |
|     ATTRIB_VALUE_ENTITY_U: S++, // <foo bar="
 | |
|     CLOSE_TAG: S++, // </a
 | |
|     CLOSE_TAG_SAW_WHITE: S++, // </a   >
 | |
|     SCRIPT: S++, // <script> ...
 | |
|     SCRIPT_ENDING: S++ // <script> ... <
 | |
|   }
 | |
| 
 | |
|   sax.XML_ENTITIES = {
 | |
|     'amp': '&',
 | |
|     'gt': '>',
 | |
|     'lt': '<',
 | |
|     'quot': '"',
 | |
|     'apos': "'"
 | |
|   }
 | |
| 
 | |
|   sax.ENTITIES = {
 | |
|     'amp': '&',
 | |
|     'gt': '>',
 | |
|     'lt': '<',
 | |
|     'quot': '"',
 | |
|     'apos': "'",
 | |
|     'AElig': 198,
 | |
|     'Aacute': 193,
 | |
|     'Acirc': 194,
 | |
|     'Agrave': 192,
 | |
|     'Aring': 197,
 | |
|     'Atilde': 195,
 | |
|     'Auml': 196,
 | |
|     'Ccedil': 199,
 | |
|     'ETH': 208,
 | |
|     'Eacute': 201,
 | |
|     'Ecirc': 202,
 | |
|     'Egrave': 200,
 | |
|     'Euml': 203,
 | |
|     'Iacute': 205,
 | |
|     'Icirc': 206,
 | |
|     'Igrave': 204,
 | |
|     'Iuml': 207,
 | |
|     'Ntilde': 209,
 | |
|     'Oacute': 211,
 | |
|     'Ocirc': 212,
 | |
|     'Ograve': 210,
 | |
|     'Oslash': 216,
 | |
|     'Otilde': 213,
 | |
|     'Ouml': 214,
 | |
|     'THORN': 222,
 | |
|     'Uacute': 218,
 | |
|     'Ucirc': 219,
 | |
|     'Ugrave': 217,
 | |
|     'Uuml': 220,
 | |
|     'Yacute': 221,
 | |
|     'aacute': 225,
 | |
|     'acirc': 226,
 | |
|     'aelig': 230,
 | |
|     'agrave': 224,
 | |
|     'aring': 229,
 | |
|     'atilde': 227,
 | |
|     'auml': 228,
 | |
|     'ccedil': 231,
 | |
|     'eacute': 233,
 | |
|     'ecirc': 234,
 | |
|     'egrave': 232,
 | |
|     'eth': 240,
 | |
|     'euml': 235,
 | |
|     'iacute': 237,
 | |
|     'icirc': 238,
 | |
|     'igrave': 236,
 | |
|     'iuml': 239,
 | |
|     'ntilde': 241,
 | |
|     'oacute': 243,
 | |
|     'ocirc': 244,
 | |
|     'ograve': 242,
 | |
|     'oslash': 248,
 | |
|     'otilde': 245,
 | |
|     'ouml': 246,
 | |
|     'szlig': 223,
 | |
|     'thorn': 254,
 | |
|     'uacute': 250,
 | |
|     'ucirc': 251,
 | |
|     'ugrave': 249,
 | |
|     'uuml': 252,
 | |
|     'yacute': 253,
 | |
|     'yuml': 255,
 | |
|     'copy': 169,
 | |
|     'reg': 174,
 | |
|     'nbsp': 160,
 | |
|     'iexcl': 161,
 | |
|     'cent': 162,
 | |
|     'pound': 163,
 | |
|     'curren': 164,
 | |
|     'yen': 165,
 | |
|     'brvbar': 166,
 | |
|     'sect': 167,
 | |
|     'uml': 168,
 | |
|     'ordf': 170,
 | |
|     'laquo': 171,
 | |
|     'not': 172,
 | |
|     'shy': 173,
 | |
|     'macr': 175,
 | |
|     'deg': 176,
 | |
|     'plusmn': 177,
 | |
|     'sup1': 185,
 | |
|     'sup2': 178,
 | |
|     'sup3': 179,
 | |
|     'acute': 180,
 | |
|     'micro': 181,
 | |
|     'para': 182,
 | |
|     'middot': 183,
 | |
|     'cedil': 184,
 | |
|     'ordm': 186,
 | |
|     'raquo': 187,
 | |
|     'frac14': 188,
 | |
|     'frac12': 189,
 | |
|     'frac34': 190,
 | |
|     'iquest': 191,
 | |
|     'times': 215,
 | |
|     'divide': 247,
 | |
|     'OElig': 338,
 | |
|     'oelig': 339,
 | |
|     'Scaron': 352,
 | |
|     'scaron': 353,
 | |
|     'Yuml': 376,
 | |
|     'fnof': 402,
 | |
|     'circ': 710,
 | |
|     'tilde': 732,
 | |
|     'Alpha': 913,
 | |
|     'Beta': 914,
 | |
|     'Gamma': 915,
 | |
|     'Delta': 916,
 | |
|     'Epsilon': 917,
 | |
|     'Zeta': 918,
 | |
|     'Eta': 919,
 | |
|     'Theta': 920,
 | |
|     'Iota': 921,
 | |
|     'Kappa': 922,
 | |
|     'Lambda': 923,
 | |
|     'Mu': 924,
 | |
|     'Nu': 925,
 | |
|     'Xi': 926,
 | |
|     'Omicron': 927,
 | |
|     'Pi': 928,
 | |
|     'Rho': 929,
 | |
|     'Sigma': 931,
 | |
|     'Tau': 932,
 | |
|     'Upsilon': 933,
 | |
|     'Phi': 934,
 | |
|     'Chi': 935,
 | |
|     'Psi': 936,
 | |
|     'Omega': 937,
 | |
|     'alpha': 945,
 | |
|     'beta': 946,
 | |
|     'gamma': 947,
 | |
|     'delta': 948,
 | |
|     'epsilon': 949,
 | |
|     'zeta': 950,
 | |
|     'eta': 951,
 | |
|     'theta': 952,
 | |
|     'iota': 953,
 | |
|     'kappa': 954,
 | |
|     'lambda': 955,
 | |
|     'mu': 956,
 | |
|     'nu': 957,
 | |
|     'xi': 958,
 | |
|     'omicron': 959,
 | |
|     'pi': 960,
 | |
|     'rho': 961,
 | |
|     'sigmaf': 962,
 | |
|     'sigma': 963,
 | |
|     'tau': 964,
 | |
|     'upsilon': 965,
 | |
|     'phi': 966,
 | |
|     'chi': 967,
 | |
|     'psi': 968,
 | |
|     'omega': 969,
 | |
|     'thetasym': 977,
 | |
|     'upsih': 978,
 | |
|     'piv': 982,
 | |
|     'ensp': 8194,
 | |
|     'emsp': 8195,
 | |
|     'thinsp': 8201,
 | |
|     'zwnj': 8204,
 | |
|     'zwj': 8205,
 | |
|     'lrm': 8206,
 | |
|     'rlm': 8207,
 | |
|     'ndash': 8211,
 | |
|     'mdash': 8212,
 | |
|     'lsquo': 8216,
 | |
|     'rsquo': 8217,
 | |
|     'sbquo': 8218,
 | |
|     'ldquo': 8220,
 | |
|     'rdquo': 8221,
 | |
|     'bdquo': 8222,
 | |
|     'dagger': 8224,
 | |
|     'Dagger': 8225,
 | |
|     'bull': 8226,
 | |
|     'hellip': 8230,
 | |
|     'permil': 8240,
 | |
|     'prime': 8242,
 | |
|     'Prime': 8243,
 | |
|     'lsaquo': 8249,
 | |
|     'rsaquo': 8250,
 | |
|     'oline': 8254,
 | |
|     'frasl': 8260,
 | |
|     'euro': 8364,
 | |
|     'image': 8465,
 | |
|     'weierp': 8472,
 | |
|     'real': 8476,
 | |
|     'trade': 8482,
 | |
|     'alefsym': 8501,
 | |
|     'larr': 8592,
 | |
|     'uarr': 8593,
 | |
|     'rarr': 8594,
 | |
|     'darr': 8595,
 | |
|     'harr': 8596,
 | |
|     'crarr': 8629,
 | |
|     'lArr': 8656,
 | |
|     'uArr': 8657,
 | |
|     'rArr': 8658,
 | |
|     'dArr': 8659,
 | |
|     'hArr': 8660,
 | |
|     'forall': 8704,
 | |
|     'part': 8706,
 | |
|     'exist': 8707,
 | |
|     'empty': 8709,
 | |
|     'nabla': 8711,
 | |
|     'isin': 8712,
 | |
|     'notin': 8713,
 | |
|     'ni': 8715,
 | |
|     'prod': 8719,
 | |
|     'sum': 8721,
 | |
|     'minus': 8722,
 | |
|     'lowast': 8727,
 | |
|     'radic': 8730,
 | |
|     'prop': 8733,
 | |
|     'infin': 8734,
 | |
|     'ang': 8736,
 | |
|     'and': 8743,
 | |
|     'or': 8744,
 | |
|     'cap': 8745,
 | |
|     'cup': 8746,
 | |
|     'int': 8747,
 | |
|     'there4': 8756,
 | |
|     'sim': 8764,
 | |
|     'cong': 8773,
 | |
|     'asymp': 8776,
 | |
|     'ne': 8800,
 | |
|     'equiv': 8801,
 | |
|     'le': 8804,
 | |
|     'ge': 8805,
 | |
|     'sub': 8834,
 | |
|     'sup': 8835,
 | |
|     'nsub': 8836,
 | |
|     'sube': 8838,
 | |
|     'supe': 8839,
 | |
|     'oplus': 8853,
 | |
|     'otimes': 8855,
 | |
|     'perp': 8869,
 | |
|     'sdot': 8901,
 | |
|     'lceil': 8968,
 | |
|     'rceil': 8969,
 | |
|     'lfloor': 8970,
 | |
|     'rfloor': 8971,
 | |
|     'lang': 9001,
 | |
|     'rang': 9002,
 | |
|     'loz': 9674,
 | |
|     'spades': 9824,
 | |
|     'clubs': 9827,
 | |
|     'hearts': 9829,
 | |
|     'diams': 9830
 | |
|   }
 | |
| 
 | |
|   Object.keys(sax.ENTITIES).forEach(function (key) {
 | |
|     var e = sax.ENTITIES[key]
 | |
|     var s = typeof e === 'number' ? String.fromCharCode(e) : e
 | |
|     sax.ENTITIES[key] = s
 | |
|   })
 | |
| 
 | |
|   for (var s in sax.STATE) {
 | |
|     sax.STATE[sax.STATE[s]] = s
 | |
|   }
 | |
| 
 | |
|   // shorthand
 | |
|   S = sax.STATE
 | |
| 
 | |
|   function emit (parser, event, data) {
 | |
|     parser[event] && parser[event](data)
 | |
|   }
 | |
| 
 | |
|   function emitNode (parser, nodeType, data) {
 | |
|     if (parser.textNode) closeText(parser)
 | |
|     emit(parser, nodeType, data)
 | |
|   }
 | |
| 
 | |
|   function closeText (parser) {
 | |
|     parser.textNode = textopts(parser.opt, parser.textNode)
 | |
|     if (parser.textNode) emit(parser, 'ontext', parser.textNode)
 | |
|     parser.textNode = ''
 | |
|   }
 | |
| 
 | |
|   function textopts (opt, text) {
 | |
|     if (opt.trim) text = text.trim()
 | |
|     if (opt.normalize) text = text.replace(/\s+/g, ' ')
 | |
|     return text
 | |
|   }
 | |
| 
 | |
|   function error (parser, er) {
 | |
|     closeText(parser)
 | |
|     if (parser.trackPosition) {
 | |
|       er += '\nLine: ' + parser.line +
 | |
|         '\nColumn: ' + parser.column +
 | |
|         '\nChar: ' + parser.c
 | |
|     }
 | |
|     er = new Error(er)
 | |
|     parser.error = er
 | |
|     emit(parser, 'onerror', er)
 | |
|     return parser
 | |
|   }
 | |
| 
 | |
|   function end (parser) {
 | |
|     if (parser.sawRoot && !parser.closedRoot) strictFail(parser, 'Unclosed root tag')
 | |
|     if ((parser.state !== S.BEGIN) &&
 | |
|       (parser.state !== S.BEGIN_WHITESPACE) &&
 | |
|       (parser.state !== S.TEXT)) {
 | |
|       error(parser, 'Unexpected end')
 | |
|     }
 | |
|     closeText(parser)
 | |
|     parser.c = ''
 | |
|     parser.closed = true
 | |
|     emit(parser, 'onend')
 | |
|     SAXParser.call(parser, parser.strict, parser.opt)
 | |
|     return parser
 | |
|   }
 | |
| 
 | |
|   function strictFail (parser, message) {
 | |
|     if (typeof parser !== 'object' || !(parser instanceof SAXParser)) {
 | |
|       throw new Error('bad call to strictFail')
 | |
|     }
 | |
|     if (parser.strict) {
 | |
|       error(parser, message)
 | |
|     }
 | |
|   }
 | |
| 
 | |
|   function newTag (parser) {
 | |
|     if (!parser.strict) parser.tagName = parser.tagName[parser.looseCase]()
 | |
|     var parent = parser.tags[parser.tags.length - 1] || parser
 | |
|     var tag = parser.tag = { name: parser.tagName, attributes: {} }
 | |
| 
 | |
|     // will be overridden if tag contails an xmlns="foo" or xmlns:foo="bar"
 | |
|     if (parser.opt.xmlns) {
 | |
|       tag.ns = parent.ns
 | |
|     }
 | |
|     parser.attribList.length = 0
 | |
|     emitNode(parser, 'onopentagstart', tag)
 | |
|   }
 | |
| 
 | |
|   function qname (name, attribute) {
 | |
|     var i = name.indexOf(':')
 | |
|     var qualName = i < 0 ? [ '', name ] : name.split(':')
 | |
|     var prefix = qualName[0]
 | |
|     var local = qualName[1]
 | |
| 
 | |
|     // <x "xmlns"="http://foo">
 | |
|     if (attribute && name === 'xmlns') {
 | |
|       prefix = 'xmlns'
 | |
|       local = ''
 | |
|     }
 | |
| 
 | |
|     return { prefix: prefix, local: local }
 | |
|   }
 | |
| 
 | |
|   function attrib (parser) {
 | |
|     if (!parser.strict) {
 | |
|       parser.attribName = parser.attribName[parser.looseCase]()
 | |
|     }
 | |
| 
 | |
|     if (parser.attribList.indexOf(parser.attribName) !== -1 ||
 | |
|       parser.tag.attributes.hasOwnProperty(parser.attribName)) {
 | |
|       parser.attribName = parser.attribValue = ''
 | |
|       return
 | |
|     }
 | |
| 
 | |
|     if (parser.opt.xmlns) {
 | |
|       var qn = qname(parser.attribName, true)
 | |
|       var prefix = qn.prefix
 | |
|       var local = qn.local
 | |
| 
 | |
|       if (prefix === 'xmlns') {
 | |
|         // namespace binding attribute. push the binding into scope
 | |
|         if (local === 'xml' && parser.attribValue !== XML_NAMESPACE) {
 | |
|           strictFail(parser,
 | |
|             'xml: prefix must be bound to ' + XML_NAMESPACE + '\n' +
 | |
|             'Actual: ' + parser.attribValue)
 | |
|         } else if (local === 'xmlns' && parser.attribValue !== XMLNS_NAMESPACE) {
 | |
|           strictFail(parser,
 | |
|             'xmlns: prefix must be bound to ' + XMLNS_NAMESPACE + '\n' +
 | |
|             'Actual: ' + parser.attribValue)
 | |
|         } else {
 | |
|           var tag = parser.tag
 | |
|           var parent = parser.tags[parser.tags.length - 1] || parser
 | |
|           if (tag.ns === parent.ns) {
 | |
|             tag.ns = Object.create(parent.ns)
 | |
|           }
 | |
|           tag.ns[local] = parser.attribValue
 | |
|         }
 | |
|       }
 | |
| 
 | |
|       // defer onattribute events until all attributes have been seen
 | |
|       // so any new bindings can take effect. preserve attribute order
 | |
|       // so deferred events can be emitted in document order
 | |
|       parser.attribList.push([parser.attribName, parser.attribValue])
 | |
|     } else {
 | |
|       // in non-xmlns mode, we can emit the event right away
 | |
|       parser.tag.attributes[parser.attribName] = parser.attribValue
 | |
|       emitNode(parser, 'onattribute', {
 | |
|         name: parser.attribName,
 | |
|         value: parser.attribValue
 | |
|       })
 | |
|     }
 | |
| 
 | |
|     parser.attribName = parser.attribValue = ''
 | |
|   }
 | |
| 
 | |
|   function openTag (parser, selfClosing) {
 | |
|     if (parser.opt.xmlns) {
 | |
|       // emit namespace binding events
 | |
|       var tag = parser.tag
 | |
| 
 | |
|       // add namespace info to tag
 | |
|       var qn = qname(parser.tagName)
 | |
|       tag.prefix = qn.prefix
 | |
|       tag.local = qn.local
 | |
|       tag.uri = tag.ns[qn.prefix] || ''
 | |
| 
 | |
|       if (tag.prefix && !tag.uri) {
 | |
|         strictFail(parser, 'Unbound namespace prefix: ' +
 | |
|           JSON.stringify(parser.tagName))
 | |
|         tag.uri = qn.prefix
 | |
|       }
 | |
| 
 | |
|       var parent = parser.tags[parser.tags.length - 1] || parser
 | |
|       if (tag.ns && parent.ns !== tag.ns) {
 | |
|         Object.keys(tag.ns).forEach(function (p) {
 | |
|           emitNode(parser, 'onopennamespace', {
 | |
|             prefix: p,
 | |
|             uri: tag.ns[p]
 | |
|           })
 | |
|         })
 | |
|       }
 | |
| 
 | |
|       // handle deferred onattribute events
 | |
|       // Note: do not apply default ns to attributes:
 | |
|       //   http://www.w3.org/TR/REC-xml-names/#defaulting
 | |
|       for (var i = 0, l = parser.attribList.length; i < l; i++) {
 | |
|         var nv = parser.attribList[i]
 | |
|         var name = nv[0]
 | |
|         var value = nv[1]
 | |
|         var qualName = qname(name, true)
 | |
|         var prefix = qualName.prefix
 | |
|         var local = qualName.local
 | |
|         var uri = prefix === '' ? '' : (tag.ns[prefix] || '')
 | |
|         var a = {
 | |
|           name: name,
 | |
|           value: value,
 | |
|           prefix: prefix,
 | |
|           local: local,
 | |
|           uri: uri
 | |
|         }
 | |
| 
 | |
|         // if there's any attributes with an undefined namespace,
 | |
|         // then fail on them now.
 | |
|         if (prefix && prefix !== 'xmlns' && !uri) {
 | |
|           strictFail(parser, 'Unbound namespace prefix: ' +
 | |
|             JSON.stringify(prefix))
 | |
|           a.uri = prefix
 | |
|         }
 | |
|         parser.tag.attributes[name] = a
 | |
|         emitNode(parser, 'onattribute', a)
 | |
|       }
 | |
|       parser.attribList.length = 0
 | |
|     }
 | |
| 
 | |
|     parser.tag.isSelfClosing = !!selfClosing
 | |
| 
 | |
|     // process the tag
 | |
|     parser.sawRoot = true
 | |
|     parser.tags.push(parser.tag)
 | |
|     emitNode(parser, 'onopentag', parser.tag)
 | |
|     if (!selfClosing) {
 | |
|       // special case for <script> in non-strict mode.
 | |
|       if (!parser.noscript && parser.tagName.toLowerCase() === 'script') {
 | |
|         parser.state = S.SCRIPT
 | |
|       } else {
 | |
|         parser.state = S.TEXT
 | |
|       }
 | |
|       parser.tag = null
 | |
|       parser.tagName = ''
 | |
|     }
 | |
|     parser.attribName = parser.attribValue = ''
 | |
|     parser.attribList.length = 0
 | |
|   }
 | |
| 
 | |
|   function closeTag (parser) {
 | |
|     if (!parser.tagName) {
 | |
|       strictFail(parser, 'Weird empty close tag.')
 | |
|       parser.textNode += '</>'
 | |
|       parser.state = S.TEXT
 | |
|       return
 | |
|     }
 | |
| 
 | |
|     if (parser.script) {
 | |
|       if (parser.tagName !== 'script') {
 | |
|         parser.script += '</' + parser.tagName + '>'
 | |
|         parser.tagName = ''
 | |
|         parser.state = S.SCRIPT
 | |
|         return
 | |
|       }
 | |
|       emitNode(parser, 'onscript', parser.script)
 | |
|       parser.script = ''
 | |
|     }
 | |
| 
 | |
|     // first make sure that the closing tag actually exists.
 | |
|     // <a><b></c></b></a> will close everything, otherwise.
 | |
|     var t = parser.tags.length
 | |
|     var tagName = parser.tagName
 | |
|     if (!parser.strict) {
 | |
|       tagName = tagName[parser.looseCase]()
 | |
|     }
 | |
|     var closeTo = tagName
 | |
|     while (t--) {
 | |
|       var close = parser.tags[t]
 | |
|       if (close.name !== closeTo) {
 | |
|         // fail the first time in strict mode
 | |
|         strictFail(parser, 'Unexpected close tag')
 | |
|       } else {
 | |
|         break
 | |
|       }
 | |
|     }
 | |
| 
 | |
|     // didn't find it.  we already failed for strict, so just abort.
 | |
|     if (t < 0) {
 | |
|       strictFail(parser, 'Unmatched closing tag: ' + parser.tagName)
 | |
|       parser.textNode += '</' + parser.tagName + '>'
 | |
|       parser.state = S.TEXT
 | |
|       return
 | |
|     }
 | |
|     parser.tagName = tagName
 | |
|     var s = parser.tags.length
 | |
|     while (s-- > t) {
 | |
|       var tag = parser.tag = parser.tags.pop()
 | |
|       parser.tagName = parser.tag.name
 | |
|       emitNode(parser, 'onclosetag', parser.tagName)
 | |
| 
 | |
|       var x = {}
 | |
|       for (var i in tag.ns) {
 | |
|         x[i] = tag.ns[i]
 | |
|       }
 | |
| 
 | |
|       var parent = parser.tags[parser.tags.length - 1] || parser
 | |
|       if (parser.opt.xmlns && tag.ns !== parent.ns) {
 | |
|         // remove namespace bindings introduced by tag
 | |
|         Object.keys(tag.ns).forEach(function (p) {
 | |
|           var n = tag.ns[p]
 | |
|           emitNode(parser, 'onclosenamespace', { prefix: p, uri: n })
 | |
|         })
 | |
|       }
 | |
|     }
 | |
|     if (t === 0) parser.closedRoot = true
 | |
|     parser.tagName = parser.attribValue = parser.attribName = ''
 | |
|     parser.attribList.length = 0
 | |
|     parser.state = S.TEXT
 | |
|   }
 | |
| 
 | |
|   function parseEntity (parser) {
 | |
|     var entity = parser.entity
 | |
|     var entityLC = entity.toLowerCase()
 | |
|     var num
 | |
|     var numStr = ''
 | |
| 
 | |
|     if (parser.ENTITIES[entity]) {
 | |
|       return parser.ENTITIES[entity]
 | |
|     }
 | |
|     if (parser.ENTITIES[entityLC]) {
 | |
|       return parser.ENTITIES[entityLC]
 | |
|     }
 | |
|     entity = entityLC
 | |
|     if (entity.charAt(0) === '#') {
 | |
|       if (entity.charAt(1) === 'x') {
 | |
|         entity = entity.slice(2)
 | |
|         num = parseInt(entity, 16)
 | |
|         numStr = num.toString(16)
 | |
|       } else {
 | |
|         entity = entity.slice(1)
 | |
|         num = parseInt(entity, 10)
 | |
|         numStr = num.toString(10)
 | |
|       }
 | |
|     }
 | |
|     entity = entity.replace(/^0+/, '')
 | |
|     if (isNaN(num) || numStr.toLowerCase() !== entity) {
 | |
|       strictFail(parser, 'Invalid character entity')
 | |
|       return '&' + parser.entity + ';'
 | |
|     }
 | |
| 
 | |
|     return String.fromCodePoint(num)
 | |
|   }
 | |
| 
 | |
|   function beginWhiteSpace (parser, c) {
 | |
|     if (c === '<') {
 | |
|       parser.state = S.OPEN_WAKA
 | |
|       parser.startTagPosition = parser.position
 | |
|     } else if (!isWhitespace(c)) {
 | |
|       // have to process this as a text node.
 | |
|       // weird, but happens.
 | |
|       strictFail(parser, 'Non-whitespace before first tag.')
 | |
|       parser.textNode = c
 | |
|       parser.state = S.TEXT
 | |
|     }
 | |
|   }
 | |
| 
 | |
|   function charAt (chunk, i) {
 | |
|     var result = ''
 | |
|     if (i < chunk.length) {
 | |
|       result = chunk.charAt(i)
 | |
|     }
 | |
|     return result
 | |
|   }
 | |
| 
 | |
|   function write (chunk) {
 | |
|     var parser = this
 | |
|     if (this.error) {
 | |
|       throw this.error
 | |
|     }
 | |
|     if (parser.closed) {
 | |
|       return error(parser,
 | |
|         'Cannot write after close. Assign an onready handler.')
 | |
|     }
 | |
|     if (chunk === null) {
 | |
|       return end(parser)
 | |
|     }
 | |
|     if (typeof chunk === 'object') {
 | |
|       chunk = chunk.toString()
 | |
|     }
 | |
|     var i = 0
 | |
|     var c = ''
 | |
|     while (true) {
 | |
|       c = charAt(chunk, i++)
 | |
|       parser.c = c
 | |
| 
 | |
|       if (!c) {
 | |
|         break
 | |
|       }
 | |
| 
 | |
|       if (parser.trackPosition) {
 | |
|         parser.position++
 | |
|         if (c === '\n') {
 | |
|           parser.line++
 | |
|           parser.column = 0
 | |
|         } else {
 | |
|           parser.column++
 | |
|         }
 | |
|       }
 | |
| 
 | |
|       switch (parser.state) {
 | |
|         case S.BEGIN:
 | |
|           parser.state = S.BEGIN_WHITESPACE
 | |
|           if (c === '\uFEFF') {
 | |
|             continue
 | |
|           }
 | |
|           beginWhiteSpace(parser, c)
 | |
|           continue
 | |
| 
 | |
|         case S.BEGIN_WHITESPACE:
 | |
|           beginWhiteSpace(parser, c)
 | |
|           continue
 | |
| 
 | |
|         case S.TEXT:
 | |
|           if (parser.sawRoot && !parser.closedRoot) {
 | |
|             var starti = i - 1
 | |
|             while (c && c !== '<' && c !== '&') {
 | |
|               c = charAt(chunk, i++)
 | |
|               if (c && parser.trackPosition) {
 | |
|                 parser.position++
 | |
|                 if (c === '\n') {
 | |
|                   parser.line++
 | |
|                   parser.column = 0
 | |
|                 } else {
 | |
|                   parser.column++
 | |
|                 }
 | |
|               }
 | |
|             }
 | |
|             parser.textNode += chunk.substring(starti, i - 1)
 | |
|           }
 | |
|           if (c === '<' && !(parser.sawRoot && parser.closedRoot && !parser.strict)) {
 | |
|             parser.state = S.OPEN_WAKA
 | |
|             parser.startTagPosition = parser.position
 | |
|           } else {
 | |
|             if (!isWhitespace(c) && (!parser.sawRoot || parser.closedRoot)) {
 | |
|               strictFail(parser, 'Text data outside of root node.')
 | |
|             }
 | |
|             if (c === '&') {
 | |
|               parser.state = S.TEXT_ENTITY
 | |
|             } else {
 | |
|               parser.textNode += c
 | |
|             }
 | |
|           }
 | |
|           continue
 | |
| 
 | |
|         case S.SCRIPT:
 | |
|           // only non-strict
 | |
|           if (c === '<') {
 | |
|             parser.state = S.SCRIPT_ENDING
 | |
|           } else {
 | |
|             parser.script += c
 | |
|           }
 | |
|           continue
 | |
| 
 | |
|         case S.SCRIPT_ENDING:
 | |
|           if (c === '/') {
 | |
|             parser.state = S.CLOSE_TAG
 | |
|           } else {
 | |
|             parser.script += '<' + c
 | |
|             parser.state = S.SCRIPT
 | |
|           }
 | |
|           continue
 | |
| 
 | |
|         case S.OPEN_WAKA:
 | |
|           // either a /, ?, !, or text is coming next.
 | |
|           if (c === '!') {
 | |
|             parser.state = S.SGML_DECL
 | |
|             parser.sgmlDecl = ''
 | |
|           } else if (isWhitespace(c)) {
 | |
|             // wait for it...
 | |
|           } else if (isMatch(nameStart, c)) {
 | |
|             parser.state = S.OPEN_TAG
 | |
|             parser.tagName = c
 | |
|           } else if (c === '/') {
 | |
|             parser.state = S.CLOSE_TAG
 | |
|             parser.tagName = ''
 | |
|           } else if (c === '?') {
 | |
|             parser.state = S.PROC_INST
 | |
|             parser.procInstName = parser.procInstBody = ''
 | |
|           } else {
 | |
|             strictFail(parser, 'Unencoded <')
 | |
|             // if there was some whitespace, then add that in.
 | |
|             if (parser.startTagPosition + 1 < parser.position) {
 | |
|               var pad = parser.position - parser.startTagPosition
 | |
|               c = new Array(pad).join(' ') + c
 | |
|             }
 | |
|             parser.textNode += '<' + c
 | |
|             parser.state = S.TEXT
 | |
|           }
 | |
|           continue
 | |
| 
 | |
|         case S.SGML_DECL:
 | |
|           if ((parser.sgmlDecl + c).toUpperCase() === CDATA) {
 | |
|             emitNode(parser, 'onopencdata')
 | |
|             parser.state = S.CDATA
 | |
|             parser.sgmlDecl = ''
 | |
|             parser.cdata = ''
 | |
|           } else if (parser.sgmlDecl + c === '--') {
 | |
|             parser.state = S.COMMENT
 | |
|             parser.comment = ''
 | |
|             parser.sgmlDecl = ''
 | |
|           } else if ((parser.sgmlDecl + c).toUpperCase() === DOCTYPE) {
 | |
|             parser.state = S.DOCTYPE
 | |
|             if (parser.doctype || parser.sawRoot) {
 | |
|               strictFail(parser,
 | |
|                 'Inappropriately located doctype declaration')
 | |
|             }
 | |
|             parser.doctype = ''
 | |
|             parser.sgmlDecl = ''
 | |
|           } else if (c === '>') {
 | |
|             emitNode(parser, 'onsgmldeclaration', parser.sgmlDecl)
 | |
|             parser.sgmlDecl = ''
 | |
|             parser.state = S.TEXT
 | |
|           } else if (isQuote(c)) {
 | |
|             parser.state = S.SGML_DECL_QUOTED
 | |
|             parser.sgmlDecl += c
 | |
|           } else {
 | |
|             parser.sgmlDecl += c
 | |
|           }
 | |
|           continue
 | |
| 
 | |
|         case S.SGML_DECL_QUOTED:
 | |
|           if (c === parser.q) {
 | |
|             parser.state = S.SGML_DECL
 | |
|             parser.q = ''
 | |
|           }
 | |
|           parser.sgmlDecl += c
 | |
|           continue
 | |
| 
 | |
|         case S.DOCTYPE:
 | |
|           if (c === '>') {
 | |
|             parser.state = S.TEXT
 | |
|             emitNode(parser, 'ondoctype', parser.doctype)
 | |
|             parser.doctype = true // just remember that we saw it.
 | |
|           } else {
 | |
|             parser.doctype += c
 | |
|             if (c === '[') {
 | |
|               parser.state = S.DOCTYPE_DTD
 | |
|             } else if (isQuote(c)) {
 | |
|               parser.state = S.DOCTYPE_QUOTED
 | |
|               parser.q = c
 | |
|             }
 | |
|           }
 | |
|           continue
 | |
| 
 | |
|         case S.DOCTYPE_QUOTED:
 | |
|           parser.doctype += c
 | |
|           if (c === parser.q) {
 | |
|             parser.q = ''
 | |
|             parser.state = S.DOCTYPE
 | |
|           }
 | |
|           continue
 | |
| 
 | |
|         case S.DOCTYPE_DTD:
 | |
|           parser.doctype += c
 | |
|           if (c === ']') {
 | |
|             parser.state = S.DOCTYPE
 | |
|           } else if (isQuote(c)) {
 | |
|             parser.state = S.DOCTYPE_DTD_QUOTED
 | |
|             parser.q = c
 | |
|           }
 | |
|           continue
 | |
| 
 | |
|         case S.DOCTYPE_DTD_QUOTED:
 | |
|           parser.doctype += c
 | |
|           if (c === parser.q) {
 | |
|             parser.state = S.DOCTYPE_DTD
 | |
|             parser.q = ''
 | |
|           }
 | |
|           continue
 | |
| 
 | |
|         case S.COMMENT:
 | |
|           if (c === '-') {
 | |
|             parser.state = S.COMMENT_ENDING
 | |
|           } else {
 | |
|             parser.comment += c
 | |
|           }
 | |
|           continue
 | |
| 
 | |
|         case S.COMMENT_ENDING:
 | |
|           if (c === '-') {
 | |
|             parser.state = S.COMMENT_ENDED
 | |
|             parser.comment = textopts(parser.opt, parser.comment)
 | |
|             if (parser.comment) {
 | |
|               emitNode(parser, 'oncomment', parser.comment)
 | |
|             }
 | |
|             parser.comment = ''
 | |
|           } else {
 | |
|             parser.comment += '-' + c
 | |
|             parser.state = S.COMMENT
 | |
|           }
 | |
|           continue
 | |
| 
 | |
|         case S.COMMENT_ENDED:
 | |
|           if (c !== '>') {
 | |
|             strictFail(parser, 'Malformed comment')
 | |
|             // allow <!-- blah -- bloo --> in non-strict mode,
 | |
|             // which is a comment of " blah -- bloo "
 | |
|             parser.comment += '--' + c
 | |
|             parser.state = S.COMMENT
 | |
|           } else {
 | |
|             parser.state = S.TEXT
 | |
|           }
 | |
|           continue
 | |
| 
 | |
|         case S.CDATA:
 | |
|           if (c === ']') {
 | |
|             parser.state = S.CDATA_ENDING
 | |
|           } else {
 | |
|             parser.cdata += c
 | |
|           }
 | |
|           continue
 | |
| 
 | |
|         case S.CDATA_ENDING:
 | |
|           if (c === ']') {
 | |
|             parser.state = S.CDATA_ENDING_2
 | |
|           } else {
 | |
|             parser.cdata += ']' + c
 | |
|             parser.state = S.CDATA
 | |
|           }
 | |
|           continue
 | |
| 
 | |
|         case S.CDATA_ENDING_2:
 | |
|           if (c === '>') {
 | |
|             if (parser.cdata) {
 | |
|               emitNode(parser, 'oncdata', parser.cdata)
 | |
|             }
 | |
|             emitNode(parser, 'onclosecdata')
 | |
|             parser.cdata = ''
 | |
|             parser.state = S.TEXT
 | |
|           } else if (c === ']') {
 | |
|             parser.cdata += ']'
 | |
|           } else {
 | |
|             parser.cdata += ']]' + c
 | |
|             parser.state = S.CDATA
 | |
|           }
 | |
|           continue
 | |
| 
 | |
|         case S.PROC_INST:
 | |
|           if (c === '?') {
 | |
|             parser.state = S.PROC_INST_ENDING
 | |
|           } else if (isWhitespace(c)) {
 | |
|             parser.state = S.PROC_INST_BODY
 | |
|           } else {
 | |
|             parser.procInstName += c
 | |
|           }
 | |
|           continue
 | |
| 
 | |
|         case S.PROC_INST_BODY:
 | |
|           if (!parser.procInstBody && isWhitespace(c)) {
 | |
|             continue
 | |
|           } else if (c === '?') {
 | |
|             parser.state = S.PROC_INST_ENDING
 | |
|           } else {
 | |
|             parser.procInstBody += c
 | |
|           }
 | |
|           continue
 | |
| 
 | |
|         case S.PROC_INST_ENDING:
 | |
|           if (c === '>') {
 | |
|             emitNode(parser, 'onprocessinginstruction', {
 | |
|               name: parser.procInstName,
 | |
|               body: parser.procInstBody
 | |
|             })
 | |
|             parser.procInstName = parser.procInstBody = ''
 | |
|             parser.state = S.TEXT
 | |
|           } else {
 | |
|             parser.procInstBody += '?' + c
 | |
|             parser.state = S.PROC_INST_BODY
 | |
|           }
 | |
|           continue
 | |
| 
 | |
|         case S.OPEN_TAG:
 | |
|           if (isMatch(nameBody, c)) {
 | |
|             parser.tagName += c
 | |
|           } else {
 | |
|             newTag(parser)
 | |
|             if (c === '>') {
 | |
|               openTag(parser)
 | |
|             } else if (c === '/') {
 | |
|               parser.state = S.OPEN_TAG_SLASH
 | |
|             } else {
 | |
|               if (!isWhitespace(c)) {
 | |
|                 strictFail(parser, 'Invalid character in tag name')
 | |
|               }
 | |
|               parser.state = S.ATTRIB
 | |
|             }
 | |
|           }
 | |
|           continue
 | |
| 
 | |
|         case S.OPEN_TAG_SLASH:
 | |
|           if (c === '>') {
 | |
|             openTag(parser, true)
 | |
|             closeTag(parser)
 | |
|           } else {
 | |
|             strictFail(parser, 'Forward-slash in opening tag not followed by >')
 | |
|             parser.state = S.ATTRIB
 | |
|           }
 | |
|           continue
 | |
| 
 | |
|         case S.ATTRIB:
 | |
|           // haven't read the attribute name yet.
 | |
|           if (isWhitespace(c)) {
 | |
|             continue
 | |
|           } else if (c === '>') {
 | |
|             openTag(parser)
 | |
|           } else if (c === '/') {
 | |
|             parser.state = S.OPEN_TAG_SLASH
 | |
|           } else if (isMatch(nameStart, c)) {
 | |
|             parser.attribName = c
 | |
|             parser.attribValue = ''
 | |
|             parser.state = S.ATTRIB_NAME
 | |
|           } else {
 | |
|             strictFail(parser, 'Invalid attribute name')
 | |
|           }
 | |
|           continue
 | |
| 
 | |
|         case S.ATTRIB_NAME:
 | |
|           if (c === '=') {
 | |
|             parser.state = S.ATTRIB_VALUE
 | |
|           } else if (c === '>') {
 | |
|             strictFail(parser, 'Attribute without value')
 | |
|             parser.attribValue = parser.attribName
 | |
|             attrib(parser)
 | |
|             openTag(parser)
 | |
|           } else if (isWhitespace(c)) {
 | |
|             parser.state = S.ATTRIB_NAME_SAW_WHITE
 | |
|           } else if (isMatch(nameBody, c)) {
 | |
|             parser.attribName += c
 | |
|           } else {
 | |
|             strictFail(parser, 'Invalid attribute name')
 | |
|           }
 | |
|           continue
 | |
| 
 | |
|         case S.ATTRIB_NAME_SAW_WHITE:
 | |
|           if (c === '=') {
 | |
|             parser.state = S.ATTRIB_VALUE
 | |
|           } else if (isWhitespace(c)) {
 | |
|             continue
 | |
|           } else {
 | |
|             strictFail(parser, 'Attribute without value')
 | |
|             parser.tag.attributes[parser.attribName] = ''
 | |
|             parser.attribValue = ''
 | |
|             emitNode(parser, 'onattribute', {
 | |
|               name: parser.attribName,
 | |
|               value: ''
 | |
|             })
 | |
|             parser.attribName = ''
 | |
|             if (c === '>') {
 | |
|               openTag(parser)
 | |
|             } else if (isMatch(nameStart, c)) {
 | |
|               parser.attribName = c
 | |
|               parser.state = S.ATTRIB_NAME
 | |
|             } else {
 | |
|               strictFail(parser, 'Invalid attribute name')
 | |
|               parser.state = S.ATTRIB
 | |
|             }
 | |
|           }
 | |
|           continue
 | |
| 
 | |
|         case S.ATTRIB_VALUE:
 | |
|           if (isWhitespace(c)) {
 | |
|             continue
 | |
|           } else if (isQuote(c)) {
 | |
|             parser.q = c
 | |
|             parser.state = S.ATTRIB_VALUE_QUOTED
 | |
|           } else {
 | |
|             strictFail(parser, 'Unquoted attribute value')
 | |
|             parser.state = S.ATTRIB_VALUE_UNQUOTED
 | |
|             parser.attribValue = c
 | |
|           }
 | |
|           continue
 | |
| 
 | |
|         case S.ATTRIB_VALUE_QUOTED:
 | |
|           if (c !== parser.q) {
 | |
|             if (c === '&') {
 | |
|               parser.state = S.ATTRIB_VALUE_ENTITY_Q
 | |
|             } else {
 | |
|               parser.attribValue += c
 | |
|             }
 | |
|             continue
 | |
|           }
 | |
|           attrib(parser)
 | |
|           parser.q = ''
 | |
|           parser.state = S.ATTRIB_VALUE_CLOSED
 | |
|           continue
 | |
| 
 | |
|         case S.ATTRIB_VALUE_CLOSED:
 | |
|           if (isWhitespace(c)) {
 | |
|             parser.state = S.ATTRIB
 | |
|           } else if (c === '>') {
 | |
|             openTag(parser)
 | |
|           } else if (c === '/') {
 | |
|             parser.state = S.OPEN_TAG_SLASH
 | |
|           } else if (isMatch(nameStart, c)) {
 | |
|             strictFail(parser, 'No whitespace between attributes')
 | |
|             parser.attribName = c
 | |
|             parser.attribValue = ''
 | |
|             parser.state = S.ATTRIB_NAME
 | |
|           } else {
 | |
|             strictFail(parser, 'Invalid attribute name')
 | |
|           }
 | |
|           continue
 | |
| 
 | |
|         case S.ATTRIB_VALUE_UNQUOTED:
 | |
|           if (!isAttribEnd(c)) {
 | |
|             if (c === '&') {
 | |
|               parser.state = S.ATTRIB_VALUE_ENTITY_U
 | |
|             } else {
 | |
|               parser.attribValue += c
 | |
|             }
 | |
|             continue
 | |
|           }
 | |
|           attrib(parser)
 | |
|           if (c === '>') {
 | |
|             openTag(parser)
 | |
|           } else {
 | |
|             parser.state = S.ATTRIB
 | |
|           }
 | |
|           continue
 | |
| 
 | |
|         case S.CLOSE_TAG:
 | |
|           if (!parser.tagName) {
 | |
|             if (isWhitespace(c)) {
 | |
|               continue
 | |
|             } else if (notMatch(nameStart, c)) {
 | |
|               if (parser.script) {
 | |
|                 parser.script += '</' + c
 | |
|                 parser.state = S.SCRIPT
 | |
|               } else {
 | |
|                 strictFail(parser, 'Invalid tagname in closing tag.')
 | |
|               }
 | |
|             } else {
 | |
|               parser.tagName = c
 | |
|             }
 | |
|           } else if (c === '>') {
 | |
|             closeTag(parser)
 | |
|           } else if (isMatch(nameBody, c)) {
 | |
|             parser.tagName += c
 | |
|           } else if (parser.script) {
 | |
|             parser.script += '</' + parser.tagName
 | |
|             parser.tagName = ''
 | |
|             parser.state = S.SCRIPT
 | |
|           } else {
 | |
|             if (!isWhitespace(c)) {
 | |
|               strictFail(parser, 'Invalid tagname in closing tag')
 | |
|             }
 | |
|             parser.state = S.CLOSE_TAG_SAW_WHITE
 | |
|           }
 | |
|           continue
 | |
| 
 | |
|         case S.CLOSE_TAG_SAW_WHITE:
 | |
|           if (isWhitespace(c)) {
 | |
|             continue
 | |
|           }
 | |
|           if (c === '>') {
 | |
|             closeTag(parser)
 | |
|           } else {
 | |
|             strictFail(parser, 'Invalid characters in closing tag')
 | |
|           }
 | |
|           continue
 | |
| 
 | |
|         case S.TEXT_ENTITY:
 | |
|         case S.ATTRIB_VALUE_ENTITY_Q:
 | |
|         case S.ATTRIB_VALUE_ENTITY_U:
 | |
|           var returnState
 | |
|           var buffer
 | |
|           switch (parser.state) {
 | |
|             case S.TEXT_ENTITY:
 | |
|               returnState = S.TEXT
 | |
|               buffer = 'textNode'
 | |
|               break
 | |
| 
 | |
|             case S.ATTRIB_VALUE_ENTITY_Q:
 | |
|               returnState = S.ATTRIB_VALUE_QUOTED
 | |
|               buffer = 'attribValue'
 | |
|               break
 | |
| 
 | |
|             case S.ATTRIB_VALUE_ENTITY_U:
 | |
|               returnState = S.ATTRIB_VALUE_UNQUOTED
 | |
|               buffer = 'attribValue'
 | |
|               break
 | |
|           }
 | |
| 
 | |
|           if (c === ';') {
 | |
|             parser[buffer] += parseEntity(parser)
 | |
|             parser.entity = ''
 | |
|             parser.state = returnState
 | |
|           } else if (isMatch(parser.entity.length ? entityBody : entityStart, c)) {
 | |
|             parser.entity += c
 | |
|           } else {
 | |
|             strictFail(parser, 'Invalid character in entity name')
 | |
|             parser[buffer] += '&' + parser.entity + c
 | |
|             parser.entity = ''
 | |
|             parser.state = returnState
 | |
|           }
 | |
| 
 | |
|           continue
 | |
| 
 | |
|         default:
 | |
|           throw new Error(parser, 'Unknown state: ' + parser.state)
 | |
|       }
 | |
|     } // while
 | |
| 
 | |
|     if (parser.position >= parser.bufferCheckPosition) {
 | |
|       checkBufferLength(parser)
 | |
|     }
 | |
|     return parser
 | |
|   }
 | |
| 
 | |
|   /*! http://mths.be/fromcodepoint v0.1.0 by @mathias */
 | |
|   /* istanbul ignore next */
 | |
|   if (!String.fromCodePoint) {
 | |
|     (function () {
 | |
|       var stringFromCharCode = String.fromCharCode
 | |
|       var floor = Math.floor
 | |
|       var fromCodePoint = function () {
 | |
|         var MAX_SIZE = 0x4000
 | |
|         var codeUnits = []
 | |
|         var highSurrogate
 | |
|         var lowSurrogate
 | |
|         var index = -1
 | |
|         var length = arguments.length
 | |
|         if (!length) {
 | |
|           return ''
 | |
|         }
 | |
|         var result = ''
 | |
|         while (++index < length) {
 | |
|           var codePoint = Number(arguments[index])
 | |
|           if (
 | |
|             !isFinite(codePoint) || // `NaN`, `+Infinity`, or `-Infinity`
 | |
|             codePoint < 0 || // not a valid Unicode code point
 | |
|             codePoint > 0x10FFFF || // not a valid Unicode code point
 | |
|             floor(codePoint) !== codePoint // not an integer
 | |
|           ) {
 | |
|             throw RangeError('Invalid code point: ' + codePoint)
 | |
|           }
 | |
|           if (codePoint <= 0xFFFF) { // BMP code point
 | |
|             codeUnits.push(codePoint)
 | |
|           } else { // Astral code point; split in surrogate halves
 | |
|             // http://mathiasbynens.be/notes/javascript-encoding#surrogate-formulae
 | |
|             codePoint -= 0x10000
 | |
|             highSurrogate = (codePoint >> 10) + 0xD800
 | |
|             lowSurrogate = (codePoint % 0x400) + 0xDC00
 | |
|             codeUnits.push(highSurrogate, lowSurrogate)
 | |
|           }
 | |
|           if (index + 1 === length || codeUnits.length > MAX_SIZE) {
 | |
|             result += stringFromCharCode.apply(null, codeUnits)
 | |
|             codeUnits.length = 0
 | |
|           }
 | |
|         }
 | |
|         return result
 | |
|       }
 | |
|       /* istanbul ignore next */
 | |
|       if (Object.defineProperty) {
 | |
|         Object.defineProperty(String, 'fromCodePoint', {
 | |
|           value: fromCodePoint,
 | |
|           configurable: true,
 | |
|           writable: true
 | |
|         })
 | |
|       } else {
 | |
|         String.fromCodePoint = fromCodePoint
 | |
|       }
 | |
|     }())
 | |
|   }
 | |
| })(typeof exports === 'undefined' ? this.sax = {} : exports)
 |