vue.js 源代码学习笔记 ----- html-parse.js

/**

 * Not type-checking this file because it's mostly vendor code.

 */

/*!

 * HTML Parser By John Resig (ejohn.org)

 * Modified by Juriy "kangax" Zaytsev

 * Original code by Erik Arvidsson, Mozilla Public License

 * http://erik.eae.net/simplehtmlparser/simplehtmlparser.js

 */

import { makeMap, no } from 'shared/util'

import { isNonPhrasingTag, canBeLeftOpenTag } from 'web/util/index'

// Regular Expressions for parsing tags and attributes

const singleAttrIdentifier = /([^\s"'<>/=]+)/

const singleAttrAssign = /(?:=)/

const singleAttrValues = [

  // attr value double quotes

  /"([^"]*)"+/.source,

  // attr value, single quotes

  /'([^']*)'+/.source,

  // attr value, no quotes

  /([^\s"'=<>`]+)/.source

]

const attribute = new RegExp(

  '^\\s*' + singleAttrIdentifier.source +

  '(?:\\s*(' + singleAttrAssign.source + ')' +

  '\\s*(?:' + singleAttrValues.join('|') + '))?'

)

// could use https://www.w3.org/TR/1999/REC-xml-names-19990114/#NT-QName

// but for Vue templates we can enforce a simple charset

const ncname = '[a-zA-Z_][\\w\\-\\.]*'

const qnameCapture = '((?:' + ncname + '\\:)?' + ncname + ')'

const startTagOpen = new RegExp('^<' + qnameCapture)

const startTagClose = /^\s*(\/?)>/

const endTag = new RegExp('^<\\/' + qnameCapture + '[^>]*>')

const doctype = /^<!DOCTYPE [^>]+>/i

const comment = /^<!--/

const conditionalComment = /^<!\[/

let IS_REGEX_CAPTURING_BROKEN = false

'x'.replace(/x(.)?/g, function (m, g) {

  IS_REGEX_CAPTURING_BROKEN = g === ''

})

// Special Elements (can contain anything)

const isScriptOrStyle = makeMap('script,style', true)

const hasLang = attr => attr.name === 'lang' && attr.value !== 'html'

const isSpecialTag = (tag, isSFC, stack) => {

  if (isScriptOrStyle(tag)) {

    return true

  }

  if (isSFC && stack.length === 1) {

    // top-level template that has no pre-processor

    if (tag === 'template' && !stack[0].attrs.some(hasLang)) {

      return false

    } else {

      return true

    }

  }

  return false

}

const reCache = {}

const ltRE = /&lt;/g

const gtRE = /&gt;/g

const nlRE = /
/g

const ampRE = /&amp;/g

const quoteRE = /&quot;/g

function decodeAttr (value, shouldDecodeNewlines) {

  if (shouldDecodeNewlines) {

    value = value.replace(nlRE, '\n')

  }

  return value

    .replace(ltRE, '<')

    .replace(gtRE, '>')

    .replace(ampRE, '&')

    .replace(quoteRE, '"')

}

export function parseHTML (html, options) {

  const stack = []

  const expectHTML = options.expectHTML

  const isUnaryTag = options.isUnaryTag || no

  let index = 0

  let last, lastTag

  while (html) {

    last = html

    // Make sure we're not in a script or style element

    if (!lastTag || !isSpecialTag(lastTag, options.sfc, stack)) {

      let textEnd = html.indexOf('<')

      if (textEnd === 0) {

        // Comment:

        if (comment.test(html)) {

          const commentEnd = html.indexOf('-->')

          if (commentEnd >= 0) {

            advance(commentEnd + 3)

            continue

          }

        }

        // http://en.wikipedia.org/wiki/Conditional_comment#Downlevel-revealed_conditional_comment

        if (conditionalComment.test(html)) {

          const conditionalEnd = html.indexOf(']>')

          if (conditionalEnd >= 0) {

            advance(conditionalEnd + 2)

            continue

          }

        }

        // Doctype:

        const doctypeMatch = html.match(doctype)

        if (doctypeMatch) {

          advance(doctypeMatch[0].length)

          continue

        }

        // End tag:

        const endTagMatch = html.match(endTag)

        if (endTagMatch) {

          const curIndex = index

          advance(endTagMatch[0].length)

          parseEndTag(endTagMatch[0], endTagMatch[1], curIndex, index)

          continue

        }

        // Start tag:

        const startTagMatch = parseStartTag()

        if (startTagMatch) {

          handleStartTag(startTagMatch)

          continue

        }

      }

      let text, rest, next

      if (textEnd > 0) {

        rest = html.slice(textEnd)

        while (

          !endTag.test(rest) &&

          !startTagOpen.test(rest) &&

          !comment.test(rest) &&

          !conditionalComment.test(rest)

        ) {

          // < in plain text, be forgiving and treat it as text

          next = rest.indexOf('<', 1)

          if (next < 0) break

          textEnd += next

          rest = html.slice(textEnd)

        }

        text = html.substring(0, textEnd)

        advance(textEnd)

      }

      if (textEnd < 0) {

        text = html

        html = ''

      }

      if (options.chars && text) {

        options.chars(text)

      }

    } else {

      var stackedTag = lastTag.toLowerCase()

      var reStackedTag = reCache[stackedTag] || (reCache[stackedTag] = new RegExp('([\\s\\S]*?)(</' + stackedTag + '[^>]*>)', 'i'))

      var endTagLength = 0

      var rest = html.replace(reStackedTag, function (all, text, endTag) {

        endTagLength = endTag.length

        if (stackedTag !== 'script' && stackedTag !== 'style' && stackedTag !== 'noscript') {

          text = text

            .replace(/<!--([\s\S]*?)-->/g, '$1')

            .replace(/<!\[CDATA\[([\s\S]*?)]]>/g, '$1')

        }

        if (options.chars) {

          options.chars(text)

        }

        return ''

      })

      index += html.length - rest.length

      html = rest

      parseEndTag('</' + stackedTag + '>', stackedTag, index - endTagLength, index)

    }

    if (html === last && options.chars) {

      options.chars(html)

      break

    }

  }

  // Clean up any remaining tags

  parseEndTag()

  function advance (n) {

    index += n

    html = html.substring(n)

  }

  function parseStartTag () {

    const start = html.match(startTagOpen)

    if (start) {

      const match = {

        tagName: start[1],

        attrs: [],

        start: index

      }

      advance(start[0].length)

      let end, attr

      while (!(end = html.match(startTagClose)) && (attr = html.match(attribute))) {

        advance(attr[0].length)

        match.attrs.push(attr)

      }

      if (end) {

        match.unarySlash = end[1]

        advance(end[0].length)

        match.end = index

        return match

      }

    }

  }

  function handleStartTag (match) {

    const tagName = match.tagName

    let unarySlash = match.unarySlash

    if (expectHTML) {

      if (lastTag === 'p' && isNonPhrasingTag(tagName)) {

        parseEndTag('', lastTag)

      }

      if (canBeLeftOpenTag(tagName) && lastTag === tagName) {

        parseEndTag('', tagName)

      }

    }

    const unary = isUnaryTag(tagName) || tagName === 'html' && lastTag === 'head' || !!unarySlash

    const l = match.attrs.length

    const attrs = new Array(l)

    for (let i = 0; i < l; i++) {

      const args = match.attrs[i]

      // hackish work around FF bug https://bugzilla.mozilla.org/show_bug.cgi?id=369778

      if (IS_REGEX_CAPTURING_BROKEN && args[0].indexOf('""') === -1) {

        if (args[3] === '') { delete args[3] }

        if (args[4] === '') { delete args[4] }

        if (args[5] === '') { delete args[5] }

      }

      const value = args[3] || args[4] || args[5] || ''

      attrs[i] = {

        name: args[1],

        value: decodeAttr(

          value,

          options.shouldDecodeNewlines

        )

      }

    }

    if (!unary) {

      stack.push({ tag: tagName, attrs: attrs })

      lastTag = tagName

      unarySlash = ''

    }

    if (options.start) {

      options.start(tagName, attrs, unary, match.start, match.end)

    }

  }

  function parseEndTag (tag, tagName, start, end) {

    let pos

    if (start == null) start = index

    if (end == null) end = index

    // Find the closest opened tag of the same type

    if (tagName) {

      const needle = tagName.toLowerCase()

      for (pos = stack.length - 1; pos >= 0; pos--) {

        if (stack[pos].tag.toLowerCase() === needle) {

          break

        }

      }

    } else {

      // If no tag name is provided, clean shop

      pos = 0

    }

    if (pos >= 0) {

      // Close all the open elements, up the stack

      for (let i = stack.length - 1; i >= pos; i--) {

        if (options.end) {

          options.end(stack[i].tag, start, end)

        }

      }

      // Remove the open elements from the stack

      stack.length = pos

      lastTag = pos && stack[pos - 1].tag

    } else if (tagName.toLowerCase() === 'br') {

      if (options.start) {

        options.start(tagName, [], true, start, end)

      }

    } else if (tagName.toLowerCase() === 'p') {

      if (options.start) {

        options.start(tagName, [], false, start, end)

      }

      if (options.end) {

        options.end(tagName, start, end)

      }

    }

  }

}

vue.js 源代码学习笔记 ----- html-parse.js的更多相关文章

vue.js 源代码学习笔记 ----- core scedule.js
/* @flow */ import type Watcher from './watcher' import config from '../config' import { callHook } ...
vue.js 源代码学习笔记 ----- core array.js
/* * not type checking this file because flow doesn't play well with * dynamically accessing methods ...
node.js day01学习笔记:认识node.js
Node.js(JavaScript,everywhere) 1.Node.js 介绍 1.1. 为什么要学习Node.js 企业需求 + 具有服务端开发经验更好 + front-end + back ...
vue.js 源代码学习笔记 ----- 工具方法 lang
/* @flow */ // Object.freeze 使得这个对象不能增加属性, 修改属性, 这样就保证了这个对象在任何时候都是空的 export const emptyObject = Obje ...
vue.js 源代码学习笔记 ----- 工具方法 env
/* @flow */ /* globals MutationObserver */ import { noop } from 'shared/util' // can we use __proto_ ...
vue.js 源代码学习笔记 ----- helpers.js
/* @flow */ import { parseFilters } from './parser/filter-parser' export function baseWarn (msg: str ...
vue.js 源代码学习笔记 ----- 工具方法 share
/* @flow */ /** * Convert a value to a string that is actually rendered. { .. } [ .. ] 2 => '' */ ...
vue.js 源代码学习笔记 ----- instance render
/* @flow */ import { warn, nextTick, toNumber, _toString, looseEqual, emptyObject, handleError, loos ...
vue.js 源代码学习笔记 ----- instance event
/* @flow */ import { updateListeners } from '../vdom/helpers/index' import { toArray, tip, hyphenate ...

随机推荐

Java压缩多个文件并导出
controller层: /** * 打包压缩下载文件 */ @RequestMapping(value = "/downLoadZipFile") public void dow ...
Openstack（五）Memcache- repcached集群
5.1.1下载Memcache- repcached并解压 # wget http://downloads.sourceforge.net/repcached/memcached-1.2.8-repc ...
（转）SpringBoot非官方教程 | 第七篇：springboot开启声明式事务
springboot开启事务很简单,只需要一个注解@Transactional 就可以了.因为在springboot中已经默认对jpa.jdbc.mybatis开启了事事务,引入它们依赖的时候,事物就 ...
基因芯片与NGS区别[转载]
转自:http://blog.sina.com.cn/s/blog_40d4ae110101fjzy.html 1 二代测序与基因芯片的区别与优缺点. 生物芯片相对第二代测序而言,优势在于价格便宜,便 ...
linux系统进入单用户模式
进入单用户模式可进行root账户和其他普通账户的密码的修改 1)Ubuntu 开机到grub时(在开机时长按shift键),用上下键移到第二行的恢复模式(recovery mode),按e(注意不是回 ...
Django之MTV
一.MTV模型 Django的MTV分别代表: Model(模型):负责业务对象与数据库的对象(ORM) Template(模版):负责如何把页面展示给用户 View(视图):负责业务逻辑,并在适当的 ...
html 音频
<!DOCTYPE html><meta charset="utf-8"><video src="movie.webm" cont ...
HDU5183 hash 表
做题的时候忘了数据结构老师说的hash表了, 用二分找,还好过了, hash 表对这题更快一些 #include <iostream> #include <algorithm& ...
一次频繁Full GC问题排查过程分享
问题描述应用收到频繁Full GC告警问题排查登录到对应机器上去,查看GC日志,发现YGC一分钟已经达到了15次,比Full GC还要频繁一些,其中Full GC平均10分钟超过了4次,如下图 ...
Windows10系统远程桌面连接出现卡顿如何解决
最新的windows10系统下,用户只要开启远程桌面连接,就能够轻松地操控其他电脑.但是,最近部分用户在win10中启用远程连接时,发现电脑窗口变得非常缓慢卡顿,这是怎么回事呢?其实,该问题与系统的设 ...

vue.js 源代码学习笔记 ----- html-parse.js

vue.js 源代码学习笔记 ----- html-parse.js的更多相关文章

随机推荐

热门专题