blob: 8702379e2e438e8fa8f96fce8864a4c01a37151d [file] [log] [blame]
# -*- coding: utf-8 -*- #
module Rouge
module Lexers
class XML < RegexLexer
title "XML"
desc %q(<desc for="this-lexer">XML</desc>)
tag 'xml'
filenames *%w(*.xml *.xsl *.rss *.xslt *.xsd *.wsdl)
mimetypes *%w(
text/xml
application/xml
image/svg+xml
application/rss+xml
application/atom+xml
)
def self.analyze_text(text)
return 0.9 if text.doctype?
return 0.8 if text =~ /\A<\?xml\b/
start = text[0..1000]
return 0.6 if start =~ %r(<xml\b)
return 0.3 if start =~ %r(<.+?>.*?</.+?>)m
end
state :root do
rule /[^<&]+/, Text
rule /&\S*?;/, Name::Entity
rule /<!\[CDATA\[.*?\]\]\>/, Comment::Preproc
rule /<!--/, Comment, :comment
rule /<\?.*?\?>/, Comment::Preproc
rule /<![^>]*>/, Comment::Preproc
# open tags
rule %r(<\s*[\w:.-]+)m, Name::Tag, :tag
# self-closing tags
rule %r(<\s*/\s*[\w:.-]+\s*>)m, Name::Tag
end
state :comment do
rule /[^-]+/m, Comment
rule /-->/, Comment, :pop!
rule /-/, Comment
end
state :tag do
rule /\s+/m, Text
rule /[\w.:-]+\s*=/m, Name::Attribute, :attr
rule %r(/?\s*>), Name::Tag, :pop!
end
state :attr do
rule /\s+/m, Text
rule /".*?"|'.*?'|[^\s>]+/, Str, :pop!
end
end
end
end