Class | FeedParser::SGMLParser |
In: |
lib/feedparser/sgml-parser.rb
|
Parent: | Object |
Interesting | = | /[&<]/ | Regular expressions used for parsing: | |
Incomplete | = | Regexp.compile('&([a-zA-Z][a-zA-Z0-9]*|#[0-9]*)?|' + '<([a-zA-Z][^<>]*|/([a-zA-Z][^<>]*)?|' + '![^<>]*)?') | ||
Entityref | = | /&([a-zA-Z][-.a-zA-Z0-9]*);/ | ||
Charref | = | /&#([0-9]+);/ | ||
Starttagopen | = | /<[>a-zA-Z]/ | ||
Endtagopen | = | /<\/[<>a-zA-Z]/ | ||
Endbracket | = | /[<>]/ | ||
Special | = | /<![^<>]*>/ | ||
Commentopen | = | /<!--/ | ||
Commentclose | = | /--[ \t\n]*>/ | ||
Tagfind | = | /[a-zA-Z][a-zA-Z0-9.-]*/ | ||
Attrfind | = | Regexp.compile('[\s,]*([a-zA-Z_][a-zA-Z_0-9.-]*)' + '(\s*=\s*' + "('[^']*'" + '|"[^"]*"' + '|[-~a-zA-Z0-9,./:+*%?!()_#=]*))?') | ||
Entitydefs | = | {'lt'=>'<', 'gt'=>'>', 'amp'=>'&', 'quot'=>'"', 'apos'=>'\''} |