How to use Regular Expressions with HTML

by Ovid (Cardinal)
on Aug 16, 2003

    $data =~ s{(<a\s(?:[^>](?!href))*href\s*)(&(&[^;]+;)?(?:.(?!\3))+(?:\3
    <p class="foo" name="bar">
    <p name="bar" CLASS="ovid has no class">
    <p NAME="bar" class="ovid has no class">
    <p name="bar" class="ovid has no class">
    package HTML::Token;
            return $tag;
    my $html = <<END_HTML;
    <h1>This is a test</h1>
        push @tokens => HTML::Token->new($token);
    push @tokens => (qw[* . *]); # make the (p) tag zero or more, followed
    + by anything
    use Token::Regex;
    my $regex = Token::Regex->new('HTML::Token');
    my $tokens = html_tokens(<<END_HTML);
    <h1>This is html</h1>
        return \@tokens;

