Beefy Boxes and Bandwidth Generously Provided by pair Networks
Perl Monk, Perl Meditation
 
PerlMonks  

Re: How to recognize url in text and convert to hyperlink, unless already in anchor

by pizza_milkshake (Monk)
on Oct 11, 2004 at 23:19 UTC ( #398331=note: print w/ replies, xml ) Need Help??


in reply to How to recognize url in text and convert to hyperlink, unless already in anchor

$ cat no_href.pl

#!perl -l # ex: set ts=4: use strict; use warnings; use HTML::Parser; use URI; my (@tagstack, $BUF); sub start { # enter into tags my ($tag, $attr, $text) = @_; $tag .= " href" if ($tag eq "a" && defined $attr->{"href"}); push @tagstack, $tag; output($text); } sub end { # escape out of tags my ($tag, $text) = @_; shift @tagstack while (scalar @tagstack && $tagstack[0] ne $tag); shift @tagstack if scalar @tagstack; # actually nuke element we're + looking for output($text); } sub text { # handle everything inside and around tags my ($text) = @_; if (unlinked()) { # replace URLs with their linked equivalent if we're not withi +n a link $text =~ s{ \b(http://\S+) }{ "<a href=\"" . URI->new($1)->can +onical . "\">$1</a>" }gex; } output($text); } # are we inside a link right now? sub unlinked { return not scalar grep { /^a href$/ } @tagstack; } # add to output buffer sub output { $BUF .= shift @_; } # start code my $p = HTML::Parser->new( "start_h" => [ \&start, "tagname, attr, text" ] ,"end_h" => [ \&end, "tagname, text" ] ,"text_h" => [ \&text, "dtext" ] ); $p->parse(do{ local $/; <DATA> }); print $BUF; __DATA__ <a href="">http://linked1.com</a> <a style="" href='bob'>http://linked2.com</a> <a href="whatever">http://linked3.com</a> <a nolink>http://linked4.com</a> http://unlinked1 http://unlinked2.com
$ perl no_href.pl
<a href="">http://linked1.com</a> <a style="" href='bob'>http://linked2.com</a> <a href="whatever">http://linked3.com</a> <a nolink><a href="http://linked4.com/">http://linked4.com</a></a> <a href="http://unlinked1/">http://unlinked1</a> <a href="http://unlinked2.com/">http://unlinked2.com</a>

perl -e"\$_=qq/nwdd\x7F^n\x7Flm{{llql0}qs\x14/;s/./chr(ord$&^30)/ge;print"


Comment on Re: How to recognize url in text and convert to hyperlink, unless already in anchor
Select or Download Code

Log In?
Username:
Password:

What's my password?
Create A New User
Node Status?
node history
Node Type: note [id://398331]
help
Chatterbox?
and the web crawler heard nothing...

How do I use this? | Other CB clients
Other Users?
Others rifling through the Monastery: (6)
As of 2015-07-04 18:27 GMT
Sections?
Information?
Find Nodes?
Leftovers?
    Voting Booth?

    The top three priorities of my open tasks are (in descending order of likelihood to be worked on) ...









    Results (60 votes), past polls