comment on

Well, I have a first release of my rhyme generator done. The dictionary module can be found here. I would welcome any comments on style, efficiency, room for improvement, etc.

package Lingua::EN::Rhyme;
use strict;
use Lingua::EN::Rhyme::Dictionary qw/%dict %reversedict/;
require Exporter;

our @ISA =qw/Exporter/;
our @EXPORT=qw/variants pronounce syllables accent endrhyme beginrhyme
+ visualrhyme/;
our @EXPORT_OK=qw/endsylrhyme beginsylrhyme/;
our %EXPORT_TAGS= ( default => [qw(variants pronounce syllables accent
+ endrhyme beginrhyme visualrhyme)]);
our $VERSION=0.01;

sub pronounce {
  my $word=$_[0];
  $word.="($_[1])" if defined ($_[1]) and $_[1]>1;
  return defined($dict{uc($word)})? $dict{uc($word)} : "** unknown wor
+d **";
}

sub syllables {
  my $pron=pronounce(uc($_[0]),$_[1]);
  $_=$pron;
  my @match=/([012])/g;
  my $rv=@match;
  return ($rv) if !($pron=~/unknown word/);
}

sub accent {
  my $pron=pronounce(uc($_[0]),$_[1]);
  $_=$pron;
  my @match=/([012])/g;
  return wantarray()?@match:join('',@match);
}

sub sylpron {
  $_=$_[0];
  my @match=/([012])/g;
  my $rv=@match;
  return $rv;
}

sub beginrhyme {
  my ($word,$variant,$syl) = @_;
  my $pron=pronounce(uc($word),$variant);
  $pron=$word if ($word =~ / /);
  my $syllab=sylpron($pron);
  $syl=$syllab if (!defined($syl))||($syl>$syllab);
  my @result=();
  for (my $i=$syl; $i>0; $i--) {
    @result = beginsylrhyme ($word,$variant,$i);
    if (@result) {
      return wantarray()? @result: $result[int(rand(@result))];
    }
  }
  return wantarray()?():"";
} 

sub variants {
  my $word=uc(shift);
  my $answer=2;
  return 0 if !defined($dict{$word});
  while (defined($dict{"${word}($answer)"})) {
    $answer++
  } 
  $answer--;
  return $answer;
}

sub visualrhyme {
  my $word=uc(shift);
  my $letters=shift;
  $letters=length($word)-1 if (!defined($letters));
  my @results=();
  for (my $i=$letters; $i>0; $i--) {
    foreach (keys %dict) {
       push (@results,$_) if length($_)>$i and (substr($word,-$i) eq s
+ubstr($_,-$i)) and $word ne $_ and $_ !~ /\(\d\)/;
    }
    if (@results) {
      return wantarray()?@results:$results[int(rand(@results))];
    }
  }
  return wantarray()?():"";
}


sub endrhyme {
  my ($word,$variant,$syl) = @_;
  my $pron=pronounce(uc($word),$variant);
  $pron=$word if ($word =~ / /);
  my $syllab=sylpron($pron);
  $syl=$syllab if (!defined($syl))||($syl>$syllab); 
  
  my @result=();
  for (my $i=$syl; $i>0; $i--) {
    @result = endsylrhyme($word,$variant,$i) ;
    if (@result) {
      return wantarray()? @result : $result[int(rand(@result))];
    }
  } 
  return wantarray()? (): "";
}

sub endsylrhyme {
  my ($word,$variant,$syl) = @_;
  $word=uc($word);
  my $pron = pronounce ($word,$variant);
  $pron=$word if ($word=~/ /);
  if ($pron=~ /^\*\*/) {
    return wantarray()? ():"";
  }
  $pron =~ /\b(\w+\d)\b/;
  $pron = substr($pron,$-[0]);
  my @resultarray=();
  my $syllab=sylpron($pron);
  while (defined($syl) and $syl<$syllab and $syl>0) {
    $pron =~ /\b(\w+\d)\b/; #skip a vowel
    $pron = substr($pron,$+[0]) if defined($+[0]);
    $pron =~ /\b(\w+\d)\b/; #strip consonants in front of it
    $pron = substr($pron,$-[0]) if defined($-[0]);
    $syllab = sylpron($pron);
  }
  foreach (keys %reversedict) {
    push(@resultarray,$reversedict{$_}) if /$pron$/ and $reversedict{$
+_}!~/^$word(\(\d\))?$/;
  }
  if (@resultarray) {
    return wantarray()? @resultarray : $resultarray[int(rand(@resultar
+ray))];
   } else {
     return wantarray()? ():"";
   } 
}

sub beginsylrhyme {
  my ($word,$variant,$syl) = @_;
  $word=uc($word);
  my $pron = pronounce ($word,$variant);
  $pron=$word if ($word=~/ /);
  if ($pron=~ /^\*\*/) {
    return wantarray()? ():"";
  }
  $pron = reverse $pron;
  $pron =~ /\b(\d\w+)\b/;
  $pron = substr($pron,$-[0]);
  my @resultarray=();
  my $syllab=syllables($word,$variant);
  while (defined($syl) and $syl<$syllab and $syl>0) {
    $pron =~ /\b(\d\w+)\b/; #skip a vowel
    $pron = substr($pron,$+[0]) if defined($+[0]);
    $pron =~ /\b(\d\w+)\b/; #strip consonants in front of it
    $pron = substr($pron,$-[0]) if defined($-[0]);
    $syllab = sylpron($pron);
  }
  $pron=reverse $pron;
  foreach (keys %reversedict) {
    push(@resultarray,$reversedict{$_}) if /^$pron/ and $reversedict{$
+_}!~/^$word(\(\d\))?$/;
  }
  if (@resultarray) {
    return wantarray()? @resultarray : $resultarray[int(rand(@resultar
+ray))];
   } else {
     return wantarray()? ():"";
   } 
}

=head1 NAME

Lingua::EN::Rhyme - Finds rhymes for English words.

=head1 SYNOPSIS

    use Lingua::EN::Rhyme;
    my $rhyme=endrhyme('orange');
    my @rhymelist=endrhyme('orange');
    $rhyme=beginrhyme('project',2,1); #Pronunciation 2, one syllable o
+nly
    my $accentuation=accent('abortionist');
    my $pronunciation=pronounce('project',2);

=head1 DESCRIPTION

To the joy of would-be poets everywhere, this module seeks to ease the
+ 
load of finding the perfect rhyme. The dictionary used is the freely
distributable CMU Pronouncing dictionary, and is contained in the modu
+le
Lingua::EN::Rhyme::Dictionary.

=head2 Default Export

C<endrhyme> - You must specify a word, and optionally the number of th
+e variant
desired and the maximum number of syllables to match. Given these para
+meters,
a list of the "best" matches will be created. If called in array conte
+xt,
this array is returned, while in scalar context a random entry from th
+e list
is given. You may optionally provide a phonetic transcription followin
+g the
CMU style instead of a word. In this case, the value of the variant wo
+uld be
ignored.

C<beginrhyme> - Usage is the same as endrhyme, but matches the beginni
+ng of the
words. Here "silver" would be a rhyme for "sylvan", for instance.

C<visualrhyme> - Looks for words having the same ending letters as the
+ 
word provided. You may optionally provide a maximum number of letters 
+to match.
Here you do not specify a variant, because we are basing this on spell
+ing,
not pronunciation.

C<pronounce> - Returns the pronunciation of the word. You may optional
+ly 
provide the number of the variant.

C<variants> - Returns the number of variants in the dictionary for the
+ 
word provided.

C<accent> - Returns either an array or a string containing the accentu
+ation
values of the word (and optionally variant) values provided. Here, 0 m
+eans
unaccented, 1 is primary stress, and 2 is secondary stress.

C<syllables> - Returns the number of syllables in the word (and option
+ally
variant).

=head2 Optional Exports

The following two routines are used internally by Lingua::EN::Rhyme, b
+ut may
be exported for use in the calling program if desired.

C<endsylrhyme> - Here you must specify word, variant, and number of sy
+llables.
Returns word(s) that rhyme in EXACTLY the number of syllables requeste
+d.

C<beginsylrhyme> - The same, for beginning rhymes.

=head1 HISTORY

    Revision 0.01    2001/05/28    Mark Polo
    Initial revision

=head1 COPYRIGHT

Copyright 2001 by Mark Polo

=head1 LICENSE

Permission is hereby granted, free of charge, to any person obtaining 
+a
copy of this software and associated documentation files (the "Softwar
+e"),
to deal in the Software without restriction, including without limitat
+ion
the rights to use, copy, modify, merge, publish, distribute, sublicens
+e,
and/or sell copies of the Software, and to permit persons to whom the
Software is furnished to do so, subject to the following conditions:

The above copyright notice and this permission notice shall be include
+d
in all copies or substantial portions of the Software.

THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRES
+S OR
IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILIT
+Y,
FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHAL
+L
THE AUTHOR BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER LIABILITY,
WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM, OUT
OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN
THE SOFTWARE.

=cut

1;
[download]

In reply to Rhyme generator by mpolo

Are you posting in the right place? Check out Where do I post X? to know for sure.
Posts may use any of the Perl Monks Approved HTML tags. Currently these include the following:
<code> <a> <b> <big> <blockquote> <br /> <dd> <dl> <dt> <em> <font> <h1> <h2> <h3> <h4> <h5> <h6> <hr /> <i> <li> <nbsp> <ol> <p> <small> <strike> <strong> <sub> <sup> <table> <td> <th> <tr> <tt> <u> <ul>
Snippets of code should be wrapped in <code> tags not <pre> tags. In fact, <pre> tags should generally be avoided. If they must be used, extreme care should be taken to ensure that their contents do not have long lines (<70 chars), in order to prevent horizontal scrolling (and possible janitor intervention).
Want more info? How to link or How to display code and escape characters are good places to start.


P is for Practical
	PerlMonks