use strict; use warnings; use utf8; my $re_address_word = qr/\b(?: universit|center|centre|institute?|sciences?|college|research| avenue|street|philosophy|professor|address|department| umass )\b/ix; our $re_publication_word = qr/\b(?: forthcoming|editors?|edited|publish\w*|press|volume to\sappear\sin|draft|editor\w*|reprints?|excerpt| circulation|cite )\b/ix; my $re_notitle = qr/ $re_address_word | $re_publication_word | \b(?:thanks?| @| [12]\d{3}| abstract )/ix; our $re_title = qr/^ (?!.*$re_notitle?.*) \p{IsAlpha} /x;