foreach $filetoget(@aonly) { $fullfile="$base_url/$filetoget"; $fonly=$filetoget; #my $base_url = 'http://www.sec.gov/Archives'; for my $line (split qr/\'\n'/, get($fullfile)) { while ($line_count < 2) { if($line=~m/^\s*CENTRAL\s*INDEX\s*KEY:\s*(\d*)/m){$cik=$1;} if($line=~m/^\s*FORM\s*TYPE:\s*(.*$)/m){$form_type=$1;} if($line=~m/^\s*CONFORMED\s*PERIOD\s*OF\s*REPORT:\s*(\d*)/m){$report_date=$1;} if($line=~m/^\s*FILED\s*AS\s*OF\s*DATE:\s*(\d*)/m){$file_date=$1;} if($line=~m/^\s*COMPANY\s*CONFORMED\s*NAME:\s*(.*$)/m){$name=$1;} $line_count++; #last if $line_count > 29; print "$cik, $form_type, $report_date, $file_date, $name\n"; #if ($line_count++ >30) {next}; #Means no need to read another line, write to file!; print "$line_count\n"; } # end of while loop; } # end of for my $line split loop; #$line_count=0; ### Now write the results to file!; #Open the ouput file; #open my $FH_OUT, '>',$write_dir.'/'.$filename or die "Can't open file $filename"; open my $FH_OUT, '>>',$write_dir or die "Can't open file $write_dir"; #Save/write results/output; $,='|'; print $FH_OUT "$cik$,$form_type$,$report_date$,$file_date$,$name$,\n"; $line_count=0; #close $FH_IN or die "unable to close $filename"; #Update file_counter; #Update file counter; ++$file_count; print "$file_count lines read from $fullfile\n"; #closedir($dir_handle); close($FH_OUT); } # end of foreach file to get loop; #end of qtr loop } #end of year loop } sub trim { my $new_phrase; my $phrase = shift(@_); $phrase =~ s/^\s+//; $phrase =~ s/\s+$//; $new_phrase = "$phrase"; return "$new_phrase"; }