#!/usr/bin/perl
print "Content-type: text/html\n\n";
use CGI qw/:cgi-lib/;
use CGI::Carp qw(fatalsToBrowser);
%FORM=Vars();
use CGI;
use PDF::Parse;
opendir (DIR, '/pdfdocs') or die "Couldn't open directory, $!";
while ($file = readdir DIR)
{
print "Extracting: $file...";
my $pdf = CAM::PDF->new($file);
my $pageone_tree = $pdf->getPageContentTree(1);
$pagetext= CAM::PDF::PageText->render($pageone_tree);
open(OUTF,">./pdfdocs/$file.txt");
print OUTF "$pagetext\n";
close(OUTF);
$pagetext="";
print "Done<br>\n";
}
closedir DIR;