krmahadevan/PlayWithPDF.java

## PlayWithPDF.java
import java.io.BufferedInputStream;
import java.io.IOException;
import java.net.URISyntaxException;
import java.net.URL;

import org.apache.pdfbox.pdfparser.PDFParser;
import org.apache.pdfbox.util.PDFTextStripper;

public class PlayWithPDF {

	/**
	 * @param args
	 * @throws URISyntaxException
	 * @throws IOException
	 */
	public static void main(String[] args) throws URISyntaxException, IOException {
		URL url = new URL("http://illiad.evms.edu/sample.pdf");
		System.out.println(getTextFromPDF(url));
	}

	public static String getTextFromPDF(URL url) throws IOException{
		BufferedInputStream fileToParse = new BufferedInputStream(url.openStream());
		PDFParser parser = new PDFParser(fileToParse);
		parser.parse();
		String text = new PDFTextStripper().getText(parser.getPDDocument());
		System.out.println(text);
		parser.getPDDocument().close();
		return text;
	}

}
	import java.io.BufferedInputStream;
	import java.io.IOException;
	import java.net.URISyntaxException;
	import java.net.URL;

	import org.apache.pdfbox.pdfparser.PDFParser;
	import org.apache.pdfbox.util.PDFTextStripper;

	public class PlayWithPDF {

	/**
	* @param args
	* @throws URISyntaxException
	* @throws IOException
	*/
	public static void main(String[] args) throws URISyntaxException, IOException {
	URL url = new URL("http://illiad.evms.edu/sample.pdf");
	System.out.println(getTextFromPDF(url));
	}

	public static String getTextFromPDF(URL url) throws IOException{
	BufferedInputStream fileToParse = new BufferedInputStream(url.openStream());
	PDFParser parser = new PDFParser(fileToParse);
	parser.parse();
	String text = new PDFTextStripper().getText(parser.getPDDocument());
	System.out.println(text);
	parser.getPDDocument().close();
	return text;
	}

	}