/** * Method to parse HTML source using JTidy. * Pls download JTidy jar file from its website. * @param is - Input Stream of the HTML Source */ private static void parseHtmlByTidy(InputStream is) { Tidy tidy = new Tidy(); // tidy will print whatever it parses to System.out Document doc = tidy.parseDOM(is, System.out); // Try to read