01: /***************************************************************
02: * This file is part of the [fleXive](R) project.
03: *
04: * Copyright (c) 1999-2008
05: * UCS - unique computing solutions gmbh (http://www.ucs.at)
06: * All rights reserved
07: *
08: * The [fleXive](R) project is free software; you can redistribute
09: * it and/or modify it under the terms of the GNU General Public
10: * License as published by the Free Software Foundation;
11: * either version 2 of the License, or (at your option) any
12: * later version.
13: *
14: * The GNU General Public License can be found at
15: * http://www.gnu.org/copyleft/gpl.html.
16: * A copy is found in the textfile GPL.txt and important notices to the
17: * license from the author are found in LICENSE.txt distributed with
18: * these libraries.
19: *
20: * This library is distributed in the hope that it will be useful,
21: * but WITHOUT ANY WARRANTY; without even the implied warranty of
22: * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
23: * GNU General Public License for more details.
24: *
25: * For further information about UCS - unique computing solutions gmbh,
26: * please see the company website: http://www.ucs.at
27: *
28: * For further information about [fleXive](R), please see the
29: * project website: http://www.flexive.org
30: *
31: *
32: * This copyright notice MUST APPEAR in all copies of the file!
33: ***************************************************************/package com.flexive.extractor.htmlExtractor;
34:
35: import java.io.FileInputStream;
36:
37: public class consoleTest {
38:
39: public static void main(String[] args) {
40:
41: FileInputStream input = null;
42: try {
43: input = new FileInputStream(args[0]);
44: HtmlExtractor result = new HtmlExtractor(input, true);
45: System.out.println(result.getText());
46: System.out.println("title:" + result.getTitle());
47: System.out.println("word#:" + result.getWordCount());
48: System.out.println("char#:" + result.getCharacterCount());
49: } catch (Exception exc) {
50: System.err.println("ERROR>>> " + exc.getMessage());
51: exc.printStackTrace();
52: } finally {
53: try {
54: if (input != null)
55: input.close();
56: } catch (Exception exc) {/*nothing*/
57: }
58: }
59: }
60:
61: }
|