Java Doc for plasmaParser.java in  » Search-Engine » yacy » de » anomic » plasma » Java Source Code / Java DocumentationJava Source Code and Java Documentation

Java Source Code / Java Documentation
1. 6.0 JDK Core
2. 6.0 JDK Modules
3. 6.0 JDK Modules com.sun
4. 6.0 JDK Modules com.sun.java
5. 6.0 JDK Modules sun
6. 6.0 JDK Platform
7. Ajax
8. Apache Harmony Java SE
9. Aspect oriented
10. Authentication Authorization
11. Blogger System
12. Build
13. Byte Code
14. Cache
15. Chart
16. Chat
17. Code Analyzer
18. Collaboration
19. Content Management System
20. Database Client
21. Database DBMS
22. Database JDBC Connection Pool
23. Database ORM
24. Development
25. EJB Server geronimo
26. EJB Server GlassFish
27. EJB Server JBoss 4.2.1
28. EJB Server resin 3.1.5
29. ERP CRM Financial
30. ESB
31. Forum
32. GIS
33. Graphic Library
34. Groupware
35. HTML Parser
36. IDE
37. IDE Eclipse
38. IDE Netbeans
39. Installer
40. Internationalization Localization
41. Inversion of Control
42. Issue Tracking
43. J2EE
44. JBoss
45. JMS
46. JMX
47. Library
48. Mail Clients
49. Net
50. Parser
51. PDF
52. Portal
53. Profiler
54. Project Management
55. Report
56. RSS RDF
57. Rule Engine
58. Science
59. Scripting
60. Search Engine
61. Security
62. Sevlet Container
63. Source Control
64. Swing Library
65. Template Engine
66. Test Coverage
67. Testing
68. UML
69. Web Crawler
70. Web Framework
71. Web Mail
72. Web Server
73. Web Services
74. Web Services apache cxf 2.0.1
75. Web Services AXIS2
76. Wiki Engine
77. Workflow Engines
78. XML
79. XML UI
Java
Java Tutorial
Java Open Source
Jar File Download
Java Articles
Java Products
Java by API
Photoshop Tutorials
Maya Tutorials
Flash Tutorials
3ds-Max Tutorials
Illustrator Tutorials
GIMP Tutorials
C# / C Sharp
C# / CSharp Tutorial
C# / CSharp Open Source
ASP.Net
ASP.NET Tutorial
JavaScript DHTML
JavaScript Tutorial
JavaScript Reference
HTML / CSS
HTML CSS Reference
C / ANSI-C
C Tutorial
C++
C++ Tutorial
Ruby
PHP
Python
Python Tutorial
Python Open Source
SQL Server / T-SQL
SQL Server / T-SQL Tutorial
Oracle PL / SQL
Oracle PL/SQL Tutorial
PostgreSQL
SQL / MySQL
MySQL Tutorial
VB.Net
VB.Net Tutorial
Flash / Flex / ActionScript
VBA / Excel / Access / Word
XML
XML Tutorial
Microsoft Office PowerPoint 2007 Tutorial
Microsoft Office Excel 2007 Tutorial
Microsoft Office Word 2007 Tutorial
Java Source Code / Java Documentation » Search Engine » yacy » de.anomic.plasma 
Source Cross Reference  Class Diagram Java Document (Java Doc) 


java.lang.Object
   de.anomic.plasma.plasmaParser

plasmaParser
final public class plasmaParser (Code)


Field Summary
final public static  HashSet<String>PARSER_MODE
    
final public static  StringPARSER_MODE_CRAWLER
    
final public static  StringPARSER_MODE_ICAP
    
final public static  StringPARSER_MODE_IMAGE
    
final public static  StringPARSER_MODE_PROXY
    
final public static  StringPARSER_MODE_URLREDIRECTOR
    
final public static  HashMap<String, ParserInfo>availableParserList
    
final public static  HashSet<String>supportedHTMLFileExt
    
final public static  HashSet<String>supportedHTMLMimeTypes
    


Method Summary
public static  booleanHTMLParsableMimeTypesContains(String mimeType)
    
static  Map<yacyURL, String>allReflinks(Set links)
    
static  Map<yacyURL, String>allSubpaths(Set links)
    
public static  booleanappsExtContains(String appsExt)
    
public static  booleanaudioExtContains(String audioExt)
    
public  voidclose()
    
public static  List<String>extString2extList(String extString)
    
public  HashMap<String, ParserInfo>getAvailableParserList()
    
public static  StringgetFileExt(yacyURL url)
    
public  serverLoggetLogger()
    
public static  StringgetMediaExtList()
    
public static  StringgetMimeTypeByFileExt(String fileExt)
    
public static  HashMap<String, plasmaParserConfig>getParserConfigList()
    
public static  StringgetRealCharsetEncoding(String encoding)
    
public static  booleanimageExtContains(String imageExt)
    
public static  voidinitAppsExt(List<String> appsExtList)
    
public static  voidinitAudioExt(List<String> audioExtList)
    
public static  voidinitHTMLParsableMimeTypes(String htmlParsableMimeTypes)
     This function is used to initialize the HTMLParsableMimeTypes List.
public static  voidinitImageExt(List<String> imageExtList)
    
public static  voidinitMediaExt(List<String> mediaExtList)
    
public static  voidinitParseableMimeTypes(String parserMode, String configStr)
    
public static  voidinitSupportedHTMLFileExt(List<String> supportedRealtimeFileExtList)
    
public static  voidinitVideoExt(List<String> videoExtList)
    
public static  voidmain(String[] args)
    
public static  ParsermakeParser(Object name)
    
public static  booleanmediaExtContains(String mediaExt)
    
public static  StringnormalizeMimeType(String mimeType)
    
public  plasmaParserDocumentparseSource(yacyURL location, String mimeType, String charset, byte[] sourceArray)
    
public  plasmaParserDocumentparseSource(yacyURL location, String theMimeType, String theDocumentCharset, File sourceFile)
    
public  plasmaParserDocumentparseSource(yacyURL location, String theMimeType, String theDocumentCharset, long contentLength, InputStream sourceStream)
    
public static  String[]setEnabledParserList(String parserMode, Set<String> mimeTypeSet)
    
public static  booleansupportedContent(yacyURL url, String mimeType)
    
public static  booleansupportedContent(String parserMode, yacyURL url, String mimeType)
    
public static  booleansupportedFileExtContains(String fileExt)
    
public static  booleansupportedHTMLContent(yacyURL url, String mimeType)
    
public static  booleansupportedHTMLFileExtContains(yacyURL url)
    
public static  booleansupportedMimeTypesContains(String mimeType)
    
public  plasmaParserDocumenttransformScraper(yacyURL location, String mimeType, String charSet, htmlFilterContentScraper scraper)
    
public static  booleanvideoExtContains(String videoExt)
    

Field Detail
PARSER_MODE
final public static HashSet<String> PARSER_MODE(Code)



PARSER_MODE_CRAWLER
final public static String PARSER_MODE_CRAWLER(Code)



PARSER_MODE_ICAP
final public static String PARSER_MODE_ICAP(Code)



PARSER_MODE_IMAGE
final public static String PARSER_MODE_IMAGE(Code)



PARSER_MODE_PROXY
final public static String PARSER_MODE_PROXY(Code)



PARSER_MODE_URLREDIRECTOR
final public static String PARSER_MODE_URLREDIRECTOR(Code)



availableParserList
final public static HashMap<String, ParserInfo> availableParserList(Code)
A list containing all installed parsers and the mimeType that they support
See Also:   plasmaParser.loadAvailableParserList()



supportedHTMLFileExt
final public static HashSet<String> supportedHTMLFileExt(Code)
A list of file extensions and mime types that are supported by the html-parser



supportedHTMLMimeTypes
final public static HashSet<String> supportedHTMLMimeTypes(Code)





Method Detail
HTMLParsableMimeTypesContains
public static boolean HTMLParsableMimeTypesContains(String mimeType)(Code)



allReflinks
static Map<yacyURL, String> allReflinks(Set links)(Code)



allSubpaths
static Map<yacyURL, String> allSubpaths(Set links)(Code)



appsExtContains
public static boolean appsExtContains(String appsExt)(Code)



audioExtContains
public static boolean audioExtContains(String audioExt)(Code)



close
public void close()(Code)



extString2extList
public static List<String> extString2extList(String extString)(Code)



getAvailableParserList
public HashMap<String, ParserInfo> getAvailableParserList()(Code)



getFileExt
public static String getFileExt(yacyURL url)(Code)



getLogger
public serverLog getLogger()(Code)



getMediaExtList
public static String getMediaExtList()(Code)



getMimeTypeByFileExt
public static String getMimeTypeByFileExt(String fileExt)(Code)



getParserConfigList
public static HashMap<String, plasmaParserConfig> getParserConfigList()(Code)



getRealCharsetEncoding
public static String getRealCharsetEncoding(String encoding)(Code)



imageExtContains
public static boolean imageExtContains(String imageExt)(Code)



initAppsExt
public static void initAppsExt(List<String> appsExtList)(Code)



initAudioExt
public static void initAudioExt(List<String> audioExtList)(Code)



initHTMLParsableMimeTypes
public static void initHTMLParsableMimeTypes(String htmlParsableMimeTypes)(Code)
This function is used to initialize the HTMLParsableMimeTypes List. This list contains a list of mimeTypes that can be parsed in realtime by the yacy html-Parser
Parameters:
  htmlParsableMimeTypes - a list of mimetypes that can be parsed by the yacy html parser



initImageExt
public static void initImageExt(List<String> imageExtList)(Code)



initMediaExt
public static void initMediaExt(List<String> mediaExtList)(Code)



initParseableMimeTypes
public static void initParseableMimeTypes(String parserMode, String configStr)(Code)



initSupportedHTMLFileExt
public static void initSupportedHTMLFileExt(List<String> supportedRealtimeFileExtList)(Code)



initVideoExt
public static void initVideoExt(List<String> videoExtList)(Code)



main
public static void main(String[] args)(Code)



makeParser
public static Parser makeParser(Object name) throws Exception(Code)



mediaExtContains
public static boolean mediaExtContains(String mediaExt)(Code)



normalizeMimeType
public static String normalizeMimeType(String mimeType)(Code)



parseSource
public plasmaParserDocument parseSource(yacyURL location, String mimeType, String charset, byte[] sourceArray) throws InterruptedException, ParserException(Code)



parseSource
public plasmaParserDocument parseSource(yacyURL location, String theMimeType, String theDocumentCharset, File sourceFile) throws InterruptedException, ParserException(Code)



parseSource
public plasmaParserDocument parseSource(yacyURL location, String theMimeType, String theDocumentCharset, long contentLength, InputStream sourceStream) throws InterruptedException, ParserException(Code)
To parse a resource from an InputStream
Parameters:
  location - the URL of the resource
Parameters:
  theMimeType - the resource mimetype (null if unknown)
Parameters:
  theDocumentCharset - the charset of the resource (null if unknown)
Parameters:
  contentLength - the content length of the resource (-1 if unknown)
Parameters:
  sourceStream - an InputStream containing the resource body the parsed plasmaParserDocument document
throws:
  InterruptedException -
throws:
  ParserException -



setEnabledParserList
public static String[] setEnabledParserList(String parserMode, Set<String> mimeTypeSet)(Code)



supportedContent
public static boolean supportedContent(yacyURL url, String mimeType)(Code)



supportedContent
public static boolean supportedContent(String parserMode, yacyURL url, String mimeType)(Code)



supportedFileExtContains
public static boolean supportedFileExtContains(String fileExt)(Code)



supportedHTMLContent
public static boolean supportedHTMLContent(yacyURL url, String mimeType)(Code)



supportedHTMLFileExtContains
public static boolean supportedHTMLFileExtContains(yacyURL url)(Code)



supportedMimeTypesContains
public static boolean supportedMimeTypesContains(String mimeType)(Code)



transformScraper
public plasmaParserDocument transformScraper(yacyURL location, String mimeType, String charSet, htmlFilterContentScraper scraper)(Code)



videoExtContains
public static boolean videoExtContains(String videoExt)(Code)



Methods inherited from java.lang.Object
native protected Object clone() throws CloneNotSupportedException(Code)(Java Doc)
public boolean equals(Object obj)(Code)(Java Doc)
protected void finalize() throws Throwable(Code)(Java Doc)
final native public Class getClass()(Code)(Java Doc)
native public int hashCode()(Code)(Java Doc)
final native public void notify()(Code)(Java Doc)
final native public void notifyAll()(Code)(Java Doc)
public String toString()(Code)(Java Doc)
final native public void wait(long timeout) throws InterruptedException(Code)(Java Doc)
final public void wait(long timeout, int nanos) throws InterruptedException(Code)(Java Doc)
final public void wait() throws InterruptedException(Code)(Java Doc)

www.java2java.com | Contact Us
Copyright 2009 - 12 Demo Source and Support. All rights reserved.
All other trademarks are property of their respective owners.