Nutch的扩展点(extension point)在nutch-extensionpoints/plugin.xml文件中定义:
<plugin
id="nutch-extensionpoints"
name="the nutch core extension points"
version="2.0.0"
provider-name="nutch.org">
<!-- this file hosts all extension points nutch core code offers.
Please not that plugins can define extension points as well to be extendable.-->
<extension-point
id="org.apache.nutch.indexer.IndexingFilter"
name="Nutch Indexing Filter"/>
<extension-point
id="org.apache.nutch.parse.Parser"
name="Nutch Content Parser"/>
<extension-point
id="org.apache.nutch.parse.HtmlParseFilter"
name="HTML Parse Filter"/>
<extension-point
id="org.apache.nutch.protocol.Protocol"
name="Nutch Protocol"/>
<extension-point
id="org.apache.nutch.net.URLFilter"
name="Nutch URL Filter"/>
<extension-point
id="org.apache.nutch.net.URLNormalizer"
name="Nutch URL Normalizer"/>
<extension-point
id="org.apache.nutch.scoring.ScoringFilter"
name="Nutch Scoring"/>
<extension-point
id="org.apache.nutch.segment.SegmentMergeFilter"
name="Nutch Segment Merge Filter"/>
</plugin>
所有的插件开发都应实现相应的借口,并规范配置。