getConf: URLMetaScoringFilter.java: src.plugin.urlmeta.src.java.org.apache.nutch.scoring.urlmeta Diff:16
setConf: FeedParser.java: src.plugin.feed.src.java.org.apache.nutch.parse.feed Diff:12
getConf: IndexingFiltersChecker.java: src.java.org.apache.nutch.indexer Diff:10
getScore: CrawlDatum.java: src.java.org.apache.nutch.crawl Diff:1
getSignature: SignatureFactory.java: src.java.org.apache.nutch.crawl Diff:7
getParserById: ParserFactory.java: src.java.org.apache.nutch.parse Diff:21
fromHexString: StringUtil.java: src.java.org.apache.nutch.util Diff:7
map: CrawlDBScanner.java: src.java.org.apache.nutch.tools Diff:6
setMinorCode: ParseStatus.java: src.java.org.apache.nutch.parse Diff:1
setFetchInterval: CrawlDatum.java: src.java.org.apache.nutch.crawl Diff:1
getConf: TLDScoringFilter.java: src.plugin.tld.src.java.org.apache.nutch.scoring.tld Diff:5
toString: ProtocolStatus.java: src.java.org.apache.nutch.protocol Diff:2
getDocumentMeta: NutchDocument.java: src.java.org.apache.nutch.indexer Diff:8
run: Generator.java: src.java.org.apache.nutch.crawl Diff:34
createWebGraph: WebGraph.java: src.java.org.apache.nutch.scoring.webgraph Diff:17
configure: ParseSegment.java: src.java.org.apache.nutch.parse Diff:1
reduce: DomainStatistics.java: src.java.org.apache.nutch.util.domain Diff:14
removeLockFile: LockUtil.java: src.java.org.apache.nutch.util Diff:1
getNotExportedLibUrls: PluginDescriptor.java: src.java.org.apache.nutch.plugin Diff:7
write: NutchDocument.java: src.java.org.apache.nutch.indexer Diff:7
removeField: NutchDocument.java: src.java.org.apache.nutch.indexer Diff:8
getPluginPath: PluginDescriptor.java: src.java.org.apache.nutch.plugin Diff:6
indexSolr: SolrIndexer.java: src.java.org.apache.nutch.indexer.solr Diff:7
closeReaders: FSUtils.java: src.java.org.apache.nutch.util Diff:3
getConf: LanguageIndexingFilter.java: src.plugin.languageidentifier.src.java.org.apache.nutch.analysis.lang Diff:14
dumpLinks: LinkDumper.java: src.java.org.apache.nutch.scoring.webgraph Diff:5
mapKey: SolrMappingReader.java: src.java.org.apache.nutch.indexer.solr Diff:25
close: LinkDbMerger.java: src.java.org.apache.nutch.crawl Diff:9
unzip: GZIPUtils.java: src.java.org.apache.nutch.util Diff:6
checkOne: URLNormalizerChecker.java: src.java.org.apache.nutch.net Diff:8
setFParsePluginsFile: ParsePluginsReader.java: src.java.org.apache.nutch.parse Diff:10
main: SegmentMerger.java: src.java.org.apache.nutch.segment Diff:73
run: Fetcher.java: src.java.org.apache.nutch.fetcher Diff:14
findDisagreements: EncodingDetector.java: src.java.org.apache.nutch.util Diff:18
parseManifestFile: PluginManifestParser.java: src.java.org.apache.nutch.plugin Diff:5
run: CrawlDBScanner.java: src.java.org.apache.nutch.tools Diff:14
getDependencyCheckedPlugins: PluginRepository.java: src.java.org.apache.nutch.plugin Diff:19
setConf: LanguageIndexingFilter.java: src.plugin.languageidentifier.src.java.org.apache.nutch.analysis.lang Diff:14
close: Fetcher.java: src.java.org.apache.nutch.fetcher Diff:3
map: ParseSegment.java: src.java.org.apache.nutch.parse Diff:29
getFParsePluginsFile: ParsePluginsReader.java: src.java.org.apache.nutch.parse Diff:10
checkOne: URLFilterChecker.java: src.java.org.apache.nutch.net Diff:8
createJobConf: SegmentReader.java: src.java.org.apache.nutch.segment Diff:9
parse: ParsePluginsReader.java: src.java.org.apache.nutch.parse Diff:7
logError: ArcSegmentCreator.java: src.java.org.apache.nutch.tools.arc Diff:47
metadataEquals: CrawlDatum.java: src.java.org.apache.nutch.crawl Diff:6
getResourceString: PluginDescriptor.java: src.java.org.apache.nutch.plugin Diff:8
main: FreeGenerator.java: src.java.org.apache.nutch.tools Diff:5
deflate: DeflateUtils.java: src.java.org.apache.nutch.util Diff:11
write: SolrWriter.java: src.java.org.apache.nutch.indexer.solr Diff:14
map: LinkDbFilter.java: src.java.org.apache.nutch.crawl Diff:14
getStats: SegmentReader.java: src.java.org.apache.nutch.segment Diff:64
dumpUrl: LoopReader.java: src.java.org.apache.nutch.scoring.webgraph Diff:4
main: OldFetcher.java: src.java.org.apache.nutch.fetcher Diff:8
isEmpty: StringUtil.java: src.java.org.apache.nutch.util Diff:8
setConf: DomainStatistics.java: src.java.org.apache.nutch.util.domain Diff:3
load: NGramProfile.java: src.plugin.languageidentifier.src.java.org.apache.nutch.analysis.lang Diff:37
addClue: EncodingDetector.java: src.java.org.apache.nutch.util Diff:5
getAliases: ParsePluginsReader.java: src.java.org.apache.nutch.parse Diff:13
init: LogDebugHandler.java: src.java.org.apache.nutch.tools.proxy Diff:1
finalize: PluginRepository.java: src.java.org.apache.nutch.plugin Diff:27
shotDownActivatedPlugins: PluginRepository.java: src.java.org.apache.nutch.plugin Diff:29
addTopicsFromFile: DmozParser.java: src.java.org.apache.nutch.tools Diff:7
getHost: LinkDb.java: src.java.org.apache.nutch.crawl Diff:8
distributeScoreToOutlink: TLDScoringFilter.java: src.plugin.tld.src.java.org.apache.nutch.scoring.tld Diff:5
configure: URLPartitioner.java: src.java.org.apache.nutch.crawl Diff:4
deleteSubCollection: CollectionManager.java: src.plugin.subcollection.src.java.org.apache.nutch.collection Diff:14
add: NGramProfile.java: src.plugin.languageidentifier.src.java.org.apache.nutch.analysis.lang Diff:2
getExtensionFromAlias: ParserFactory.java: src.java.org.apache.nutch.parse Diff:46
setUUID: NutchConfiguration.java: src.java.org.apache.nutch.util Diff:2
normalize: NGramProfile.java: src.plugin.languageidentifier.src.java.org.apache.nutch.analysis.lang Diff:16
create: NGramProfile.java: src.plugin.languageidentifier.src.java.org.apache.nutch.analysis.lang Diff:39
getDom: DomUtil.java: src.java.org.apache.nutch.util Diff:4
getMetaValues: MetaWrapper.java: src.java.org.apache.nutch.metadata Diff:4
addExportedLibRelative: PluginDescriptor.java: src.java.org.apache.nutch.plugin Diff:6
dumpUrl: NodeReader.java: src.java.org.apache.nutch.scoring.webgraph Diff:8
setWhiteList: Subcollection.java: src.plugin.subcollection.src.java.org.apache.nutch.collection Diff:4
getWeight: NutchDocument.java: src.java.org.apache.nutch.indexer Diff:8
resolveUrls: ResolveUrls.java: src.java.org.apache.nutch.tools Diff:6
getCommonsHttpSolrServer: SolrUtils.java: src.java.org.apache.nutch.indexer.solr Diff:3
filter: URLMetaIndexingFilter.java: src.plugin.urlmeta.src.java.org.apache.nutch.indexer.urlmeta Diff:3
configure: IndexerMapReduce.java: src.java.org.apache.nutch.indexer Diff:3
run: CrawlDbMerger.java: src.java.org.apache.nutch.crawl Diff:9
handle: DelayHandler.java: src.java.org.apache.nutch.tools.proxy Diff:1
identify: LanguageIdentifier.java: src.plugin.languageidentifier.src.java.org.apache.nutch.analysis.lang Diff:23
close: SegmentReader.java: src.java.org.apache.nutch.segment Diff:9
stripTags: FeedParser.java: src.plugin.feed.src.java.org.apache.nutch.parse.feed Diff:34
parseRequires: PluginManifestParser.java: src.java.org.apache.nutch.plugin Diff:10
main: FeedParser.java: src.plugin.feed.src.java.org.apache.nutch.parse.feed Diff:13
getConf: URLMetaIndexingFilter.java: src.plugin.urlmeta.src.java.org.apache.nutch.indexer.urlmeta Diff:3
distributeScoreToOutlinks: URLMetaScoringFilter.java: src.plugin.urlmeta.src.java.org.apache.nutch.scoring.urlmeta Diff:6
filter: CCParseFilter.java: src.plugin.creativecommons.src.java.org.creativecommons.nutch Diff:12
getConf: FeedIndexingFilter.java: src.plugin.feed.src.java.org.apache.nutch.indexer.feed Diff:12
append: SegmentReader.java: src.java.org.apache.nutch.segment Diff:9
parse: ParseUtil.java: src.java.org.apache.nutch.parse Diff:13
getOutlinksJDK5Impl: OutlinkExtractor.java: src.java.org.apache.nutch.parse Diff:2
reduce: ParseSegment.java: src.java.org.apache.nutch.parse Diff:30
getVersion: PluginDescriptor.java: src.java.org.apache.nutch.plugin Diff:8
getExtensions: ExtensionPoint.java: src.java.org.apache.nutch.plugin Diff:2
main: NGramProfile.java: src.plugin.languageidentifier.src.java.org.apache.nutch.analysis.lang Diff:39
getSupportedMimeTypes: ParsePluginList.java: src.java.org.apache.nutch.parse Diff:3
call: ParseCallable.java: src.java.org.apache.nutch.parse Diff:1
main: LinkDumper.java: src.java.org.apache.nutch.scoring.webgraph Diff:5
setPageGoneSchedule: AbstractFetchSchedule.java: src.java.org.apache.nutch.crawl Diff:8
run: Benchmark.java: src.java.org.apache.nutch.tools Diff:7
configure: CrawlDBScanner.java: src.java.org.apache.nutch.tools Diff:2
getModifiedTime: CrawlDatum.java: src.java.org.apache.nutch.crawl Diff:1
setPluginClass: PluginDescriptor.java: src.java.org.apache.nutch.plugin Diff:2
setModifiedTime: CrawlDatum.java: src.java.org.apache.nutch.crawl Diff:1
identify: LanguageIdentifier.java: src.plugin.languageidentifier.src.java.org.apache.nutch.analysis.lang Diff:24
reportStatus: OldFetcher.java: src.java.org.apache.nutch.fetcher Diff:1
configure: SegmentReader.java: src.java.org.apache.nutch.segment Diff:8
skipChildren: NodeWalker.java: src.java.org.apache.nutch.util Diff:1
calculate: TextProfileSignature.java: src.java.org.apache.nutch.crawl Diff:21
close: ScoreUpdater.java: src.java.org.apache.nutch.scoring.webgraph Diff:8
main: WebGraph.java: src.java.org.apache.nutch.scoring.webgraph Diff:17
identify: LanguageIdentifier.java: src.plugin.languageidentifier.src.java.org.apache.nutch.analysis.lang Diff:28
main: NodeDumper.java: src.java.org.apache.nutch.scoring.webgraph Diff:2
addMeta: MetaWrapper.java: src.java.org.apache.nutch.metadata Diff:1
run: SolrDeleteDuplicates.java: src.java.org.apache.nutch.indexer.solr Diff:8
main: ResolveUrls.java: src.java.org.apache.nutch.tools Diff:9
toHexString: StringUtil.java: src.java.org.apache.nutch.util Diff:4
getPartition: URLPartitioner.java: src.java.org.apache.nutch.crawl Diff:16
getRecordWriter: IndexerOutputFormat.java: src.java.org.apache.nutch.indexer Diff:4
checkAll: URLNormalizerChecker.java: src.java.org.apache.nutch.net Diff:9
collectLibs: PluginDescriptor.java: src.java.org.apache.nutch.plugin Diff:5
getProviderName: PluginDescriptor.java: src.java.org.apache.nutch.plugin Diff:8
getBaseHref: HTMLMetaTags.java: src.java.org.apache.nutch.parse Diff:2
run: Loops.java: src.java.org.apache.nutch.scoring.webgraph Diff:8
setAliases: ParsePluginList.java: src.java.org.apache.nutch.parse Diff:1
readFields: NutchDocument.java: src.java.org.apache.nutch.indexer Diff:8
parseExtensionPoints: PluginManifestParser.java: src.java.org.apache.nutch.plugin Diff:17
partitionSegment: Generator.java: src.java.org.apache.nutch.crawl Diff:28
parseDmozFile: DmozParser.java: src.java.org.apache.nutch.tools Diff:4
inject: Injector.java: src.java.org.apache.nutch.crawl Diff:11
main: LanguageIdentifier.java: src.plugin.languageidentifier.src.java.org.apache.nutch.analysis.lang Diff:7
main: EncodingDetector.java: src.java.org.apache.nutch.util Diff:25
identify: LanguageIdentifier.java: src.plugin.languageidentifier.src.java.org.apache.nutch.analysis.lang Diff:14
reduce: ScoreUpdater.java: src.java.org.apache.nutch.scoring.webgraph Diff:8
main: LinkRank.java: src.java.org.apache.nutch.scoring.webgraph Diff:11
readFields: MetaWrapper.java: src.java.org.apache.nutch.metadata Diff:3
run: Crawl.java: src.java.org.apache.nutch.crawl Diff:28
analyze: NGramProfile.java: src.plugin.languageidentifier.src.java.org.apache.nutch.analysis.lang Diff:7
getSeqRecords: SegmentReader.java: src.java.org.apache.nutch.segment Diff:38
filter: SubcollectionIndexingFilter.java: src.plugin.subcollection.src.java.org.apache.nutch.indexer.subcollection Diff:4
getNoCache: HTMLMetaTags.java: src.java.org.apache.nutch.parse Diff:2
getMeta: ParseData.java: src.java.org.apache.nutch.parse Diff:2
handle: LogDebugHandler.java: src.java.org.apache.nutch.tools.proxy Diff:1
save: NGramProfile.java: src.plugin.languageidentifier.src.java.org.apache.nutch.analysis.lang Diff:45
isParsing: OldFetcher.java: src.java.org.apache.nutch.fetcher Diff:1
map: CrawlDbFilter.java: src.java.org.apache.nutch.crawl Diff:5
setDescriptor: Extension.java: src.java.org.apache.nutch.plugin Diff:2
main: AdaptiveFetchSchedule.java: src.java.org.apache.nutch.crawl Diff:11
run: ArcSegmentCreator.java: src.java.org.apache.nutch.tools.arc Diff:55
getSubCollections: CollectionManager.java: src.plugin.subcollection.src.java.org.apache.nutch.collection Diff:24
toString: NGramProfile.java: src.plugin.languageidentifier.src.java.org.apache.nutch.analysis.lang Diff:29
main: SolrIndexer.java: src.java.org.apache.nutch.indexer.solr Diff:14
run: ScoreUpdater.java: src.java.org.apache.nutch.scoring.webgraph Diff:17
map: ScoreUpdater.java: src.java.org.apache.nutch.scoring.webgraph Diff:1
getMimeType: MimeUtil.java: src.java.org.apache.nutch.util Diff:2
getExtensionPoint: PluginRepository.java: src.java.org.apache.nutch.plugin Diff:21
setConf: CCIndexingFilter.java: src.plugin.creativecommons.src.java.org.creativecommons.nutch Diff:2
setConf: IndexingFiltersChecker.java: src.java.org.apache.nutch.indexer Diff:10
filter: Subcollection.java: src.plugin.subcollection.src.java.org.apache.nutch.collection Diff:6
checkConfiguration: Fetcher.java: src.java.org.apache.nutch.fetcher Diff:29
passScoreAfterParsing: URLMetaScoringFilter.java: src.plugin.urlmeta.src.java.org.apache.nutch.scoring.urlmeta Diff:16
updateDbScore: TLDScoringFilter.java: src.plugin.tld.src.java.org.apache.nutch.scoring.tld Diff:5
create: NutchConfiguration.java: src.java.org.apache.nutch.util Diff:2
findLoops: Loops.java: src.java.org.apache.nutch.scoring.webgraph Diff:6
main: ParsePluginsReader.java: src.java.org.apache.nutch.parse Diff:10
update: ScoreUpdater.java: src.java.org.apache.nutch.scoring.webgraph Diff:14
saveDom: DomUtil.java: src.java.org.apache.nutch.util Diff:8
fetch: OldFetcher.java: src.java.org.apache.nutch.fetcher Diff:8
filter: SegmentMergeFilters.java: src.java.org.apache.nutch.segment Diff:1
toLong: HttpDateFormat.java: src.java.org.apache.nutch.net.protocols Diff:2
dump: SegmentReader.java: src.java.org.apache.nutch.segment Diff:9
addToMap: FeedParser.java: src.plugin.feed.src.java.org.apache.nutch.parse.feed Diff:32
mergeMetadata: FeedParser.java: src.plugin.feed.src.java.org.apache.nutch.parse.feed Diff:54
resolveEncodingAlias: EncodingDetector.java: src.java.org.apache.nutch.util Diff:21
reduce: CrawlDbReducer.java: src.java.org.apache.nutch.crawl Diff:87
toDate: HttpDateFormat.java: src.java.org.apache.nutch.net.protocols Diff:1
getExportedLibUrls: PluginDescriptor.java: src.java.org.apache.nutch.plugin Diff:6
passScoreBeforeParsing: TLDScoringFilter.java: src.plugin.tld.src.java.org.apache.nutch.scoring.tld Diff:5
setConf: TLDIndexingFilter.java: src.plugin.tld.src.java.org.apache.nutch.indexer.tld Diff:4
setFetchInterval: CrawlDatum.java: src.java.org.apache.nutch.crawl Diff:1
parse: CollectionManager.java: src.plugin.subcollection.src.java.org.apache.nutch.collection Diff:10
run: LinkDb.java: src.java.org.apache.nutch.crawl Diff:31
setRetriesSinceFetch: CrawlDatum.java: src.java.org.apache.nutch.crawl Diff:1
getDescriptor: Extension.java: src.java.org.apache.nutch.plugin Diff:2
getInlinks: LinkDbReader.java: src.java.org.apache.nutch.crawl Diff:1
main: IndexingFiltersChecker.java: src.java.org.apache.nutch.indexer Diff:10
getRetriesSinceFetch: CrawlDatum.java: src.java.org.apache.nutch.crawl Diff:1
close: IndexerMapReduce.java: src.java.org.apache.nutch.indexer Diff:31
addAttribute: Extension.java: src.java.org.apache.nutch.plugin Diff:2
parseByExtensionId: ParseUtil.java: src.java.org.apache.nutch.parse Diff:22
setClazz: Extension.java: src.java.org.apache.nutch.plugin Diff:2
main: ParserChecker.java: src.java.org.apache.nutch.parse Diff:12
reduce: SolrDeleteDuplicates.java: src.java.org.apache.nutch.indexer.solr Diff:8
close: CrawlDbFilter.java: src.java.org.apache.nutch.crawl Diff:1
setId: Extension.java: src.java.org.apache.nutch.plugin Diff:2
close: OldFetcher.java: src.java.org.apache.nutch.fetcher Diff:1
isStoringContent: Fetcher.java: src.java.org.apache.nutch.fetcher Diff:3
getExtensions: PluginDescriptor.java: src.java.org.apache.nutch.plugin Diff:1
createMergeJob: CrawlDbMerger.java: src.java.org.apache.nutch.crawl Diff:4
getDomainName: URLUtil.java: src.java.org.apache.nutch.util Diff:2
getPluginDescriptor: PluginRepository.java: src.java.org.apache.nutch.plugin Diff:22
lessThan: CrawlDbReducer.java: src.java.org.apache.nutch.crawl Diff:2
setBlackList: Subcollection.java: src.plugin.subcollection.src.java.org.apache.nutch.collection Diff:5
output: ArcSegmentCreator.java: src.java.org.apache.nutch.tools.arc Diff:47
handle: FakeHandler.java: src.java.org.apache.nutch.tools.proxy Diff:13
toString: ParseStatus.java: src.java.org.apache.nutch.parse Diff:1
parseMapping: SolrMappingReader.java: src.java.org.apache.nutch.indexer.solr Diff:21
setConf: URLMetaIndexingFilter.java: src.plugin.urlmeta.src.java.org.apache.nutch.indexer.urlmeta Diff:3
reduce: LinkDbMerger.java: src.java.org.apache.nutch.crawl Diff:9
getPluginList: ParsePluginList.java: src.java.org.apache.nutch.parse Diff:1
dedup: SolrDeleteDuplicates.java: src.java.org.apache.nutch.indexer.solr Diff:7
run: WebGraph.java: src.java.org.apache.nutch.scoring.webgraph Diff:24
getExtensions: ParserFactory.java: src.java.org.apache.nutch.parse Diff:25
runInitializer: LinkRank.java: src.java.org.apache.nutch.scoring.webgraph Diff:4
getDependencyLibs: PluginDescriptor.java: src.java.org.apache.nutch.plugin Diff:5
get: PluginRepository.java: src.java.org.apache.nutch.plugin Diff:2
close: URLPartitioner.java: src.java.org.apache.nutch.crawl Diff:4
initialize: Subcollection.java: src.plugin.subcollection.src.java.org.apache.nutch.collection Diff:4
handle: NotFoundHandler.java: src.java.org.apache.nutch.tools.proxy Diff:4
createMergeJob: LinkDbMerger.java: src.java.org.apache.nutch.crawl Diff:13
getPluginCheckedDependencies: PluginRepository.java: src.java.org.apache.nutch.plugin Diff:13
checkAll: URLFilterChecker.java: src.java.org.apache.nutch.net Diff:9
merge: LinkDbMerger.java: src.java.org.apache.nutch.crawl Diff:12
run: IndexingFiltersChecker.java: src.java.org.apache.nutch.indexer Diff:10
configure: DomainStatistics.java: src.java.org.apache.nutch.util.domain Diff:3
readFields: GenericWritableConfigurable.java: src.java.org.apache.nutch.util Diff:1
elapsedTime: TimingUtil.java: src.java.org.apache.nutch.util Diff:4
getParsers: ParserFactory.java: src.java.org.apache.nutch.parse Diff:13
getInstance: SolrMappingReader.java: src.java.org.apache.nutch.indexer.solr Diff:5
getURLNormalizers: URLNormalizers.java: src.java.org.apache.nutch.net Diff:13
resolveUrls: ResolveUrls.java: src.java.org.apache.nutch.tools Diff:6
getNoIndex: HTMLMetaTags.java: src.java.org.apache.nutch.parse Diff:2
getDependencies: PluginDescriptor.java: src.java.org.apache.nutch.plugin Diff:5
main: ParseText.java: src.java.org.apache.nutch.parse Diff:1
findExtension: ProtocolFactory.java: src.java.org.apache.nutch.protocol Diff:6
getPluginFolder: PluginManifestParser.java: src.java.org.apache.nutch.plugin Diff:7
runCounter: LinkRank.java: src.java.org.apache.nutch.scoring.webgraph Diff:3
getMimeType: MimeUtil.java: src.java.org.apache.nutch.util Diff:1
getRecordReader: ArcInputFormat.java: src.java.org.apache.nutch.tools.arc Diff:2
getNutchIndexWriters: NutchIndexWriterFactory.java: src.java.org.apache.nutch.indexer Diff:1
reduce: CrawlDBScanner.java: src.java.org.apache.nutch.tools Diff:8
addDomainSuffix: DomainSuffixes.java: src.java.org.apache.nutch.util.domain Diff:2
main: URLFilterChecker.java: src.java.org.apache.nutch.net Diff:9
generateSegmentName: Generator.java: src.java.org.apache.nutch.crawl Diff:28
reduce: SegmentMerger.java: src.java.org.apache.nutch.segment Diff:51
addClue: EncodingDetector.java: src.java.org.apache.nutch.util Diff:4
configure: LinkDbFilter.java: src.java.org.apache.nutch.crawl Diff:1
getAliases: ParsePluginList.java: src.java.org.apache.nutch.parse Diff:1
clone: CrawlDatum.java: src.java.org.apache.nutch.crawl Diff:5
getConf: FeedParser.java: src.plugin.feed.src.java.org.apache.nutch.parse.feed Diff:12
getMapRecords: SegmentReader.java: src.java.org.apache.nutch.segment Diff:32
hashCode: CrawlDatum.java: src.java.org.apache.nutch.crawl Diff:5
main: URLNormalizerChecker.java: src.java.org.apache.nutch.net Diff:10
getConf: TLDIndexingFilter.java: src.plugin.tld.src.java.org.apache.nutch.indexer.tld Diff:4
map: IndexerMapReduce.java: src.java.org.apache.nutch.indexer Diff:3
main: DmozParser.java: src.java.org.apache.nutch.tools Diff:17
replace: FSUtils.java: src.java.org.apache.nutch.util Diff:1
map: SegmentMerger.java: src.java.org.apache.nutch.segment Diff:5
main: SegmentReader.java: src.java.org.apache.nutch.segment Diff:68
setFetchSchedule: DefaultFetchSchedule.java: src.java.org.apache.nutch.crawl Diff:5
setMessage: ParseStatus.java: src.java.org.apache.nutch.parse Diff:1
filter: FeedIndexingFilter.java: src.plugin.feed.src.java.org.apache.nutch.indexer.feed Diff:12
createSegments: ArcSegmentCreator.java: src.java.org.apache.nutch.tools.arc Diff:56
setNoFollow: HTMLMetaTags.java: src.java.org.apache.nutch.parse Diff:2
readFields: CrawlDatum.java: src.java.org.apache.nutch.crawl Diff:2
analyze: LinkRank.java: src.java.org.apache.nutch.scoring.webgraph Diff:11
generatorSortValue: TLDScoringFilter.java: src.plugin.tld.src.java.org.apache.nutch.scoring.tld Diff:5
setWeight: NutchDocument.java: src.java.org.apache.nutch.indexer Diff:8
runAnalysis: LinkRank.java: src.java.org.apache.nutch.scoring.webgraph Diff:8
parseXML: PluginManifestParser.java: src.java.org.apache.nutch.plugin Diff:6
configure: CrawlDbFilter.java: src.java.org.apache.nutch.crawl Diff:1
add: NutchDocument.java: src.java.org.apache.nutch.indexer Diff:1
addExtension: ExtensionPoint.java: src.java.org.apache.nutch.plugin Diff:1
setConf: TLDScoringFilter.java: src.plugin.tld.src.java.org.apache.nutch.scoring.tld Diff:5
getAll: CollectionManager.java: src.plugin.subcollection.src.java.org.apache.nutch.collection Diff:25
getPluginCheckedDependencies: PluginRepository.java: src.java.org.apache.nutch.plugin Diff:14
main: Loops.java: src.java.org.apache.nutch.scoring.webgraph Diff:6
update: CrawlDb.java: src.java.org.apache.nutch.crawl Diff:5
run: Injector.java: src.java.org.apache.nutch.crawl Diff:10
getConf: CCParseFilter.java: src.plugin.creativecommons.src.java.org.creativecommons.nutch Diff:12
getUrlContent: LanguageIdentifier.java: src.plugin.languageidentifier.src.java.org.apache.nutch.analysis.lang Diff:15
reportStatus: OldFetcher.java: src.java.org.apache.nutch.fetcher Diff:1
setBaseHref: HTMLMetaTags.java: src.java.org.apache.nutch.parse Diff:2
filter: PluginRepository.java: src.java.org.apache.nutch.plugin Diff:42
getCopyMap: SolrMappingReader.java: src.java.org.apache.nutch.indexer.solr Diff:21
dumpNodes: NodeDumper.java: src.java.org.apache.nutch.scoring.webgraph Diff:2
setConf: FeedIndexingFilter.java: src.plugin.feed.src.java.org.apache.nutch.indexer.feed Diff:12
delete: SolrClean.java: src.java.org.apache.nutch.indexer.solr Diff:1
main: TextProfileSignature.java: src.java.org.apache.nutch.crawl Diff:34
invert: LinkDb.java: src.java.org.apache.nutch.crawl Diff:20
toString: HTMLMetaTags.java: src.java.org.apache.nutch.parse Diff:16
getExtenstionPoints: PluginDescriptor.java: src.java.org.apache.nutch.plugin Diff:4
contains: ProtocolFactory.java: src.java.org.apache.nutch.protocol Diff:7
charToNibble: StringUtil.java: src.java.org.apache.nutch.util Diff:7
getSimilarity: NGramProfile.java: src.plugin.languageidentifier.src.java.org.apache.nutch.analysis.lang Diff:36
hasNext: NodeWalker.java: src.java.org.apache.nutch.util Diff:2
reset: HTMLMetaTags.java: src.java.org.apache.nutch.parse Diff:2
configure: Fetcher.java: src.java.org.apache.nutch.fetcher Diff:3
list: SegmentReader.java: src.java.org.apache.nutch.segment Diff:55
indexerScore: URLMetaScoringFilter.java: src.plugin.urlmeta.src.java.org.apache.nutch.scoring.urlmeta Diff:16
run: LinkDbMerger.java: src.java.org.apache.nutch.crawl Diff:16
setNoCache: HTMLMetaTags.java: src.java.org.apache.nutch.parse Diff:2
distributeScoreToOutlinks: TLDScoringFilter.java: src.plugin.tld.src.java.org.apache.nutch.scoring.tld Diff:5
createParseResult: ParseResult.java: src.java.org.apache.nutch.parse Diff:1
close: CrawlDbReducer.java: src.java.org.apache.nutch.crawl Diff:1
setPluginId: PluginDescriptor.java: src.java.org.apache.nutch.plugin Diff:2
run: ParseSegment.java: src.java.org.apache.nutch.parse Diff:33
configure: CrawlDbReducer.java: src.java.org.apache.nutch.crawl Diff:1
main: NodeReader.java: src.java.org.apache.nutch.scoring.webgraph Diff:12
addUrlFeatures: CCIndexingFilter.java: src.plugin.creativecommons.src.java.org.creativecommons.nutch Diff:1
compareTo: CrawlDatum.java: src.java.org.apache.nutch.crawl Diff:2
installExtensions: PluginRepository.java: src.java.org.apache.nutch.plugin Diff:8
main: Injector.java: src.java.org.apache.nutch.crawl Diff:11
equals: CrawlDatum.java: src.java.org.apache.nutch.crawl Diff:6
getFetchTime: CrawlDatum.java: src.java.org.apache.nutch.crawl Diff:1
findExtensions: URLNormalizers.java: src.java.org.apache.nutch.net Diff:29
main: LinkDbReader.java: src.java.org.apache.nutch.crawl Diff:2
getPluginInstance: PluginRepository.java: src.java.org.apache.nutch.plugin Diff:28
readFields: ParseData.java: src.java.org.apache.nutch.parse Diff:2
addDependency: PluginDescriptor.java: src.java.org.apache.nutch.plugin Diff:6
runAnalysis: LinkRank.java: src.java.org.apache.nutch.scoring.webgraph Diff:8
add: NGramProfile.java: src.plugin.languageidentifier.src.java.org.apache.nutch.analysis.lang Diff:6
merge: CrawlDbMerger.java: src.java.org.apache.nutch.crawl Diff:3
run: Fetcher.java: src.java.org.apache.nutch.fetcher Diff:23
parsePluginFolder: PluginManifestParser.java: src.java.org.apache.nutch.plugin Diff:4
indexerScore: TLDScoringFilter.java: src.plugin.tld.src.java.org.apache.nutch.scoring.tld Diff:5
setMajorCode: ParseStatus.java: src.java.org.apache.nutch.parse Diff:1
configure: SolrDeleteDuplicates.java: src.java.org.apache.nutch.indexer.solr Diff:1
setPageRetrySchedule: AbstractFetchSchedule.java: src.java.org.apache.nutch.crawl Diff:11
getExtensionInstance: Extension.java: src.java.org.apache.nutch.plugin Diff:2
getRecordWriter: FetcherOutputFormat.java: src.java.org.apache.nutch.fetcher Diff:10
filter: HTMLLanguageParser.java: src.plugin.languageidentifier.src.java.org.apache.nutch.analysis.lang Diff:9
getProtocol: ProtocolFactory.java: src.java.org.apache.nutch.protocol Diff:5
setRefreshTime: HTMLMetaTags.java: src.java.org.apache.nutch.parse Diff:2
getGeneralTags: HTMLMetaTags.java: src.java.org.apache.nutch.parse Diff:2
inflateBestEffort: DeflateUtils.java: src.java.org.apache.nutch.util Diff:4
installExtensionPoints: PluginRepository.java: src.java.org.apache.nutch.plugin Diff:5
main: CrawlDb.java: src.java.org.apache.nutch.crawl Diff:10
get: DomainSuffixes.java: src.java.org.apache.nutch.util.domain Diff:2
run: LinkDbReader.java: src.java.org.apache.nutch.crawl Diff:5
clearClues: EncodingDetector.java: src.java.org.apache.nutch.util Diff:4
inflate: DeflateUtils.java: src.java.org.apache.nutch.util Diff:7
getUniqueKey: SolrMappingReader.java: src.java.org.apache.nutch.indexer.solr Diff:21
getNoFollow: HTMLMetaTags.java: src.java.org.apache.nutch.parse Diff:2
getFieldValue: NutchDocument.java: src.java.org.apache.nutch.indexer Diff:6
getExtension: ParserFactory.java: src.java.org.apache.nutch.parse Diff:45
getAttribute: Extension.java: src.java.org.apache.nutch.plugin Diff:1
usage: SegmentReader.java: src.java.org.apache.nutch.segment Diff:68
write: CrawlDatum.java: src.java.org.apache.nutch.crawl Diff:1
getVersion: ParseData.java: src.java.org.apache.nutch.parse Diff:2
main: ParseSegment.java: src.java.org.apache.nutch.parse Diff:34
getRefreshTime: HTMLMetaTags.java: src.java.org.apache.nutch.parse Diff:2
reduce: IndexerMapReduce.java: src.java.org.apache.nutch.indexer Diff:31
getPluginDescriptors: PluginRepository.java: src.java.org.apache.nutch.plugin Diff:20
main: CrawlDBScanner.java: src.java.org.apache.nutch.tools Diff:13
main: SolrDeleteDuplicates.java: src.java.org.apache.nutch.indexer.solr Diff:8
main: LoopReader.java: src.java.org.apache.nutch.scoring.webgraph Diff:8
map: LinkDb.java: src.java.org.apache.nutch.crawl Diff:9
getRecordWriter: ParseOutputFormat.java: src.java.org.apache.nutch.parse Diff:67
main: CrawlDbMerger.java: src.java.org.apache.nutch.crawl Diff:4
setArgs: ParseStatus.java: src.java.org.apache.nutch.parse Diff:1
unzipBestEffort: GZIPUtils.java: src.java.org.apache.nutch.util Diff:3
processDumpJob: LinkDbReader.java: src.java.org.apache.nutch.crawl Diff:2
getCollectionManager: CollectionManager.java: src.plugin.subcollection.src.java.org.apache.nutch.collection Diff:13
getRecordReader: ContentAsTextInputFormat.java: src.java.org.apache.nutch.segment Diff:2
passScoreBeforeParsing: URLMetaScoringFilter.java: src.plugin.urlmeta.src.java.org.apache.nutch.scoring.urlmeta Diff:11
reportStatus: OldFetcher.java: src.java.org.apache.nutch.fetcher Diff:1
setRefreshHref: HTMLMetaTags.java: src.java.org.apache.nutch.parse Diff:2
create: NutchConfiguration.java: src.java.org.apache.nutch.util Diff:1
getFetchInterval: CrawlDatum.java: src.java.org.apache.nutch.crawl Diff:1
getExtensions: URLNormalizers.java: src.java.org.apache.nutch.net Diff:16
getAnchors: Inlinks.java: src.java.org.apache.nutch.crawl Diff:1
configure: LinkDbMerger.java: src.java.org.apache.nutch.crawl Diff:9
iterator: NutchDocument.java: src.java.org.apache.nutch.indexer Diff:8
setConf: CCParseFilter.java: src.plugin.creativecommons.src.java.org.creativecommons.nutch Diff:12
getSubColection: CollectionManager.java: src.plugin.subcollection.src.java.org.apache.nutch.collection Diff:14
map: DomainStatistics.java: src.java.org.apache.nutch.util.domain Diff:11
fetch: Fetcher.java: src.java.org.apache.nutch.fetcher Diff:19
getHttpEquivTags: HTMLMetaTags.java: src.java.org.apache.nutch.parse Diff:2
updateDbScore: URLMetaScoringFilter.java: src.plugin.urlmeta.src.java.org.apache.nutch.scoring.urlmeta Diff:16
checkString: FeedParser.java: src.plugin.feed.src.java.org.apache.nutch.parse.feed Diff:55
getSignature: CrawlDatum.java: src.java.org.apache.nutch.crawl Diff:1
getFieldNames: NutchDocument.java: src.java.org.apache.nutch.indexer Diff:9
run: OldFetcher.java: src.java.org.apache.nutch.fetcher Diff:12
addExtension: PluginDescriptor.java: src.java.org.apache.nutch.plugin Diff:2
generate: Generator.java: src.java.org.apache.nutch.crawl Diff:28
normalize: SpellCheckedMetadata.java: src.java.org.apache.nutch.metadata Diff:2
scan: CrawlDBScanner.java: src.java.org.apache.nutch.tools Diff:13
getOutlinks: OutlinkExtractor.java: src.java.org.apache.nutch.parse Diff:2
addSubCollectionField: SubcollectionIndexingFilter.java: src.plugin.subcollection.src.java.org.apache.nutch.indexer.subcollection Diff:4
isDomainSuffix: DomainSuffixes.java: src.java.org.apache.nutch.util.domain Diff:3
setNoIndex: HTMLMetaTags.java: src.java.org.apache.nutch.parse Diff:2
main: ArcSegmentCreator.java: src.java.org.apache.nutch.tools.arc Diff:56
autoDetectClues: EncodingDetector.java: src.java.org.apache.nutch.util Diff:4
reduce: SegmentReader.java: src.java.org.apache.nutch.segment Diff:5
makeIOException: SolrWriter.java: src.java.org.apache.nutch.indexer.solr Diff:18
close: LinkDbFilter.java: src.java.org.apache.nutch.crawl Diff:1
findExtensions: ParserFactory.java: src.java.org.apache.nutch.parse Diff:24
invert: LinkDb.java: src.java.org.apache.nutch.crawl Diff:11
getFetchSchedule: FetchScheduleFactory.java: src.java.org.apache.nutch.crawl Diff:7
main: ScoreUpdater.java: src.java.org.apache.nutch.scoring.webgraph Diff:14
run: SolrIndexer.java: src.java.org.apache.nutch.indexer.solr Diff:14
stripNonCharCodepoints: SolrUtils.java: src.java.org.apache.nutch.indexer.solr Diff:5
calculate: MD5Signature.java: src.java.org.apache.nutch.crawl Diff:2
main: Fetcher.java: src.java.org.apache.nutch.fetcher Diff:19
map: ArcSegmentCreator.java: src.java.org.apache.nutch.tools.arc Diff:54
getKeyMap: SolrMappingReader.java: src.java.org.apache.nutch.indexer.solr Diff:21
parseLibraries: PluginManifestParser.java: src.java.org.apache.nutch.plugin Diff:13
closeReaders: FSUtils.java: src.java.org.apache.nutch.util Diff:2
getClassLoader: PluginDescriptor.java: src.java.org.apache.nutch.plugin Diff:6
handle: SegmentHandler.java: src.java.org.apache.nutch.tools.proxy Diff:28
setFetchTime: CrawlDatum.java: src.java.org.apache.nutch.crawl Diff:1
getRefresh: HTMLMetaTags.java: src.java.org.apache.nutch.parse Diff:2
run: OldFetcher.java: src.java.org.apache.nutch.fetcher Diff:4
getConf: DomainStatistics.java: src.java.org.apache.nutch.util.domain Diff:3
getUUID: NutchConfiguration.java: src.java.org.apache.nutch.util Diff:3
addExtensionPoint: PluginDescriptor.java: src.java.org.apache.nutch.plugin Diff:3
main: StringUtil.java: src.java.org.apache.nutch.util Diff:9
add: NGramProfile.java: src.plugin.languageidentifier.src.java.org.apache.nutch.analysis.lang Diff:1
addNutchResources: NutchConfiguration.java: src.java.org.apache.nutch.util Diff:2
reportStatus: Fetcher.java: src.java.org.apache.nutch.fetcher Diff:3
setSignature: CrawlDatum.java: src.java.org.apache.nutch.crawl Diff:1
merge: SegmentMerger.java: src.java.org.apache.nutch.segment Diff:62
configure: OldFetcher.java: src.java.org.apache.nutch.fetcher Diff:1
addFields: FeedParser.java: src.plugin.feed.src.java.org.apache.nutch.parse.feed Diff:51
doFilter: LogDebugHandler.java: src.java.org.apache.nutch.tools.proxy Diff:1
setScore: CrawlDatum.java: src.java.org.apache.nutch.crawl Diff:1
normalize: URLNormalizers.java: src.java.org.apache.nutch.net Diff:29
toString: CrawlDatum.java: src.java.org.apache.nutch.crawl Diff:5
getSorted: NGramProfile.java: src.plugin.languageidentifier.src.java.org.apache.nutch.analysis.lang Diff:18
match: ParserFactory.java: src.java.org.apache.nutch.parse Diff:44
run: SolrClean.java: src.java.org.apache.nutch.indexer.solr Diff:1
init: CollectionManager.java: src.plugin.subcollection.src.java.org.apache.nutch.collection Diff:6
main: LinkDbMerger.java: src.java.org.apache.nutch.crawl Diff:13
addFeature: CCIndexingFilter.java: src.plugin.creativecommons.src.java.org.creativecommons.nutch Diff:2
getId: Extension.java: src.java.org.apache.nutch.plugin Diff:1
getOutlinksJakartaRegexpImpl: OutlinkExtractor.java: src.java.org.apache.nutch.parse Diff:2
main: Generator.java: src.java.org.apache.nutch.crawl Diff:28
createJob: CrawlDb.java: src.java.org.apache.nutch.crawl Diff:7
initMRJob: IndexerMapReduce.java: src.java.org.apache.nutch.indexer Diff:31
init: LinkDbReader.java: src.java.org.apache.nutch.crawl Diff:2
createJob: LinkDb.java: src.java.org.apache.nutch.crawl Diff:22
isParsing: Fetcher.java: src.java.org.apache.nutch.fetcher Diff:3
runAnalysis: LinkRank.java: src.java.org.apache.nutch.scoring.webgraph Diff:8
addNotExportedLibRelative: PluginDescriptor.java: src.java.org.apache.nutch.plugin Diff:6
main: LinkDb.java: src.java.org.apache.nutch.crawl Diff:25
getConf: CCIndexingFilter.java: src.plugin.creativecommons.src.java.org.creativecommons.nutch Diff:2
setFetchSchedule: AdaptiveFetchSchedule.java: src.java.org.apache.nutch.crawl Diff:4
getMeta: MetaWrapper.java: src.java.org.apache.nutch.metadata Diff:3
getClazz: Extension.java: src.java.org.apache.nutch.plugin Diff:1
close: ParseSegment.java: src.java.org.apache.nutch.parse Diff:1
createSeeds: Benchmark.java: src.java.org.apache.nutch.tools Diff:3
setPluginList: ParsePluginList.java: src.java.org.apache.nutch.parse Diff:2
close: SolrWriter.java: src.java.org.apache.nutch.indexer.solr Diff:18
run: NodeDumper.java: src.java.org.apache.nutch.scoring.webgraph Diff:9
install: CrawlDb.java: src.java.org.apache.nutch.crawl Diff:10
addClassToConf: NutchIndexWriterFactory.java: src.java.org.apache.nutch.indexer Diff:5
filter: CCIndexingFilter.java: src.plugin.creativecommons.src.java.org.creativecommons.nutch Diff:2
resolveUrls: ResolveUrls.java: src.java.org.apache.nutch.tools Diff:6
forceRefetch: AbstractFetchSchedule.java: src.java.org.apache.nutch.crawl Diff:25
injectedScore: URLMetaScoringFilter.java: src.plugin.urlmeta.src.java.org.apache.nutch.scoring.urlmeta Diff:16
main: SolrClean.java: src.java.org.apache.nutch.indexer.solr Diff:1
filter: TLDIndexingFilter.java: src.plugin.tld.src.java.org.apache.nutch.indexer.tld Diff:4
open: SolrWriter.java: src.java.org.apache.nutch.indexer.solr Diff:2
guessEncoding: EncodingDetector.java: src.java.org.apache.nutch.util Diff:3
getStatusName: CrawlDatum.java: src.java.org.apache.nutch.crawl Diff:1
setConf: URLMetaScoringFilter.java: src.plugin.urlmeta.src.java.org.apache.nutch.scoring.urlmeta Diff:16
close: SolrDeleteDuplicates.java: src.java.org.apache.nutch.indexer.solr Diff:1
parsePlugin: PluginManifestParser.java: src.java.org.apache.nutch.plugin Diff:8
rightPad: StringUtil.java: src.java.org.apache.nutch.util Diff:2
parseCharacterEncoding: EncodingDetector.java: src.java.org.apache.nutch.util Diff:21
main: PluginRepository.java: src.java.org.apache.nutch.plugin Diff:47
getField: NutchDocument.java: src.java.org.apache.nutch.indexer Diff:7
getConf: HTMLLanguageParser.java: src.plugin.languageidentifier.src.java.org.apache.nutch.analysis.lang Diff:12
run: DomainStatistics.java: src.java.org.apache.nutch.util.domain Diff:3
setRefresh: HTMLMetaTags.java: src.java.org.apache.nutch.parse Diff:2
benchmark: Benchmark.java: src.java.org.apache.nutch.tools Diff:35
dedup: SolrDeleteDuplicates.java: src.java.org.apache.nutch.indexer.solr Diff:8
runParser: ParseUtil.java: src.java.org.apache.nutch.parse Diff:24
getRefreshHref: HTMLMetaTags.java: src.java.org.apache.nutch.parse Diff:2
write: MetaWrapper.java: src.java.org.apache.nutch.metadata Diff:2
generatorSortValue: URLMetaScoringFilter.java: src.plugin.urlmeta.src.java.org.apache.nutch.scoring.urlmeta Diff:16
getParse: FeedParser.java: src.plugin.feed.src.java.org.apache.nutch.parse.feed Diff:11
close: LinkRank.java: src.java.org.apache.nutch.scoring.webgraph Diff:8
getTargetPoint: Extension.java: src.java.org.apache.nutch.plugin Diff:2
toHexString: StringUtil.java: src.java.org.apache.nutch.util Diff:9
hasCopy: SolrMappingReader.java: src.java.org.apache.nutch.indexer.solr Diff:23
getExtension: ParserFactory.java: src.java.org.apache.nutch.parse Diff:43
run: LinkDumper.java: src.java.org.apache.nutch.scoring.webgraph Diff:7
shouldFetch: AbstractFetchSchedule.java: src.java.org.apache.nutch.crawl Diff:18
isSuccess: ParseResult.java: src.java.org.apache.nutch.parse Diff:1
get: SegmentReader.java: src.java.org.apache.nutch.segment Diff:29
getDomainName: URLUtil.java: src.java.org.apache.nutch.util Diff:1
save: CollectionManager.java: src.plugin.subcollection.src.java.org.apache.nutch.collection Diff:35
initialScore: TLDScoringFilter.java: src.plugin.tld.src.java.org.apache.nutch.scoring.tld Diff:5
isStoringContent: OldFetcher.java: src.java.org.apache.nutch.fetcher Diff:1
getLanguageFromMetadata: HTMLLanguageParser.java: src.plugin.languageidentifier.src.java.org.apache.nutch.analysis.lang Diff:12
setMetaData: CrawlDatum.java: src.java.org.apache.nutch.crawl Diff:1
setConf: HTMLLanguageParser.java: src.plugin.languageidentifier.src.java.org.apache.nutch.analysis.lang Diff:12
initialScore: URLMetaScoringFilter.java: src.plugin.urlmeta.src.java.org.apache.nutch.scoring.urlmeta Diff:16
setFetchSchedule: AbstractFetchSchedule.java: src.java.org.apache.nutch.crawl Diff:4
parse: ParseSegment.java: src.java.org.apache.nutch.parse Diff:34
install: LinkDb.java: src.java.org.apache.nutch.crawl Diff:25
parseList: Subcollection.java: src.plugin.subcollection.src.java.org.apache.nutch.collection Diff:6
filter: LanguageIndexingFilter.java: src.plugin.languageidentifier.src.java.org.apache.nutch.analysis.lang Diff:14
createSubCollection: CollectionManager.java: src.plugin.subcollection.src.java.org.apache.nutch.collection Diff:17
getInstance: SolrMappingReader.java: src.java.org.apache.nutch.indexer.solr Diff:5
forName: MimeUtil.java: src.java.org.apache.nutch.util Diff:2
mapCopyKey: SolrMappingReader.java: src.java.org.apache.nutch.indexer.solr Diff:27
run: CrawlDb.java: src.java.org.apache.nutch.crawl Diff:21
runInverter: LinkRank.java: src.java.org.apache.nutch.scoring.webgraph Diff:5
passScoreAfterParsing: TLDScoringFilter.java: src.plugin.tld.src.java.org.apache.nutch.scoring.tld Diff:5
injectedScore: TLDScoringFilter.java: src.plugin.tld.src.java.org.apache.nutch.scoring.tld Diff:5
main: DomainStatistics.java: src.java.org.apache.nutch.util.domain Diff:14
run: FreeGenerator.java: src.java.org.apache.nutch.tools Diff:5
readFields: FetcherOutput.java: src.java.org.apache.nutch.fetcher Diff:3
zip: GZIPUtils.java: src.java.org.apache.nutch.util Diff:11
autoResolveContentType: MimeUtil.java: src.java.org.apache.nutch.util Diff:3
setStatus: CrawlDatum.java: src.java.org.apache.nutch.crawl Diff:1
parseExtension: PluginManifestParser.java: src.java.org.apache.nutch.plugin Diff:25
displayStatus: PluginRepository.java: src.java.org.apache.nutch.plugin Diff:36
calculateLastFetchTime: AbstractFetchSchedule.java: src.java.org.apache.nutch.crawl Diff:13
initializeSchedule: AbstractFetchSchedule.java: src.java.org.apache.nutch.crawl Diff:3
run: LinkRank.java: src.java.org.apache.nutch.scoring.webgraph Diff:13
setMeta: MetaWrapper.java: src.java.org.apache.nutch.metadata Diff:2
matchExtensions: ParserFactory.java: src.java.org.apache.nutch.parse Diff:37
add: NGramProfile.java: src.plugin.languageidentifier.src.java.org.apache.nutch.analysis.lang Diff:3
leftPad: StringUtil.java: src.java.org.apache.nutch.util Diff:5
main: ParseData.java: src.java.org.apache.nutch.parse Diff:2
set: CrawlDatum.java: src.java.org.apache.nutch.crawl Diff:1
