diff --git a/src/main/java/org/commoncrawl/stormcrawler/news/CrawlTopology.java b/src/main/java/org/commoncrawl/stormcrawler/news/CrawlTopology.java index 6897c83..153c25a 100644 --- a/src/main/java/org/commoncrawl/stormcrawler/news/CrawlTopology.java +++ b/src/main/java/org/commoncrawl/stormcrawler/news/CrawlTopology.java @@ -122,7 +122,7 @@ protected WARCHdfsBolt getWarcBolt(String filePrefix) { fileNameFormat.withPrefix(filePrefix); Map fields = new LinkedHashMap<>(); - fields.put("software:", "StormCrawler 1.17 https://stormcrawler.net/"); + fields.put("software", "StormCrawler 1.17 https://stormcrawler.net/"); fields.put("description", "News crawl for Common Crawl"); String userAgent = AbstractHttpProtocol.getAgentString(getConf()); fields.put("http-header-user-agent", userAgent);