Skip to content

Commit

Permalink
Fix duplicate colon in warcinfo header
Browse files Browse the repository at this point in the history
  • Loading branch information
sebastian-nagel committed Oct 29, 2021
1 parent 2c62b3c commit fb1c64d
Showing 1 changed file with 1 addition and 1 deletion.
Original file line number Diff line number Diff line change
Expand Up @@ -122,7 +122,7 @@ protected WARCHdfsBolt getWarcBolt(String filePrefix) {
fileNameFormat.withPrefix(filePrefix);

Map<String, String> fields = new LinkedHashMap<>();
fields.put("software:", "StormCrawler 1.17 https://stormcrawler.net/");
fields.put("software", "StormCrawler 1.17 https://stormcrawler.net/");
fields.put("description", "News crawl for Common Crawl");
String userAgent = AbstractHttpProtocol.getAgentString(getConf());
fields.put("http-header-user-agent", userAgent);
Expand Down

0 comments on commit fb1c64d

Please sign in to comment.