/** * */ public KeyMakerUrlCanonicalizer() { this.surtForm = true; keyMaker = new WaybackURLKeyMaker(true); }
public String canonicalize(String url, boolean surt) throws UnsupportedEncodingException, URISyntaxException { if ((canonicalizer == null) || (url == null) || url.isEmpty()) { return url; } url = java.net.URLDecoder.decode(url, "UTF-8"); if (surt) { return url; } int slashIndex = url.indexOf('/'); // If true, assume this is already a SURT and skip if ((slashIndex > 0) && url.charAt(slashIndex - 1) == ')') { return url; } return canonicalizer.makeKey(url); }
WaybackURLKeyMaker keymaker = new WaybackURLKeyMaker(true); next = keymaker.makeKey(next); } catch (Exception e) { continue;
WaybackURLKeyMaker keymaker = new WaybackURLKeyMaker(true); next = keymaker.makeKey(next); } catch (Exception e) { continue;
public KeyMakerUrlCanonicalizer(boolean surtForm) { this.surtForm = surtForm; keyMaker = new WaybackURLKeyMaker(surtForm); }
WaybackURLKeyMaker keymaker = new WaybackURLKeyMaker(true); next = keymaker.makeKey(next); } catch (Exception e) { continue;
public String canonicalize(String url, boolean surt) throws UnsupportedEncodingException, URISyntaxException { if ((canonicalizer == null) || (url == null) || url.isEmpty()) { return url; } url = java.net.URLDecoder.decode(url, "UTF-8"); if (surt) { return url; } int slashIndex = url.indexOf('/'); // If true, assume this is already a SURT and skip if ((slashIndex > 0) && url.charAt(slashIndex - 1) == ')') { return url; } return canonicalizer.makeKey(url); }
key = applyCustomRules(key);
public KeyMakerUrlCanonicalizer(boolean surtForm) { this.surtForm = surtForm; keyMaker = new WaybackURLKeyMaker(surtForm); }
public RealCDXExtractorOutput(PrintWriter out) { this(out,new WaybackURLKeyMaker()); } // SimpleJSONPathSpec gzFooterLengthSpec = new SimpleJSONPathSpec("Container.Gzip-Metadata.Footer-Length");
/** * */ public KeyMakerUrlCanonicalizer() { this.surtForm = true; keyMaker = new WaybackURLKeyMaker(true); }
public RealCDXExtractorOutput(PrintWriter out) { this(out,new WaybackURLKeyMaker()); } // SimpleJSONPathSpec gzFooterLengthSpec = new SimpleJSONPathSpec("Container.Gzip-Metadata.Footer-Length");
public RealCDXExtractorOutput(PrintWriter out) { this(out,new WaybackURLKeyMaker()); } // SimpleJSONPathSpec gzFooterLengthSpec = new SimpleJSONPathSpec("Container.Gzip-Metadata.Footer-Length");
@Override public void afterPropertiesSet() throws Exception { if (authChecker == null) { authChecker = new AllAccessAuth(); } canonicalizer = new WaybackURLKeyMaker(surtMode); urlSurtRangeComputer = new UrlSurtRangeComputer(surtMode); }
@Override public void afterPropertiesSet() throws Exception { if (authChecker == null) { authChecker = new AllAccessAuth(); } canonicalizer = new WaybackURLKeyMaker(surtMode); urlSurtRangeComputer = new UrlSurtRangeComputer(surtMode); }
out = new RealCDXExtractorOutput(makePrintWriter(os), new WaybackURLKeyMaker(false));
out = new RealCDXExtractorOutput(makePrintWriter(os), new WaybackURLKeyMaker(false));
out = new RealCDXExtractorOutput(makePrintWriter(os), new WaybackURLKeyMaker(false));