@Override public TokenStream create(final TokenStream input) { final URILocalnameFilter filter = new URILocalnameFilter(input); filter.setMaxLength(maxLength); return filter; }
public PositionAttributeFilter(final TokenStream input) { super(input); nodeAtt = this.addAttribute(NodeAttribute.class); posAtt = this.addAttribute(PositionAttribute.class); posIncrAtt = this.addAttribute(PositionIncrementAttribute.class); }
/** * Converts characters above ASCII to their ASCII equivalents. For example, * accents are removed from accented characters. * @param input The string to fold * @param length The number of characters in the input string */ public void foldToASCII(final char[] input, final int length) { // Worst-case length required: final int maxSizeNeeded = 4 * length; this.growBuffer(output, maxSizeNeeded); outputPos = foldToASCII(input, 0, output, 0, length); }
@Override public TokenStream create(final TokenStream input) { return new SirenPayloadFilter(input); }
@Override public TokenStream create(final TokenStream input) { return new PositionAttributeFilter(input); }
@Override public TokenStream create(final TokenStream input) { return new URINormalisationFilter(input); }
@Override public TokenStream create(final TokenStream input) { return new URIDecodingFilter(input, DEFAULT_ENCODING); }
@Override public ASCIIFoldingExpansionFilter create(final TokenStream input) { return new ASCIIFoldingExpansionFilter(input); }
@Override public TokenStream create(final TokenStream input) { return new MailtoFilter(input); }
@Override public TokenStream create(final TokenStream input) { return new URITrailingSlashFilter(input); }
protected boolean isBreakPoint(final int c) { return this.isDelim(c) || this.isUppercase(c); }
protected boolean isBreakPoint(final int c) { return this.isDelim(c) || this.isUppercase(c); }
private void assertURLDecodedTo(final Tokenizer t, final String uri, final String[] expectedStems) throws IOException { this.assertURLDecodedTo(t, "UTF-8", uri, expectedStems, null, null); }
private void assertURLDecodedTo(final Tokenizer t, final String uri, final String[] expectedStems) throws IOException { this.assertURLDecodedTo(t, uri, expectedStems, null); }
public SirenPayloadFilter(final TokenStream input) { super(input); payloadAtt = this.addAttribute(PayloadAttribute.class); nodeAtt = this.addAttribute(NodeAttribute.class); posAtt = this.addAttribute(PositionAttribute.class); }
public URITrailingSlashFilter(final TokenStream in) { super(in); termAtt = this.addAttribute(CharTermAttribute.class); }
public void assertNormalisesTo(final Tokenizer t, final String input, final String[] expectedImages, final String[] expectedTypes) throws Exception { this.assertNormalisesTo(t, input, expectedImages, expectedTypes, null); }
private void assertURLDecodedTo(final Tokenizer t, final String encoding, final String uri, final String[] expectedStems) throws IOException { this.assertURLDecodedTo(t, encoding, uri, expectedStems, null, null); }
private void assertURLDecodedTo(final Tokenizer t, final String uri, final String[] expectedStems, final String[] expectedTypes) throws IOException { this.assertURLDecodedTo(t, uri, expectedStems, expectedTypes, null); }
private void assertURLDecodedTo(final Tokenizer t, final String uri, final String[] expectedStems, final String[] expectedTypes, final int[] expectedPosIncr) throws IOException { this.assertURLDecodedTo(t, "UTF-8", uri, expectedStems, expectedTypes, expectedPosIncr); }