org.apache.lucene.util.BytesRef.getUTF8SortedAsUnicodeComparator java code examples

/**
 * Creates a new sorted wrapper, using {@link
 * BytesRef#getUTF8SortedAsUnicodeComparator} for
 * sorting. */
public SortedInputIterator(InputIterator source) throws IOException {
 this(source, BytesRef.getUTF8SortedAsUnicodeComparator());
}

@Override
int compareTerm(Terms.Bucket other) {
  return BytesRef.getUTF8SortedAsUnicodeComparator().compare(termBytes, ((Bucket) other).termBytes);
}

@Override int compareTerm(final SignificantTerms.Bucket other) {
  return BytesRef.getUTF8SortedAsUnicodeComparator().compare(termBytes, ((ComputedSignificantStringTermsBucket) other).termBytes);
}

@Override
int compareTerm(SignificantTerms.Bucket other) {
  return BytesRef.getUTF8SortedAsUnicodeComparator().compare(termBytes, ((Bucket) other).termBytes);
}

@Override int compareTerm(final SignificantTerms.Bucket other) {
  return BytesRef.getUTF8SortedAsUnicodeComparator().compare(termBytes, ((ComputedSignificantStringTermsBucket) other).termBytes);
}

/** Collapse the hash table and sort in-place; also sets
 * this.sortedTermIDs to the results */
public int[] sortPostings() {
 sortedTermIDs = bytesHash.sort(BytesRef.getUTF8SortedAsUnicodeComparator());
 return sortedTermIDs;
}

/**
 * Creates an {@link FSTCompletion} with default options: 10 buckets, exact match
 * promoted to first position and {@link InMemorySorter} with a comparator obtained from
 * {@link BytesRef#getUTF8SortedAsUnicodeComparator()}.
 */
public FSTCompletionBuilder() {
 this(DEFAULT_BUCKETS, new InMemorySorter(BytesRef.getUTF8SortedAsUnicodeComparator()), Integer.MAX_VALUE);
}

TermsIncludingScoreQuery(String field, boolean multipleValuesPerDocument, BytesRefHash terms, float[] scores, Query originalQuery) {
 this.field = field;
 this.multipleValuesPerDocument = multipleValuesPerDocument;
 this.terms = terms;
 this.scores = scores;
 this.originalQuery = originalQuery;
 this.ords = terms.sort(BytesRef.getUTF8SortedAsUnicodeComparator());
 this.unwrittenOriginalQuery = originalQuery;
}

/**
 * Creates an {@link FSTCompletion} with default options: 10 buckets, exact match
 * promoted to first position and {@link InMemorySorter} with a comparator obtained from
 * {@link BytesRef#getUTF8SortedAsUnicodeComparator()}.
 */
public FSTCompletionBuilder() {
 this(DEFAULT_BUCKETS, new InMemorySorter(BytesRef.getUTF8SortedAsUnicodeComparator()), Integer.MAX_VALUE);
}

public DocValuesTermsQuery(String field, Collection<BytesRef> terms) {
 this.field = Objects.requireNonNull(field);
 Objects.requireNonNull(terms, "Collection of terms must not be null");
 this.terms = terms.toArray(new BytesRef[terms.size()]);
 ArrayUtil.timSort(this.terms, BytesRef.getUTF8SortedAsUnicodeComparator());
}

/**
 * @param field The field that should contain terms that are specified in the previous parameter
 * @param terms The terms that matching documents should have. The terms must be sorted by natural order.
 */
TermsQuery(String field, Query fromQuery, BytesRefHash terms) {
 super(field);
 this.fromQuery = fromQuery;
 this.terms = terms;
 ords = terms.sort(BytesRef.getUTF8SortedAsUnicodeComparator());
}

/** Collapse the hash table and sort in-place; also sets
 * this.sortedTermIDs to the results */
public int[] sortPostings() {
 sortedTermIDs = bytesHash.sort(BytesRef.getUTF8SortedAsUnicodeComparator());
 return sortedTermIDs;
}

/**
 * Sorts hashed terms into ascending order, reusing memory along the
 * way. Note that sorting is lazily delayed until required (often it's
 * not required at all). If a sorted view is required then hashing +
 * sort + binary search is still faster and smaller than TreeMap usage
 * (which would be an alternative and somewhat more elegant approach,
 * apart from more sophisticated Tries / prefix trees).
 */
public void sortTerms() {
 if (sortedTerms == null) {
  sortedTerms = terms.sort(BytesRef.getUTF8SortedAsUnicodeComparator());
 }
}

TermIterator() throws IOException {
 termsEnum = reader.terms(new Term(field, ""));
 Term term = termsEnum.term();
 if (term == null || term.field() != field) {
  comp = null;
 } else {
  comp = BytesRef.getUTF8SortedAsUnicodeComparator();
 }
}

@Override
public boolean seekExact(BytesRef text) {
 termUpto = binarySearch(text, br, 0, info.terms.size()-1, info.terms, info.sortedTerms, BytesRef.getUTF8SortedAsUnicodeComparator());
 return termUpto >= 0;
}

HighFrequencyIterator() throws IOException {
 termsEnum = reader.terms(new Term(field, ""));
 minNumDocs = (int)(thresh * (float)reader.numDocs());
 Term term = termsEnum.term();
 if (term == null || term.field() != field) {
  comp = null;
 } else {
  comp = BytesRef.getUTF8SortedAsUnicodeComparator();
 }
}

SeekingTermSetTermsEnum(TermsEnum tenum, BytesRefHash terms, int[] ords) {
 super(tenum);
 this.terms = terms;
 this.ords = ords;
 comparator = BytesRef.getUTF8SortedAsUnicodeComparator();
 lastElement = terms.size() - 1;
 lastTerm = terms.get(ords[lastElement], new BytesRef());
 seekTerm = terms.get(ords[upto], spare);
}

@Override
public SeekStatus seekCeil(BytesRef text) {
 termUpto = binarySearch(text, br, 0, info.terms.size()-1, info.terms, info.sortedTerms, BytesRef.getUTF8SortedAsUnicodeComparator());
 if (termUpto < 0) { // not found; choose successor
  termUpto = -termUpto-1;
  if (termUpto >= info.terms.size()) {
   return SeekStatus.END;
  } else {
   info.terms.get(info.sortedTerms[termUpto], br);
   return SeekStatus.NOT_FOUND;
  }
 } else {
  return SeekStatus.FOUND;
 }
}

SeekingTermSetTermsEnum(TermsEnum tenum, BytesRefTermsSet termsSet) {
 super(tenum);
 this.terms = termsSet.getBytesRefHash();
 this.ords = this.terms.sort(BytesRef.getUTF8SortedAsUnicodeComparator());
 lastElement = terms.size() - 1;
 lastTerm = terms.get(ords[lastElement], new BytesRef());
 seekTerm = terms.get(ords[upto], spare);
}

/**
 * Returns an {@link StemmerOverrideMap} to be used with the {@link StemmerOverrideFilter}
 * @return an {@link StemmerOverrideMap} to be used with the {@link StemmerOverrideFilter}
 * @throws IOException if an {@link IOException} occurs;
 */
public StemmerOverrideMap build() throws IOException {
 ByteSequenceOutputs outputs = ByteSequenceOutputs.getSingleton();
 org.apache.lucene.util.fst.Builder<BytesRef> builder = new org.apache.lucene.util.fst.Builder<>(
   FST.INPUT_TYPE.BYTE4, outputs);
 final int[] sort = hash.sort(BytesRef.getUTF8SortedAsUnicodeComparator());
 IntsRefBuilder intsSpare = new IntsRefBuilder();
 final int size = hash.size();
 BytesRef spare = new BytesRef();
 for (int i = 0; i < size; i++) {
  int id = sort[i];
  BytesRef bytesRef = hash.get(id, spare);
  intsSpare.copyUTF8Bytes(bytesRef);
  builder.add(intsSpare.get(), new BytesRef(outputValues.get(id)));
 }
 return new StemmerOverrideMap(builder.finish(), ignoreCase);
}

Popular methods of BytesRef

<init>
This instance will directly reference bytes w/o making a copy. bytes should not be null.
utf8ToString
Interprets stored bytes as UTF8 bytes, returning the resulting string
deepCopyOf
Creates a new BytesRef that points to a copy of the bytes fromother The returned BytesRef will have
compareTo
Unsigned byte order comparison
equals
hashCode
Calculates the hash code as required by TermsHash during indexing. This is currently implemented as
bytesEquals
Expert: compares the bytes against another BytesRef, returning true if the bytes are equal.
toString
Returns hex encoded bytes, eg [0x6c 0x75 0x63 0x65 0x6e 0x65]
clone
Returns a shallow clone of this instance (the underlying bytes arenot copied and will be shared by b
copyBytes
isValid
Performs internal consistency checks. Always returns true (or throws IllegalStateException)
append

Popular in Java

Creating JSON documents from java classes using gson
getApplicationContext (Context)
setContentView (Activity)
getResourceAsStream (ClassLoader)
HttpServer (com.sun.net.httpserver)
This class implements a simple HTTP server. A HttpServer is bound to an IP address and port number a
FileWriter (java.io)
A specialized Writer that writes to a file in the file system. All write requests made by calling me
IOException (java.io)
Signals a general, I/O-related error. Error details may be specified when calling the constructor, a
Executors (java.util.concurrent)
Factory and utility methods for Executor, ExecutorService, ScheduledExecutorService, ThreadFactory,
Modifier (javassist)
The Modifier class provides static methods and constants to decode class and member access modifiers
BoxLayout (javax.swing)
Top Sublime Text plugins

How to use getUTF8SortedAsUnicodeComparatormethodin org.apache.lucene.util.BytesRef

Best Java code snippets using org.apache.lucene.util.BytesRef.getUTF8SortedAsUnicodeComparator (Showing top 20 results out of 315)

How to use
getUTF8SortedAsUnicodeComparator
method
in
org.apache.lucene.util.BytesRef