mirror of
https://github.com/MarginaliaSearch/MarginaliaSearch.git
synced 2025-10-05 21:22:39 +02:00
(refac) Clean up index code
This commit is contained in:
@@ -3,11 +3,11 @@ package nu.marginalia.index;
|
||||
import com.google.inject.Guice;
|
||||
import com.google.inject.Inject;
|
||||
import nu.marginalia.IndexLocations;
|
||||
import nu.marginalia.index.forward.ForwardIndexFileNames;
|
||||
import nu.marginalia.index.config.ForwardIndexFileNames;
|
||||
import nu.marginalia.index.forward.construction.ForwardIndexConverter;
|
||||
import nu.marginalia.index.journal.IndexJournal;
|
||||
import nu.marginalia.index.reverse.ReverseIndexFullFileNames;
|
||||
import nu.marginalia.index.reverse.ReverseIndexPrioFileNames;
|
||||
import nu.marginalia.index.config.ReverseIndexFullFileNames;
|
||||
import nu.marginalia.index.config.ReverseIndexPrioFileNames;
|
||||
import nu.marginalia.index.reverse.construction.full.FullIndexConstructor;
|
||||
import nu.marginalia.index.reverse.construction.prio.PrioIndexConstructor;
|
||||
import nu.marginalia.index.searchset.DomainRankings;
|
||||
|
@@ -3,12 +3,12 @@ package nu.marginalia.index;
|
||||
import com.google.inject.Inject;
|
||||
import com.google.inject.Singleton;
|
||||
import nu.marginalia.IndexLocations;
|
||||
import nu.marginalia.index.forward.ForwardIndexFileNames;
|
||||
import nu.marginalia.index.config.ForwardIndexFileNames;
|
||||
import nu.marginalia.index.config.ReverseIndexFullFileNames;
|
||||
import nu.marginalia.index.config.ReverseIndexPrioFileNames;
|
||||
import nu.marginalia.index.forward.ForwardIndexReader;
|
||||
import nu.marginalia.index.reverse.FullReverseIndexReader;
|
||||
import nu.marginalia.index.reverse.PrioReverseIndexReader;
|
||||
import nu.marginalia.index.reverse.ReverseIndexFullFileNames;
|
||||
import nu.marginalia.index.reverse.ReverseIndexPrioFileNames;
|
||||
import nu.marginalia.index.reverse.positions.PositionsFileReader;
|
||||
import nu.marginalia.storage.FileStorageService;
|
||||
|
||||
|
@@ -1,4 +1,4 @@
|
||||
package nu.marginalia.index.forward;
|
||||
package nu.marginalia.index.config;
|
||||
|
||||
import java.nio.file.Path;
|
||||
|
@@ -1,4 +1,4 @@
|
||||
package nu.marginalia.index.forward;
|
||||
package nu.marginalia.index.config;
|
||||
|
||||
public class ForwardIndexParameters {
|
||||
public static final int ENTRY_SIZE = 3;
|
@@ -1,4 +1,4 @@
|
||||
package nu.marginalia.index.reverse;
|
||||
package nu.marginalia.index.config;
|
||||
|
||||
import java.nio.file.Path;
|
||||
|
@@ -1,4 +1,4 @@
|
||||
package nu.marginalia.index.reverse;
|
||||
package nu.marginalia.index.config;
|
||||
|
||||
import nu.marginalia.btree.model.BTreeBlockSize;
|
||||
import nu.marginalia.btree.model.BTreeContext;
|
@@ -1,4 +1,4 @@
|
||||
package nu.marginalia.index.reverse;
|
||||
package nu.marginalia.index.config;
|
||||
|
||||
import java.nio.file.Path;
|
||||
|
@@ -18,7 +18,7 @@ import java.nio.file.Files;
|
||||
import java.nio.file.Path;
|
||||
import java.util.concurrent.TimeoutException;
|
||||
|
||||
import static nu.marginalia.index.forward.ForwardIndexParameters.*;
|
||||
import static nu.marginalia.index.config.ForwardIndexParameters.*;
|
||||
|
||||
/** Reads the forward index.
|
||||
* <p/>
|
||||
|
@@ -3,7 +3,7 @@ package nu.marginalia.index.forward.construction;
|
||||
import it.unimi.dsi.fastutil.longs.Long2IntOpenHashMap;
|
||||
import nu.marginalia.array.LongArray;
|
||||
import nu.marginalia.array.LongArrayFactory;
|
||||
import nu.marginalia.index.forward.ForwardIndexParameters;
|
||||
import nu.marginalia.index.config.ForwardIndexParameters;
|
||||
import nu.marginalia.index.forward.spans.IndexSpansWriter;
|
||||
import nu.marginalia.index.journal.IndexJournal;
|
||||
import nu.marginalia.index.searchset.DomainRankings;
|
||||
|
@@ -11,6 +11,8 @@ public class SpansCodec {
|
||||
public static int FOOTER_SIZE = 8;
|
||||
|
||||
public enum SpansCodecVersion {
|
||||
@Deprecated
|
||||
DEPRECATED_1, // This must not be removed, the ordinal is used to encode the version
|
||||
PLAIN
|
||||
}
|
||||
|
||||
|
@@ -5,6 +5,7 @@ import nu.marginalia.array.LongArrayFactory;
|
||||
import nu.marginalia.array.pool.BufferPool;
|
||||
import nu.marginalia.btree.BTreeReader;
|
||||
import nu.marginalia.ffi.LinuxSystemCalls;
|
||||
import nu.marginalia.index.config.ReverseIndexParameters;
|
||||
import nu.marginalia.index.model.CombinedDocIdList;
|
||||
import nu.marginalia.index.model.TermMetadataList;
|
||||
import nu.marginalia.index.reverse.positions.PositionsFileReader;
|
||||
|
@@ -61,6 +61,7 @@ public class PrioIndexEntrySource implements EntrySource {
|
||||
var outputBuffer = buffer.asByteBuffer().order(ByteOrder.LITTLE_ENDIAN);
|
||||
outputBuffer.clear();
|
||||
|
||||
// FYI: The encoding end of this compression algorithm is at PrioDocIdsTransformer
|
||||
while (outputBuffer.hasRemaining() && readItems++ < numItems) {
|
||||
int rank;
|
||||
int domainId;
|
||||
|
@@ -4,6 +4,7 @@ import nu.marginalia.array.LongArray;
|
||||
import nu.marginalia.array.LongArrayFactory;
|
||||
import nu.marginalia.btree.BTreeReader;
|
||||
import nu.marginalia.ffi.LinuxSystemCalls;
|
||||
import nu.marginalia.index.config.ReverseIndexParameters;
|
||||
import nu.marginalia.index.reverse.query.EmptyEntrySource;
|
||||
import nu.marginalia.index.reverse.query.EntrySource;
|
||||
import org.slf4j.Logger;
|
||||
|
@@ -3,11 +3,11 @@ package nu.marginalia.index.reverse.construction.full;
|
||||
import nu.marginalia.array.LongArray;
|
||||
import nu.marginalia.array.LongArrayFactory;
|
||||
import nu.marginalia.btree.BTreeWriter;
|
||||
import nu.marginalia.index.reverse.ReverseIndexParameters;
|
||||
import nu.marginalia.index.config.ReverseIndexParameters;
|
||||
import nu.marginalia.index.journal.IndexJournalPage;
|
||||
import nu.marginalia.index.reverse.construction.CountToOffsetTransformer;
|
||||
import nu.marginalia.index.reverse.construction.DocIdRewriter;
|
||||
import nu.marginalia.index.reverse.construction.PositionsFileConstructor;
|
||||
import nu.marginalia.index.journal.IndexJournalPage;
|
||||
import org.slf4j.Logger;
|
||||
import org.slf4j.LoggerFactory;
|
||||
|
||||
|
@@ -3,10 +3,10 @@ package nu.marginalia.index.reverse.construction.prio;
|
||||
import nu.marginalia.array.LongArray;
|
||||
import nu.marginalia.array.LongArrayFactory;
|
||||
import nu.marginalia.btree.BTreeWriter;
|
||||
import nu.marginalia.index.reverse.ReverseIndexParameters;
|
||||
import nu.marginalia.index.config.ReverseIndexParameters;
|
||||
import nu.marginalia.index.journal.IndexJournalPage;
|
||||
import nu.marginalia.index.reverse.construction.CountToOffsetTransformer;
|
||||
import nu.marginalia.index.reverse.construction.DocIdRewriter;
|
||||
import nu.marginalia.index.journal.IndexJournalPage;
|
||||
import org.slf4j.Logger;
|
||||
import org.slf4j.LoggerFactory;
|
||||
|
||||
|
@@ -6,11 +6,11 @@ import it.unimi.dsi.fastutil.ints.IntList;
|
||||
import nu.marginalia.IndexLocations;
|
||||
import nu.marginalia.array.page.LongQueryBuffer;
|
||||
import nu.marginalia.hash.MurmurHash3_128;
|
||||
import nu.marginalia.index.forward.ForwardIndexFileNames;
|
||||
import nu.marginalia.index.config.ForwardIndexFileNames;
|
||||
import nu.marginalia.index.config.ReverseIndexFullFileNames;
|
||||
import nu.marginalia.index.forward.construction.ForwardIndexConverter;
|
||||
import nu.marginalia.index.journal.IndexJournal;
|
||||
import nu.marginalia.index.journal.IndexJournalSlopWriter;
|
||||
import nu.marginalia.index.reverse.ReverseIndexFullFileNames;
|
||||
import nu.marginalia.index.reverse.construction.DocIdRewriter;
|
||||
import nu.marginalia.index.reverse.construction.full.FullIndexConstructor;
|
||||
import nu.marginalia.index.reverse.query.IndexSearchBudget;
|
||||
|
@@ -7,12 +7,12 @@ import nu.marginalia.api.searchquery.RpcDecoratedResultItem;
|
||||
import nu.marginalia.api.searchquery.RpcQueryLimits;
|
||||
import nu.marginalia.api.searchquery.model.query.*;
|
||||
import nu.marginalia.api.searchquery.model.results.PrototypeRankingParameters;
|
||||
import nu.marginalia.index.forward.ForwardIndexFileNames;
|
||||
import nu.marginalia.index.config.ForwardIndexFileNames;
|
||||
import nu.marginalia.index.config.ReverseIndexFullFileNames;
|
||||
import nu.marginalia.index.config.ReverseIndexPrioFileNames;
|
||||
import nu.marginalia.index.forward.construction.ForwardIndexConverter;
|
||||
import nu.marginalia.index.journal.IndexJournal;
|
||||
import nu.marginalia.index.journal.IndexJournalSlopWriter;
|
||||
import nu.marginalia.index.reverse.ReverseIndexFullFileNames;
|
||||
import nu.marginalia.index.reverse.ReverseIndexPrioFileNames;
|
||||
import nu.marginalia.index.reverse.construction.DocIdRewriter;
|
||||
import nu.marginalia.index.reverse.construction.full.FullIndexConstructor;
|
||||
import nu.marginalia.index.reverse.construction.prio.PrioIndexConstructor;
|
||||
|
@@ -8,12 +8,12 @@ import nu.marginalia.api.searchquery.RpcQueryLimits;
|
||||
import nu.marginalia.api.searchquery.model.query.*;
|
||||
import nu.marginalia.api.searchquery.model.results.PrototypeRankingParameters;
|
||||
import nu.marginalia.hash.MurmurHash3_128;
|
||||
import nu.marginalia.index.forward.ForwardIndexFileNames;
|
||||
import nu.marginalia.index.config.ForwardIndexFileNames;
|
||||
import nu.marginalia.index.forward.construction.ForwardIndexConverter;
|
||||
import nu.marginalia.index.journal.IndexJournal;
|
||||
import nu.marginalia.index.journal.IndexJournalSlopWriter;
|
||||
import nu.marginalia.index.reverse.ReverseIndexFullFileNames;
|
||||
import nu.marginalia.index.reverse.ReverseIndexPrioFileNames;
|
||||
import nu.marginalia.index.config.ReverseIndexFullFileNames;
|
||||
import nu.marginalia.index.config.ReverseIndexPrioFileNames;
|
||||
import nu.marginalia.index.reverse.construction.DocIdRewriter;
|
||||
import nu.marginalia.index.reverse.construction.full.FullIndexConstructor;
|
||||
import nu.marginalia.index.reverse.construction.prio.PrioIndexConstructor;
|
||||
|
@@ -16,13 +16,13 @@ import nu.marginalia.crawl.fetcher.warc.WarcRecorder;
|
||||
import nu.marginalia.functions.searchquery.QueryFactory;
|
||||
import nu.marginalia.index.IndexQueryExecution;
|
||||
import nu.marginalia.index.StatefulIndex;
|
||||
import nu.marginalia.index.forward.ForwardIndexFileNames;
|
||||
import nu.marginalia.index.config.ForwardIndexFileNames;
|
||||
import nu.marginalia.index.config.ReverseIndexFullFileNames;
|
||||
import nu.marginalia.index.config.ReverseIndexPrioFileNames;
|
||||
import nu.marginalia.index.forward.construction.ForwardIndexConverter;
|
||||
import nu.marginalia.index.journal.IndexJournal;
|
||||
import nu.marginalia.index.model.SearchContext;
|
||||
import nu.marginalia.index.results.IndexResultRankingService;
|
||||
import nu.marginalia.index.reverse.ReverseIndexFullFileNames;
|
||||
import nu.marginalia.index.reverse.ReverseIndexPrioFileNames;
|
||||
import nu.marginalia.index.reverse.construction.full.FullIndexConstructor;
|
||||
import nu.marginalia.index.reverse.construction.prio.PrioIndexConstructor;
|
||||
import nu.marginalia.index.searchset.DomainRankings;
|
||||
|
Reference in New Issue
Block a user