# from colbert.indexing.codecs.residual import ResidualCodec
import colbert.indexing.codecs.residual_embeddings as residual_embeddings
from colbert.search.strided_tensor import StridedTensor
class ResidualEmbeddingsStrided:
def __init__(self, codec, embeddings, doclens):
self.codec = codec
self.codes = embeddings.codes
self.residuals = embeddings.residuals
self.use_gpu = self.codec.use_gpu
self.codes_strided = StridedTensor(self.codes, doclens, use_gpu=self.use_gpu)
self.residuals_strided = StridedTensor(self.residuals, doclens, use_gpu=self.use_gpu)
def lookup_pids(self, passage_ids, out_device='cuda'):
codes_packed, codes_lengths = self.codes_strided.lookup(passage_ids)#.as_packed_tensor()
residuals_packed, _ = self.residuals_strided.lookup(passage_ids)#.as_packed_tensor()
embeddings_packed = self.codec.decompress(residual_embeddings.ResidualEmbeddings(codes_packed, residuals_packed))
return embeddings_packed, codes_lengths
def lookup_codes(self, passage_ids):
return self.codes_strided.lookup(passage_ids)#.as_packed_tensor()