From a4c7f853b3c9156bd714a3e28a5ed02f48b84e5d Mon Sep 17 00:00:00 2001 From: Siddhant Chaudhary Date: Wed, 24 Jul 2024 13:19:52 +0530 Subject: [PATCH] Fixing the indexing code to include the `QueryTokenizer` in the `CheckPoint`. --- src/indexing.jl | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/src/indexing.jl b/src/indexing.jl index 0bcb30a..617e165 100644 --- a/src/indexing.jl +++ b/src/indexing.jl @@ -17,7 +17,7 @@ function index(indexer::Indexer) # loading the models @info "Loading ColBERT layers from HuggingFace." base_colbert = BaseColBERT(checkpoint, config) - checkPoint = Checkpoint(base_colbert, DocTokenizer(base_colbert.tokenizer, config), config) + checkPoint = Checkpoint(base_colbert, DocTokenizer(base_colbert.tokenizer, config), QueryTokenizer(base_colbert.tokenizer, config), config) # creating the encoder, saver and indexer encoder = CollectionEncoder(config, checkPoint)