Skip to content
This repository has been archived by the owner on Jan 2, 2025. It is now read-only.

Commit

Permalink
Split files by token in proc, on a new thread (#615)
Browse files Browse the repository at this point in the history
* Split files by token in proc, on a new thread

* Optimize `split_line_set_by_tokens`, fix large proc requests
  • Loading branch information
calyptobai authored Jun 9, 2023
1 parent b9563ab commit 752b335
Showing 1 changed file with 27 additions and 16 deletions.
43 changes: 27 additions & 16 deletions server/bleep/src/webserver/answer.rs
Original file line number Diff line number Diff line change
Expand Up @@ -576,6 +576,8 @@ impl Conversation {
let repo_ref = &self.repo_ref;
let chunks = stream::iter(paths)
.map(|path| async move {
tracing::debug!(?path, "reading file");

let lines = ctx
.app
.indexes
Expand All @@ -589,20 +591,24 @@ impl Conversation {
.map(|(i, line)| format!("{} {line}", i + 1))
.collect::<Vec<_>>();

Result::<_>::Ok((lines, path))
})
// Buffer file loading to load multiple paths at once
.buffered(10)
.and_then(|(lines, path): (Vec<String>, String)| async move {
const MAX_TOKENS: usize = 3400;
const LINE_OVERLAP: usize = 3;

let bpe = tiktoken_rs::get_bpe_from_model("gpt-3.5-turbo")?;
let iter = split_line_set_by_tokens(lines, bpe, MAX_TOKENS, LINE_OVERLAP)
.map(move |lines| Result::<_>::Ok((lines, path.clone())));

Ok(futures::stream::iter(iter))
let iter = tokio::task::spawn_blocking(|| {
split_line_set_by_tokens(lines, bpe, MAX_TOKENS, LINE_OVERLAP)
.collect::<Vec<_>>()
})
.await
.context("failed to split by token")?
.into_iter()
.map(move |lines| Result::<_>::Ok((lines, path.clone())));

Result::<_>::Ok(futures::stream::iter(iter))
})
// Buffer file loading to load multiple paths at once
.buffered(10)
.try_flatten()
.map(|result| async {
let (lines, path) = result?;
Expand All @@ -621,6 +627,8 @@ impl Conversation {
let contents = lines.join("\n");
let prompt = prompts::file_explanation(question, &path, &contents);

tracing::debug!(?path, "calling chat API on file");

let json = ctx
.llm_gateway
.chat(&[llm_gateway::api::Message::system(&prompt)])
Expand Down Expand Up @@ -1127,6 +1135,11 @@ fn split_line_set_by_tokens(
max_tokens: usize,
line_overlap: usize,
) -> impl Iterator<Item = Vec<String>> {
let line_tokens = lines
.iter()
.map(|line| bpe.encode_ordinary(line).len())
.collect::<Vec<_>>();

let mut start = 0usize;

std::iter::from_fn(move || {
Expand All @@ -1138,14 +1151,12 @@ fn split_line_set_by_tokens(

let mut subset = Vec::new();

loop {
if start >= lines.len() {
break;
}

let text = subset.join("\n");

if limit_tokens(&text, bpe.clone(), max_tokens).len() < text.len() {
while start < lines.len() {
if line_tokens[start - subset.len()..start]
.iter()
.sum::<usize>()
> max_tokens
{
subset.pop();
start -= 1;
break;
Expand Down

0 comments on commit 752b335

Please sign in to comment.