mirror of
https://github.com/TabbyML/tabby
synced 2024-11-22 00:08:06 +00:00
chore(index): skip web documents if body is empty (#2831)
* chore(index): skip web documents if body is empty * Update .changes/unreleased/Fixed and Improvements-20240811-124728.yaml
This commit is contained in:
parent
4d3f889c92
commit
6c60ca4a17
@ -0,0 +1,3 @@
|
||||
kind: Fixed and Improvements
|
||||
body: Skip web documents if body is empty
|
||||
time: 2024-08-11T12:47:28.678694-07:00
|
@ -47,15 +47,18 @@ impl DocIndexer {
|
||||
};
|
||||
|
||||
stream! {
|
||||
let is_document_empty = document.body.trim().is_empty();
|
||||
let (id, s) = self.builder.build(document).await;
|
||||
self.indexer.delete(&id);
|
||||
for await doc in s.buffer_unordered(std::cmp::max(std::thread::available_parallelism().unwrap().get() * 2, 32)) {
|
||||
if let Ok(Some(doc)) = doc {
|
||||
self.indexer.add(doc).await;
|
||||
|
||||
if !is_document_empty {
|
||||
for await doc in s.buffer_unordered(std::cmp::max(std::thread::available_parallelism().unwrap().get() * 2, 32)) {
|
||||
if let Ok(Some(doc)) = doc {
|
||||
self.indexer.add(doc).await;
|
||||
}
|
||||
}
|
||||
}
|
||||
}.count().await;
|
||||
|
||||
true
|
||||
}
|
||||
|
||||
|
Loading…
Reference in New Issue
Block a user