mirror of
https://forgejo.ellis.link/continuwuation/continuwuity.git
synced 2025-06-27 21:34:50 +02:00
65 lines
2.3 KiB
Rust
65 lines
2.3 KiB
Rust
use ruma::RoomId;
|
|
|
|
use crate::{database::KeyValueDatabase, service, services, utils, Result};
|
|
|
|
type SearchPdusResult<'a> = Result<Option<(Box<dyn Iterator<Item = Vec<u8>> + 'a>, Vec<String>)>>;
|
|
|
|
impl service::rooms::search::Data for KeyValueDatabase {
|
|
fn index_pdu(&self, shortroomid: u64, pdu_id: &[u8], message_body: &str) -> Result<()> {
|
|
let mut batch = message_body
|
|
.split_terminator(|c: char| !c.is_alphanumeric())
|
|
.filter(|s| !s.is_empty())
|
|
.filter(|word| word.len() <= 50)
|
|
.map(str::to_lowercase)
|
|
.map(|word| {
|
|
let mut key = shortroomid.to_be_bytes().to_vec();
|
|
key.extend_from_slice(word.as_bytes());
|
|
key.push(0xff);
|
|
key.extend_from_slice(pdu_id); // TODO: currently we save the room id a second time here
|
|
(key, Vec::new())
|
|
});
|
|
|
|
self.tokenids.insert_batch(&mut batch)
|
|
}
|
|
|
|
fn search_pdus<'a>(&'a self, room_id: &RoomId, search_string: &str) -> SearchPdusResult<'a> {
|
|
let prefix = services()
|
|
.rooms
|
|
.short
|
|
.get_shortroomid(room_id)?
|
|
.expect("room exists")
|
|
.to_be_bytes()
|
|
.to_vec();
|
|
|
|
let words: Vec<_> = search_string
|
|
.split_terminator(|c: char| !c.is_alphanumeric())
|
|
.filter(|s| !s.is_empty())
|
|
.map(str::to_lowercase)
|
|
.collect();
|
|
|
|
let iterators = words.clone().into_iter().map(move |word| {
|
|
let mut prefix2 = prefix.clone();
|
|
prefix2.extend_from_slice(word.as_bytes());
|
|
prefix2.push(0xff);
|
|
let prefix3 = prefix2.clone();
|
|
|
|
let mut last_possible_id = prefix2.clone();
|
|
last_possible_id.extend_from_slice(&u64::MAX.to_be_bytes());
|
|
|
|
self.tokenids
|
|
.iter_from(&last_possible_id, true) // Newest pdus first
|
|
.take_while(move |(k, _)| k.starts_with(&prefix2))
|
|
.map(move |(key, _)| key[prefix3.len()..].to_vec())
|
|
});
|
|
|
|
let common_elements = match utils::common_elements(iterators, |a, b| {
|
|
// We compare b with a because we reversed the iterator earlier
|
|
b.cmp(a)
|
|
}) {
|
|
Some(it) => it,
|
|
None => return Ok(None),
|
|
};
|
|
|
|
Ok(Some((Box::new(common_elements), words)))
|
|
}
|
|
}
|