mirror of
https://github.com/chatmail/core.git
synced 2026-04-17 13:36:30 +03:00
875 lines
28 KiB
Rust
875 lines
28 KiB
Rust
//! Some tools and enhancements to the used libraries, there should be
|
|
//! no references to Context and other "larger" entities here.
|
|
|
|
#![allow(missing_docs)]
|
|
|
|
use std::borrow::Cow;
|
|
use std::io::{Cursor, Write};
|
|
use std::mem;
|
|
use std::ops::{AddAssign, Deref};
|
|
use std::path::{Path, PathBuf};
|
|
use std::str::from_utf8;
|
|
// If a time value doesn't need to be sent to another host, saved to the db or otherwise used across
|
|
// program restarts, a monotonically nondecreasing clock (`Instant`) should be used. But as
|
|
// `Instant` may use `libc::clock_gettime(CLOCK_MONOTONIC)`, e.g. on Android, and does not advance
|
|
// while being in deep sleep mode, we use `SystemTime` instead, but add an alias for it to document
|
|
// why `Instant` isn't used in those places. Also this can help to switch to another clock impl if
|
|
// we find any. Another reason is that `Instant` may reintroduce panics in the future versions:
|
|
// https://doc.rust-lang.org/1.87.0/std/time/struct.Instant.html#method.elapsed.
|
|
use std::time::Duration;
|
|
pub use std::time::SystemTime as Time;
|
|
#[cfg(not(test))]
|
|
pub use std::time::SystemTime;
|
|
|
|
use anyhow::{Context as _, Result, bail, ensure};
|
|
use base64::Engine as _;
|
|
use chrono::{Local, NaiveDateTime, NaiveTime, TimeZone};
|
|
use deltachat_contact_tools::EmailAddress;
|
|
#[cfg(test)]
|
|
pub use deltachat_time::SystemTimeTools as SystemTime;
|
|
use futures::TryStreamExt;
|
|
use mailparse::MailHeaderMap;
|
|
use mailparse::dateparse;
|
|
use mailparse::headers::Headers;
|
|
use num_traits::PrimInt;
|
|
use tokio::{fs, io};
|
|
use url::Url;
|
|
use uuid::Uuid;
|
|
|
|
use crate::chat::{add_device_msg, add_device_msg_with_importance};
|
|
use crate::config::Config;
|
|
use crate::constants::{self, DC_ELLIPSIS, DC_OUTDATED_WARNING_DAYS};
|
|
use crate::context::Context;
|
|
use crate::events::EventType;
|
|
use crate::log::warn;
|
|
use crate::message::{Message, Viewtype};
|
|
use crate::stock_str;
|
|
|
|
/// Shortens a string to a specified length and adds "[...]" to the
|
|
/// end of the shortened string.
|
|
pub(crate) fn truncate(buf: &str, approx_chars: usize) -> Cow<'_, str> {
|
|
let count = buf.chars().count();
|
|
if count <= approx_chars + DC_ELLIPSIS.len() {
|
|
return Cow::Borrowed(buf);
|
|
}
|
|
let end_pos = buf
|
|
.char_indices()
|
|
.nth(approx_chars)
|
|
.map(|(n, _)| n)
|
|
.unwrap_or_default();
|
|
|
|
if let Some(index) = buf.get(..end_pos).and_then(|s| s.rfind([' ', '\n'])) {
|
|
Cow::Owned(format!(
|
|
"{}{}",
|
|
&buf.get(..=index).unwrap_or_default(),
|
|
DC_ELLIPSIS
|
|
))
|
|
} else {
|
|
Cow::Owned(format!(
|
|
"{}{}",
|
|
&buf.get(..end_pos).unwrap_or_default(),
|
|
DC_ELLIPSIS
|
|
))
|
|
}
|
|
}
|
|
|
|
/// Shortens a string to a specified line count and adds "[...]" to the
|
|
/// end of the shortened string.
|
|
///
|
|
/// returns tuple with the String and a boolean whether is was truncated
|
|
pub(crate) fn truncate_by_lines(
|
|
buf: String,
|
|
max_lines: usize,
|
|
max_line_len: usize,
|
|
) -> (String, bool) {
|
|
let mut lines = 0;
|
|
let mut line_chars = 0;
|
|
let mut break_point: Option<usize> = None;
|
|
|
|
for (index, char) in buf.char_indices() {
|
|
if char == '\n' {
|
|
line_chars = 0;
|
|
lines += 1;
|
|
} else {
|
|
line_chars += 1;
|
|
if line_chars > max_line_len {
|
|
line_chars = 1;
|
|
lines += 1;
|
|
}
|
|
}
|
|
if lines == max_lines {
|
|
break_point = Some(index);
|
|
break;
|
|
}
|
|
}
|
|
|
|
if let Some(end_pos) = break_point {
|
|
// Text has too many lines and needs to be truncated.
|
|
let text = {
|
|
if let Some(buffer) = buf.get(..end_pos) {
|
|
if let Some(index) = buffer.rfind([' ', '\n']) {
|
|
buf.get(..=index)
|
|
} else {
|
|
buf.get(..end_pos)
|
|
}
|
|
} else {
|
|
None
|
|
}
|
|
};
|
|
|
|
if let Some(truncated_text) = text {
|
|
(format!("{truncated_text}{DC_ELLIPSIS}"), true)
|
|
} else {
|
|
// In case of indexing/slicing error, we return an error
|
|
// message as a preview and add HTML version. This should
|
|
// never happen.
|
|
let error_text = "[Truncation of the message failed, this is a bug in the Delta Chat core. Please report it.\nYou can still open the full text to view the original message.]";
|
|
(error_text.to_string(), true)
|
|
}
|
|
} else {
|
|
// text is unchanged
|
|
(buf, false)
|
|
}
|
|
}
|
|
|
|
/// Shortens a message text if necessary according to the configuration. Adds "[...]" to the end of
|
|
/// the shortened text.
|
|
///
|
|
/// Returns the resulting text and a bool telling whether a truncation was done.
|
|
pub(crate) async fn truncate_msg_text(context: &Context, text: String) -> Result<(String, bool)> {
|
|
if context.get_config_bool(Config::Bot).await? {
|
|
return Ok((text, false));
|
|
}
|
|
// Truncate text if it has too many lines
|
|
Ok(truncate_by_lines(
|
|
text,
|
|
constants::DC_DESIRED_TEXT_LINES,
|
|
constants::DC_DESIRED_TEXT_LINE_LEN,
|
|
))
|
|
}
|
|
|
|
/* ******************************************************************************
|
|
* date/time tools
|
|
******************************************************************************/
|
|
|
|
/// Converts Unix time in seconds to a local timestamp string.
|
|
pub fn timestamp_to_str(wanted: i64) -> String {
|
|
if let Some(ts) = Local.timestamp_opt(wanted, 0).single() {
|
|
ts.format("%Y.%m.%d %H:%M:%S").to_string()
|
|
} else {
|
|
// Out of range number of seconds.
|
|
"??.??.?? ??:??:??".to_string()
|
|
}
|
|
}
|
|
|
|
/// Converts duration to string representation suitable for logs.
|
|
pub fn duration_to_str(duration: Duration) -> String {
|
|
let secs = duration.as_secs();
|
|
let h = secs / 3600;
|
|
let m = (secs % 3600) / 60;
|
|
let s = (secs % 3600) % 60;
|
|
format!("{h}h {m}m {s}s")
|
|
}
|
|
|
|
pub(crate) fn gm2local_offset() -> i64 {
|
|
/* returns the offset that must be _added_ to an UTC/GMT-time to create the localtime.
|
|
the function may return negative values. */
|
|
let lt = Local::now();
|
|
i64::from(lt.offset().local_minus_utc())
|
|
}
|
|
|
|
/// Returns the current smeared timestamp,
|
|
///
|
|
/// The returned timestamp MAY NOT be unique and MUST NOT go to "Date" header.
|
|
pub(crate) fn smeared_time(context: &Context) -> i64 {
|
|
let now = time();
|
|
let ts = context.smeared_timestamp.current();
|
|
std::cmp::max(ts, now)
|
|
}
|
|
|
|
/// Returns a timestamp that is guaranteed to be unique.
|
|
pub(crate) fn create_smeared_timestamp(context: &Context) -> i64 {
|
|
let now = time();
|
|
context.smeared_timestamp.create(now)
|
|
}
|
|
|
|
// creates `count` timestamps that are guaranteed to be unique.
|
|
// the first created timestamps is returned directly,
|
|
// get the other timestamps just by adding 1..count-1
|
|
pub(crate) fn create_smeared_timestamps(context: &Context, count: usize) -> i64 {
|
|
let now = time();
|
|
context.smeared_timestamp.create_n(now, count as i64)
|
|
}
|
|
|
|
/// Returns the last release timestamp as a unix timestamp compatible for comparison with time() and
|
|
/// database times.
|
|
pub fn get_release_timestamp() -> i64 {
|
|
NaiveDateTime::new(
|
|
*crate::release::DATE,
|
|
NaiveTime::from_hms_opt(0, 0, 0).unwrap(),
|
|
)
|
|
.and_utc()
|
|
.timestamp_millis()
|
|
/ 1_000
|
|
}
|
|
|
|
// if the system time is not plausible, once a day, add a device message.
|
|
// for testing we're using time() as that is also used for message timestamps.
|
|
// moreover, add a warning if the app is outdated.
|
|
pub(crate) async fn maybe_add_time_based_warnings(context: &Context) {
|
|
if !maybe_warn_on_bad_time(context, time(), get_release_timestamp()).await {
|
|
maybe_warn_on_outdated(context, time(), get_release_timestamp()).await;
|
|
}
|
|
}
|
|
|
|
async fn maybe_warn_on_bad_time(context: &Context, now: i64, known_past_timestamp: i64) -> bool {
|
|
if now < known_past_timestamp {
|
|
let mut msg = Message::new(Viewtype::Text);
|
|
msg.text = stock_str::bad_time_msg_body(
|
|
context,
|
|
&Local.timestamp_opt(now, 0).single().map_or_else(
|
|
|| "YY-MM-DD hh:mm:ss".to_string(),
|
|
|ts| ts.format("%Y-%m-%d %H:%M:%S").to_string(),
|
|
),
|
|
)
|
|
.await;
|
|
if let Some(timestamp) = chrono::DateTime::<chrono::Utc>::from_timestamp(now, 0) {
|
|
add_device_msg_with_importance(
|
|
context,
|
|
Some(
|
|
format!(
|
|
"bad-time-warning-{}",
|
|
timestamp.format("%Y-%m-%d") // repeat every day
|
|
)
|
|
.as_str(),
|
|
),
|
|
Some(&mut msg),
|
|
true,
|
|
)
|
|
.await
|
|
.ok();
|
|
} else {
|
|
warn!(context, "Can't convert current timestamp");
|
|
}
|
|
return true;
|
|
}
|
|
false
|
|
}
|
|
|
|
async fn maybe_warn_on_outdated(context: &Context, now: i64, approx_compile_time: i64) {
|
|
if now > approx_compile_time + DC_OUTDATED_WARNING_DAYS * 24 * 60 * 60 {
|
|
let mut msg = Message::new_text(stock_str::update_reminder_msg_body(context).await);
|
|
if let Some(timestamp) = chrono::DateTime::<chrono::Utc>::from_timestamp(now, 0) {
|
|
add_device_msg(
|
|
context,
|
|
Some(
|
|
format!(
|
|
"outdated-warning-{}",
|
|
timestamp.format("%Y-%m") // repeat every month
|
|
)
|
|
.as_str(),
|
|
),
|
|
Some(&mut msg),
|
|
)
|
|
.await
|
|
.ok();
|
|
}
|
|
}
|
|
}
|
|
|
|
/// Generate an unique ID.
|
|
///
|
|
/// The generated ID should be short but unique:
|
|
/// - short, because it used in Chat-Group-ID headers and in QR codes
|
|
/// - unique as two IDs generated on two devices should not be the same
|
|
///
|
|
/// IDs generated by this function have 144 bits of entropy
|
|
/// and are returned as 24 Base64 characters, each containing 6 bits of entropy.
|
|
/// 144 is chosen because it is sufficiently secure
|
|
/// (larger than AES-128 keys used for message encryption)
|
|
/// and divides both by 8 (byte size) and 6 (number of bits in a single Base64 character).
|
|
pub(crate) fn create_id() -> String {
|
|
// Generate 144 random bits.
|
|
let mut arr = [0u8; 18];
|
|
rand::fill(&mut arr[..]);
|
|
|
|
base64::engine::general_purpose::URL_SAFE.encode(arr)
|
|
}
|
|
|
|
/// Generate a shared secret for a broadcast channel, consisting of 43 characters.
|
|
///
|
|
/// The string generated by this function has 258 bits of entropy
|
|
/// and is returned as 43 Base64 characters, each containing 6 bits of entropy.
|
|
/// 258 is chosen because we may switch to AES-256 keys in the future,
|
|
/// and so that the shared secret definitely won't be the weak spot.
|
|
pub(crate) fn create_broadcast_secret() -> String {
|
|
// ThreadRng implements CryptoRng trait and is supposed to be cryptographically secure.
|
|
// Generate 264 random bits.
|
|
let mut arr = [0u8; 33];
|
|
rand::fill(&mut arr[..]);
|
|
|
|
let mut res = base64::engine::general_purpose::URL_SAFE.encode(arr);
|
|
res.truncate(43);
|
|
res
|
|
}
|
|
|
|
/// Returns true if given string is a valid ID.
|
|
///
|
|
/// All IDs generated with `create_id()` should be considered valid.
|
|
pub(crate) fn validate_id(s: &str) -> bool {
|
|
let alphabet = base64::alphabet::URL_SAFE.as_str();
|
|
s.chars().all(|c| alphabet.contains(c)) && s.len() > 10 && s.len() <= 32
|
|
}
|
|
|
|
pub(crate) fn validate_broadcast_secret(s: &str) -> bool {
|
|
let alphabet = base64::alphabet::URL_SAFE.as_str();
|
|
s.chars().all(|c| alphabet.contains(c)) && s.len() >= 43 && s.len() <= 100
|
|
}
|
|
|
|
/// Function generates a Message-ID that can be used for a new outgoing message.
|
|
/// - this function is called for all outgoing messages.
|
|
/// - the message ID should be globally unique
|
|
/// - do not add a counter or any private data as this leaks information unnecessarily
|
|
pub(crate) fn create_outgoing_rfc724_mid() -> String {
|
|
// We use UUID similarly to iCloud web mail client
|
|
// because it seems their spam filter does not like Message-IDs
|
|
// without hyphens.
|
|
//
|
|
// However, we use `localhost` instead of the real domain to avoid
|
|
// leaking the domain when resent by otherwise anonymizing
|
|
// From-rewriting mailing lists and forwarders.
|
|
let uuid = Uuid::new_v4();
|
|
format!("{uuid}@localhost")
|
|
}
|
|
|
|
// the returned suffix is lower-case
|
|
pub fn get_filesuffix_lc(path_filename: &str) -> Option<String> {
|
|
Path::new(path_filename)
|
|
.extension()
|
|
.map(|p| p.to_string_lossy().to_lowercase())
|
|
}
|
|
|
|
/// Returns the `(width, height)` of the given image buffer.
|
|
pub fn get_filemeta(buf: &[u8]) -> Result<(u32, u32)> {
|
|
let image = image::ImageReader::new(Cursor::new(buf)).with_guessed_format()?;
|
|
let dimensions = image.into_dimensions()?;
|
|
Ok(dimensions)
|
|
}
|
|
|
|
/// Expand paths relative to $BLOBDIR into absolute paths.
|
|
///
|
|
/// If `path` starts with "$BLOBDIR", replaces it with the blobdir path.
|
|
/// Otherwise, returns path as is.
|
|
pub(crate) fn get_abs_path(context: &Context, path: &Path) -> PathBuf {
|
|
if let Ok(p) = path.strip_prefix("$BLOBDIR") {
|
|
context.get_blobdir().join(p)
|
|
} else {
|
|
path.into()
|
|
}
|
|
}
|
|
|
|
pub(crate) async fn get_filebytes(context: &Context, path: &Path) -> Result<u64> {
|
|
let path_abs = get_abs_path(context, path);
|
|
let meta = fs::metadata(&path_abs).await?;
|
|
Ok(meta.len())
|
|
}
|
|
|
|
pub(crate) async fn delete_file(context: &Context, path: &Path) -> Result<()> {
|
|
let path_abs = get_abs_path(context, path);
|
|
if !path_abs.exists() {
|
|
bail!("path {} does not exist", path_abs.display());
|
|
}
|
|
if !path_abs.is_file() {
|
|
warn!(context, "refusing to delete non-file {}.", path.display());
|
|
bail!("not a file: \"{}\"", path.display());
|
|
}
|
|
|
|
let dpath = format!("{}", path.to_string_lossy());
|
|
fs::remove_file(path_abs)
|
|
.await
|
|
.with_context(|| format!("cannot delete {dpath:?}"))?;
|
|
context.emit_event(EventType::DeletedBlobFile(dpath));
|
|
Ok(())
|
|
}
|
|
|
|
/// Create a safe name based on a messy input string.
|
|
///
|
|
/// The safe name will be a valid filename on Unix and Windows and
|
|
/// not contain any path separators. The input can contain path
|
|
/// segments separated by either Unix or Windows path separators,
|
|
/// the rightmost non-empty segment will be used as name,
|
|
/// sanitised for special characters.
|
|
pub(crate) fn sanitize_filename(mut name: &str) -> String {
|
|
for part in name.rsplit('/') {
|
|
if !part.is_empty() {
|
|
name = part;
|
|
break;
|
|
}
|
|
}
|
|
for part in name.rsplit('\\') {
|
|
if !part.is_empty() {
|
|
name = part;
|
|
break;
|
|
}
|
|
}
|
|
|
|
let opts = sanitize_filename::Options {
|
|
truncate: true,
|
|
windows: true,
|
|
replacement: "",
|
|
};
|
|
let name = sanitize_filename::sanitize_with_options(name, opts);
|
|
|
|
if name.starts_with('.') || name.is_empty() {
|
|
format!("file{name}")
|
|
} else {
|
|
name
|
|
}
|
|
}
|
|
|
|
/// A guard which will remove the path when dropped.
|
|
///
|
|
/// It implements [`Deref`] so it can be used as a `&Path`.
|
|
#[derive(Debug)]
|
|
pub(crate) struct TempPathGuard {
|
|
path: PathBuf,
|
|
}
|
|
|
|
impl TempPathGuard {
|
|
pub(crate) fn new(path: PathBuf) -> Self {
|
|
Self { path }
|
|
}
|
|
}
|
|
|
|
impl Drop for TempPathGuard {
|
|
fn drop(&mut self) {
|
|
let path = self.path.clone();
|
|
std::fs::remove_file(path).ok();
|
|
}
|
|
}
|
|
|
|
impl Deref for TempPathGuard {
|
|
type Target = Path;
|
|
|
|
fn deref(&self) -> &Self::Target {
|
|
&self.path
|
|
}
|
|
}
|
|
|
|
impl AsRef<Path> for TempPathGuard {
|
|
fn as_ref(&self) -> &Path {
|
|
self
|
|
}
|
|
}
|
|
|
|
pub(crate) async fn create_folder(context: &Context, path: &Path) -> Result<(), io::Error> {
|
|
let path_abs = get_abs_path(context, path);
|
|
if !path_abs.exists() {
|
|
match fs::create_dir_all(path_abs).await {
|
|
Ok(_) => Ok(()),
|
|
Err(err) => {
|
|
warn!(
|
|
context,
|
|
"Cannot create directory \"{}\": {}",
|
|
path.display(),
|
|
err
|
|
);
|
|
Err(err)
|
|
}
|
|
}
|
|
} else {
|
|
Ok(())
|
|
}
|
|
}
|
|
|
|
/// Write a the given content to provided file path.
|
|
pub(crate) async fn write_file(
|
|
context: &Context,
|
|
path: &Path,
|
|
buf: &[u8],
|
|
) -> Result<(), io::Error> {
|
|
let path_abs = get_abs_path(context, path);
|
|
fs::write(&path_abs, buf).await.map_err(|err| {
|
|
warn!(
|
|
context,
|
|
"Cannot write {} bytes to \"{}\": {}",
|
|
buf.len(),
|
|
path.display(),
|
|
err
|
|
);
|
|
err
|
|
})
|
|
}
|
|
|
|
/// Reads the file and returns its context as a byte vector.
|
|
pub async fn read_file(context: &Context, path: &Path) -> Result<Vec<u8>> {
|
|
let path_abs = get_abs_path(context, path);
|
|
|
|
match fs::read(&path_abs).await {
|
|
Ok(bytes) => Ok(bytes),
|
|
Err(err) => {
|
|
warn!(
|
|
context,
|
|
"Cannot read \"{}\" or file is empty: {}",
|
|
path.display(),
|
|
err
|
|
);
|
|
Err(err.into())
|
|
}
|
|
}
|
|
}
|
|
|
|
pub async fn open_file(context: &Context, path: &Path) -> Result<fs::File> {
|
|
let path_abs = get_abs_path(context, path);
|
|
|
|
match fs::File::open(&path_abs).await {
|
|
Ok(bytes) => Ok(bytes),
|
|
Err(err) => {
|
|
warn!(
|
|
context,
|
|
"Cannot read \"{}\" or file is empty: {}",
|
|
path.display(),
|
|
err
|
|
);
|
|
Err(err.into())
|
|
}
|
|
}
|
|
}
|
|
|
|
pub fn open_file_std(context: &Context, path: impl AsRef<Path>) -> Result<std::fs::File> {
|
|
let path_abs = get_abs_path(context, path.as_ref());
|
|
|
|
match std::fs::File::open(path_abs) {
|
|
Ok(bytes) => Ok(bytes),
|
|
Err(err) => {
|
|
warn!(
|
|
context,
|
|
"Cannot read \"{}\" or file is empty: {}",
|
|
path.as_ref().display(),
|
|
err
|
|
);
|
|
Err(err.into())
|
|
}
|
|
}
|
|
}
|
|
|
|
/// Reads directory and returns a vector of directory entries.
|
|
pub async fn read_dir(path: &Path) -> Result<Vec<fs::DirEntry>> {
|
|
let res = tokio_stream::wrappers::ReadDirStream::new(fs::read_dir(path).await?)
|
|
.try_collect()
|
|
.await?;
|
|
Ok(res)
|
|
}
|
|
|
|
pub(crate) fn time() -> i64 {
|
|
SystemTime::now()
|
|
.duration_since(SystemTime::UNIX_EPOCH)
|
|
.unwrap_or_default()
|
|
.as_secs() as i64
|
|
}
|
|
|
|
pub(crate) fn time_elapsed(time: &Time) -> Duration {
|
|
time.elapsed().unwrap_or_default()
|
|
}
|
|
|
|
/// Struct containing all mailto information
|
|
#[derive(Debug, Default, Eq, PartialEq)]
|
|
pub struct MailTo {
|
|
pub to: Vec<EmailAddress>,
|
|
pub subject: Option<String>,
|
|
pub body: Option<String>,
|
|
}
|
|
|
|
/// Parse mailto urls
|
|
pub fn parse_mailto(mailto_url: &str) -> Option<MailTo> {
|
|
if let Ok(url) = Url::parse(mailto_url) {
|
|
if url.scheme() == "mailto" {
|
|
let mut mailto: MailTo = Default::default();
|
|
// Extract the email address
|
|
url.path().split(',').for_each(|email| {
|
|
if let Ok(email) = EmailAddress::new(email) {
|
|
mailto.to.push(email);
|
|
}
|
|
});
|
|
|
|
// Extract query parameters
|
|
for (key, value) in url.query_pairs() {
|
|
if key == "subject" {
|
|
mailto.subject = Some(value.to_string());
|
|
} else if key == "body" {
|
|
mailto.body = Some(value.to_string());
|
|
}
|
|
}
|
|
Some(mailto)
|
|
} else {
|
|
None
|
|
}
|
|
} else {
|
|
None
|
|
}
|
|
}
|
|
|
|
pub(crate) trait IsNoneOrEmpty<T> {
|
|
/// Returns true if an Option does not contain a string
|
|
/// or contains an empty string.
|
|
fn is_none_or_empty(&self) -> bool;
|
|
}
|
|
impl<T> IsNoneOrEmpty<T> for Option<T>
|
|
where
|
|
T: AsRef<str>,
|
|
{
|
|
fn is_none_or_empty(&self) -> bool {
|
|
!matches!(self, Some(s) if !s.as_ref().is_empty())
|
|
}
|
|
}
|
|
|
|
pub(crate) trait ToOption<T> {
|
|
fn to_option(self) -> Option<T>;
|
|
}
|
|
impl<'a> ToOption<&'a str> for &'a String {
|
|
fn to_option(self) -> Option<&'a str> {
|
|
if self.is_empty() { None } else { Some(self) }
|
|
}
|
|
}
|
|
impl ToOption<String> for u16 {
|
|
fn to_option(self) -> Option<String> {
|
|
if self == 0 {
|
|
None
|
|
} else {
|
|
Some(self.to_string())
|
|
}
|
|
}
|
|
}
|
|
impl ToOption<String> for Option<i32> {
|
|
fn to_option(self) -> Option<String> {
|
|
match self {
|
|
None | Some(0) => None,
|
|
Some(v) => Some(v.to_string()),
|
|
}
|
|
}
|
|
}
|
|
|
|
pub fn remove_subject_prefix(last_subject: &str) -> String {
|
|
let subject_start = if last_subject.starts_with("Chat:") {
|
|
0
|
|
} else {
|
|
// "Antw:" is the longest abbreviation in
|
|
// <https://en.wikipedia.org/wiki/List_of_email_subject_abbreviations#Abbreviations_in_other_languages>,
|
|
// so look at the first _5_ characters:
|
|
match last_subject.chars().take(5).position(|c| c == ':') {
|
|
Some(prefix_end) => prefix_end + 1,
|
|
None => 0,
|
|
}
|
|
};
|
|
last_subject
|
|
.chars()
|
|
.skip(subject_start)
|
|
.collect::<String>()
|
|
.trim()
|
|
.to_string()
|
|
}
|
|
|
|
// Types and methods to create hop-info for message-info
|
|
|
|
fn extract_address_from_receive_header<'a>(header: &'a str, start: &str) -> Option<&'a str> {
|
|
let header_len = header.len();
|
|
header.find(start).and_then(|mut begin| {
|
|
begin += start.len();
|
|
let end = header
|
|
.get(begin..)?
|
|
.find(|c: char| c.is_whitespace())
|
|
.unwrap_or(header_len);
|
|
header.get(begin..begin + end)
|
|
})
|
|
}
|
|
|
|
pub(crate) fn parse_receive_header(header: &str) -> String {
|
|
let header = header.replace(&['\r', '\n'][..], "");
|
|
let mut hop_info = String::from("Hop: ");
|
|
|
|
if let Some(from) = extract_address_from_receive_header(&header, "from ") {
|
|
hop_info += &format!("From: {}; ", from.trim());
|
|
}
|
|
|
|
if let Some(by) = extract_address_from_receive_header(&header, "by ") {
|
|
hop_info += &format!("By: {}; ", by.trim());
|
|
}
|
|
|
|
if let Ok(date) = dateparse(&header) {
|
|
// In tests, use the UTC timezone so that the test is reproducible
|
|
#[cfg(test)]
|
|
let date_obj = chrono::Utc.timestamp_opt(date, 0).single();
|
|
#[cfg(not(test))]
|
|
let date_obj = Local.timestamp_opt(date, 0).single();
|
|
|
|
hop_info += &format!(
|
|
"Date: {}",
|
|
date_obj.map_or_else(|| "?".to_string(), |x| x.to_rfc2822())
|
|
);
|
|
};
|
|
|
|
hop_info
|
|
}
|
|
|
|
/// parses "receive"-headers
|
|
pub(crate) fn parse_receive_headers(headers: &Headers) -> String {
|
|
headers
|
|
.get_all_headers("Received")
|
|
.iter()
|
|
.rev()
|
|
.filter_map(|header_map_item| from_utf8(header_map_item.get_value_raw()).ok())
|
|
.map(parse_receive_header)
|
|
.collect::<Vec<_>>()
|
|
.join("\n")
|
|
}
|
|
|
|
/// If `collection` contains exactly one element, return this element.
|
|
/// Otherwise, return None.
|
|
pub(crate) fn single_value<T>(collection: impl IntoIterator<Item = T>) -> Option<T> {
|
|
let mut iter = collection.into_iter();
|
|
if let Some(value) = iter.next()
|
|
&& iter.next().is_none()
|
|
{
|
|
return Some(value);
|
|
}
|
|
None
|
|
}
|
|
|
|
/// Compressor/decompressor buffer size.
|
|
const BROTLI_BUFSZ: usize = 4096;
|
|
|
|
/// Compresses `buf` to `Vec` using `brotli`.
|
|
/// Note that it handles an empty `buf` as a special value that remains empty after compression,
|
|
/// otherwise brotli would add its metadata to it which is not nice because this function is used
|
|
/// for compression of strings stored in the db and empty strings are common there. This approach is
|
|
/// not strictly correct because nowhere in the brotli documentation is said that an empty buffer
|
|
/// can't be a result of compression of some input, but i think this will never break.
|
|
pub(crate) fn buf_compress(buf: &[u8]) -> Result<Vec<u8>> {
|
|
if buf.is_empty() {
|
|
return Ok(Vec::new());
|
|
}
|
|
// level 4 is 2x faster than level 6 (and 54x faster than 10, for comparison).
|
|
// with the adaptiveness, we aim to not slow down processing
|
|
// single large files too much, esp. on low-budget devices.
|
|
// in tests (see #4129), this makes a difference, without compressing much worse.
|
|
let q: u32 = if buf.len() > 1_000_000 { 4 } else { 6 };
|
|
let lgwin: u32 = 22; // log2(LZ77 window size), it's the default for brotli CLI tool.
|
|
let mut compressor = brotli::CompressorWriter::new(Vec::new(), BROTLI_BUFSZ, q, lgwin);
|
|
compressor.write_all(buf)?;
|
|
Ok(compressor.into_inner())
|
|
}
|
|
|
|
/// Decompresses `buf` to `Vec` using `brotli`.
|
|
/// See `buf_compress()` for why we don't pass an empty buffer to brotli decompressor.
|
|
pub(crate) fn buf_decompress(buf: &[u8]) -> Result<Vec<u8>> {
|
|
if buf.is_empty() {
|
|
return Ok(Vec::new());
|
|
}
|
|
let mut decompressor = brotli::DecompressorWriter::new(Vec::new(), BROTLI_BUFSZ);
|
|
decompressor.write_all(buf)?;
|
|
decompressor.flush()?;
|
|
Ok(mem::take(decompressor.get_mut()))
|
|
}
|
|
|
|
/// Returns the given `&str` if already lowercased to avoid allocation, otherwise lowercases it.
|
|
pub(crate) fn to_lowercase(s: &str) -> Cow<'_, str> {
|
|
match s.chars().all(char::is_lowercase) {
|
|
true => Cow::Borrowed(s),
|
|
false => Cow::Owned(s.to_lowercase()),
|
|
}
|
|
}
|
|
|
|
/// Returns text for storing in special db columns to make case-insensitive search possible for
|
|
/// non-ASCII messages, chat and contact names.
|
|
pub(crate) fn normalize_text(text: &str) -> Option<String> {
|
|
if text.is_ascii() {
|
|
return None;
|
|
};
|
|
Some(text.to_lowercase()).filter(|t| t != text)
|
|
}
|
|
|
|
/// Increments `*t` and checks that it equals to `expected` after that.
|
|
pub(crate) fn inc_and_check<T: PrimInt + AddAssign + std::fmt::Debug>(
|
|
t: &mut T,
|
|
expected: T,
|
|
) -> Result<()> {
|
|
*t += T::one();
|
|
ensure!(*t == expected, "Incremented value != {expected:?}");
|
|
Ok(())
|
|
}
|
|
|
|
/// Converts usize to u64 without using `as`.
|
|
///
|
|
/// This is needed for example to convert in-memory buffer sizes
|
|
/// to u64 type used for counting all the bytes written.
|
|
///
|
|
/// On 32-bit systems it is possible to have files
|
|
/// larger than 4 GiB or write more than 4 GiB to network connection,
|
|
/// in which case we need a 64-bit total counter,
|
|
/// but use 32-bit usize for buffer sizes.
|
|
///
|
|
/// This can only break if usize has more than 64 bits
|
|
/// and this is not the case as of 2025 and is
|
|
/// unlikely to change for general purpose computers.
|
|
/// See <https://github.com/rust-lang/rust/issues/30495>
|
|
/// and <https://users.rust-lang.org/t/cant-convert-usize-to-u64/6243>
|
|
/// and <https://github.com/rust-lang/rust/issues/106050>.
|
|
pub(crate) fn usize_to_u64(v: usize) -> u64 {
|
|
u64::try_from(v).unwrap_or(u64::MAX)
|
|
}
|
|
|
|
/// Returns early with an error if a condition is not satisfied.
|
|
/// In non-optimized builds, panics instead if so.
|
|
#[macro_export]
|
|
macro_rules! ensure_and_debug_assert {
|
|
($cond:expr, $($arg:tt)*) => {
|
|
let cond_val = $cond;
|
|
debug_assert!(cond_val, $($arg)*);
|
|
anyhow::ensure!(cond_val, $($arg)*);
|
|
};
|
|
}
|
|
|
|
/// Returns early with an error on two expressions inequality.
|
|
/// In non-optimized builds, panics instead if so.
|
|
#[macro_export]
|
|
macro_rules! ensure_and_debug_assert_eq {
|
|
($left:expr, $right:expr, $($arg:tt)*) => {
|
|
match (&$left, &$right) {
|
|
(left_val, right_val) => {
|
|
debug_assert_eq!(left_val, right_val, $($arg)*);
|
|
anyhow::ensure!(left_val == right_val, $($arg)*);
|
|
}
|
|
}
|
|
};
|
|
}
|
|
|
|
/// Returns early with an error on two expressions equality.
|
|
/// In non-optimized builds, panics instead if so.
|
|
#[macro_export]
|
|
macro_rules! ensure_and_debug_assert_ne {
|
|
($left:expr, $right:expr, $($arg:tt)*) => {
|
|
match (&$left, &$right) {
|
|
(left_val, right_val) => {
|
|
debug_assert_ne!(left_val, right_val, $($arg)*);
|
|
anyhow::ensure!(left_val != right_val, $($arg)*);
|
|
}
|
|
}
|
|
};
|
|
}
|
|
|
|
/// Logs a warning if a condition is not satisfied.
|
|
/// In non-optimized builds, panics also if so.
|
|
#[macro_export]
|
|
macro_rules! logged_debug_assert {
|
|
($ctx:expr, $cond:expr, $($arg:tt)*) => {
|
|
let cond_val = $cond;
|
|
if !cond_val {
|
|
warn!($ctx, $($arg)*);
|
|
}
|
|
debug_assert!(cond_val, $($arg)*);
|
|
};
|
|
}
|
|
|
|
#[cfg(test)]
|
|
mod tools_tests;
|