Clean up wgettext

Because wgettext stores strings forever, we can simply leak them onto the heap;
this cleans up some call sites and type signatures.
This commit is contained in:
ridiculousfish
2024-01-07 14:44:40 -08:00
parent 9aa5a97530
commit 1914c3a513
3 changed files with 50 additions and 44 deletions

View File

@@ -1,5 +1,4 @@
use std::{ use std::{
borrow::Cow,
cmp::Ordering, cmp::Ordering,
collections::{BTreeMap, HashMap, HashSet}, collections::{BTreeMap, HashMap, HashSet},
mem, mem,
@@ -14,7 +13,6 @@
use bitflags::bitflags; use bitflags::bitflags;
use once_cell::sync::Lazy; use once_cell::sync::Lazy;
use printf_compat::sprintf; use printf_compat::sprintf;
use widestring::U32CString;
use crate::{ use crate::{
abbrs::with_abbrs, abbrs::with_abbrs,
@@ -49,7 +47,7 @@
StringFuzzyMatch, StringFuzzyMatch,
}, },
wildcard::{wildcard_complete, wildcard_has, wildcard_match}, wildcard::{wildcard_complete, wildcard_has, wildcard_match},
wutil::{gettext::wgettext_impl_do_not_use_directly, wgettext, wrealpath}, wutil::{gettext::wgettext_str, wgettext, wrealpath},
}; };
// Completion description strings, mostly for different types of files, such as sockets, block // Completion description strings, mostly for different types of files, such as sockets, block
@@ -75,11 +73,7 @@ fn C_(s: &wstr) -> &'static wstr {
if s.is_empty() { if s.is_empty() {
L!("") L!("")
} else { } else {
wgettext_impl_do_not_use_directly(Cow::Owned( wgettext_str(s)
U32CString::from_ustr(s)
.expect("translation string without NUL bytes")
.into_vec_with_nul(),
))
} }
} }

View File

@@ -13,7 +13,7 @@
use crate::parser::Parser; use crate::parser::Parser;
use crate::parser_keywords::parser_keywords_is_reserved; use crate::parser_keywords::parser_keywords_is_reserved;
use crate::wchar::prelude::*; use crate::wchar::prelude::*;
use crate::wutil::{dir_iter::DirIter, gettext::wgettext_expr, sprintf}; use crate::wutil::{dir_iter::DirIter, gettext::wgettext_str, sprintf};
use once_cell::sync::Lazy; use once_cell::sync::Lazy;
use std::collections::{HashMap, HashSet}; use std::collections::{HashMap, HashSet};
use std::sync::{Arc, Mutex}; use std::sync::{Arc, Mutex};
@@ -347,7 +347,7 @@ pub fn localized_description(&self) -> &'static wstr {
if self.description.is_empty() { if self.description.is_empty() {
L!("") L!("")
} else { } else {
wgettext_expr!(&self.description) wgettext_str(&self.description)
} }
} }

View File

@@ -1,18 +1,14 @@
use std::borrow::Cow;
use std::collections::hash_map::Entry;
use std::collections::HashMap; use std::collections::HashMap;
use std::ffi::CString; use std::ffi::CString;
use std::pin::Pin;
use std::sync::Mutex; use std::sync::Mutex;
use crate::common::{charptr2wcstring, wcs2zstring}; use crate::common::{charptr2wcstring, truncate_at_nul, wcs2zstring};
use crate::fish::PACKAGE_NAME; use crate::fish::PACKAGE_NAME;
#[cfg(test)] #[cfg(test)]
use crate::tests::prelude::*; use crate::tests::prelude::*;
use crate::wchar::prelude::*; use crate::wchar::prelude::*;
use errno::{errno, set_errno}; use errno::{errno, set_errno};
use once_cell::sync::{Lazy, OnceCell}; use once_cell::sync::{Lazy, OnceCell};
use widestring::U32CString;
#[cfg(feature = "gettext")] #[cfg(feature = "gettext")]
mod internal { mod internal {
@@ -63,68 +59,84 @@ fn wgettext_init_if_necessary() {
INIT.get_or_init(wgettext_really_init); INIT.get_or_init(wgettext_really_init);
} }
/// A type that can be either a static or local string.
enum MaybeStatic<'a> {
Static(&'static wstr),
Local(&'a wstr),
}
/// Implementation detail for wgettext!. /// Implementation detail for wgettext!.
/// Wide character wrapper around the gettext function. For historic reasons, unlike the real /// Wide character wrapper around the gettext function. For historic reasons, unlike the real
/// gettext function, wgettext takes care of setting the correct domain, etc. using the textdomain /// gettext function, wgettext takes care of setting the correct domain, etc. using the textdomain
/// and bindtextdomain functions. This should probably be moved out of wgettext, so that wgettext /// and bindtextdomain functions. This should probably be moved out of wgettext, so that wgettext
/// will be nothing more than a wrapper around gettext, like all other functions in this file. /// will be nothing more than a wrapper around gettext, like all other functions in this file.
pub fn wgettext_impl_do_not_use_directly(text: Cow<'static, [u32]>) -> &'static wstr { fn wgettext_impl(text: MaybeStatic) -> &'static wstr {
assert_eq!(text.last(), Some(&0), "should be nul-terminated");
// Preserve errno across this since this is often used in printing error messages. // Preserve errno across this since this is often used in printing error messages.
let err = errno(); let err = errno();
wgettext_init_if_necessary(); wgettext_init_if_necessary();
#[allow(clippy::type_complexity)]
static WGETTEXT_MAP: Lazy<Mutex<HashMap<Cow<'static, [u32]>, Pin<Box<WString>>>>> = let key = match text {
MaybeStatic::Static(s) => s,
MaybeStatic::Local(s) => s,
};
debug_assert!(
truncate_at_nul(key).len() == key.len(),
"key should not contain NUL"
);
// Note that because entries are immortal, we simply leak non-static keys, and all values.
static WGETTEXT_MAP: Lazy<Mutex<HashMap<&'static wstr, &'static wstr>>> =
Lazy::new(|| Mutex::new(HashMap::new())); Lazy::new(|| Mutex::new(HashMap::new()));
let mut wmap = WGETTEXT_MAP.lock().unwrap(); let mut wmap = WGETTEXT_MAP.lock().unwrap();
let v = match wmap.entry(text) { let res = match wmap.get(key) {
Entry::Occupied(v) => Pin::get_ref(Pin::as_ref(v.get())) as *const WString, Some(v) => *v,
Entry::Vacant(v) => { None => {
let key = wstr::from_slice(v.key()).unwrap();
let mbs_in = wcs2zstring(key); let mbs_in = wcs2zstring(key);
let out = fish_gettext(&mbs_in); let out = fish_gettext(&mbs_in);
let out = charptr2wcstring(out); let out = charptr2wcstring(out);
let res = Pin::new(Box::new(out)); // Leak the value into the heap.
let value = v.insert(res); let value: &'static wstr = Box::leak(out.into_boxed_utfstr());
Pin::get_ref(Pin::as_ref(value)) as *const WString
// Get a static key, perhaps leaking it into the heap as well.
let key: &'static wstr = match text {
MaybeStatic::Static(s) => s,
MaybeStatic::Local(s) => wstr::from_char_slice(Box::leak(s.as_char_slice().into())),
};
wmap.insert(key, value);
value
} }
}; };
set_errno(err); set_errno(err);
// The returned string is stored in the map. res
// TODO: If we want to shrink the map, this would be a problem. }
unsafe { v.as_ref().unwrap() }.as_utfstr()
/// Get a (possibly translated) string from a literal.
/// Note this assumes that the string does not contain interior NUL characters -
/// this is checked in debug mode.
pub fn wgettext_static_str(s: &'static wstr) -> &'static wstr {
wgettext_impl(MaybeStatic::Static(s))
} }
/// Get a (possibly translated) string from a non-literal. /// Get a (possibly translated) string from a non-literal.
/// This truncates at the first NUL character.
pub fn wgettext_str(s: &wstr) -> &'static wstr { pub fn wgettext_str(s: &wstr) -> &'static wstr {
let cstr: U32CString = U32CString::from_chars_truncate(s.as_char_slice()); wgettext_impl(MaybeStatic::Local(truncate_at_nul(s)))
wgettext_impl_do_not_use_directly(Cow::Owned(cstr.into_vec_with_nul()))
} }
/// Get a (possibly translated) string from a string literal. /// Get a (possibly translated) string from a string literal.
/// This returns a &'static wstr. /// This returns a &'static wstr.
macro_rules! wgettext { macro_rules! wgettext {
($string:expr) => { ($string:expr) => {
crate::wutil::gettext::wgettext_impl_do_not_use_directly(std::borrow::Cow::Borrowed( crate::wutil::gettext::wgettext_static_str(widestring::utf32str!($string))
widestring::u32cstr!($string).as_slice_with_nul(),
))
}; };
} }
pub(crate) use wgettext; pub(crate) use wgettext;
/// Like wgettext, but for non-literals.
macro_rules! wgettext_expr {
($string:expr) => {
crate::wutil::gettext::wgettext_impl_do_not_use_directly(std::borrow::Cow::Owned(
widestring::U32CString::from_ustr_truncate($string).into_vec_with_nul(),
))
};
}
pub(crate) use wgettext_expr;
/// Like wgettext, but applies a sprintf format string. /// Like wgettext, but applies a sprintf format string.
/// The result is a WString. /// The result is a WString.
macro_rules! wgettext_fmt { macro_rules! wgettext_fmt {