1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
use once_cell::sync::Lazy;
use rand::{distributions::Alphanumeric, thread_rng, Rng};
use regex::Regex;

static IETF_LANGUAGE_CODE_REGEX: Lazy<Regex> = Lazy::new(|| {
    Regex::new(r"^[a-z]{2,3}(-[A-Z][a-z]{3})?-[A-Z]{2}$")
        .expect("Invalid IETF language code regex.")
});

pub fn generate_random_string(length: usize) -> String {
    thread_rng()
        .sample_iter(Alphanumeric)
        .take(length)
        .map(char::from)
        .collect()
}

pub fn generate_easily_writable_random_string(length: usize) -> String {
    thread_rng()
        .sample_iter(Alphanumeric)
        .filter(|c| c.is_ascii_lowercase() || c.is_ascii_digit())
        // Filter out characters that might be confused with each other
        .filter(|c| c != &b'l' && c != &b'1' && c != &b'o' && c != &b'0')
        .take(length)
        .map(char::from)
        .collect()
}

/// Checks whether the string is IETF language code where subtags are separated with underscore.
pub fn is_ietf_language_code_like(string: &str) -> bool {
    IETF_LANGUAGE_CODE_REGEX.is_match(string)
}

#[cfg(test)]
mod test {
    use super::*;

    #[test]
    fn ietf_language_code_validation_works() {
        // Invalid scenarios
        assert!(!is_ietf_language_code_like(""));
        assert!(!is_ietf_language_code_like("en"));
        assert!(!is_ietf_language_code_like("en_us"));
        assert!(!is_ietf_language_code_like("en_US"));
        assert!(!is_ietf_language_code_like("in-cans"));
        assert!(!is_ietf_language_code_like("in-cans-ca"));

        // Valid scenarios
        assert!(is_ietf_language_code_like("en-US"));
        assert!(is_ietf_language_code_like("in-Cans-CA"));
    }
}