You can not select more than 25 topics
Topics must start with a letter or number, can include dashes ('-') and can be up to 35 characters long.
134 lines
4.5 KiB
134 lines
4.5 KiB
use assert_matches::assert_matches;
|
|
use unicode_normalization::char::is_combining_mark;
|
|
|
|
/// https://github.com/servo/rust-url/issues/373
|
|
#[test]
|
|
fn test_punycode_prefix_with_length_check() {
|
|
let config = idna::Config::default()
|
|
.verify_dns_length(true)
|
|
.check_hyphens(true)
|
|
.use_std3_ascii_rules(true);
|
|
|
|
assert!(config.to_ascii("xn--").is_err());
|
|
assert!(config.to_ascii("xn---").is_err());
|
|
assert!(config.to_ascii("xn-----").is_err());
|
|
assert!(config.to_ascii("xn--.").is_err());
|
|
assert!(config.to_ascii("xn--...").is_err());
|
|
assert!(config.to_ascii(".xn--").is_err());
|
|
assert!(config.to_ascii("...xn--").is_err());
|
|
assert!(config.to_ascii("xn--.xn--").is_err());
|
|
assert!(config.to_ascii("xn--.example.org").is_err());
|
|
}
|
|
|
|
/// https://github.com/servo/rust-url/issues/373
|
|
#[test]
|
|
fn test_punycode_prefix_without_length_check() {
|
|
let config = idna::Config::default()
|
|
.verify_dns_length(false)
|
|
.check_hyphens(true)
|
|
.use_std3_ascii_rules(true);
|
|
|
|
assert_eq!(config.to_ascii("xn--").unwrap(), "");
|
|
assert!(config.to_ascii("xn---").is_err());
|
|
assert!(config.to_ascii("xn-----").is_err());
|
|
assert_eq!(config.to_ascii("xn--.").unwrap(), ".");
|
|
assert_eq!(config.to_ascii("xn--...").unwrap(), "...");
|
|
assert_eq!(config.to_ascii(".xn--").unwrap(), ".");
|
|
assert_eq!(config.to_ascii("...xn--").unwrap(), "...");
|
|
assert_eq!(config.to_ascii("xn--.xn--").unwrap(), ".");
|
|
assert_eq!(config.to_ascii("xn--.example.org").unwrap(), ".example.org");
|
|
}
|
|
|
|
// http://www.unicode.org/reports/tr46/#Table_Example_Processing
|
|
#[test]
|
|
fn test_examples() {
|
|
let mut codec = idna::Idna::default();
|
|
let mut out = String::new();
|
|
|
|
assert_matches!(codec.to_unicode("Bloß.de", &mut out), Ok(()));
|
|
assert_eq!(out, "bloß.de");
|
|
|
|
out.clear();
|
|
assert_matches!(codec.to_unicode("xn--blo-7ka.de", &mut out), Ok(()));
|
|
assert_eq!(out, "bloß.de");
|
|
|
|
out.clear();
|
|
assert_matches!(codec.to_unicode("u\u{308}.com", &mut out), Ok(()));
|
|
assert_eq!(out, "ü.com");
|
|
|
|
out.clear();
|
|
assert_matches!(codec.to_unicode("xn--tda.com", &mut out), Ok(()));
|
|
assert_eq!(out, "ü.com");
|
|
|
|
out.clear();
|
|
assert_matches!(codec.to_unicode("xn--u-ccb.com", &mut out), Err(_));
|
|
|
|
out.clear();
|
|
assert_matches!(codec.to_unicode("a⒈com", &mut out), Err(_));
|
|
|
|
out.clear();
|
|
assert_matches!(codec.to_unicode("xn--a-ecp.ru", &mut out), Err(_));
|
|
|
|
out.clear();
|
|
assert_matches!(codec.to_unicode("xn--0.pt", &mut out), Err(_));
|
|
|
|
out.clear();
|
|
assert_matches!(codec.to_unicode("日本語。JP", &mut out), Ok(()));
|
|
assert_eq!(out, "日本語.jp");
|
|
|
|
out.clear();
|
|
assert_matches!(codec.to_unicode("☕.us", &mut out), Ok(()));
|
|
assert_eq!(out, "☕.us");
|
|
}
|
|
|
|
#[test]
|
|
fn test_v5() {
|
|
let config = idna::Config::default()
|
|
.verify_dns_length(true)
|
|
.use_std3_ascii_rules(true);
|
|
|
|
// IdnaTest:784 蔏。𑰺
|
|
assert!(is_combining_mark('\u{11C3A}'));
|
|
assert!(config.to_ascii("\u{11C3A}").is_err());
|
|
assert!(config.to_ascii("\u{850f}.\u{11C3A}").is_err());
|
|
assert!(config.to_ascii("\u{850f}\u{ff61}\u{11C3A}").is_err());
|
|
}
|
|
|
|
#[test]
|
|
fn test_v8_bidi_rules() {
|
|
let config = idna::Config::default()
|
|
.verify_dns_length(true)
|
|
.use_std3_ascii_rules(true);
|
|
|
|
assert_eq!(config.to_ascii("abc").unwrap(), "abc");
|
|
assert_eq!(config.to_ascii("123").unwrap(), "123");
|
|
assert_eq!(config.to_ascii("אבּג").unwrap(), "xn--kdb3bdf");
|
|
assert_eq!(config.to_ascii("ابج").unwrap(), "xn--mgbcm");
|
|
assert_eq!(config.to_ascii("abc.ابج").unwrap(), "abc.xn--mgbcm");
|
|
assert_eq!(config.to_ascii("אבּג.ابج").unwrap(), "xn--kdb3bdf.xn--mgbcm");
|
|
|
|
// Bidi domain names cannot start with digits
|
|
assert!(config.to_ascii("0a.\u{05D0}").is_err());
|
|
assert!(config.to_ascii("0à.\u{05D0}").is_err());
|
|
|
|
// Bidi chars may be punycode-encoded
|
|
assert!(config.to_ascii("xn--0ca24w").is_err());
|
|
}
|
|
|
|
#[test]
|
|
fn emoji_domains() {
|
|
// HOT BEVERAGE is allowed here...
|
|
let config = idna::Config::default()
|
|
.verify_dns_length(true)
|
|
.use_std3_ascii_rules(true);
|
|
assert_eq!(config.to_ascii("☕.com").unwrap(), "xn--53h.com");
|
|
|
|
// ... but not here
|
|
let config = idna::Config::default()
|
|
.verify_dns_length(true)
|
|
.use_std3_ascii_rules(true)
|
|
.use_idna_2008_rules(true);
|
|
let error = format!("{:?}", config.to_ascii("☕.com").unwrap_err());
|
|
assert!(error.contains("disallowed_in_idna_2008"));
|
|
}
|