2024-01-01 14:58:21 -05:00
|
|
|
// Copyright 2018-2024 the Deno authors. All rights reserved. MIT license.
|
2023-02-20 18:47:42 +01:00
|
|
|
|
2023-09-14 08:29:44 +02:00
|
|
|
use deno_core::op2;
|
2023-02-20 18:47:42 +01:00
|
|
|
|
2024-03-11 15:49:43 -07:00
|
|
|
use std::borrow::Cow;
|
|
|
|
|
|
|
|
// map_domain, to_ascii and to_unicode are based on the punycode implementation in node.js
|
|
|
|
// https://github.com/nodejs/node/blob/73025c4dec042e344eeea7912ed39f7b7c4a3991/lib/punycode.js
|
|
|
|
|
|
|
|
const PUNY_PREFIX: &str = "xn--";
|
|
|
|
|
2024-10-24 10:45:17 -07:00
|
|
|
#[derive(Debug, thiserror::Error)]
|
|
|
|
pub enum IdnaError {
|
|
|
|
#[error("Invalid input")]
|
|
|
|
InvalidInput,
|
|
|
|
#[error("Input would take more than 63 characters to encode")]
|
|
|
|
InputTooLong,
|
|
|
|
#[error("Illegal input >= 0x80 (not a basic code point)")]
|
|
|
|
IllegalInput,
|
2024-03-11 15:49:43 -07:00
|
|
|
}
|
|
|
|
|
|
|
|
/// map a domain by mapping each label with the given function
|
2024-10-24 10:45:17 -07:00
|
|
|
fn map_domain(
|
2024-03-11 15:49:43 -07:00
|
|
|
domain: &str,
|
2024-10-24 10:45:17 -07:00
|
|
|
f: impl Fn(&str) -> Result<Cow<'_, str>, IdnaError>,
|
|
|
|
) -> Result<String, IdnaError> {
|
2024-03-11 15:49:43 -07:00
|
|
|
let mut result = String::with_capacity(domain.len());
|
|
|
|
let mut domain = domain;
|
|
|
|
|
|
|
|
// if it's an email, leave the local part as is
|
|
|
|
let mut parts = domain.split('@');
|
|
|
|
if let (Some(local), Some(remaining)) = (parts.next(), parts.next()) {
|
|
|
|
result.push_str(local);
|
|
|
|
result.push('@');
|
|
|
|
domain = remaining;
|
|
|
|
}
|
|
|
|
|
|
|
|
// split into labels and map each one
|
|
|
|
for (i, label) in domain.split('.').enumerate() {
|
|
|
|
if i > 0 {
|
|
|
|
result.push('.');
|
|
|
|
}
|
|
|
|
result.push_str(&f(label)?);
|
|
|
|
}
|
|
|
|
Ok(result)
|
|
|
|
}
|
|
|
|
|
|
|
|
/// Maps a unicode domain to ascii by punycode encoding each label
|
|
|
|
///
|
|
|
|
/// Note this is not IDNA2003 or IDNA2008 compliant, rather it matches node.js's punycode implementation
|
2024-10-24 10:45:17 -07:00
|
|
|
fn to_ascii(input: &str) -> Result<String, IdnaError> {
|
2024-03-11 15:49:43 -07:00
|
|
|
if input.is_ascii() {
|
|
|
|
return Ok(input.into());
|
|
|
|
}
|
|
|
|
|
|
|
|
let mut result = String::with_capacity(input.len()); // at least as long as input
|
|
|
|
|
|
|
|
let rest = map_domain(input, |label| {
|
|
|
|
if label.is_ascii() {
|
|
|
|
Ok(label.into())
|
|
|
|
} else {
|
|
|
|
idna::punycode::encode_str(label)
|
|
|
|
.map(|encoded| [PUNY_PREFIX, &encoded].join("").into()) // add the prefix
|
2024-10-24 10:45:17 -07:00
|
|
|
.ok_or(IdnaError::InputTooLong) // only error possible per the docs
|
2024-03-11 15:49:43 -07:00
|
|
|
}
|
|
|
|
})?;
|
|
|
|
|
|
|
|
result.push_str(&rest);
|
|
|
|
Ok(result)
|
|
|
|
}
|
|
|
|
|
|
|
|
/// Maps an ascii domain to unicode by punycode decoding each label
|
|
|
|
///
|
|
|
|
/// Note this is not IDNA2003 or IDNA2008 compliant, rather it matches node.js's punycode implementation
|
2024-10-24 10:45:17 -07:00
|
|
|
fn to_unicode(input: &str) -> Result<String, IdnaError> {
|
2024-03-11 15:49:43 -07:00
|
|
|
map_domain(input, |s| {
|
|
|
|
if let Some(puny) = s.strip_prefix(PUNY_PREFIX) {
|
|
|
|
// it's a punycode encoded label
|
|
|
|
Ok(
|
|
|
|
idna::punycode::decode_to_string(&puny.to_lowercase())
|
2024-10-24 10:45:17 -07:00
|
|
|
.ok_or(IdnaError::InvalidInput)?
|
2024-03-11 15:49:43 -07:00
|
|
|
.into(),
|
|
|
|
)
|
|
|
|
} else {
|
|
|
|
Ok(s.into())
|
|
|
|
}
|
|
|
|
})
|
|
|
|
}
|
|
|
|
|
|
|
|
/// Converts a domain to unicode with behavior that is
|
|
|
|
/// compatible with the `punycode` module in node.js
|
|
|
|
#[op2]
|
|
|
|
#[string]
|
|
|
|
pub fn op_node_idna_punycode_to_ascii(
|
|
|
|
#[string] domain: String,
|
2024-10-24 10:45:17 -07:00
|
|
|
) -> Result<String, IdnaError> {
|
2024-03-11 15:49:43 -07:00
|
|
|
to_ascii(&domain)
|
|
|
|
}
|
|
|
|
|
|
|
|
/// Converts a domain to ASCII with behavior that is
|
|
|
|
/// compatible with the `punycode` module in node.js
|
|
|
|
#[op2]
|
|
|
|
#[string]
|
|
|
|
pub fn op_node_idna_punycode_to_unicode(
|
|
|
|
#[string] domain: String,
|
2024-10-24 10:45:17 -07:00
|
|
|
) -> Result<String, IdnaError> {
|
2024-03-11 15:49:43 -07:00
|
|
|
to_unicode(&domain)
|
|
|
|
}
|
|
|
|
|
|
|
|
/// Converts a domain to ASCII as per the IDNA spec
|
|
|
|
/// (specifically UTS #46)
|
2023-09-14 08:29:44 +02:00
|
|
|
#[op2]
|
|
|
|
#[string]
|
2023-02-20 18:47:42 +01:00
|
|
|
pub fn op_node_idna_domain_to_ascii(
|
2023-09-14 08:29:44 +02:00
|
|
|
#[string] domain: String,
|
2024-10-24 10:45:17 -07:00
|
|
|
) -> Result<String, idna::Errors> {
|
|
|
|
idna::domain_to_ascii(&domain)
|
2023-02-20 18:47:42 +01:00
|
|
|
}
|
|
|
|
|
2024-03-11 15:49:43 -07:00
|
|
|
/// Converts a domain to Unicode as per the IDNA spec
|
|
|
|
/// (specifically UTS #46)
|
2023-09-14 08:29:44 +02:00
|
|
|
#[op2]
|
|
|
|
#[string]
|
|
|
|
pub fn op_node_idna_domain_to_unicode(#[string] domain: String) -> String {
|
2023-02-20 18:47:42 +01:00
|
|
|
idna::domain_to_unicode(&domain).0
|
|
|
|
}
|
|
|
|
|
2023-09-14 08:29:44 +02:00
|
|
|
#[op2]
|
|
|
|
#[string]
|
2024-03-11 15:49:43 -07:00
|
|
|
pub fn op_node_idna_punycode_decode(
|
|
|
|
#[string] domain: String,
|
2024-10-24 10:45:17 -07:00
|
|
|
) -> Result<String, IdnaError> {
|
2024-03-11 15:49:43 -07:00
|
|
|
if domain.is_empty() {
|
|
|
|
return Ok(domain);
|
|
|
|
}
|
|
|
|
|
|
|
|
// all code points before the last delimiter must be basic
|
|
|
|
// see https://github.com/nodejs/node/blob/73025c4dec042e344eeea7912ed39f7b7c4a3991/lib/punycode.js#L215-L227
|
|
|
|
let last_dash = domain.len()
|
|
|
|
- 1
|
|
|
|
- domain
|
|
|
|
.bytes()
|
|
|
|
.rev()
|
|
|
|
.position(|b| b == b'-')
|
|
|
|
.unwrap_or(domain.len() - 1);
|
|
|
|
|
|
|
|
if !domain[..last_dash].is_ascii() {
|
2024-10-24 10:45:17 -07:00
|
|
|
return Err(IdnaError::IllegalInput);
|
2024-03-11 15:49:43 -07:00
|
|
|
}
|
|
|
|
|
2024-10-24 10:45:17 -07:00
|
|
|
idna::punycode::decode_to_string(&domain).ok_or(IdnaError::InvalidInput)
|
2023-02-20 18:47:42 +01:00
|
|
|
}
|
|
|
|
|
2023-09-14 08:29:44 +02:00
|
|
|
#[op2]
|
|
|
|
#[string]
|
|
|
|
pub fn op_node_idna_punycode_encode(#[string] domain: String) -> String {
|
2023-02-20 18:47:42 +01:00
|
|
|
idna::punycode::encode_str(&domain).unwrap_or_default()
|
|
|
|
}
|