// Copyright 2018-2024 the Deno authors. All rights reserved. MIT license. use std::borrow::Cow; use std::ops::Range; use std::sync::Arc; use base64::prelude::BASE64_STANDARD; use base64::Engine; use deno_core::ModuleSourceCode; static SOURCE_MAP_PREFIX: &[u8] = b"//# sourceMappingURL=data:application/json;base64,"; pub fn from_utf8_lossy_owned(bytes: Vec) -> String { match String::from_utf8_lossy(&bytes) { Cow::Owned(code) => code, // SAFETY: `String::from_utf8_lossy` guarantees that the result is valid // UTF-8 if `Cow::Borrowed` is returned. Cow::Borrowed(_) => unsafe { String::from_utf8_unchecked(bytes) }, } } pub fn source_map_from_code(code: &[u8]) -> Option> { let range = find_source_map_range(code)?; let source_map_range = &code[range]; let input = source_map_range.split_at(SOURCE_MAP_PREFIX.len()).1; let decoded_map = BASE64_STANDARD.decode(input).ok()?; Some(decoded_map) } /// Truncate the source code before the source map. pub fn code_without_source_map(code: ModuleSourceCode) -> ModuleSourceCode { use deno_core::ModuleCodeBytes; match code { ModuleSourceCode::String(mut code) => { if let Some(range) = find_source_map_range(code.as_bytes()) { code.truncate(range.start); } ModuleSourceCode::String(code) } ModuleSourceCode::Bytes(code) => { if let Some(range) = find_source_map_range(code.as_bytes()) { let source_map_index = range.start; ModuleSourceCode::Bytes(match code { ModuleCodeBytes::Static(bytes) => { ModuleCodeBytes::Static(&bytes[..source_map_index]) } ModuleCodeBytes::Boxed(bytes) => { // todo(dsherret): should be possible without cloning ModuleCodeBytes::Boxed( bytes[..source_map_index].to_vec().into_boxed_slice(), ) } ModuleCodeBytes::Arc(bytes) => ModuleCodeBytes::Boxed( bytes[..source_map_index].to_vec().into_boxed_slice(), ), }) } else { ModuleSourceCode::Bytes(code) } } } } fn find_source_map_range(code: &[u8]) -> Option> { fn last_non_blank_line_range(code: &[u8]) -> Option> { let mut hit_non_whitespace = false; let mut range_end = code.len(); for i in (0..code.len()).rev() { match code[i] { b' ' | b'\t' => { if !hit_non_whitespace { range_end = i; } } b'\n' | b'\r' => { if hit_non_whitespace { return Some(i + 1..range_end); } range_end = i; } _ => { hit_non_whitespace = true; } } } None } let range = last_non_blank_line_range(code)?; if code[range.start..range.end].starts_with(SOURCE_MAP_PREFIX) { Some(range) } else { None } } /// Converts an `Arc` to an `Arc<[u8]>`. #[allow(dead_code)] pub fn arc_str_to_bytes(arc_str: Arc) -> Arc<[u8]> { let raw = Arc::into_raw(arc_str); // SAFETY: This is safe because they have the same memory layout. unsafe { Arc::from_raw(raw as *const [u8]) } } /// Converts an `Arc` to an `Arc` if able. #[allow(dead_code)] pub fn arc_u8_to_arc_str( arc_u8: Arc<[u8]>, ) -> Result, std::str::Utf8Error> { // Check that the string is valid UTF-8. std::str::from_utf8(&arc_u8)?; // SAFETY: the string is valid UTF-8, and the layout Arc<[u8]> is the same as // Arc. This is proven by the From> impl for Arc<[u8]> from the // standard library. Ok(unsafe { std::mem::transmute::, std::sync::Arc>(arc_u8) }) } #[cfg(test)] mod tests { use std::sync::Arc; use deno_core::ModuleCodeBytes; use deno_core::ModuleCodeString; use super::*; #[test] fn test_source_map_from_code() { let to_string = |bytes: Vec| -> String { String::from_utf8(bytes).unwrap() }; assert_eq!( source_map_from_code( b"test\n//# sourceMappingURL=data:application/json;base64,dGVzdGluZ3Rlc3Rpbmc=", ).map(to_string), Some("testingtesting".to_string()) ); assert_eq!( source_map_from_code( b"test\n//# sourceMappingURL=data:application/json;base64,dGVzdGluZ3Rlc3Rpbmc=\n \n", ).map(to_string), Some("testingtesting".to_string()) ); assert_eq!( source_map_from_code( b"test\n//# sourceMappingURL=data:application/json;base64,dGVzdGluZ3Rlc3Rpbmc=\n test\n", ), None ); assert_eq!( source_map_from_code( b"\"use strict\"; throw new Error(\"Hello world!\"); //# sourceMappingURL=data:application/json;base64,{", ), None ); } #[test] fn test_source_without_source_map() { run_test("", ""); run_test("\n", "\n"); run_test("\r\n", "\r\n"); run_test("a", "a"); run_test("a\n", "a\n"); run_test("a\r\n", "a\r\n"); run_test("a\r\nb", "a\r\nb"); run_test("a\nb\n", "a\nb\n"); run_test("a\r\nb\r\n", "a\r\nb\r\n"); run_test( "test\n//# sourceMappingURL=data:application/json;base64,test", "test\n", ); run_test( "test\r\n//# sourceMappingURL=data:application/json;base64,test", "test\r\n", ); run_test( "\n//# sourceMappingURL=data:application/json;base64,test", "\n", ); run_test( "test\n//# sourceMappingURL=data:application/json;base64,test\n\n", "test\n", ); run_test( "test\n//# sourceMappingURL=data:application/json;base64,test\n \n ", "test\n", ); fn run_test(input: &'static str, output: &'static str) { let forms = [ ModuleSourceCode::String(ModuleCodeString::from_static(input)), ModuleSourceCode::String({ let text: Arc = input.into(); text.into() }), ModuleSourceCode::String({ let text: String = input.into(); text.into() }), ModuleSourceCode::Bytes(ModuleCodeBytes::Static(input.as_bytes())), ModuleSourceCode::Bytes(ModuleCodeBytes::Boxed( input.as_bytes().to_vec().into_boxed_slice(), )), ModuleSourceCode::Bytes(ModuleCodeBytes::Arc( input.as_bytes().to_vec().into(), )), ]; for form in forms { let result = code_without_source_map(form); let bytes = result.as_bytes(); assert_eq!(bytes, output.as_bytes()); } } } }