2024-10-24 15:48:48 -04:00
|
|
|
// Copyright 2018-2024 the Deno authors. All rights reserved. MIT license.
|
|
|
|
|
|
|
|
use std::borrow::Cow;
|
2024-12-16 19:20:53 -05:00
|
|
|
use std::cell::Cell;
|
2024-10-24 15:48:48 -04:00
|
|
|
use std::collections::BTreeMap;
|
|
|
|
use std::collections::HashMap;
|
|
|
|
use std::io::Write;
|
|
|
|
|
2024-12-20 16:14:37 -05:00
|
|
|
use capacity_builder::BytesAppendable;
|
2024-12-19 12:53:52 -05:00
|
|
|
use deno_ast::swc::common::source_map;
|
2024-10-24 15:48:48 -04:00
|
|
|
use deno_ast::MediaType;
|
|
|
|
use deno_core::anyhow::bail;
|
|
|
|
use deno_core::anyhow::Context;
|
|
|
|
use deno_core::error::AnyError;
|
|
|
|
use deno_core::serde_json;
|
|
|
|
use deno_core::url::Url;
|
|
|
|
use deno_core::FastString;
|
|
|
|
use deno_core::ModuleSourceCode;
|
|
|
|
use deno_core::ModuleType;
|
|
|
|
use deno_npm::resolution::SerializedNpmResolutionSnapshot;
|
|
|
|
use deno_npm::resolution::SerializedNpmResolutionSnapshotPackage;
|
|
|
|
use deno_npm::resolution::ValidSerializedNpmResolutionSnapshot;
|
|
|
|
use deno_npm::NpmPackageId;
|
|
|
|
use deno_semver::package::PackageReq;
|
2024-12-20 16:14:37 -05:00
|
|
|
use deno_semver::StackString;
|
2024-12-19 12:53:52 -05:00
|
|
|
use indexmap::IndexMap;
|
2024-10-24 15:48:48 -04:00
|
|
|
|
|
|
|
use crate::standalone::virtual_fs::VirtualDirectory;
|
|
|
|
|
|
|
|
use super::binary::Metadata;
|
2024-12-12 13:07:35 -05:00
|
|
|
use super::virtual_fs::BuiltVfs;
|
2024-10-24 15:48:48 -04:00
|
|
|
use super::virtual_fs::VfsBuilder;
|
2024-12-19 12:53:52 -05:00
|
|
|
use super::virtual_fs::VirtualDirectoryEntries;
|
2024-10-24 15:48:48 -04:00
|
|
|
|
|
|
|
const MAGIC_BYTES: &[u8; 8] = b"d3n0l4nd";
|
|
|
|
|
|
|
|
/// Binary format:
|
|
|
|
/// * d3n0l4nd
|
|
|
|
/// * <metadata_len><metadata>
|
|
|
|
/// * <npm_snapshot_len><npm_snapshot>
|
2024-12-19 12:53:52 -05:00
|
|
|
/// * <remote_modules>
|
2024-10-24 15:48:48 -04:00
|
|
|
/// * <vfs_headers_len><vfs_headers>
|
|
|
|
/// * <vfs_file_data_len><vfs_file_data>
|
2024-12-19 12:53:52 -05:00
|
|
|
/// * <source_map_data>
|
2024-10-24 15:48:48 -04:00
|
|
|
/// * d3n0l4nd
|
|
|
|
pub fn serialize_binary_data_section(
|
|
|
|
metadata: &Metadata,
|
|
|
|
npm_snapshot: Option<SerializedNpmResolutionSnapshot>,
|
|
|
|
remote_modules: &RemoteModulesStoreBuilder,
|
2024-12-19 12:53:52 -05:00
|
|
|
source_map_store: &SourceMapStore,
|
2024-12-12 13:07:35 -05:00
|
|
|
vfs: &BuiltVfs,
|
2024-10-24 15:48:48 -04:00
|
|
|
) -> Result<Vec<u8>, AnyError> {
|
2024-12-16 19:20:53 -05:00
|
|
|
let metadata = serde_json::to_string(metadata)?;
|
|
|
|
let npm_snapshot =
|
|
|
|
npm_snapshot.map(serialize_npm_snapshot).unwrap_or_default();
|
2024-12-19 12:53:52 -05:00
|
|
|
let serialized_vfs = serde_json::to_string(&vfs.entries)?;
|
2024-12-16 19:20:53 -05:00
|
|
|
|
|
|
|
let bytes = capacity_builder::BytesBuilder::build(|builder| {
|
|
|
|
builder.append(MAGIC_BYTES);
|
|
|
|
// 1. Metadata
|
|
|
|
{
|
|
|
|
builder.append_le(metadata.len() as u64);
|
|
|
|
builder.append(&metadata);
|
|
|
|
}
|
|
|
|
// 2. Npm snapshot
|
|
|
|
{
|
|
|
|
builder.append_le(npm_snapshot.len() as u64);
|
|
|
|
builder.append(&npm_snapshot);
|
|
|
|
}
|
|
|
|
// 3. Remote modules
|
|
|
|
{
|
|
|
|
remote_modules.write(builder);
|
|
|
|
}
|
|
|
|
// 4. VFS
|
|
|
|
{
|
|
|
|
builder.append_le(serialized_vfs.len() as u64);
|
|
|
|
builder.append(&serialized_vfs);
|
|
|
|
let vfs_bytes_len = vfs.files.iter().map(|f| f.len() as u64).sum::<u64>();
|
|
|
|
builder.append_le(vfs_bytes_len);
|
|
|
|
for file in &vfs.files {
|
|
|
|
builder.append(file);
|
|
|
|
}
|
2024-10-24 15:48:48 -04:00
|
|
|
}
|
2024-12-19 12:53:52 -05:00
|
|
|
// 5. Source maps
|
|
|
|
{
|
|
|
|
builder.append_le(source_map_store.data.len() as u32);
|
|
|
|
for (specifier, source_map) in &source_map_store.data {
|
|
|
|
builder.append_le(specifier.len() as u32);
|
|
|
|
builder.append(specifier);
|
|
|
|
builder.append_le(source_map.len() as u32);
|
2024-12-20 12:43:03 -05:00
|
|
|
builder.append(source_map.as_ref());
|
2024-12-19 12:53:52 -05:00
|
|
|
}
|
|
|
|
}
|
2024-10-24 15:48:48 -04:00
|
|
|
|
2024-12-16 19:20:53 -05:00
|
|
|
// write the magic bytes at the end so we can use it
|
|
|
|
// to make sure we've deserialized correctly
|
|
|
|
builder.append(MAGIC_BYTES);
|
|
|
|
})?;
|
2024-10-24 15:48:48 -04:00
|
|
|
|
|
|
|
Ok(bytes)
|
|
|
|
}
|
|
|
|
|
|
|
|
pub struct DeserializedDataSection {
|
|
|
|
pub metadata: Metadata,
|
|
|
|
pub npm_snapshot: Option<ValidSerializedNpmResolutionSnapshot>,
|
|
|
|
pub remote_modules: RemoteModulesStore,
|
2024-12-19 12:53:52 -05:00
|
|
|
pub source_maps: SourceMapStore,
|
|
|
|
pub vfs_root_entries: VirtualDirectoryEntries,
|
2024-10-24 15:48:48 -04:00
|
|
|
pub vfs_files_data: &'static [u8],
|
|
|
|
}
|
|
|
|
|
|
|
|
pub fn deserialize_binary_data_section(
|
|
|
|
data: &'static [u8],
|
|
|
|
) -> Result<Option<DeserializedDataSection>, AnyError> {
|
|
|
|
fn read_magic_bytes(input: &[u8]) -> Result<(&[u8], bool), AnyError> {
|
|
|
|
if input.len() < MAGIC_BYTES.len() {
|
|
|
|
bail!("Unexpected end of data. Could not find magic bytes.");
|
|
|
|
}
|
|
|
|
let (magic_bytes, input) = input.split_at(MAGIC_BYTES.len());
|
|
|
|
if magic_bytes != MAGIC_BYTES {
|
|
|
|
return Ok((input, false));
|
|
|
|
}
|
|
|
|
Ok((input, true))
|
|
|
|
}
|
|
|
|
|
2024-12-19 12:53:52 -05:00
|
|
|
#[allow(clippy::type_complexity)]
|
|
|
|
fn read_source_map_entry(
|
|
|
|
input: &[u8],
|
2024-12-20 12:43:03 -05:00
|
|
|
) -> Result<(&[u8], (Cow<str>, &[u8])), AnyError> {
|
2024-12-19 12:53:52 -05:00
|
|
|
let (input, specifier) = read_string_lossy(input)?;
|
2024-12-20 12:43:03 -05:00
|
|
|
let (input, source_map) = read_bytes_with_u32_len(input)?;
|
2024-12-19 12:53:52 -05:00
|
|
|
Ok((input, (specifier, source_map)))
|
|
|
|
}
|
|
|
|
|
2024-10-24 15:48:48 -04:00
|
|
|
let (input, found) = read_magic_bytes(data)?;
|
|
|
|
if !found {
|
|
|
|
return Ok(None);
|
|
|
|
}
|
|
|
|
|
|
|
|
// 1. Metadata
|
2024-12-19 12:53:52 -05:00
|
|
|
let (input, data) =
|
|
|
|
read_bytes_with_u64_len(input).context("reading metadata")?;
|
2024-10-24 15:48:48 -04:00
|
|
|
let metadata: Metadata =
|
|
|
|
serde_json::from_slice(data).context("deserializing metadata")?;
|
|
|
|
// 2. Npm snapshot
|
|
|
|
let (input, data) =
|
2024-12-19 12:53:52 -05:00
|
|
|
read_bytes_with_u64_len(input).context("reading npm snapshot")?;
|
2024-10-24 15:48:48 -04:00
|
|
|
let npm_snapshot = if data.is_empty() {
|
|
|
|
None
|
|
|
|
} else {
|
|
|
|
Some(deserialize_npm_snapshot(data).context("deserializing npm snapshot")?)
|
|
|
|
};
|
|
|
|
// 3. Remote modules
|
2024-12-19 12:53:52 -05:00
|
|
|
let (input, remote_modules) =
|
|
|
|
RemoteModulesStore::build(input).context("deserializing remote modules")?;
|
2024-10-24 15:48:48 -04:00
|
|
|
// 4. VFS
|
2024-12-19 12:53:52 -05:00
|
|
|
let (input, data) = read_bytes_with_u64_len(input).context("vfs")?;
|
|
|
|
let vfs_root_entries: VirtualDirectoryEntries =
|
2024-10-24 15:48:48 -04:00
|
|
|
serde_json::from_slice(data).context("deserializing vfs data")?;
|
|
|
|
let (input, vfs_files_data) =
|
2024-12-19 12:53:52 -05:00
|
|
|
read_bytes_with_u64_len(input).context("reading vfs files data")?;
|
|
|
|
// 5. Source maps
|
|
|
|
let (mut input, source_map_data_len) = read_u32_as_usize(input)?;
|
|
|
|
let mut source_maps = SourceMapStore::with_capacity(source_map_data_len);
|
|
|
|
for _ in 0..source_map_data_len {
|
|
|
|
let (current_input, (specifier, source_map)) =
|
|
|
|
read_source_map_entry(input)?;
|
|
|
|
input = current_input;
|
2024-12-20 12:43:03 -05:00
|
|
|
source_maps.add(specifier, Cow::Borrowed(source_map));
|
2024-12-19 12:53:52 -05:00
|
|
|
}
|
2024-10-24 15:48:48 -04:00
|
|
|
|
|
|
|
// finally ensure we read the magic bytes at the end
|
|
|
|
let (_input, found) = read_magic_bytes(input)?;
|
|
|
|
if !found {
|
|
|
|
bail!("Could not find magic bytes at the end of the data.");
|
|
|
|
}
|
|
|
|
|
|
|
|
Ok(Some(DeserializedDataSection {
|
|
|
|
metadata,
|
|
|
|
npm_snapshot,
|
|
|
|
remote_modules,
|
2024-12-19 12:53:52 -05:00
|
|
|
source_maps,
|
|
|
|
vfs_root_entries,
|
2024-10-24 15:48:48 -04:00
|
|
|
vfs_files_data,
|
|
|
|
}))
|
|
|
|
}
|
|
|
|
|
|
|
|
#[derive(Default)]
|
|
|
|
pub struct RemoteModulesStoreBuilder {
|
|
|
|
specifiers: Vec<(String, u64)>,
|
2024-12-19 12:53:52 -05:00
|
|
|
data: Vec<(MediaType, Vec<u8>, Option<Vec<u8>>)>,
|
2024-10-24 15:48:48 -04:00
|
|
|
data_byte_len: u64,
|
|
|
|
redirects: Vec<(String, String)>,
|
|
|
|
redirects_len: u64,
|
|
|
|
}
|
|
|
|
|
|
|
|
impl RemoteModulesStoreBuilder {
|
2024-12-19 12:53:52 -05:00
|
|
|
pub fn add(
|
|
|
|
&mut self,
|
|
|
|
specifier: &Url,
|
|
|
|
media_type: MediaType,
|
|
|
|
data: Vec<u8>,
|
|
|
|
maybe_transpiled: Option<Vec<u8>>,
|
|
|
|
) {
|
2024-10-28 09:31:58 -04:00
|
|
|
log::debug!("Adding '{}' ({})", specifier, media_type);
|
2024-10-24 15:48:48 -04:00
|
|
|
let specifier = specifier.to_string();
|
|
|
|
self.specifiers.push((specifier, self.data_byte_len));
|
2024-12-19 12:53:52 -05:00
|
|
|
let maybe_transpiled_len = match &maybe_transpiled {
|
|
|
|
// data length (4 bytes), data
|
|
|
|
Some(data) => 4 + data.len() as u64,
|
|
|
|
None => 0,
|
|
|
|
};
|
|
|
|
// media type (1 byte), data length (4 bytes), data, has transpiled (1 byte), transpiled length
|
|
|
|
self.data_byte_len += 1 + 4 + data.len() as u64 + 1 + maybe_transpiled_len;
|
|
|
|
self.data.push((media_type, data, maybe_transpiled));
|
2024-10-24 15:48:48 -04:00
|
|
|
}
|
|
|
|
|
|
|
|
pub fn add_redirects(&mut self, redirects: &BTreeMap<Url, Url>) {
|
|
|
|
self.redirects.reserve(redirects.len());
|
|
|
|
for (from, to) in redirects {
|
2024-10-28 09:31:58 -04:00
|
|
|
log::debug!("Adding redirect '{}' -> '{}'", from, to);
|
2024-10-24 15:48:48 -04:00
|
|
|
let from = from.to_string();
|
|
|
|
let to = to.to_string();
|
|
|
|
self.redirects_len += (4 + from.len() + 4 + to.len()) as u64;
|
|
|
|
self.redirects.push((from, to));
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2024-12-20 16:14:37 -05:00
|
|
|
fn write<'a, TBytes: capacity_builder::BytesType>(
|
|
|
|
&'a self,
|
|
|
|
builder: &mut capacity_builder::BytesBuilder<'a, TBytes>,
|
|
|
|
) {
|
2024-12-16 19:20:53 -05:00
|
|
|
builder.append_le(self.specifiers.len() as u32);
|
|
|
|
builder.append_le(self.redirects.len() as u32);
|
2024-10-24 15:48:48 -04:00
|
|
|
for (specifier, offset) in &self.specifiers {
|
2024-12-16 19:20:53 -05:00
|
|
|
builder.append_le(specifier.len() as u32);
|
2024-12-19 12:53:52 -05:00
|
|
|
builder.append(specifier);
|
2024-12-16 19:20:53 -05:00
|
|
|
builder.append_le(*offset);
|
2024-10-24 15:48:48 -04:00
|
|
|
}
|
|
|
|
for (from, to) in &self.redirects {
|
2024-12-16 19:20:53 -05:00
|
|
|
builder.append_le(from.len() as u32);
|
|
|
|
builder.append(from);
|
|
|
|
builder.append_le(to.len() as u32);
|
|
|
|
builder.append(to);
|
2024-10-24 15:48:48 -04:00
|
|
|
}
|
2024-12-19 12:53:52 -05:00
|
|
|
builder.append_le(
|
|
|
|
self
|
|
|
|
.data
|
|
|
|
.iter()
|
|
|
|
.map(|(_, data, maybe_transpiled)| {
|
|
|
|
1 + 4
|
|
|
|
+ (data.len() as u64)
|
|
|
|
+ 1
|
|
|
|
+ match maybe_transpiled {
|
|
|
|
Some(transpiled) => 4 + (transpiled.len() as u64),
|
|
|
|
None => 0,
|
|
|
|
}
|
|
|
|
})
|
|
|
|
.sum::<u64>(),
|
|
|
|
);
|
|
|
|
for (media_type, data, maybe_transpiled) in &self.data {
|
2024-12-16 19:20:53 -05:00
|
|
|
builder.append(serialize_media_type(*media_type));
|
2024-12-19 12:53:52 -05:00
|
|
|
builder.append_le(data.len() as u32);
|
2024-12-16 19:20:53 -05:00
|
|
|
builder.append(data);
|
2024-12-19 12:53:52 -05:00
|
|
|
if let Some(transpiled) = maybe_transpiled {
|
|
|
|
builder.append(1);
|
|
|
|
builder.append_le(transpiled.len() as u32);
|
|
|
|
builder.append(transpiled);
|
|
|
|
} else {
|
|
|
|
builder.append(0);
|
|
|
|
}
|
2024-10-24 15:48:48 -04:00
|
|
|
}
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2024-11-01 12:27:00 -04:00
|
|
|
pub enum DenoCompileModuleSource {
|
|
|
|
String(&'static str),
|
|
|
|
Bytes(Cow<'static, [u8]>),
|
2024-10-24 15:48:48 -04:00
|
|
|
}
|
|
|
|
|
2024-11-01 12:27:00 -04:00
|
|
|
impl DenoCompileModuleSource {
|
|
|
|
pub fn into_for_v8(self) -> ModuleSourceCode {
|
2024-10-24 15:48:48 -04:00
|
|
|
fn into_bytes(data: Cow<'static, [u8]>) -> ModuleSourceCode {
|
|
|
|
ModuleSourceCode::Bytes(match data {
|
|
|
|
Cow::Borrowed(d) => d.into(),
|
|
|
|
Cow::Owned(d) => d.into_boxed_slice().into(),
|
|
|
|
})
|
|
|
|
}
|
|
|
|
|
2024-11-01 12:27:00 -04:00
|
|
|
match self {
|
2024-10-24 15:48:48 -04:00
|
|
|
// todo(https://github.com/denoland/deno_core/pull/943): store whether
|
|
|
|
// the string is ascii or not ahead of time so we can avoid the is_ascii()
|
|
|
|
// check in FastString::from_static
|
2024-11-01 12:27:00 -04:00
|
|
|
Self::String(s) => ModuleSourceCode::String(FastString::from_static(s)),
|
|
|
|
Self::Bytes(b) => into_bytes(b),
|
|
|
|
}
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2024-12-19 12:53:52 -05:00
|
|
|
pub struct SourceMapStore {
|
2024-12-20 12:43:03 -05:00
|
|
|
data: IndexMap<Cow<'static, str>, Cow<'static, [u8]>>,
|
2024-12-19 12:53:52 -05:00
|
|
|
}
|
|
|
|
|
|
|
|
impl SourceMapStore {
|
|
|
|
pub fn with_capacity(capacity: usize) -> Self {
|
|
|
|
Self {
|
|
|
|
data: IndexMap::with_capacity(capacity),
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
pub fn add(
|
|
|
|
&mut self,
|
|
|
|
specifier: Cow<'static, str>,
|
2024-12-20 12:43:03 -05:00
|
|
|
source_map: Cow<'static, [u8]>,
|
2024-12-19 12:53:52 -05:00
|
|
|
) {
|
|
|
|
self.data.insert(specifier, source_map);
|
|
|
|
}
|
|
|
|
|
2024-12-20 12:43:03 -05:00
|
|
|
pub fn get(&self, specifier: &str) -> Option<&[u8]> {
|
|
|
|
self.data.get(specifier).map(|v| v.as_ref())
|
2024-12-19 12:53:52 -05:00
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2024-11-01 12:27:00 -04:00
|
|
|
pub struct DenoCompileModuleData<'a> {
|
|
|
|
pub specifier: &'a Url,
|
|
|
|
pub media_type: MediaType,
|
|
|
|
pub data: Cow<'static, [u8]>,
|
|
|
|
}
|
|
|
|
|
|
|
|
impl<'a> DenoCompileModuleData<'a> {
|
|
|
|
pub fn into_parts(self) -> (&'a Url, ModuleType, DenoCompileModuleSource) {
|
|
|
|
fn into_string_unsafe(data: Cow<'static, [u8]>) -> DenoCompileModuleSource {
|
2024-10-24 15:48:48 -04:00
|
|
|
match data {
|
2024-11-01 12:27:00 -04:00
|
|
|
Cow::Borrowed(d) => DenoCompileModuleSource::String(
|
2024-10-24 15:48:48 -04:00
|
|
|
// SAFETY: we know this is a valid utf8 string
|
2024-11-01 12:27:00 -04:00
|
|
|
unsafe { std::str::from_utf8_unchecked(d) },
|
2024-10-24 15:48:48 -04:00
|
|
|
),
|
2024-11-01 12:27:00 -04:00
|
|
|
Cow::Owned(d) => DenoCompileModuleSource::Bytes(Cow::Owned(d)),
|
2024-10-24 15:48:48 -04:00
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
let (media_type, source) = match self.media_type {
|
|
|
|
MediaType::JavaScript
|
|
|
|
| MediaType::Jsx
|
|
|
|
| MediaType::Mjs
|
|
|
|
| MediaType::Cjs
|
|
|
|
| MediaType::TypeScript
|
|
|
|
| MediaType::Mts
|
|
|
|
| MediaType::Cts
|
|
|
|
| MediaType::Dts
|
|
|
|
| MediaType::Dmts
|
|
|
|
| MediaType::Dcts
|
|
|
|
| MediaType::Tsx => {
|
|
|
|
(ModuleType::JavaScript, into_string_unsafe(self.data))
|
|
|
|
}
|
|
|
|
MediaType::Json => (ModuleType::Json, into_string_unsafe(self.data)),
|
2024-11-01 12:27:00 -04:00
|
|
|
MediaType::Wasm => {
|
|
|
|
(ModuleType::Wasm, DenoCompileModuleSource::Bytes(self.data))
|
2024-10-24 15:48:48 -04:00
|
|
|
}
|
2024-11-01 12:27:00 -04:00
|
|
|
// just assume javascript if we made it here
|
|
|
|
MediaType::Css | MediaType::SourceMap | MediaType::Unknown => (
|
|
|
|
ModuleType::JavaScript,
|
|
|
|
DenoCompileModuleSource::Bytes(self.data),
|
|
|
|
),
|
2024-10-24 15:48:48 -04:00
|
|
|
};
|
|
|
|
(self.specifier, media_type, source)
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2024-12-19 12:53:52 -05:00
|
|
|
pub struct RemoteModuleEntry<'a> {
|
|
|
|
pub specifier: &'a Url,
|
|
|
|
pub media_type: MediaType,
|
|
|
|
pub data: Cow<'static, [u8]>,
|
|
|
|
pub transpiled_data: Option<Cow<'static, [u8]>>,
|
|
|
|
}
|
|
|
|
|
2024-10-24 15:48:48 -04:00
|
|
|
enum RemoteModulesStoreSpecifierValue {
|
|
|
|
Data(usize),
|
|
|
|
Redirect(Url),
|
|
|
|
}
|
|
|
|
|
|
|
|
pub struct RemoteModulesStore {
|
|
|
|
specifiers: HashMap<Url, RemoteModulesStoreSpecifierValue>,
|
|
|
|
files_data: &'static [u8],
|
|
|
|
}
|
|
|
|
|
|
|
|
impl RemoteModulesStore {
|
2024-12-19 12:53:52 -05:00
|
|
|
fn build(input: &'static [u8]) -> Result<(&'static [u8], Self), AnyError> {
|
2024-10-24 15:48:48 -04:00
|
|
|
fn read_specifier(input: &[u8]) -> Result<(&[u8], (Url, u64)), AnyError> {
|
|
|
|
let (input, specifier) = read_string_lossy(input)?;
|
|
|
|
let specifier = Url::parse(&specifier)?;
|
|
|
|
let (input, offset) = read_u64(input)?;
|
|
|
|
Ok((input, (specifier, offset)))
|
|
|
|
}
|
|
|
|
|
|
|
|
fn read_redirect(input: &[u8]) -> Result<(&[u8], (Url, Url)), AnyError> {
|
|
|
|
let (input, from) = read_string_lossy(input)?;
|
|
|
|
let from = Url::parse(&from)?;
|
|
|
|
let (input, to) = read_string_lossy(input)?;
|
|
|
|
let to = Url::parse(&to)?;
|
|
|
|
Ok((input, (from, to)))
|
|
|
|
}
|
|
|
|
|
|
|
|
fn read_headers(
|
|
|
|
input: &[u8],
|
|
|
|
) -> Result<(&[u8], HashMap<Url, RemoteModulesStoreSpecifierValue>), AnyError>
|
|
|
|
{
|
|
|
|
let (input, specifiers_len) = read_u32_as_usize(input)?;
|
|
|
|
let (mut input, redirects_len) = read_u32_as_usize(input)?;
|
|
|
|
let mut specifiers =
|
|
|
|
HashMap::with_capacity(specifiers_len + redirects_len);
|
|
|
|
for _ in 0..specifiers_len {
|
|
|
|
let (current_input, (specifier, offset)) =
|
|
|
|
read_specifier(input).context("reading specifier")?;
|
|
|
|
input = current_input;
|
|
|
|
specifiers.insert(
|
|
|
|
specifier,
|
|
|
|
RemoteModulesStoreSpecifierValue::Data(offset as usize),
|
|
|
|
);
|
|
|
|
}
|
|
|
|
|
|
|
|
for _ in 0..redirects_len {
|
|
|
|
let (current_input, (from, to)) = read_redirect(input)?;
|
|
|
|
input = current_input;
|
|
|
|
specifiers.insert(from, RemoteModulesStoreSpecifierValue::Redirect(to));
|
|
|
|
}
|
|
|
|
|
|
|
|
Ok((input, specifiers))
|
|
|
|
}
|
|
|
|
|
2024-12-19 12:53:52 -05:00
|
|
|
let (input, specifiers) = read_headers(input)?;
|
|
|
|
let (input, files_data) = read_bytes_with_u64_len(input)?;
|
2024-10-24 15:48:48 -04:00
|
|
|
|
2024-12-19 12:53:52 -05:00
|
|
|
Ok((
|
|
|
|
input,
|
|
|
|
Self {
|
|
|
|
specifiers,
|
|
|
|
files_data,
|
|
|
|
},
|
|
|
|
))
|
2024-10-24 15:48:48 -04:00
|
|
|
}
|
|
|
|
|
|
|
|
pub fn resolve_specifier<'a>(
|
|
|
|
&'a self,
|
|
|
|
specifier: &'a Url,
|
|
|
|
) -> Result<Option<&'a Url>, AnyError> {
|
|
|
|
let mut count = 0;
|
|
|
|
let mut current = specifier;
|
|
|
|
loop {
|
|
|
|
if count > 10 {
|
|
|
|
bail!("Too many redirects resolving '{}'", specifier);
|
|
|
|
}
|
|
|
|
match self.specifiers.get(current) {
|
|
|
|
Some(RemoteModulesStoreSpecifierValue::Redirect(to)) => {
|
|
|
|
current = to;
|
|
|
|
count += 1;
|
|
|
|
}
|
|
|
|
Some(RemoteModulesStoreSpecifierValue::Data(_)) => {
|
|
|
|
return Ok(Some(current));
|
|
|
|
}
|
|
|
|
None => {
|
|
|
|
return Ok(None);
|
|
|
|
}
|
|
|
|
}
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
pub fn read<'a>(
|
|
|
|
&'a self,
|
2024-10-28 09:31:58 -04:00
|
|
|
original_specifier: &'a Url,
|
2024-12-19 12:53:52 -05:00
|
|
|
) -> Result<Option<RemoteModuleEntry<'a>>, AnyError> {
|
2024-10-24 15:48:48 -04:00
|
|
|
let mut count = 0;
|
2024-10-28 09:31:58 -04:00
|
|
|
let mut specifier = original_specifier;
|
2024-10-24 15:48:48 -04:00
|
|
|
loop {
|
|
|
|
if count > 10 {
|
2024-10-28 09:31:58 -04:00
|
|
|
bail!("Too many redirects resolving '{}'", original_specifier);
|
2024-10-24 15:48:48 -04:00
|
|
|
}
|
2024-10-28 09:31:58 -04:00
|
|
|
match self.specifiers.get(specifier) {
|
2024-10-24 15:48:48 -04:00
|
|
|
Some(RemoteModulesStoreSpecifierValue::Redirect(to)) => {
|
2024-10-28 09:31:58 -04:00
|
|
|
specifier = to;
|
2024-10-24 15:48:48 -04:00
|
|
|
count += 1;
|
|
|
|
}
|
|
|
|
Some(RemoteModulesStoreSpecifierValue::Data(offset)) => {
|
|
|
|
let input = &self.files_data[*offset..];
|
|
|
|
let (input, media_type_byte) = read_bytes(input, 1)?;
|
|
|
|
let media_type = deserialize_media_type(media_type_byte[0])?;
|
2024-12-19 12:53:52 -05:00
|
|
|
let (input, data) = read_bytes_with_u32_len(input)?;
|
|
|
|
check_has_len(input, 1)?;
|
|
|
|
let (input, has_transpiled) = (&input[1..], input[0]);
|
|
|
|
let (_, transpiled_data) = match has_transpiled {
|
|
|
|
0 => (input, None),
|
|
|
|
1 => {
|
|
|
|
let (input, data) = read_bytes_with_u32_len(input)?;
|
|
|
|
(input, Some(data))
|
|
|
|
}
|
|
|
|
value => bail!(
|
|
|
|
"Invalid transpiled data flag: {}. Compiled data is corrupt.",
|
|
|
|
value
|
|
|
|
),
|
|
|
|
};
|
|
|
|
return Ok(Some(RemoteModuleEntry {
|
2024-10-24 15:48:48 -04:00
|
|
|
specifier,
|
|
|
|
media_type,
|
|
|
|
data: Cow::Borrowed(data),
|
2024-12-19 12:53:52 -05:00
|
|
|
transpiled_data: transpiled_data.map(Cow::Borrowed),
|
2024-10-24 15:48:48 -04:00
|
|
|
}));
|
|
|
|
}
|
|
|
|
None => {
|
|
|
|
return Ok(None);
|
|
|
|
}
|
|
|
|
}
|
|
|
|
}
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
fn serialize_npm_snapshot(
|
|
|
|
mut snapshot: SerializedNpmResolutionSnapshot,
|
|
|
|
) -> Vec<u8> {
|
|
|
|
fn append_string(bytes: &mut Vec<u8>, string: &str) {
|
|
|
|
let len = string.len() as u32;
|
|
|
|
bytes.extend_from_slice(&len.to_le_bytes());
|
|
|
|
bytes.extend_from_slice(string.as_bytes());
|
|
|
|
}
|
|
|
|
|
|
|
|
snapshot.packages.sort_by(|a, b| a.id.cmp(&b.id)); // determinism
|
|
|
|
let ids_to_stored_ids = snapshot
|
|
|
|
.packages
|
|
|
|
.iter()
|
|
|
|
.enumerate()
|
|
|
|
.map(|(i, pkg)| (&pkg.id, i as u32))
|
|
|
|
.collect::<HashMap<_, _>>();
|
|
|
|
|
|
|
|
let mut root_packages: Vec<_> = snapshot.root_packages.iter().collect();
|
|
|
|
root_packages.sort();
|
|
|
|
let mut bytes = Vec::new();
|
|
|
|
|
|
|
|
bytes.extend_from_slice(&(snapshot.packages.len() as u32).to_le_bytes());
|
|
|
|
for pkg in &snapshot.packages {
|
|
|
|
append_string(&mut bytes, &pkg.id.as_serialized());
|
|
|
|
}
|
|
|
|
|
|
|
|
bytes.extend_from_slice(&(root_packages.len() as u32).to_le_bytes());
|
|
|
|
for (req, id) in root_packages {
|
|
|
|
append_string(&mut bytes, &req.to_string());
|
|
|
|
let id = ids_to_stored_ids.get(&id).unwrap();
|
|
|
|
bytes.extend_from_slice(&id.to_le_bytes());
|
|
|
|
}
|
|
|
|
|
|
|
|
for pkg in &snapshot.packages {
|
|
|
|
let deps_len = pkg.dependencies.len() as u32;
|
|
|
|
bytes.extend_from_slice(&deps_len.to_le_bytes());
|
|
|
|
let mut deps: Vec<_> = pkg.dependencies.iter().collect();
|
|
|
|
deps.sort();
|
|
|
|
for (req, id) in deps {
|
|
|
|
append_string(&mut bytes, req);
|
|
|
|
let id = ids_to_stored_ids.get(&id).unwrap();
|
|
|
|
bytes.extend_from_slice(&id.to_le_bytes());
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
bytes
|
|
|
|
}
|
|
|
|
|
|
|
|
fn deserialize_npm_snapshot(
|
|
|
|
input: &[u8],
|
|
|
|
) -> Result<ValidSerializedNpmResolutionSnapshot, AnyError> {
|
|
|
|
fn parse_id(input: &[u8]) -> Result<(&[u8], NpmPackageId), AnyError> {
|
|
|
|
let (input, id) = read_string_lossy(input)?;
|
|
|
|
let id = NpmPackageId::from_serialized(&id)?;
|
|
|
|
Ok((input, id))
|
|
|
|
}
|
|
|
|
|
|
|
|
#[allow(clippy::needless_lifetimes)] // clippy bug
|
|
|
|
fn parse_root_package<'a>(
|
|
|
|
id_to_npm_id: &'a impl Fn(usize) -> Result<NpmPackageId, AnyError>,
|
|
|
|
) -> impl Fn(&[u8]) -> Result<(&[u8], (PackageReq, NpmPackageId)), AnyError> + 'a
|
|
|
|
{
|
|
|
|
|input| {
|
|
|
|
let (input, req) = read_string_lossy(input)?;
|
|
|
|
let req = PackageReq::from_str(&req)?;
|
|
|
|
let (input, id) = read_u32_as_usize(input)?;
|
|
|
|
Ok((input, (req, id_to_npm_id(id)?)))
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
#[allow(clippy::needless_lifetimes)] // clippy bug
|
|
|
|
fn parse_package_dep<'a>(
|
|
|
|
id_to_npm_id: &'a impl Fn(usize) -> Result<NpmPackageId, AnyError>,
|
2024-12-20 16:14:37 -05:00
|
|
|
) -> impl Fn(&[u8]) -> Result<(&[u8], (StackString, NpmPackageId)), AnyError> + 'a
|
2024-10-24 15:48:48 -04:00
|
|
|
{
|
|
|
|
|input| {
|
|
|
|
let (input, req) = read_string_lossy(input)?;
|
|
|
|
let (input, id) = read_u32_as_usize(input)?;
|
2024-12-20 16:14:37 -05:00
|
|
|
let req = StackString::from_cow(req);
|
|
|
|
Ok((input, (req, id_to_npm_id(id)?)))
|
2024-10-24 15:48:48 -04:00
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
fn parse_package<'a>(
|
|
|
|
input: &'a [u8],
|
|
|
|
id: NpmPackageId,
|
|
|
|
id_to_npm_id: &impl Fn(usize) -> Result<NpmPackageId, AnyError>,
|
|
|
|
) -> Result<(&'a [u8], SerializedNpmResolutionSnapshotPackage), AnyError> {
|
|
|
|
let (input, deps_len) = read_u32_as_usize(input)?;
|
|
|
|
let (input, dependencies) =
|
|
|
|
parse_hashmap_n_times(input, deps_len, parse_package_dep(id_to_npm_id))?;
|
|
|
|
Ok((
|
|
|
|
input,
|
|
|
|
SerializedNpmResolutionSnapshotPackage {
|
|
|
|
id,
|
|
|
|
system: Default::default(),
|
|
|
|
dist: Default::default(),
|
|
|
|
dependencies,
|
|
|
|
optional_dependencies: Default::default(),
|
|
|
|
bin: None,
|
|
|
|
scripts: Default::default(),
|
|
|
|
deprecated: Default::default(),
|
|
|
|
},
|
|
|
|
))
|
|
|
|
}
|
|
|
|
|
|
|
|
let (input, packages_len) = read_u32_as_usize(input)?;
|
|
|
|
|
|
|
|
// get a hashmap of all the npm package ids to their serialized ids
|
|
|
|
let (input, data_ids_to_npm_ids) =
|
|
|
|
parse_vec_n_times(input, packages_len, parse_id)
|
|
|
|
.context("deserializing id")?;
|
|
|
|
let data_id_to_npm_id = |id: usize| {
|
|
|
|
data_ids_to_npm_ids
|
|
|
|
.get(id)
|
|
|
|
.cloned()
|
|
|
|
.ok_or_else(|| deno_core::anyhow::anyhow!("Invalid npm package id"))
|
|
|
|
};
|
|
|
|
|
|
|
|
let (input, root_packages_len) = read_u32_as_usize(input)?;
|
|
|
|
let (input, root_packages) = parse_hashmap_n_times(
|
|
|
|
input,
|
|
|
|
root_packages_len,
|
|
|
|
parse_root_package(&data_id_to_npm_id),
|
|
|
|
)
|
|
|
|
.context("deserializing root package")?;
|
|
|
|
let (input, packages) =
|
|
|
|
parse_vec_n_times_with_index(input, packages_len, |input, index| {
|
|
|
|
parse_package(input, data_id_to_npm_id(index)?, &data_id_to_npm_id)
|
|
|
|
})
|
|
|
|
.context("deserializing package")?;
|
|
|
|
|
|
|
|
if !input.is_empty() {
|
|
|
|
bail!("Unexpected data left over");
|
|
|
|
}
|
|
|
|
|
|
|
|
Ok(
|
|
|
|
SerializedNpmResolutionSnapshot {
|
|
|
|
packages,
|
|
|
|
root_packages,
|
|
|
|
}
|
|
|
|
// this is ok because we have already verified that all the
|
|
|
|
// identifiers found in the snapshot are valid via the
|
|
|
|
// npm package id -> npm package id mapping
|
|
|
|
.into_valid_unsafe(),
|
|
|
|
)
|
|
|
|
}
|
|
|
|
|
|
|
|
fn serialize_media_type(media_type: MediaType) -> u8 {
|
|
|
|
match media_type {
|
|
|
|
MediaType::JavaScript => 0,
|
|
|
|
MediaType::Jsx => 1,
|
|
|
|
MediaType::Mjs => 2,
|
|
|
|
MediaType::Cjs => 3,
|
|
|
|
MediaType::TypeScript => 4,
|
|
|
|
MediaType::Mts => 5,
|
|
|
|
MediaType::Cts => 6,
|
|
|
|
MediaType::Dts => 7,
|
|
|
|
MediaType::Dmts => 8,
|
|
|
|
MediaType::Dcts => 9,
|
|
|
|
MediaType::Tsx => 10,
|
|
|
|
MediaType::Json => 11,
|
|
|
|
MediaType::Wasm => 12,
|
2024-11-01 12:27:00 -04:00
|
|
|
MediaType::Css => 13,
|
2024-10-24 15:48:48 -04:00
|
|
|
MediaType::SourceMap => 14,
|
|
|
|
MediaType::Unknown => 15,
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
fn deserialize_media_type(value: u8) -> Result<MediaType, AnyError> {
|
|
|
|
match value {
|
|
|
|
0 => Ok(MediaType::JavaScript),
|
|
|
|
1 => Ok(MediaType::Jsx),
|
|
|
|
2 => Ok(MediaType::Mjs),
|
|
|
|
3 => Ok(MediaType::Cjs),
|
|
|
|
4 => Ok(MediaType::TypeScript),
|
|
|
|
5 => Ok(MediaType::Mts),
|
|
|
|
6 => Ok(MediaType::Cts),
|
|
|
|
7 => Ok(MediaType::Dts),
|
|
|
|
8 => Ok(MediaType::Dmts),
|
|
|
|
9 => Ok(MediaType::Dcts),
|
|
|
|
10 => Ok(MediaType::Tsx),
|
|
|
|
11 => Ok(MediaType::Json),
|
|
|
|
12 => Ok(MediaType::Wasm),
|
2024-11-01 12:27:00 -04:00
|
|
|
13 => Ok(MediaType::Css),
|
2024-10-24 15:48:48 -04:00
|
|
|
14 => Ok(MediaType::SourceMap),
|
|
|
|
15 => Ok(MediaType::Unknown),
|
|
|
|
_ => bail!("Unknown media type value: {}", value),
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
fn parse_hashmap_n_times<TKey: std::cmp::Eq + std::hash::Hash, TValue>(
|
|
|
|
mut input: &[u8],
|
|
|
|
times: usize,
|
|
|
|
parse: impl Fn(&[u8]) -> Result<(&[u8], (TKey, TValue)), AnyError>,
|
|
|
|
) -> Result<(&[u8], HashMap<TKey, TValue>), AnyError> {
|
|
|
|
let mut results = HashMap::with_capacity(times);
|
|
|
|
for _ in 0..times {
|
|
|
|
let result = parse(input);
|
|
|
|
let (new_input, (key, value)) = result?;
|
|
|
|
results.insert(key, value);
|
|
|
|
input = new_input;
|
|
|
|
}
|
|
|
|
Ok((input, results))
|
|
|
|
}
|
|
|
|
|
|
|
|
fn parse_vec_n_times<TResult>(
|
|
|
|
input: &[u8],
|
|
|
|
times: usize,
|
|
|
|
parse: impl Fn(&[u8]) -> Result<(&[u8], TResult), AnyError>,
|
|
|
|
) -> Result<(&[u8], Vec<TResult>), AnyError> {
|
|
|
|
parse_vec_n_times_with_index(input, times, |input, _index| parse(input))
|
|
|
|
}
|
|
|
|
|
|
|
|
fn parse_vec_n_times_with_index<TResult>(
|
|
|
|
mut input: &[u8],
|
|
|
|
times: usize,
|
|
|
|
parse: impl Fn(&[u8], usize) -> Result<(&[u8], TResult), AnyError>,
|
|
|
|
) -> Result<(&[u8], Vec<TResult>), AnyError> {
|
|
|
|
let mut results = Vec::with_capacity(times);
|
|
|
|
for i in 0..times {
|
|
|
|
let result = parse(input, i);
|
|
|
|
let (new_input, result) = result?;
|
|
|
|
results.push(result);
|
|
|
|
input = new_input;
|
|
|
|
}
|
|
|
|
Ok((input, results))
|
|
|
|
}
|
|
|
|
|
2024-12-19 12:53:52 -05:00
|
|
|
fn read_bytes_with_u64_len(input: &[u8]) -> Result<(&[u8], &[u8]), AnyError> {
|
|
|
|
let (input, len) = read_u64(input)?;
|
|
|
|
let (input, data) = read_bytes(input, len as usize)?;
|
|
|
|
Ok((input, data))
|
|
|
|
}
|
|
|
|
|
|
|
|
fn read_bytes_with_u32_len(input: &[u8]) -> Result<(&[u8], &[u8]), AnyError> {
|
|
|
|
let (input, len) = read_u32_as_usize(input)?;
|
|
|
|
let (input, data) = read_bytes(input, len)?;
|
|
|
|
Ok((input, data))
|
|
|
|
}
|
|
|
|
|
2024-10-24 15:48:48 -04:00
|
|
|
fn read_bytes(input: &[u8], len: usize) -> Result<(&[u8], &[u8]), AnyError> {
|
2024-12-19 12:53:52 -05:00
|
|
|
check_has_len(input, len)?;
|
2024-10-24 15:48:48 -04:00
|
|
|
let (len_bytes, input) = input.split_at(len);
|
|
|
|
Ok((input, len_bytes))
|
|
|
|
}
|
|
|
|
|
2024-12-19 12:53:52 -05:00
|
|
|
#[inline(always)]
|
|
|
|
fn check_has_len(input: &[u8], len: usize) -> Result<(), AnyError> {
|
|
|
|
if input.len() < len {
|
|
|
|
bail!("Unexpected end of data.");
|
|
|
|
}
|
|
|
|
Ok(())
|
|
|
|
}
|
|
|
|
|
2024-10-24 15:48:48 -04:00
|
|
|
fn read_string_lossy(input: &[u8]) -> Result<(&[u8], Cow<str>), AnyError> {
|
2024-12-20 12:43:03 -05:00
|
|
|
let (input, data_bytes) = read_bytes_with_u32_len(input)?;
|
2024-10-24 15:48:48 -04:00
|
|
|
Ok((input, String::from_utf8_lossy(data_bytes)))
|
|
|
|
}
|
|
|
|
|
|
|
|
fn read_u32_as_usize(input: &[u8]) -> Result<(&[u8], usize), AnyError> {
|
|
|
|
let (input, len_bytes) = read_bytes(input, 4)?;
|
|
|
|
let len = u32::from_le_bytes(len_bytes.try_into()?);
|
|
|
|
Ok((input, len as usize))
|
|
|
|
}
|
|
|
|
|
|
|
|
fn read_u64(input: &[u8]) -> Result<(&[u8], u64), AnyError> {
|
|
|
|
let (input, len_bytes) = read_bytes(input, 8)?;
|
|
|
|
let len = u64::from_le_bytes(len_bytes.try_into()?);
|
|
|
|
Ok((input, len))
|
|
|
|
}
|