2024-12-31 14:12:39 -05:00
|
|
|
// Copyright 2018-2025 the Deno authors. MIT license.
|
2021-10-10 17:26:22 -04:00
|
|
|
|
2024-12-31 12:13:39 -05:00
|
|
|
use std::collections::HashMap;
|
|
|
|
use std::path::PathBuf;
|
|
|
|
use std::sync::Arc;
|
2021-10-10 17:26:22 -04:00
|
|
|
|
2023-09-07 09:09:16 -04:00
|
|
|
use deno_ast::MediaType;
|
2024-12-16 18:39:40 -05:00
|
|
|
use deno_cache_dir::file_fetcher::CacheSetting;
|
|
|
|
use deno_cache_dir::file_fetcher::FetchNoFollowErrorKind;
|
|
|
|
use deno_cache_dir::file_fetcher::FileOrRedirect;
|
|
|
|
use deno_core::error::AnyError;
|
2023-02-22 17:21:05 -05:00
|
|
|
use deno_core::futures;
|
2021-10-10 17:26:22 -04:00
|
|
|
use deno_core::futures::FutureExt;
|
|
|
|
use deno_core::ModuleSpecifier;
|
|
|
|
use deno_graph::source::CacheInfo;
|
|
|
|
use deno_graph::source::LoadFuture;
|
|
|
|
use deno_graph::source::LoadResponse;
|
|
|
|
use deno_graph::source::Loader;
|
2024-09-25 21:50:54 -04:00
|
|
|
use deno_runtime::deno_permissions::PermissionsContainer;
|
2024-11-01 12:27:00 -04:00
|
|
|
use node_resolver::InNpmPackageChecker;
|
2024-12-31 12:13:39 -05:00
|
|
|
|
|
|
|
use crate::args::jsr_url;
|
|
|
|
use crate::file_fetcher::CliFetchNoFollowErrorKind;
|
|
|
|
use crate::file_fetcher::CliFileFetcher;
|
|
|
|
use crate::file_fetcher::FetchNoFollowOptions;
|
|
|
|
use crate::file_fetcher::FetchPermissionsOptionRef;
|
|
|
|
use crate::sys::CliSys;
|
2021-10-10 17:26:22 -04:00
|
|
|
|
feat(core): initialize SQLite off-main-thread (#18401)
This gets SQLite off the flamegraph and reduces initialization time by
somewhere between 0.2ms and 0.5ms. In addition, I took the opportunity
to move all the cache management code to a single place and reduce
duplication. While the PR has a net gain of lines, much of that is just
being a bit more deliberate with how we're recovering from errors.
The existing caches had various policies for dealing with cache
corruption, so I've unified them and tried to isolate the decisions we
make for recovery in a single place (see `open_connection` in
`CacheDB`). The policy I chose was:
1. Retry twice to open on-disk caches
2. If that fails, try to delete the file and recreate it on-disk
3. If we fail to delete the file or re-create a new cache, use a
fallback strategy that can be chosen per-cache: InMemory (temporary
cache for the process run), BlackHole (ignore writes, return empty
reads), or Error (fail on every operation).
The caches all use the same general code now, and share the cache
failure recovery policy.
In addition, it cleans up a TODO in the `NodeAnalysisCache`.
2023-03-27 18:01:52 -04:00
|
|
|
mod cache_db;
|
|
|
|
mod caches;
|
2022-07-12 18:58:39 -04:00
|
|
|
mod check;
|
2024-04-17 10:19:55 -04:00
|
|
|
mod code_cache;
|
2022-07-12 18:58:39 -04:00
|
|
|
mod common;
|
2022-11-25 19:04:30 -05:00
|
|
|
mod deno_dir;
|
2022-07-12 18:58:39 -04:00
|
|
|
mod disk_cache;
|
|
|
|
mod emit;
|
2024-02-20 16:29:57 -05:00
|
|
|
mod fast_check;
|
2022-07-12 18:58:39 -04:00
|
|
|
mod incremental;
|
2023-10-25 18:13:22 -04:00
|
|
|
mod module_info;
|
2022-10-01 06:15:56 -04:00
|
|
|
mod node;
|
2022-08-22 12:14:59 -04:00
|
|
|
mod parsed_source;
|
2022-07-12 18:58:39 -04:00
|
|
|
|
2024-05-29 14:38:18 -04:00
|
|
|
pub use cache_db::CacheDBHash;
|
feat(core): initialize SQLite off-main-thread (#18401)
This gets SQLite off the flamegraph and reduces initialization time by
somewhere between 0.2ms and 0.5ms. In addition, I took the opportunity
to move all the cache management code to a single place and reduce
duplication. While the PR has a net gain of lines, much of that is just
being a bit more deliberate with how we're recovering from errors.
The existing caches had various policies for dealing with cache
corruption, so I've unified them and tried to isolate the decisions we
make for recovery in a single place (see `open_connection` in
`CacheDB`). The policy I chose was:
1. Retry twice to open on-disk caches
2. If that fails, try to delete the file and recreate it on-disk
3. If we fail to delete the file or re-create a new cache, use a
fallback strategy that can be chosen per-cache: InMemory (temporary
cache for the process run), BlackHole (ignore writes, return empty
reads), or Error (fail on every operation).
The caches all use the same general code now, and share the cache
failure recovery policy.
In addition, it cleans up a TODO in the `NodeAnalysisCache`.
2023-03-27 18:01:52 -04:00
|
|
|
pub use caches::Caches;
|
2022-07-12 18:58:39 -04:00
|
|
|
pub use check::TypeCheckCache;
|
2024-04-17 10:19:55 -04:00
|
|
|
pub use code_cache::CodeCache;
|
2022-07-19 11:58:18 -04:00
|
|
|
pub use common::FastInsecureHasher;
|
2024-12-31 12:13:39 -05:00
|
|
|
/// Permissions used to save a file in the disk caches.
|
|
|
|
pub use deno_cache_dir::CACHE_PERM;
|
2022-11-25 19:04:30 -05:00
|
|
|
pub use deno_dir::DenoDir;
|
2023-05-25 14:27:45 -04:00
|
|
|
pub use deno_dir::DenoDirProvider;
|
2022-07-12 18:58:39 -04:00
|
|
|
pub use disk_cache::DiskCache;
|
|
|
|
pub use emit::EmitCache;
|
2024-02-20 16:29:57 -05:00
|
|
|
pub use fast_check::FastCheckCache;
|
2022-07-12 18:58:39 -04:00
|
|
|
pub use incremental::IncrementalCache;
|
2023-10-25 18:13:22 -04:00
|
|
|
pub use module_info::ModuleInfoCache;
|
2022-10-01 06:15:56 -04:00
|
|
|
pub use node::NodeAnalysisCache;
|
2024-02-06 15:57:10 -05:00
|
|
|
pub use parsed_source::LazyGraphSourceParser;
|
2022-08-22 12:14:59 -04:00
|
|
|
pub use parsed_source::ParsedSourceCache;
|
2022-07-12 18:58:39 -04:00
|
|
|
|
2024-12-31 11:29:07 -05:00
|
|
|
pub type GlobalHttpCache = deno_cache_dir::GlobalHttpCache<CliSys>;
|
|
|
|
pub type LocalHttpCache = deno_cache_dir::LocalHttpCache<CliSys>;
|
|
|
|
pub type LocalLspHttpCache = deno_cache_dir::LocalLspHttpCache<CliSys>;
|
2023-08-08 10:23:02 -04:00
|
|
|
pub use deno_cache_dir::HttpCache;
|
|
|
|
|
2024-09-25 21:50:54 -04:00
|
|
|
pub struct FetchCacherOptions {
|
|
|
|
pub file_header_overrides: HashMap<ModuleSpecifier, HashMap<String, String>>,
|
|
|
|
pub permissions: PermissionsContainer,
|
|
|
|
/// If we're publishing for `deno publish`.
|
|
|
|
pub is_deno_publish: bool,
|
|
|
|
}
|
|
|
|
|
2021-10-10 17:26:22 -04:00
|
|
|
/// A "wrapper" for the FileFetcher and DiskCache for the Deno CLI that provides
|
|
|
|
/// a concise interface to the DENO_DIR when building module graphs.
|
2022-03-23 09:54:22 -04:00
|
|
|
pub struct FetchCacher {
|
2024-09-18 15:15:13 -04:00
|
|
|
pub file_header_overrides: HashMap<ModuleSpecifier, HashMap<String, String>>,
|
2024-12-16 18:39:40 -05:00
|
|
|
file_fetcher: Arc<CliFileFetcher>,
|
2023-08-01 20:49:09 -04:00
|
|
|
global_http_cache: Arc<GlobalHttpCache>,
|
2024-11-01 12:27:00 -04:00
|
|
|
in_npm_pkg_checker: Arc<dyn InNpmPackageChecker>,
|
2023-10-25 18:13:22 -04:00
|
|
|
module_info_cache: Arc<ModuleInfoCache>,
|
2024-09-25 21:50:54 -04:00
|
|
|
permissions: PermissionsContainer,
|
2024-12-31 11:29:07 -05:00
|
|
|
sys: CliSys,
|
2024-09-25 21:50:54 -04:00
|
|
|
is_deno_publish: bool,
|
2024-10-14 20:48:39 -04:00
|
|
|
cache_info_enabled: bool,
|
2021-10-10 17:26:22 -04:00
|
|
|
}
|
|
|
|
|
|
|
|
impl FetchCacher {
|
|
|
|
pub fn new(
|
2024-12-16 18:39:40 -05:00
|
|
|
file_fetcher: Arc<CliFileFetcher>,
|
2023-08-01 20:49:09 -04:00
|
|
|
global_http_cache: Arc<GlobalHttpCache>,
|
2024-11-01 12:27:00 -04:00
|
|
|
in_npm_pkg_checker: Arc<dyn InNpmPackageChecker>,
|
2023-10-25 18:13:22 -04:00
|
|
|
module_info_cache: Arc<ModuleInfoCache>,
|
2024-12-31 11:29:07 -05:00
|
|
|
sys: CliSys,
|
2024-09-25 21:50:54 -04:00
|
|
|
options: FetchCacherOptions,
|
2021-10-10 17:26:22 -04:00
|
|
|
) -> Self {
|
|
|
|
Self {
|
|
|
|
file_fetcher,
|
2023-08-01 20:49:09 -04:00
|
|
|
global_http_cache,
|
2024-11-01 12:27:00 -04:00
|
|
|
in_npm_pkg_checker,
|
2023-10-25 18:13:22 -04:00
|
|
|
module_info_cache,
|
2024-12-30 12:38:20 -05:00
|
|
|
sys,
|
2024-09-25 21:50:54 -04:00
|
|
|
file_header_overrides: options.file_header_overrides,
|
|
|
|
permissions: options.permissions,
|
|
|
|
is_deno_publish: options.is_deno_publish,
|
2023-02-08 19:45:04 -05:00
|
|
|
cache_info_enabled: false,
|
2021-10-10 17:26:22 -04:00
|
|
|
}
|
|
|
|
}
|
2023-02-08 19:45:04 -05:00
|
|
|
|
|
|
|
/// The cache information takes a bit of time to fetch and it's
|
|
|
|
/// not always necessary. It should only be enabled for deno info.
|
|
|
|
pub fn enable_loading_cache_info(&mut self) {
|
|
|
|
self.cache_info_enabled = true;
|
|
|
|
}
|
2023-08-01 20:49:09 -04:00
|
|
|
|
2024-09-05 10:22:13 -04:00
|
|
|
/// Only use this for `deno info`.
|
2023-08-01 20:49:09 -04:00
|
|
|
fn get_local_path(&self, specifier: &ModuleSpecifier) -> Option<PathBuf> {
|
|
|
|
// TODO(@kitsonk) fix when deno_graph does not query cache for synthetic
|
|
|
|
// modules
|
|
|
|
if specifier.scheme() == "flags" {
|
|
|
|
None
|
|
|
|
} else if specifier.scheme() == "file" {
|
|
|
|
specifier.to_file_path().ok()
|
|
|
|
} else {
|
|
|
|
#[allow(deprecated)]
|
|
|
|
self
|
|
|
|
.global_http_cache
|
|
|
|
.get_global_cache_filepath(specifier)
|
|
|
|
.ok()
|
|
|
|
}
|
|
|
|
}
|
2021-10-10 17:26:22 -04:00
|
|
|
}
|
|
|
|
|
|
|
|
impl Loader for FetchCacher {
|
|
|
|
fn get_cache_info(&self, specifier: &ModuleSpecifier) -> Option<CacheInfo> {
|
2023-02-08 19:45:04 -05:00
|
|
|
if !self.cache_info_enabled {
|
|
|
|
return None;
|
|
|
|
}
|
|
|
|
|
2023-07-08 16:06:45 -04:00
|
|
|
#[allow(deprecated)]
|
2023-08-01 20:49:09 -04:00
|
|
|
let local = self.get_local_path(specifier)?;
|
2021-10-10 17:26:22 -04:00
|
|
|
if local.is_file() {
|
2024-09-05 10:22:13 -04:00
|
|
|
Some(CacheInfo { local: Some(local) })
|
2021-10-10 17:26:22 -04:00
|
|
|
} else {
|
|
|
|
None
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
fn load(
|
2024-04-18 20:51:16 -04:00
|
|
|
&self,
|
2021-10-10 17:26:22 -04:00
|
|
|
specifier: &ModuleSpecifier,
|
2024-02-15 14:49:35 -05:00
|
|
|
options: deno_graph::source::LoadOptions,
|
2021-10-10 17:26:22 -04:00
|
|
|
) -> LoadFuture {
|
2023-09-07 09:09:16 -04:00
|
|
|
use deno_graph::source::CacheSetting as LoaderCacheSetting;
|
|
|
|
|
2024-11-01 12:27:00 -04:00
|
|
|
if specifier.scheme() == "file"
|
|
|
|
&& specifier.path().contains("/node_modules/")
|
|
|
|
{
|
|
|
|
// The specifier might be in a completely different symlinked tree than
|
|
|
|
// what the node_modules url is in (ex. `/my-project-1/node_modules`
|
|
|
|
// symlinked to `/my-project-2/node_modules`), so first we checked if the path
|
|
|
|
// is in a node_modules dir to avoid needlessly canonicalizing, then now compare
|
|
|
|
// against the canonicalized specifier.
|
2024-12-30 12:38:20 -05:00
|
|
|
let specifier = node_resolver::resolve_specifier_into_node_modules(
|
|
|
|
&self.sys, specifier,
|
2024-11-01 12:27:00 -04:00
|
|
|
);
|
|
|
|
if self.in_npm_pkg_checker.in_npm_package(&specifier) {
|
2023-10-25 14:39:00 -04:00
|
|
|
return Box::pin(futures::future::ready(Ok(Some(
|
2024-11-01 12:27:00 -04:00
|
|
|
LoadResponse::External { specifier },
|
2023-10-25 14:39:00 -04:00
|
|
|
))));
|
2023-02-22 17:21:05 -05:00
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2024-09-25 21:50:54 -04:00
|
|
|
if self.is_deno_publish
|
|
|
|
&& matches!(specifier.scheme(), "http" | "https")
|
|
|
|
&& !specifier.as_str().starts_with(jsr_url().as_str())
|
|
|
|
{
|
|
|
|
// mark non-JSR remote modules as external so we don't need --allow-import
|
|
|
|
// permissions as these will error out later when publishing
|
|
|
|
return Box::pin(futures::future::ready(Ok(Some(
|
|
|
|
LoadResponse::External {
|
|
|
|
specifier: specifier.clone(),
|
|
|
|
},
|
|
|
|
))));
|
|
|
|
}
|
|
|
|
|
2021-10-10 17:26:22 -04:00
|
|
|
let file_fetcher = self.file_fetcher.clone();
|
2023-03-22 10:15:53 -04:00
|
|
|
let file_header_overrides = self.file_header_overrides.clone();
|
2023-09-07 09:09:16 -04:00
|
|
|
let permissions = self.permissions.clone();
|
2023-02-22 14:15:25 -05:00
|
|
|
let specifier = specifier.clone();
|
2024-09-25 21:50:54 -04:00
|
|
|
let is_statically_analyzable = !options.was_dynamic_root;
|
2021-10-10 17:26:22 -04:00
|
|
|
|
|
|
|
async move {
|
2024-02-15 14:49:35 -05:00
|
|
|
let maybe_cache_setting = match options.cache_setting {
|
2023-09-07 09:09:16 -04:00
|
|
|
LoaderCacheSetting::Use => None,
|
|
|
|
LoaderCacheSetting::Reload => {
|
|
|
|
if matches!(file_fetcher.cache_setting(), CacheSetting::Only) {
|
|
|
|
return Err(deno_core::anyhow::anyhow!(
|
2024-05-28 14:58:43 -04:00
|
|
|
"Could not resolve version constraint using only cached data. Try running again without --cached-only"
|
2023-09-07 09:09:16 -04:00
|
|
|
));
|
|
|
|
}
|
|
|
|
Some(CacheSetting::ReloadAll)
|
|
|
|
}
|
|
|
|
LoaderCacheSetting::Only => Some(CacheSetting::Only),
|
|
|
|
};
|
2022-01-13 11:58:00 -05:00
|
|
|
file_fetcher
|
2024-12-16 18:39:40 -05:00
|
|
|
.fetch_no_follow(
|
|
|
|
&specifier,
|
|
|
|
FetchPermissionsOptionRef::Restricted(&permissions,
|
|
|
|
if is_statically_analyzable {
|
|
|
|
deno_runtime::deno_permissions::CheckSpecifierKind::Static
|
|
|
|
} else {
|
|
|
|
deno_runtime::deno_permissions::CheckSpecifierKind::Dynamic
|
|
|
|
}),
|
|
|
|
FetchNoFollowOptions {
|
|
|
|
maybe_auth: None,
|
|
|
|
maybe_accept: None,
|
|
|
|
maybe_cache_setting: maybe_cache_setting.as_ref(),
|
2024-04-18 21:43:28 -04:00
|
|
|
maybe_checksum: options.maybe_checksum.as_ref(),
|
2023-09-07 09:09:16 -04:00
|
|
|
})
|
2021-10-10 17:26:22 -04:00
|
|
|
.await
|
2024-04-18 21:43:28 -04:00
|
|
|
.map(|file_or_redirect| {
|
|
|
|
match file_or_redirect {
|
|
|
|
FileOrRedirect::File(file) => {
|
|
|
|
let maybe_headers =
|
|
|
|
match (file.maybe_headers, file_header_overrides.get(&specifier)) {
|
|
|
|
(Some(headers), Some(overrides)) => {
|
|
|
|
Some(headers.into_iter().chain(overrides.clone()).collect())
|
|
|
|
}
|
|
|
|
(Some(headers), None) => Some(headers),
|
|
|
|
(None, Some(overrides)) => Some(overrides.clone()),
|
|
|
|
(None, None) => None,
|
|
|
|
};
|
|
|
|
Ok(Some(LoadResponse::Module {
|
2024-12-16 18:39:40 -05:00
|
|
|
specifier: file.url,
|
2024-04-18 21:43:28 -04:00
|
|
|
maybe_headers,
|
|
|
|
content: file.source,
|
|
|
|
}))
|
|
|
|
},
|
|
|
|
FileOrRedirect::Redirect(redirect_specifier) => {
|
|
|
|
Ok(Some(LoadResponse::Redirect {
|
|
|
|
specifier: redirect_specifier,
|
|
|
|
}))
|
|
|
|
},
|
|
|
|
}
|
2023-03-15 17:46:36 -04:00
|
|
|
})
|
|
|
|
.unwrap_or_else(|err| {
|
2024-12-16 18:39:40 -05:00
|
|
|
let err = err.into_kind();
|
|
|
|
match err {
|
|
|
|
CliFetchNoFollowErrorKind::FetchNoFollow(err) => {
|
|
|
|
let err = err.into_kind();
|
|
|
|
match err {
|
|
|
|
FetchNoFollowErrorKind::NotFound(_) => Ok(None),
|
|
|
|
FetchNoFollowErrorKind::UrlToFilePath { .. } |
|
|
|
|
FetchNoFollowErrorKind::ReadingBlobUrl { .. } |
|
|
|
|
FetchNoFollowErrorKind::ReadingFile { .. } |
|
|
|
|
FetchNoFollowErrorKind::FetchingRemote { .. } |
|
|
|
|
FetchNoFollowErrorKind::ClientError { .. } |
|
|
|
|
FetchNoFollowErrorKind::NoRemote { .. } |
|
|
|
|
FetchNoFollowErrorKind::DataUrlDecode { .. } |
|
|
|
|
FetchNoFollowErrorKind::RedirectResolution { .. } |
|
|
|
|
FetchNoFollowErrorKind::CacheRead { .. } |
|
|
|
|
FetchNoFollowErrorKind::CacheSave { .. } |
|
|
|
|
FetchNoFollowErrorKind::UnsupportedScheme { .. } |
|
|
|
|
FetchNoFollowErrorKind::RedirectHeaderParse { .. } |
|
|
|
|
FetchNoFollowErrorKind::InvalidHeader { .. } => Err(AnyError::from(err)),
|
|
|
|
FetchNoFollowErrorKind::NotCached { .. } => {
|
|
|
|
if options.cache_setting == LoaderCacheSetting::Only {
|
|
|
|
Ok(None)
|
|
|
|
} else {
|
|
|
|
Err(AnyError::from(err))
|
|
|
|
}
|
|
|
|
},
|
|
|
|
FetchNoFollowErrorKind::ChecksumIntegrity(err) => {
|
|
|
|
// convert to the equivalent deno_graph error so that it
|
|
|
|
// enhances it if this is passed to deno_graph
|
|
|
|
Err(
|
|
|
|
deno_graph::source::ChecksumIntegrityError {
|
|
|
|
actual: err.actual,
|
|
|
|
expected: err.expected,
|
|
|
|
}
|
|
|
|
.into(),
|
|
|
|
)
|
|
|
|
}
|
|
|
|
}
|
|
|
|
},
|
|
|
|
CliFetchNoFollowErrorKind::PermissionCheck(permission_check_error) => Err(AnyError::from(permission_check_error)),
|
2023-09-18 10:46:44 -04:00
|
|
|
}
|
2023-03-15 17:46:36 -04:00
|
|
|
})
|
2021-10-10 17:26:22 -04:00
|
|
|
}
|
2024-06-03 17:17:08 -04:00
|
|
|
.boxed_local()
|
2021-10-10 17:26:22 -04:00
|
|
|
}
|
2023-09-07 09:09:16 -04:00
|
|
|
|
|
|
|
fn cache_module_info(
|
2024-04-18 20:51:16 -04:00
|
|
|
&self,
|
2023-09-07 09:09:16 -04:00
|
|
|
specifier: &ModuleSpecifier,
|
2024-09-05 10:22:13 -04:00
|
|
|
media_type: MediaType,
|
2024-01-31 22:15:22 -05:00
|
|
|
source: &Arc<[u8]>,
|
2023-09-07 09:09:16 -04:00
|
|
|
module_info: &deno_graph::ModuleInfo,
|
|
|
|
) {
|
2024-04-29 14:09:58 -04:00
|
|
|
log::debug!("Caching module info for {}", specifier);
|
2025-01-06 18:56:36 -05:00
|
|
|
let source_hash = CacheDBHash::from_hashable(source);
|
2023-10-25 18:13:22 -04:00
|
|
|
let result = self.module_info_cache.set_module_info(
|
2023-09-07 09:09:16 -04:00
|
|
|
specifier,
|
2024-09-05 10:22:13 -04:00
|
|
|
media_type,
|
2024-05-29 14:38:18 -04:00
|
|
|
source_hash,
|
2023-09-07 09:09:16 -04:00
|
|
|
module_info,
|
|
|
|
);
|
|
|
|
if let Err(err) = result {
|
|
|
|
log::debug!(
|
|
|
|
"Error saving module cache info for {}. {:#}",
|
|
|
|
specifier,
|
|
|
|
err
|
|
|
|
);
|
|
|
|
}
|
|
|
|
}
|
2021-10-10 17:26:22 -04:00
|
|
|
}
|