summaryrefslogtreecommitdiff
path: root/core/modules/mod.rs
diff options
context:
space:
mode:
Diffstat (limited to 'core/modules/mod.rs')
-rw-r--r--core/modules/mod.rs689
1 files changed, 689 insertions, 0 deletions
diff --git a/core/modules/mod.rs b/core/modules/mod.rs
new file mode 100644
index 000000000..83f10bc72
--- /dev/null
+++ b/core/modules/mod.rs
@@ -0,0 +1,689 @@
+// Copyright 2018-2023 the Deno authors. All rights reserved. MIT license.
+use crate::error::generic_error;
+use crate::fast_string::FastString;
+use crate::module_specifier::ModuleSpecifier;
+use crate::resolve_url;
+use anyhow::Error;
+use futures::future::FutureExt;
+use futures::stream::FuturesUnordered;
+use futures::stream::Stream;
+use futures::stream::TryStreamExt;
+use log::debug;
+use serde::Deserialize;
+use serde::Serialize;
+use std::cell::RefCell;
+use std::collections::HashMap;
+use std::collections::HashSet;
+use std::collections::VecDeque;
+use std::future::Future;
+use std::pin::Pin;
+use std::rc::Rc;
+use std::task::Context;
+use std::task::Poll;
+
+mod loaders;
+mod map;
+
+#[cfg(test)]
+mod tests;
+
+pub(crate) use loaders::ExtModuleLoader;
+pub use loaders::ExtModuleLoaderCb;
+pub use loaders::FsModuleLoader;
+pub use loaders::ModuleLoader;
+pub use loaders::NoopModuleLoader;
+pub(crate) use map::ModuleMap;
+#[cfg(test)]
+pub(crate) use map::SymbolicModule;
+
+pub type ModuleId = usize;
+pub(crate) type ModuleLoadId = i32;
+pub type ModuleCode = FastString;
+pub type ModuleName = FastString;
+
+const SUPPORTED_TYPE_ASSERTIONS: &[&str] = &["json"];
+
+/// Throws V8 exception if assertions are invalid
+pub(crate) fn validate_import_assertions(
+ scope: &mut v8::HandleScope,
+ assertions: &HashMap<String, String>,
+) {
+ for (key, value) in assertions {
+ if key == "type" && !SUPPORTED_TYPE_ASSERTIONS.contains(&value.as_str()) {
+ let message = v8::String::new(
+ scope,
+ &format!("\"{value}\" is not a valid module type."),
+ )
+ .unwrap();
+ let exception = v8::Exception::type_error(scope, message);
+ scope.throw_exception(exception);
+ return;
+ }
+ }
+}
+
+#[derive(Debug)]
+pub(crate) enum ImportAssertionsKind {
+ StaticImport,
+ DynamicImport,
+}
+
+pub(crate) fn parse_import_assertions(
+ scope: &mut v8::HandleScope,
+ import_assertions: v8::Local<v8::FixedArray>,
+ kind: ImportAssertionsKind,
+) -> HashMap<String, String> {
+ let mut assertions: HashMap<String, String> = HashMap::default();
+
+ let assertions_per_line = match kind {
+ // For static imports, assertions are triples of (keyword, value and source offset)
+ // Also used in `module_resolve_callback`.
+ ImportAssertionsKind::StaticImport => 3,
+ // For dynamic imports, assertions are tuples of (keyword, value)
+ ImportAssertionsKind::DynamicImport => 2,
+ };
+ assert_eq!(import_assertions.length() % assertions_per_line, 0);
+ let no_of_assertions = import_assertions.length() / assertions_per_line;
+
+ for i in 0..no_of_assertions {
+ let assert_key = import_assertions
+ .get(scope, assertions_per_line * i)
+ .unwrap();
+ let assert_key_val = v8::Local::<v8::Value>::try_from(assert_key).unwrap();
+ let assert_value = import_assertions
+ .get(scope, (assertions_per_line * i) + 1)
+ .unwrap();
+ let assert_value_val =
+ v8::Local::<v8::Value>::try_from(assert_value).unwrap();
+ assertions.insert(
+ assert_key_val.to_rust_string_lossy(scope),
+ assert_value_val.to_rust_string_lossy(scope),
+ );
+ }
+
+ assertions
+}
+
+pub(crate) fn get_asserted_module_type_from_assertions(
+ assertions: &HashMap<String, String>,
+) -> AssertedModuleType {
+ assertions
+ .get("type")
+ .map(|ty| {
+ if ty == "json" {
+ AssertedModuleType::Json
+ } else {
+ AssertedModuleType::JavaScriptOrWasm
+ }
+ })
+ .unwrap_or(AssertedModuleType::JavaScriptOrWasm)
+}
+
+/// A type of module to be executed.
+///
+/// For non-`JavaScript` modules, this value doesn't tell
+/// how to interpret the module; it is only used to validate
+/// the module against an import assertion (if one is present
+/// in the import statement).
+#[derive(Clone, Copy, Debug, Eq, Hash, PartialEq, Serialize, Deserialize)]
+#[repr(u32)]
+pub enum ModuleType {
+ JavaScript,
+ Json,
+}
+
+impl std::fmt::Display for ModuleType {
+ fn fmt(&self, f: &mut std::fmt::Formatter) -> std::fmt::Result {
+ match self {
+ Self::JavaScript => write!(f, "JavaScript"),
+ Self::Json => write!(f, "JSON"),
+ }
+ }
+}
+
+/// EsModule source code that will be loaded into V8.
+///
+/// Users can implement `Into<ModuleInfo>` for different file types that
+/// can be transpiled to valid EsModule.
+///
+/// Found module URL might be different from specified URL
+/// used for loading due to redirections (like HTTP 303).
+/// Eg. Both "`https://example.com/a.ts`" and
+/// "`https://example.com/b.ts`" may point to "`https://example.com/c.ts`"
+/// By keeping track of specified and found URL we can alias modules and avoid
+/// recompiling the same code 3 times.
+// TODO(bartlomieju): I have a strong opinion we should store all redirects
+// that happened; not only first and final target. It would simplify a lot
+// of things throughout the codebase otherwise we may end up requesting
+// intermediate redirects from file loader.
+// NOTE: This should _not_ be made #[derive(Clone)] unless we take some precautions to avoid excessive string copying.
+#[derive(Debug)]
+pub struct ModuleSource {
+ pub code: ModuleCode,
+ pub module_type: ModuleType,
+ module_url_specified: ModuleName,
+ /// If the module was found somewhere other than the specified address, this will be [`Some`].
+ module_url_found: Option<ModuleName>,
+}
+
+impl ModuleSource {
+ /// Create a [`ModuleSource`] without a redirect.
+ pub fn new(
+ module_type: impl Into<ModuleType>,
+ code: ModuleCode,
+ specifier: &ModuleSpecifier,
+ ) -> Self {
+ let module_url_specified = specifier.as_ref().to_owned().into();
+ Self {
+ code,
+ module_type: module_type.into(),
+ module_url_specified,
+ module_url_found: None,
+ }
+ }
+
+ /// Create a [`ModuleSource`] with a potential redirect. If the `specifier_found` parameter is the same as the
+ /// specifier, the code behaves the same was as `ModuleSource::new`.
+ pub fn new_with_redirect(
+ module_type: impl Into<ModuleType>,
+ code: ModuleCode,
+ specifier: &ModuleSpecifier,
+ specifier_found: &ModuleSpecifier,
+ ) -> Self {
+ let module_url_found = if specifier == specifier_found {
+ None
+ } else {
+ Some(specifier_found.as_ref().to_owned().into())
+ };
+ let module_url_specified = specifier.as_ref().to_owned().into();
+ Self {
+ code,
+ module_type: module_type.into(),
+ module_url_specified,
+ module_url_found,
+ }
+ }
+
+ #[cfg(test)]
+ pub fn for_test(code: &'static str, file: impl AsRef<str>) -> Self {
+ Self {
+ code: ModuleCode::from_static(code),
+ module_type: ModuleType::JavaScript,
+ module_url_specified: file.as_ref().to_owned().into(),
+ module_url_found: None,
+ }
+ }
+
+ /// If the `found` parameter is the same as the `specified` parameter, the code behaves the same was as `ModuleSource::for_test`.
+ #[cfg(test)]
+ pub fn for_test_with_redirect(
+ code: &'static str,
+ specified: impl AsRef<str>,
+ found: impl AsRef<str>,
+ ) -> Self {
+ let specified = specified.as_ref().to_string();
+ let found = found.as_ref().to_string();
+ let found = if found == specified {
+ None
+ } else {
+ Some(found.into())
+ };
+ Self {
+ code: ModuleCode::from_static(code),
+ module_type: ModuleType::JavaScript,
+ module_url_specified: specified.into(),
+ module_url_found: found,
+ }
+ }
+}
+
+pub(crate) type PrepareLoadFuture =
+ dyn Future<Output = (ModuleLoadId, Result<RecursiveModuleLoad, Error>)>;
+pub type ModuleSourceFuture = dyn Future<Output = Result<ModuleSource, Error>>;
+
+type ModuleLoadFuture =
+ dyn Future<Output = Result<(ModuleRequest, ModuleSource), Error>>;
+
+#[derive(Debug, PartialEq, Eq)]
+pub enum ResolutionKind {
+ /// This kind is used in only one situation: when a module is loaded via
+ /// `JsRuntime::load_main_module` and is the top-level module, ie. the one
+ /// passed as an argument to `JsRuntime::load_main_module`.
+ MainModule,
+ /// This kind is returned for all other modules during module load, that are
+ /// static imports.
+ Import,
+ /// This kind is returned for all modules that are loaded as a result of a
+ /// call to `import()` API (ie. top-level module as well as all its
+ /// dependencies, and any other `import()` calls from that load).
+ DynamicImport,
+}
+
+/// Describes the entrypoint of a recursive module load.
+#[derive(Debug)]
+enum LoadInit {
+ /// Main module specifier.
+ Main(String),
+ /// Module specifier for side module.
+ Side(String),
+ /// Dynamic import specifier with referrer and expected
+ /// module type (which is determined by import assertion).
+ DynamicImport(String, String, AssertedModuleType),
+}
+
+#[derive(Debug, Eq, PartialEq)]
+pub enum LoadState {
+ Init,
+ LoadingRoot,
+ LoadingImports,
+ Done,
+}
+
+/// This future is used to implement parallel async module loading.
+pub(crate) struct RecursiveModuleLoad {
+ pub id: ModuleLoadId,
+ pub root_module_id: Option<ModuleId>,
+ init: LoadInit,
+ root_asserted_module_type: Option<AssertedModuleType>,
+ root_module_type: Option<ModuleType>,
+ state: LoadState,
+ module_map_rc: Rc<RefCell<ModuleMap>>,
+ pending: FuturesUnordered<Pin<Box<ModuleLoadFuture>>>,
+ visited: HashSet<ModuleRequest>,
+ // The loader is copied from `module_map_rc`, but its reference is cloned
+ // ahead of time to avoid already-borrowed errors.
+ loader: Rc<dyn ModuleLoader>,
+}
+
+impl RecursiveModuleLoad {
+ /// Starts a new asynchronous load of the module graph for given specifier.
+ ///
+ /// The module corresponding for the given `specifier` will be marked as
+ // "the main module" (`import.meta.main` will return `true` for this module).
+ fn main(specifier: &str, module_map_rc: Rc<RefCell<ModuleMap>>) -> Self {
+ Self::new(LoadInit::Main(specifier.to_string()), module_map_rc)
+ }
+
+ /// Starts a new asynchronous load of the module graph for given specifier.
+ fn side(specifier: &str, module_map_rc: Rc<RefCell<ModuleMap>>) -> Self {
+ Self::new(LoadInit::Side(specifier.to_string()), module_map_rc)
+ }
+
+ /// Starts a new asynchronous load of the module graph for given specifier
+ /// that was imported using `import()`.
+ fn dynamic_import(
+ specifier: &str,
+ referrer: &str,
+ asserted_module_type: AssertedModuleType,
+ module_map_rc: Rc<RefCell<ModuleMap>>,
+ ) -> Self {
+ Self::new(
+ LoadInit::DynamicImport(
+ specifier.to_string(),
+ referrer.to_string(),
+ asserted_module_type,
+ ),
+ module_map_rc,
+ )
+ }
+
+ fn new(init: LoadInit, module_map_rc: Rc<RefCell<ModuleMap>>) -> Self {
+ let id = {
+ let mut module_map = module_map_rc.borrow_mut();
+ let id = module_map.next_load_id;
+ module_map.next_load_id += 1;
+ id
+ };
+ let loader = module_map_rc.borrow().loader.clone();
+ let asserted_module_type = match init {
+ LoadInit::DynamicImport(_, _, module_type) => module_type,
+ _ => AssertedModuleType::JavaScriptOrWasm,
+ };
+ let mut load = Self {
+ id,
+ root_module_id: None,
+ root_asserted_module_type: None,
+ root_module_type: None,
+ init,
+ state: LoadState::Init,
+ module_map_rc: module_map_rc.clone(),
+ loader,
+ pending: FuturesUnordered::new(),
+ visited: HashSet::new(),
+ };
+ // FIXME(bartlomieju): this seems fishy
+ // Ignore the error here, let it be hit in `Stream::poll_next()`.
+ if let Ok(root_specifier) = load.resolve_root() {
+ if let Some(module_id) = module_map_rc
+ .borrow()
+ .get_id(root_specifier, asserted_module_type)
+ {
+ load.root_module_id = Some(module_id);
+ load.root_asserted_module_type = Some(asserted_module_type);
+ load.root_module_type = Some(
+ module_map_rc
+ .borrow()
+ .get_info_by_id(module_id)
+ .unwrap()
+ .module_type,
+ );
+ }
+ }
+ load
+ }
+
+ fn resolve_root(&self) -> Result<ModuleSpecifier, Error> {
+ match self.init {
+ LoadInit::Main(ref specifier) => {
+ self
+ .loader
+ .resolve(specifier, ".", ResolutionKind::MainModule)
+ }
+ LoadInit::Side(ref specifier) => {
+ self.loader.resolve(specifier, ".", ResolutionKind::Import)
+ }
+ LoadInit::DynamicImport(ref specifier, ref referrer, _) => self
+ .loader
+ .resolve(specifier, referrer, ResolutionKind::DynamicImport),
+ }
+ }
+
+ async fn prepare(&self) -> Result<(), Error> {
+ let (module_specifier, maybe_referrer) = match self.init {
+ LoadInit::Main(ref specifier) => {
+ let spec =
+ self
+ .loader
+ .resolve(specifier, ".", ResolutionKind::MainModule)?;
+ (spec, None)
+ }
+ LoadInit::Side(ref specifier) => {
+ let spec =
+ self
+ .loader
+ .resolve(specifier, ".", ResolutionKind::Import)?;
+ (spec, None)
+ }
+ LoadInit::DynamicImport(ref specifier, ref referrer, _) => {
+ let spec = self.loader.resolve(
+ specifier,
+ referrer,
+ ResolutionKind::DynamicImport,
+ )?;
+ (spec, Some(referrer.to_string()))
+ }
+ };
+
+ self
+ .loader
+ .prepare_load(&module_specifier, maybe_referrer, self.is_dynamic_import())
+ .await
+ }
+
+ fn is_currently_loading_main_module(&self) -> bool {
+ !self.is_dynamic_import()
+ && matches!(self.init, LoadInit::Main(..))
+ && self.state == LoadState::LoadingRoot
+ }
+
+ fn is_dynamic_import(&self) -> bool {
+ matches!(self.init, LoadInit::DynamicImport(..))
+ }
+
+ pub(crate) fn register_and_recurse(
+ &mut self,
+ scope: &mut v8::HandleScope,
+ module_request: &ModuleRequest,
+ module_source: ModuleSource,
+ ) -> Result<(), ModuleError> {
+ let expected_asserted_module_type = module_source.module_type.into();
+ let module_url_found = module_source.module_url_found;
+ let module_url_specified = module_source.module_url_specified;
+
+ if module_request.asserted_module_type != expected_asserted_module_type {
+ return Err(ModuleError::Other(generic_error(format!(
+ "Expected a \"{}\" module but loaded a \"{}\" module.",
+ module_request.asserted_module_type, module_source.module_type,
+ ))));
+ }
+
+ // Register the module in the module map unless it's already there. If the
+ // specified URL and the "true" URL are different, register the alias.
+ let module_url_found = if let Some(module_url_found) = module_url_found {
+ let (module_url_found1, module_url_found2) =
+ module_url_found.into_cheap_copy();
+ self.module_map_rc.borrow_mut().alias(
+ module_url_specified,
+ expected_asserted_module_type,
+ module_url_found1,
+ );
+ module_url_found2
+ } else {
+ module_url_specified
+ };
+
+ let maybe_module_id = self
+ .module_map_rc
+ .borrow()
+ .get_id(&module_url_found, expected_asserted_module_type);
+ let module_id = match maybe_module_id {
+ Some(id) => {
+ debug!(
+ "Already-registered module fetched again: {:?}",
+ module_url_found
+ );
+ id
+ }
+ None => match module_source.module_type {
+ ModuleType::JavaScript => {
+ self.module_map_rc.borrow_mut().new_es_module(
+ scope,
+ self.is_currently_loading_main_module(),
+ module_url_found,
+ module_source.code,
+ self.is_dynamic_import(),
+ )?
+ }
+ ModuleType::Json => self.module_map_rc.borrow_mut().new_json_module(
+ scope,
+ module_url_found,
+ module_source.code,
+ )?,
+ },
+ };
+
+ // Recurse the module's imports. There are two cases for each import:
+ // 1. If the module is not in the module map, start a new load for it in
+ // `self.pending`. The result of that load should eventually be passed to
+ // this function for recursion.
+ // 2. If the module is already in the module map, queue it up to be
+ // recursed synchronously here.
+ // This robustly ensures that the whole graph is in the module map before
+ // `LoadState::Done` is set.
+ let mut already_registered = VecDeque::new();
+ already_registered.push_back((module_id, module_request.clone()));
+ self.visited.insert(module_request.clone());
+ while let Some((module_id, module_request)) = already_registered.pop_front()
+ {
+ let referrer = ModuleSpecifier::parse(&module_request.specifier).unwrap();
+ let imports = self
+ .module_map_rc
+ .borrow()
+ .get_requested_modules(module_id)
+ .unwrap()
+ .clone();
+ for module_request in imports {
+ if !self.visited.contains(&module_request) {
+ if let Some(module_id) = self.module_map_rc.borrow().get_id(
+ module_request.specifier.as_str(),
+ module_request.asserted_module_type,
+ ) {
+ already_registered.push_back((module_id, module_request.clone()));
+ } else {
+ let request = module_request.clone();
+ let specifier =
+ ModuleSpecifier::parse(&module_request.specifier).unwrap();
+ let referrer = referrer.clone();
+ let loader = self.loader.clone();
+ let is_dynamic_import = self.is_dynamic_import();
+ let fut = async move {
+ let load_result = loader
+ .load(&specifier, Some(&referrer), is_dynamic_import)
+ .await;
+ load_result.map(|s| (request, s))
+ };
+ self.pending.push(fut.boxed_local());
+ }
+ self.visited.insert(module_request);
+ }
+ }
+ }
+
+ // Update `self.state` however applicable.
+ if self.state == LoadState::LoadingRoot {
+ self.root_module_id = Some(module_id);
+ self.root_asserted_module_type = Some(module_source.module_type.into());
+ self.state = LoadState::LoadingImports;
+ }
+ if self.pending.is_empty() {
+ self.state = LoadState::Done;
+ }
+
+ Ok(())
+ }
+}
+
+impl Stream for RecursiveModuleLoad {
+ type Item = Result<(ModuleRequest, ModuleSource), Error>;
+
+ fn poll_next(
+ self: Pin<&mut Self>,
+ cx: &mut Context,
+ ) -> Poll<Option<Self::Item>> {
+ let inner = self.get_mut();
+ // IMPORTANT: Do not borrow `inner.module_map_rc` here. It may not be
+ // available.
+ match inner.state {
+ LoadState::Init => {
+ let module_specifier = match inner.resolve_root() {
+ Ok(url) => url,
+ Err(error) => return Poll::Ready(Some(Err(error))),
+ };
+ let load_fut = if let Some(_module_id) = inner.root_module_id {
+ // FIXME(bartlomieju): this is very bad
+ // The root module is already in the module map.
+ // TODO(nayeemrmn): In this case we would ideally skip to
+ // `LoadState::LoadingImports` and synchronously recurse the imports
+ // like the bottom of `RecursiveModuleLoad::register_and_recurse()`.
+ // But the module map cannot be borrowed here. Instead fake a load
+ // event so it gets passed to that function and recursed eventually.
+ let asserted_module_type = inner.root_asserted_module_type.unwrap();
+ let module_type = inner.root_module_type.unwrap();
+ let module_request = ModuleRequest {
+ specifier: module_specifier.to_string(),
+ asserted_module_type,
+ };
+ // The code will be discarded, since this module is already in the
+ // module map.
+ let module_source = ModuleSource::new(
+ module_type,
+ Default::default(),
+ &module_specifier,
+ );
+ futures::future::ok((module_request, module_source)).boxed()
+ } else {
+ let maybe_referrer = match inner.init {
+ LoadInit::DynamicImport(_, ref referrer, _) => {
+ resolve_url(referrer).ok()
+ }
+ _ => None,
+ };
+ let asserted_module_type = match inner.init {
+ LoadInit::DynamicImport(_, _, module_type) => module_type,
+ _ => AssertedModuleType::JavaScriptOrWasm,
+ };
+ let module_request = ModuleRequest {
+ specifier: module_specifier.to_string(),
+ asserted_module_type,
+ };
+ let loader = inner.loader.clone();
+ let is_dynamic_import = inner.is_dynamic_import();
+ async move {
+ let result = loader
+ .load(
+ &module_specifier,
+ maybe_referrer.as_ref(),
+ is_dynamic_import,
+ )
+ .await;
+ result.map(|s| (module_request, s))
+ }
+ .boxed_local()
+ };
+ inner.pending.push(load_fut);
+ inner.state = LoadState::LoadingRoot;
+ inner.try_poll_next_unpin(cx)
+ }
+ LoadState::LoadingRoot | LoadState::LoadingImports => {
+ match inner.pending.try_poll_next_unpin(cx)? {
+ Poll::Ready(None) => unreachable!(),
+ Poll::Ready(Some(info)) => Poll::Ready(Some(Ok(info))),
+ Poll::Pending => Poll::Pending,
+ }
+ }
+ LoadState::Done => Poll::Ready(None),
+ }
+ }
+}
+
+#[derive(Clone, Copy, Debug, Eq, Hash, PartialEq, Serialize, Deserialize)]
+#[repr(u32)]
+pub(crate) enum AssertedModuleType {
+ JavaScriptOrWasm,
+ Json,
+}
+
+impl From<ModuleType> for AssertedModuleType {
+ fn from(module_type: ModuleType) -> AssertedModuleType {
+ match module_type {
+ ModuleType::JavaScript => AssertedModuleType::JavaScriptOrWasm,
+ ModuleType::Json => AssertedModuleType::Json,
+ }
+ }
+}
+
+impl std::fmt::Display for AssertedModuleType {
+ fn fmt(&self, f: &mut std::fmt::Formatter) -> std::fmt::Result {
+ match self {
+ Self::JavaScriptOrWasm => write!(f, "JavaScriptOrWasm"),
+ Self::Json => write!(f, "JSON"),
+ }
+ }
+}
+
+/// Describes a request for a module as parsed from the source code.
+/// Usually executable (`JavaScriptOrWasm`) is used, except when an
+/// import assertions explicitly constrains an import to JSON, in
+/// which case this will have a `AssertedModuleType::Json`.
+#[derive(Clone, Debug, Eq, Hash, PartialEq, Serialize, Deserialize)]
+pub(crate) struct ModuleRequest {
+ pub specifier: String,
+ pub asserted_module_type: AssertedModuleType,
+}
+
+#[derive(Debug, PartialEq)]
+pub(crate) struct ModuleInfo {
+ #[allow(unused)]
+ pub id: ModuleId,
+ // Used in "bindings.rs" for "import.meta.main" property value.
+ pub main: bool,
+ pub name: ModuleName,
+ pub requests: Vec<ModuleRequest>,
+ pub module_type: ModuleType,
+}
+
+#[derive(Debug)]
+pub(crate) enum ModuleError {
+ Exception(v8::Global<v8::Value>),
+ Other(Error),
+}