summaryrefslogtreecommitdiff
path: root/runtime/ops/web_worker/sync_fetch.rs
blob: a9a893572d156afd167080480da6d9f9f3044be7 (plain)
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
// Copyright 2018-2023 the Deno authors. All rights reserved. MIT license.

use crate::web_worker::WebWorkerInternalHandle;
use crate::web_worker::WebWorkerType;
use deno_core::error::type_error;
use deno_core::error::AnyError;
use deno_core::op;
use deno_core::url::Url;
use deno_core::OpState;
use deno_fetch::data_url::DataUrl;
use deno_fetch::reqwest;
use deno_web::BlobStore;
use deno_websocket::DomExceptionNetworkError;
use hyper::body::Bytes;
use serde::Deserialize;
use serde::Serialize;
use tokio::task::JoinHandle;

// TODO(andreubotella) Properly parse the MIME type
fn mime_type_essence(mime_type: &str) -> String {
  let essence = match mime_type.split_once(';') {
    Some((essence, _)) => essence,
    None => mime_type,
  };
  essence.trim().to_ascii_lowercase()
}

#[derive(Serialize, Deserialize)]
#[serde(rename_all = "camelCase")]
pub struct SyncFetchScript {
  url: String,
  script: String,
}

#[op]
pub fn op_worker_sync_fetch(
  state: &mut OpState,
  scripts: Vec<String>,
  mut loose_mime_checks: bool,
) -> Result<Vec<SyncFetchScript>, AnyError> {
  let handle = state.borrow::<WebWorkerInternalHandle>().clone();
  assert_eq!(handle.worker_type, WebWorkerType::Classic);

  let client = state.borrow::<reqwest::Client>().clone();

  // TODO(andreubotella) It's not good to throw an exception related to blob
  // URLs when none of the script URLs use the blob scheme.
  // Also, in which contexts are blob URLs not supported?
  let blob_store = state
    .try_borrow::<BlobStore>()
    .ok_or_else(|| type_error("Blob URLs are not supported in this context."))?
    .clone();

  // TODO(andreubotella): make the below thread into a resource that can be
  // re-used. This would allow parallel fecthing of multiple scripts.

  let thread = std::thread::spawn(move || {
    let runtime = tokio::runtime::Builder::new_current_thread()
      .enable_io()
      .enable_time()
      .build()?;

    let handles: Vec<_> = scripts
      .into_iter()
      .map(|script| -> JoinHandle<Result<SyncFetchScript, AnyError>> {
        let client = client.clone();
        let blob_store = blob_store.clone();
        runtime.spawn(async move {
          let script_url = Url::parse(&script)
            .map_err(|_| type_error("Invalid script URL"))?;

          let (body, mime_type, res_url) = match script_url.scheme() {
            "http" | "https" => {
              let resp =
                client.get(script_url).send().await?.error_for_status()?;

              let res_url = resp.url().to_string();

              // TODO(andreubotella) Properly run fetch's "extract a MIME type".
              let mime_type = resp
                .headers()
                .get("Content-Type")
                .and_then(|v| v.to_str().ok())
                .map(mime_type_essence);

              // Always check the MIME type with HTTP(S).
              loose_mime_checks = false;

              let body = resp.bytes().await?;

              (body, mime_type, res_url)
            }
            "data" => {
              let data_url = DataUrl::process(&script)
                .map_err(|e| type_error(format!("{:?}", e)))?;

              let mime_type = {
                let mime = data_url.mime_type();
                format!("{}/{}", mime.type_, mime.subtype)
              };

              let (body, _) = data_url
                .decode_to_vec()
                .map_err(|e| type_error(format!("{:?}", e)))?;

              (Bytes::from(body), Some(mime_type), script)
            }
            "blob" => {
              let blob =
                blob_store.get_object_url(script_url).ok_or_else(|| {
                  type_error("Blob for the given URL not found.")
                })?;

              let mime_type = mime_type_essence(&blob.media_type);

              let body = blob.read_all().await?;

              (Bytes::from(body), Some(mime_type), script)
            }
            _ => {
              return Err(type_error(format!(
                "Classic scripts with scheme {}: are not supported in workers.",
                script_url.scheme()
              )))
            }
          };

          if !loose_mime_checks {
            // TODO(andreubotella) Check properly for a Javascript MIME type.
            match mime_type.as_deref() {
              Some("application/javascript" | "text/javascript") => {}
              Some(mime_type) => {
                return Err(
                  DomExceptionNetworkError {
                    msg: format!("Invalid MIME type {:?}.", mime_type),
                  }
                  .into(),
                )
              }
              None => {
                return Err(
                  DomExceptionNetworkError::new("Missing MIME type.").into(),
                )
              }
            }
          }

          let (text, _) = encoding_rs::UTF_8.decode_with_bom_removal(&body);

          Ok(SyncFetchScript {
            url: res_url,
            script: text.into_owned(),
          })
        })
      })
      .collect();

    let mut ret = Vec::with_capacity(handles.len());
    for handle in handles {
      let script = runtime.block_on(handle)??;
      ret.push(script);
    }
    Ok(ret)
  });

  thread.join().unwrap()
}