Blob.cpp 17 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379
  1. /*
  2. * Copyright (c) 2022-2023, Kenneth Myhra <kennethmyhra@serenityos.org>
  3. * Copyright (c) 2023, Shannon Booth <shannon@serenityos.org>
  4. *
  5. * SPDX-License-Identifier: BSD-2-Clause
  6. */
  7. #include <AK/GenericLexer.h>
  8. #include <LibJS/Runtime/ArrayBuffer.h>
  9. #include <LibJS/Runtime/Completion.h>
  10. #include <LibJS/Runtime/TypedArray.h>
  11. #include <LibTextCodec/Decoder.h>
  12. #include <LibWeb/Bindings/BlobPrototype.h>
  13. #include <LibWeb/Bindings/ExceptionOrUtils.h>
  14. #include <LibWeb/Bindings/Intrinsics.h>
  15. #include <LibWeb/FileAPI/Blob.h>
  16. #include <LibWeb/HTML/Scripting/TemporaryExecutionContext.h>
  17. #include <LibWeb/Infra/Strings.h>
  18. #include <LibWeb/Streams/AbstractOperations.h>
  19. #include <LibWeb/Streams/ReadableStreamDefaultReader.h>
  20. #include <LibWeb/WebIDL/AbstractOperations.h>
  21. namespace Web::FileAPI {
  22. WebIDL::ExceptionOr<JS::NonnullGCPtr<Blob>> Blob::create(JS::Realm& realm, ByteBuffer byte_buffer, String type)
  23. {
  24. return MUST_OR_THROW_OOM(realm.heap().allocate<Blob>(realm, realm, move(byte_buffer), move(type)));
  25. }
  26. // https://w3c.github.io/FileAPI/#convert-line-endings-to-native
  27. ErrorOr<String> convert_line_endings_to_native(StringView string)
  28. {
  29. // 1. Let native line ending be be the code point U+000A LF.
  30. auto native_line_ending = "\n"sv;
  31. // 2. If the underlying platform’s conventions are to represent newlines as a carriage return and line feed sequence, set native line ending to the code point U+000D CR followed by the code point U+000A LF.
  32. // NOTE: this step is a no-op since LibWeb does not compile on Windows, which is the only platform we know of that that uses a carriage return and line feed sequence for line endings.
  33. // 3. Set result to the empty string.
  34. StringBuilder result;
  35. // 4. Let position be a position variable for s, initially pointing at the start of s.
  36. auto lexer = GenericLexer { string };
  37. // 5. Let token be the result of collecting a sequence of code points that are not equal to U+000A LF or U+000D CR from s given position.
  38. // 6. Append token to result.
  39. TRY(result.try_append(lexer.consume_until(is_any_of("\n\r"sv))));
  40. // 7. While position is not past the end of s:
  41. while (!lexer.is_eof()) {
  42. // 1. If the code point at position within s equals U+000D CR:
  43. if (lexer.peek() == '\r') {
  44. // 1. Append native line ending to result.
  45. TRY(result.try_append(native_line_ending));
  46. // 2. Advance position by 1.
  47. lexer.ignore(1);
  48. // 3. If position is not past the end of s and the code point at position within s equals U+000A LF advance position by 1.
  49. if (!lexer.is_eof() && lexer.peek() == '\n')
  50. lexer.ignore(1);
  51. }
  52. // 2. Otherwise if the code point at position within s equals U+000A LF, advance position by 1 and append native line ending to result.
  53. else if (lexer.peek() == '\n') {
  54. lexer.ignore(1);
  55. TRY(result.try_append(native_line_ending));
  56. }
  57. // 3. Let token be the result of collecting a sequence of code points that are not equal to U+000A LF or U+000D CR from s given position.
  58. // 4. Append token to result.
  59. TRY(result.try_append(lexer.consume_until(is_any_of("\n\r"sv))));
  60. }
  61. // 5. Return result.
  62. return result.to_string();
  63. }
  64. // https://w3c.github.io/FileAPI/#process-blob-parts
  65. ErrorOr<ByteBuffer> process_blob_parts(Vector<BlobPart> const& blob_parts, Optional<BlobPropertyBag> const& options)
  66. {
  67. // 1. Let bytes be an empty sequence of bytes.
  68. ByteBuffer bytes {};
  69. // 2. For each element in parts:
  70. for (auto const& blob_part : blob_parts) {
  71. TRY(blob_part.visit(
  72. // 1. If element is a USVString, run the following sub-steps:
  73. [&](String const& string) -> ErrorOr<void> {
  74. // 1. Let s be element.
  75. auto s = string;
  76. // 2. If the endings member of options is "native", set s to the result of converting line endings to native of element.
  77. if (options.has_value() && options->endings == Bindings::EndingType::Native)
  78. s = TRY(convert_line_endings_to_native(s));
  79. // NOTE: The AK::String is always UTF-8.
  80. // 3. Append the result of UTF-8 encoding s to bytes.
  81. return bytes.try_append(s.bytes());
  82. },
  83. // 2. If element is a BufferSource, get a copy of the bytes held by the buffer source, and append those bytes to bytes.
  84. [&](JS::Handle<JS::Object> const& buffer_source) -> ErrorOr<void> {
  85. auto data_buffer = TRY(WebIDL::get_buffer_source_copy(*buffer_source.cell()));
  86. return bytes.try_append(data_buffer.bytes());
  87. },
  88. // 3. If element is a Blob, append the bytes it represents to bytes.
  89. [&](JS::Handle<Blob> const& blob) -> ErrorOr<void> {
  90. return bytes.try_append(blob->bytes());
  91. }));
  92. }
  93. // 3. Return bytes.
  94. return bytes;
  95. }
  96. bool is_basic_latin(StringView view)
  97. {
  98. for (auto code_point : view) {
  99. if (code_point < 0x0020 || code_point > 0x007E)
  100. return false;
  101. }
  102. return true;
  103. }
  104. Blob::Blob(JS::Realm& realm)
  105. : PlatformObject(realm)
  106. {
  107. }
  108. Blob::Blob(JS::Realm& realm, ByteBuffer byte_buffer, String type)
  109. : PlatformObject(realm)
  110. , m_byte_buffer(move(byte_buffer))
  111. , m_type(move(type))
  112. {
  113. }
  114. Blob::Blob(JS::Realm& realm, ByteBuffer byte_buffer)
  115. : PlatformObject(realm)
  116. , m_byte_buffer(move(byte_buffer))
  117. {
  118. }
  119. Blob::~Blob() = default;
  120. JS::ThrowCompletionOr<void> Blob::initialize(JS::Realm& realm)
  121. {
  122. MUST_OR_THROW_OOM(Base::initialize(realm));
  123. set_prototype(&Bindings::ensure_web_prototype<Bindings::BlobPrototype>(realm, "Blob"));
  124. return {};
  125. }
  126. // https://w3c.github.io/FileAPI/#ref-for-dom-blob-blob
  127. WebIDL::ExceptionOr<JS::NonnullGCPtr<Blob>> Blob::create(JS::Realm& realm, Optional<Vector<BlobPart>> const& blob_parts, Optional<BlobPropertyBag> const& options)
  128. {
  129. auto& vm = realm.vm();
  130. // 1. If invoked with zero parameters, return a new Blob object consisting of 0 bytes, with size set to 0, and with type set to the empty string.
  131. if (!blob_parts.has_value() && !options.has_value())
  132. return MUST_OR_THROW_OOM(realm.heap().allocate<Blob>(realm, realm));
  133. ByteBuffer byte_buffer {};
  134. // 2. Let bytes be the result of processing blob parts given blobParts and options.
  135. if (blob_parts.has_value()) {
  136. byte_buffer = TRY_OR_THROW_OOM(realm.vm(), process_blob_parts(blob_parts.value(), options));
  137. }
  138. auto type = String {};
  139. // 3. If the type member of the options argument is not the empty string, run the following sub-steps:
  140. if (options.has_value() && !options->type.is_empty()) {
  141. // 1. If the type member is provided and is not the empty string, let t be set to the type dictionary member.
  142. // If t contains any characters outside the range U+0020 to U+007E, then set t to the empty string and return from these substeps.
  143. // NOTE: t is set to empty string at declaration.
  144. if (!options->type.is_empty()) {
  145. if (is_basic_latin(options->type))
  146. type = options->type;
  147. }
  148. // 2. Convert every character in t to ASCII lowercase.
  149. if (!type.is_empty())
  150. type = TRY_OR_THROW_OOM(vm, Infra::to_ascii_lowercase(type));
  151. }
  152. // 4. Return a Blob object referring to bytes as its associated byte sequence, with its size set to the length of bytes, and its type set to the value of t from the substeps above.
  153. return MUST_OR_THROW_OOM(realm.heap().allocate<Blob>(realm, realm, move(byte_buffer), move(type)));
  154. }
  155. WebIDL::ExceptionOr<JS::NonnullGCPtr<Blob>> Blob::construct_impl(JS::Realm& realm, Optional<Vector<BlobPart>> const& blob_parts, Optional<BlobPropertyBag> const& options)
  156. {
  157. return Blob::create(realm, blob_parts, options);
  158. }
  159. // https://w3c.github.io/FileAPI/#dfn-slice
  160. WebIDL::ExceptionOr<JS::NonnullGCPtr<Blob>> Blob::slice(Optional<i64> start, Optional<i64> end, Optional<String> const& content_type)
  161. {
  162. auto& vm = realm().vm();
  163. // 1. The optional start parameter is a value for the start point of a slice() call, and must be treated as a byte-order position, with the zeroth position representing the first byte.
  164. // User agents must process slice() with start normalized according to the following:
  165. i64 relative_start;
  166. if (!start.has_value()) {
  167. // a. If the optional start parameter is not used as a parameter when making this call, let relativeStart be 0.
  168. relative_start = 0;
  169. } else {
  170. auto start_value = start.value();
  171. // b. If start is negative, let relativeStart be max((size + start), 0).
  172. if (start_value < 0) {
  173. relative_start = max((size() + start_value), 0);
  174. }
  175. // c. Else, let relativeStart be min(start, size).
  176. else {
  177. relative_start = min(start_value, size());
  178. }
  179. }
  180. // 2. The optional end parameter is a value for the end point of a slice() call. User agents must process slice() with end normalized according to the following:
  181. i64 relative_end;
  182. if (!end.has_value()) {
  183. // a. If the optional end parameter is not used as a parameter when making this call, let relativeEnd be size.
  184. relative_end = size();
  185. } else {
  186. auto end_value = end.value();
  187. // b. If end is negative, let relativeEnd be max((size + end), 0).
  188. if (end_value < 0) {
  189. relative_end = max((size() + end_value), 0);
  190. }
  191. // c Else, let relativeEnd be min(end, size).
  192. else {
  193. relative_end = min(end_value, size());
  194. }
  195. }
  196. // 3. The optional contentType parameter is used to set the ASCII-encoded string in lower case representing the media type of the Blob.
  197. // User agents must process the slice() with contentType normalized according to the following:
  198. String relative_content_type;
  199. if (!content_type.has_value()) {
  200. // a. If the contentType parameter is not provided, let relativeContentType be set to the empty string.
  201. relative_content_type = String {};
  202. } else {
  203. // b. Else let relativeContentType be set to contentType and run the substeps below:
  204. // 1. If relativeContentType contains any characters outside the range of U+0020 to U+007E, then set relativeContentType to the empty string and return from these substeps.
  205. // NOTE: contentType is set to empty string at declaration.
  206. if (is_basic_latin(content_type.value())) {
  207. // 2. Convert every character in relativeContentType to ASCII lowercase.
  208. relative_content_type = TRY_OR_THROW_OOM(vm, Infra::to_ascii_lowercase(content_type.value()));
  209. }
  210. }
  211. // 4. Let span be max((relativeEnd - relativeStart), 0).
  212. auto span = max((relative_end - relative_start), 0);
  213. // 5. Return a new Blob object S with the following characteristics:
  214. // a. S refers to span consecutive bytes from this, beginning with the byte at byte-order position relativeStart.
  215. // b. S.size = span.
  216. // c. S.type = relativeContentType.
  217. auto byte_buffer = TRY_OR_THROW_OOM(vm, m_byte_buffer.slice(relative_start, span));
  218. return MUST_OR_THROW_OOM(heap().allocate<Blob>(realm(), realm(), move(byte_buffer), move(relative_content_type)));
  219. }
  220. // https://w3c.github.io/FileAPI/#dom-blob-stream
  221. WebIDL::ExceptionOr<JS::NonnullGCPtr<Streams::ReadableStream>> Blob::stream()
  222. {
  223. // The stream() method, when invoked, must return the result of calling get stream on this.
  224. return this->get_stream();
  225. }
  226. // https://w3c.github.io/FileAPI/#blob-get-stream
  227. WebIDL::ExceptionOr<JS::NonnullGCPtr<Streams::ReadableStream>> Blob::get_stream()
  228. {
  229. auto& realm = this->realm();
  230. // 1. Let stream be a new ReadableStream created in blob’s relevant Realm.
  231. auto stream = MUST_OR_THROW_OOM(realm.heap().allocate<Streams::ReadableStream>(realm, realm));
  232. // 2. Set up stream with byte reading support.
  233. TRY(set_up_readable_stream_controller_with_byte_reading_support(stream));
  234. // FIXME: 3. Run the following steps in parallel:
  235. {
  236. // 1. While not all bytes of blob have been read:
  237. // NOTE: for simplicity the chunk is the entire buffer for now.
  238. {
  239. // 1. Let bytes be the byte sequence that results from reading a chunk from blob, or failure if a chunk cannot be read.
  240. auto bytes = m_byte_buffer;
  241. // 2. Queue a global task on the file reading task source given blob’s relevant global object to perform the following steps:
  242. HTML::queue_global_task(HTML::Task::Source::FileReading, realm.global_object(), [stream, bytes = move(bytes)]() {
  243. HTML::TemporaryExecutionContext execution_context { Bindings::host_defined_environment_settings_object(stream->realm()) };
  244. // 1. If bytes is failure, then error stream with a failure reason and abort these steps.
  245. // 2. Let chunk be a new Uint8Array wrapping an ArrayBuffer containing bytes. If creating the ArrayBuffer throws an exception, then error stream with that exception and abort these steps.
  246. auto array_buffer = JS::ArrayBuffer::create(stream->realm(), bytes);
  247. auto chunk = JS::Uint8Array::create(stream->realm(), bytes.size(), *array_buffer);
  248. // 3. Enqueue chunk in stream.
  249. auto maybe_error = Bindings::throw_dom_exception_if_needed(stream->realm().vm(), [&]() {
  250. return readable_stream_enqueue(*stream->controller(), chunk);
  251. });
  252. if (maybe_error.is_error()) {
  253. readable_stream_error(*stream, maybe_error.release_error().value().value());
  254. return;
  255. }
  256. // FIXME: Close the stream now that we have finished enqueuing all chunks to the stream. Without this, ReadableStream.read will never resolve the second time around with 'done' set.
  257. // Nowhere in the spec seems to mention this - but testing against other implementations the stream does appear to be closed after reading all data (closed callback is fired).
  258. // Probably there is a better way of doing this.
  259. readable_stream_close(*stream);
  260. });
  261. }
  262. }
  263. // 4. Return stream.
  264. return stream;
  265. }
  266. // https://w3c.github.io/FileAPI/#dom-blob-text
  267. WebIDL::ExceptionOr<JS::NonnullGCPtr<JS::Promise>> Blob::text()
  268. {
  269. auto& realm = this->realm();
  270. auto& vm = realm.vm();
  271. // 1. Let stream be the result of calling get stream on this.
  272. auto stream = TRY(this->get_stream());
  273. // 2. Let reader be the result of getting a reader from stream. If that threw an exception, return a new promise rejected with that exception.
  274. auto reader_or_exception = acquire_readable_stream_default_reader(*stream);
  275. if (reader_or_exception.is_exception()) {
  276. auto throw_completion = Bindings::dom_exception_to_throw_completion(vm, reader_or_exception.exception());
  277. auto promise_capability = WebIDL::create_rejected_promise(realm, *throw_completion.value());
  278. return JS::NonnullGCPtr { verify_cast<JS::Promise>(*promise_capability->promise().ptr()) };
  279. }
  280. auto reader = reader_or_exception.release_value();
  281. // 3. Let promise be the result of reading all bytes from stream with reader
  282. auto promise = TRY(reader->read_all_bytes_deprecated());
  283. // 4. Return the result of transforming promise by a fulfillment handler that returns the result of running UTF-8 decode on its first argument.
  284. return WebIDL::upon_fulfillment(*promise, [&](auto const& first_argument) -> WebIDL::ExceptionOr<JS::Value> {
  285. auto const& object = first_argument.as_object();
  286. VERIFY(is<JS::ArrayBuffer>(object));
  287. auto const& buffer = static_cast<const JS::ArrayBuffer&>(object).buffer();
  288. auto decoder = TextCodec::decoder_for("UTF-8"sv);
  289. auto utf8_text = TRY_OR_THROW_OOM(vm, TextCodec::convert_input_to_utf8_using_given_decoder_unless_there_is_a_byte_order_mark(*decoder, buffer));
  290. return JS::PrimitiveString::create(vm, move(utf8_text));
  291. });
  292. }
  293. // https://w3c.github.io/FileAPI/#dom-blob-arraybuffer
  294. WebIDL::ExceptionOr<JS::NonnullGCPtr<JS::Promise>> Blob::array_buffer()
  295. {
  296. auto& realm = this->realm();
  297. auto& vm = realm.vm();
  298. // 1. Let stream be the result of calling get stream on this.
  299. auto stream = TRY(this->get_stream());
  300. // 2. Let reader be the result of getting a reader from stream. If that threw an exception, return a new promise rejected with that exception.
  301. auto reader_or_exception = acquire_readable_stream_default_reader(*stream);
  302. if (reader_or_exception.is_exception()) {
  303. auto throw_completion = Bindings::dom_exception_to_throw_completion(vm, reader_or_exception.exception());
  304. auto promise_capability = WebIDL::create_rejected_promise(realm, *throw_completion.value());
  305. return JS::NonnullGCPtr { verify_cast<JS::Promise>(*promise_capability->promise().ptr()) };
  306. }
  307. auto reader = reader_or_exception.release_value();
  308. // 3. Let promise be the result of reading all bytes from stream with reader.
  309. auto promise = TRY(reader->read_all_bytes_deprecated());
  310. // 4. Return the result of transforming promise by a fulfillment handler that returns a new ArrayBuffer whose contents are its first argument.
  311. return WebIDL::upon_fulfillment(*promise, [&](auto const& first_argument) -> WebIDL::ExceptionOr<JS::Value> {
  312. auto const& object = first_argument.as_object();
  313. VERIFY(is<JS::ArrayBuffer>(object));
  314. auto const& buffer = static_cast<const JS::ArrayBuffer&>(object).buffer();
  315. return JS::ArrayBuffer::create(realm, buffer);
  316. });
  317. }
  318. }