HTMLToken.h 3.1 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104
  1. /*
  2. * Copyright (c) 2020, Andreas Kling <kling@serenityos.org>
  3. * All rights reserved.
  4. *
  5. * Redistribution and use in source and binary forms, with or without
  6. * modification, are permitted provided that the following conditions are met:
  7. *
  8. * 1. Redistributions of source code must retain the above copyright notice, this
  9. * list of conditions and the following disclaimer.
  10. *
  11. * 2. Redistributions in binary form must reproduce the above copyright notice,
  12. * this list of conditions and the following disclaimer in the documentation
  13. * and/or other materials provided with the distribution.
  14. *
  15. * THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS "AS IS"
  16. * AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
  17. * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE
  18. * DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT HOLDER OR CONTRIBUTORS BE LIABLE
  19. * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
  20. * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR
  21. * SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER
  22. * CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY,
  23. * OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE
  24. * OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
  25. */
  26. #pragma once
  27. #include <AK/String.h>
  28. #include <AK/StringBuilder.h>
  29. #include <AK/Types.h>
  30. #include <AK/Vector.h>
  31. namespace Web {
  32. class HTMLToken {
  33. friend class HTMLDocumentParser;
  34. friend class HTMLTokenizer;
  35. public:
  36. enum class Type {
  37. DOCTYPE,
  38. StartTag,
  39. EndTag,
  40. Comment,
  41. Character,
  42. EndOfFile,
  43. };
  44. bool is_doctype() const { return m_type == Type::DOCTYPE; }
  45. bool is_start_tag() const { return m_type == Type::StartTag; }
  46. bool is_end_tag() const { return m_type == Type::EndTag; }
  47. bool is_comment() const { return m_type == Type::Comment; }
  48. bool is_character() const { return m_type == Type::Character; }
  49. bool is_end_of_file() const { return m_type == Type::EndOfFile; }
  50. String tag_name() const
  51. {
  52. ASSERT(is_start_tag() || is_end_tag());
  53. return m_tag.tag_name.to_string();
  54. }
  55. bool is_self_closing() const
  56. {
  57. ASSERT(is_start_tag() || is_end_tag());
  58. return m_tag.self_closing;
  59. }
  60. Type type() const { return m_type; }
  61. String to_string() const;
  62. private:
  63. struct AttributeBuilder {
  64. StringBuilder name_builder;
  65. StringBuilder value_builder;
  66. };
  67. Type m_type;
  68. // Type::DOCTYPE
  69. struct {
  70. StringBuilder name;
  71. StringBuilder public_identifier;
  72. StringBuilder system_identifier;
  73. bool force_quirks { false };
  74. } m_doctype;
  75. // Type::StartTag
  76. // Type::EndTag
  77. struct {
  78. StringBuilder tag_name;
  79. bool self_closing { false };
  80. Vector<AttributeBuilder> attributes;
  81. } m_tag;
  82. // Type::Comment
  83. // Type::Character
  84. struct {
  85. StringBuilder data;
  86. } m_comment_or_character;
  87. };
  88. }