ruma_html/html/
matrix.rs

1//! Types to work with HTML elements and attributes [suggested by the Matrix Specification][spec].
2//!
3//! [spec]: https://spec.matrix.org/latest/client-server-api/#mroommessage-msgtypes
4
5use std::collections::BTreeSet;
6
7use html5ever::{namespace_url, ns, tendril::StrTendril, Attribute, QualName};
8use ruma_common::{
9    IdParseError, MatrixToError, MatrixToUri, MatrixUri, MatrixUriError, MxcUri, OwnedMxcUri,
10};
11
12use crate::sanitizer_config::clean::{
13    ALLOWED_SCHEMES_A_HREF_COMPAT, ALLOWED_SCHEMES_A_HREF_STRICT,
14};
15
16const CLASS_LANGUAGE_PREFIX: &str = "language-";
17
18/// The data of a Matrix HTML element.
19///
20/// This is a helper type to work with elements [suggested by the Matrix Specification][spec].
21///
22/// This performs a lossless conversion from [`ElementData`]. Unsupported elements are represented
23/// by [`MatrixElement::Other`] and unsupported attributes are listed in the `attrs` field.
24///
25/// [`ElementData`]: crate::ElementData
26/// [spec]: https://spec.matrix.org/latest/client-server-api/#mroommessage-msgtypes
27#[derive(Debug, Clone)]
28#[allow(clippy::exhaustive_structs)]
29pub struct MatrixElementData {
30    /// The HTML element and its supported data.
31    pub element: MatrixElement,
32
33    /// The unsupported attributes found on the element.
34    pub attrs: BTreeSet<Attribute>,
35}
36
37impl MatrixElementData {
38    /// Parse a `MatrixElementData` from the given qualified name and attributes.
39    #[allow(clippy::mutable_key_type)]
40    pub(super) fn parse(name: &QualName, attrs: &BTreeSet<Attribute>) -> Self {
41        let (element, attrs) = MatrixElement::parse(name, attrs);
42        Self { element, attrs }
43    }
44}
45
46/// A Matrix HTML element.
47///
48/// All the elements [suggested by the Matrix Specification][spec] have a variant. The others are
49/// handled by the fallback `Other` variant.
50///
51/// Suggested attributes are represented as optional fields on the variants structs.
52///
53/// [spec]: https://spec.matrix.org/latest/client-server-api/#mroommessage-msgtypes
54#[derive(Debug, Clone)]
55#[non_exhaustive]
56pub enum MatrixElement {
57    /// [`<del>`], a deleted text element.
58    ///
59    /// [`<del>`]: https://developer.mozilla.org/en-US/docs/Web/HTML/Element/del
60    Del,
61
62    /// [`<h1>-<h6>`], a section heading element.
63    ///
64    /// [`<h1>-<h6>`]: https://developer.mozilla.org/en-US/docs/Web/HTML/Element/Heading_Elements
65    H(HeadingData),
66
67    /// [`<blockquote>`], a block quotation element.
68    ///
69    /// [`<blockquote>`]: https://developer.mozilla.org/en-US/docs/Web/HTML/Element/blockquote
70    Blockquote,
71
72    /// [`<p>`], a paragraph element.
73    ///
74    /// [`<p>`]: https://developer.mozilla.org/en-US/docs/Web/HTML/Element/p
75    P,
76
77    /// [`<a>`], an anchor element.
78    ///
79    /// [`<a>`]: https://developer.mozilla.org/en-US/docs/Web/HTML/Element/a
80    A(AnchorData),
81
82    /// [`<ul>`], an unordered list element.
83    ///
84    /// [`<ul>`]: https://developer.mozilla.org/en-US/docs/Web/HTML/Element/ul
85    Ul,
86
87    /// [`<ol>`], an ordered list element.
88    ///
89    /// [`<ol>`]: https://developer.mozilla.org/en-US/docs/Web/HTML/Element/ol
90    Ol(OrderedListData),
91
92    /// [`<sup>`], a superscript element.
93    ///
94    /// [`<sup>`]: https://developer.mozilla.org/en-US/docs/Web/HTML/Element/sup
95    Sup,
96
97    /// [`<sub>`], a subscript element.
98    ///
99    /// [`<sub>`]: https://developer.mozilla.org/en-US/docs/Web/HTML/Element/sub
100    Sub,
101
102    /// [`<li>`], a list item element.
103    ///
104    /// [`<li>`]: https://developer.mozilla.org/en-US/docs/Web/HTML/Element/li
105    Li,
106
107    /// [`<b>`], a bring attention to element.
108    ///
109    /// [`<b>`]: https://developer.mozilla.org/en-US/docs/Web/HTML/Element/b
110    B,
111
112    /// [`<i>`], an idiomatic text element.
113    ///
114    /// [`<i>`]: https://developer.mozilla.org/en-US/docs/Web/HTML/Element/i
115    I,
116
117    /// [`<u>`], an unarticulated annotation element.
118    ///
119    /// [`<u>`]: https://developer.mozilla.org/en-US/docs/Web/HTML/Element/u
120    U,
121
122    /// [`<strong>`], a strong importance element.
123    ///
124    /// [`<strong>`]: https://developer.mozilla.org/en-US/docs/Web/HTML/Element/strong
125    Strong,
126
127    /// [`<em>`], an emphasis element.
128    ///
129    /// [`<em>`]: https://developer.mozilla.org/en-US/docs/Web/HTML/Element/em
130    Em,
131
132    /// [`<s>`], a strikethrough element.
133    ///
134    /// [`<s>`]: https://developer.mozilla.org/en-US/docs/Web/HTML/Element/s
135    S,
136
137    /// [`<code>`], an inline code element.
138    ///
139    /// [`<code>`]: https://developer.mozilla.org/en-US/docs/Web/HTML/Element/code
140    Code(CodeData),
141
142    /// [`<hr>`], a thematic break element.
143    ///
144    /// [`<hr>`]: https://developer.mozilla.org/en-US/docs/Web/HTML/Element/hr
145    Hr,
146
147    /// [`<br>`], a line break element.
148    ///
149    /// [`<br>`]: https://developer.mozilla.org/en-US/docs/Web/HTML/Element/br
150    Br,
151
152    /// [`<div>`], a content division element.
153    ///
154    /// [`<div>`]: https://developer.mozilla.org/en-US/docs/Web/HTML/Element/div
155    Div(DivData),
156
157    /// [`<table>`], a table element.
158    ///
159    /// [`<table>`]: https://developer.mozilla.org/en-US/docs/Web/HTML/Element/table
160    Table,
161
162    /// [`<thead>`], a table head element.
163    ///
164    /// [`<thead>`]: https://developer.mozilla.org/en-US/docs/Web/HTML/Element/thead
165    Thead,
166
167    /// [`<tbody>`], a table body element.
168    ///
169    /// [`<tbody>`]: https://developer.mozilla.org/en-US/docs/Web/HTML/Element/tbody
170    Tbody,
171
172    /// [`<tr>`], a table row element.
173    ///
174    /// [`<tr>`]: https://developer.mozilla.org/en-US/docs/Web/HTML/Element/tr
175    Tr,
176
177    /// [`<th>`], a table header element.
178    ///
179    /// [`<th>`]: https://developer.mozilla.org/en-US/docs/Web/HTML/Element/th
180    Th,
181
182    /// [`<td>`], a table data cell element.
183    ///
184    /// [`<td>`]: https://developer.mozilla.org/en-US/docs/Web/HTML/Element/td
185    Td,
186
187    /// [`<caption>`], a table caption element.
188    ///
189    /// [`<caption>`]: https://developer.mozilla.org/en-US/docs/Web/HTML/Element/caption
190    Caption,
191
192    /// [`<pre>`], a preformatted text element.
193    ///
194    /// [`<pre>`]: https://developer.mozilla.org/en-US/docs/Web/HTML/Element/pre
195    Pre,
196
197    /// [`<span>`], a content span element.
198    ///
199    /// [`<span>`]: https://developer.mozilla.org/en-US/docs/Web/HTML/Element/span
200    Span(SpanData),
201
202    /// [`<img>`], an image embed element.
203    ///
204    /// [`<img>`]: https://developer.mozilla.org/en-US/docs/Web/HTML/Element/img
205    Img(ImageData),
206
207    /// [`<details>`], a details disclosure element.
208    ///
209    /// [`<details>`]: https://developer.mozilla.org/en-US/docs/Web/HTML/Element/details
210    Details,
211
212    /// [`<summary>`], a disclosure summary element.
213    ///
214    /// [`<summary>`]: https://developer.mozilla.org/en-US/docs/Web/HTML/Element/summary
215    Summary,
216
217    /// [`mx-reply`], a Matrix rich reply fallback element.
218    ///
219    /// [`mx-reply`]: https://spec.matrix.org/latest/client-server-api/#rich-replies
220    MatrixReply,
221
222    /// An HTML element that is not in the suggested list.
223    Other(QualName),
224}
225
226impl MatrixElement {
227    /// Parse a `MatrixElement` from the given qualified name and attributes.
228    ///
229    /// Returns a tuple containing the constructed `Element` and the list of remaining unsupported
230    /// attributes.
231    #[allow(clippy::mutable_key_type)]
232    fn parse(name: &QualName, attrs: &BTreeSet<Attribute>) -> (Self, BTreeSet<Attribute>) {
233        if name.ns != ns!(html) {
234            return (Self::Other(name.clone()), attrs.clone());
235        }
236
237        match name.local.as_bytes() {
238            b"del" => (Self::Del, attrs.clone()),
239            b"h1" => (Self::H(HeadingData::new(1)), attrs.clone()),
240            b"h2" => (Self::H(HeadingData::new(2)), attrs.clone()),
241            b"h3" => (Self::H(HeadingData::new(3)), attrs.clone()),
242            b"h4" => (Self::H(HeadingData::new(4)), attrs.clone()),
243            b"h5" => (Self::H(HeadingData::new(5)), attrs.clone()),
244            b"h6" => (Self::H(HeadingData::new(6)), attrs.clone()),
245            b"blockquote" => (Self::Blockquote, attrs.clone()),
246            b"p" => (Self::P, attrs.clone()),
247            b"a" => {
248                let (data, attrs) = AnchorData::parse(attrs);
249                (Self::A(data), attrs)
250            }
251            b"ul" => (Self::Ul, attrs.clone()),
252            b"ol" => {
253                let (data, attrs) = OrderedListData::parse(attrs);
254                (Self::Ol(data), attrs)
255            }
256            b"sup" => (Self::Sup, attrs.clone()),
257            b"sub" => (Self::Sub, attrs.clone()),
258            b"li" => (Self::Li, attrs.clone()),
259            b"b" => (Self::B, attrs.clone()),
260            b"i" => (Self::I, attrs.clone()),
261            b"u" => (Self::U, attrs.clone()),
262            b"strong" => (Self::Strong, attrs.clone()),
263            b"em" => (Self::Em, attrs.clone()),
264            b"s" => (Self::S, attrs.clone()),
265            b"code" => {
266                let (data, attrs) = CodeData::parse(attrs);
267                (Self::Code(data), attrs)
268            }
269            b"hr" => (Self::Hr, attrs.clone()),
270            b"br" => (Self::Br, attrs.clone()),
271            b"div" => {
272                let (data, attrs) = DivData::parse(attrs);
273                (Self::Div(data), attrs)
274            }
275            b"table" => (Self::Table, attrs.clone()),
276            b"thead" => (Self::Thead, attrs.clone()),
277            b"tbody" => (Self::Tbody, attrs.clone()),
278            b"tr" => (Self::Tr, attrs.clone()),
279            b"th" => (Self::Th, attrs.clone()),
280            b"td" => (Self::Td, attrs.clone()),
281            b"caption" => (Self::Caption, attrs.clone()),
282            b"pre" => (Self::Pre, attrs.clone()),
283            b"span" => {
284                let (data, attrs) = SpanData::parse(attrs);
285                (Self::Span(data), attrs)
286            }
287            b"img" => {
288                let (data, attrs) = ImageData::parse(attrs);
289                (Self::Img(data), attrs)
290            }
291            b"details" => (Self::Details, attrs.clone()),
292            b"summary" => (Self::Summary, attrs.clone()),
293            b"mx-reply" => (Self::MatrixReply, attrs.clone()),
294            _ => (Self::Other(name.clone()), attrs.clone()),
295        }
296    }
297}
298
299/// The supported data of a `<h1>-<h6>` HTML element.
300#[derive(Debug, Clone)]
301#[non_exhaustive]
302pub struct HeadingData {
303    /// The level of the heading.
304    pub level: HeadingLevel,
305}
306
307impl HeadingData {
308    /// Constructs a new `HeadingData` with the given heading level.
309    fn new(level: u8) -> Self {
310        Self { level: HeadingLevel(level) }
311    }
312}
313
314/// The level of a heading element.
315///
316/// The supported levels range from 1 (highest) to 6 (lowest). Other levels cannot construct this
317/// and do not use the [`MatrixElement::H`] variant.
318#[derive(Debug, Clone, Copy, PartialEq, Eq)]
319pub struct HeadingLevel(u8);
320
321impl HeadingLevel {
322    /// The value of the level.
323    ///
324    /// Can only be a value between 1 and 6 included.
325    pub fn value(&self) -> u8 {
326        self.0
327    }
328}
329
330impl PartialEq<u8> for HeadingLevel {
331    fn eq(&self, other: &u8) -> bool {
332        self.0.eq(other)
333    }
334}
335
336/// The supported data of a `<a>` HTML element.
337#[derive(Debug, Clone)]
338#[non_exhaustive]
339pub struct AnchorData {
340    /// Where to display the linked URL.
341    pub target: Option<StrTendril>,
342
343    /// The URL that the hyperlink points to.
344    pub href: Option<AnchorUri>,
345}
346
347impl AnchorData {
348    /// Construct an empty `AnchorData`.
349    fn new() -> Self {
350        Self { target: None, href: None }
351    }
352
353    /// Parse the given attributes to construct a new `AnchorData`.
354    ///
355    /// Returns a tuple containing the constructed data and the remaining unsupported attributes.
356    #[allow(clippy::mutable_key_type)]
357    fn parse(attrs: &BTreeSet<Attribute>) -> (Self, BTreeSet<Attribute>) {
358        let mut data = Self::new();
359        let mut remaining_attrs = BTreeSet::new();
360
361        for attr in attrs {
362            if attr.name.ns != ns!() {
363                remaining_attrs.insert(attr.clone());
364                continue;
365            }
366
367            match attr.name.local.as_bytes() {
368                b"target" => {
369                    data.target = Some(attr.value.clone());
370                }
371                b"href" => {
372                    if let Some(uri) = AnchorUri::parse(&attr.value) {
373                        data.href = Some(uri);
374                    } else {
375                        remaining_attrs.insert(attr.clone());
376                    }
377                }
378                _ => {
379                    remaining_attrs.insert(attr.clone());
380                }
381            }
382        }
383
384        (data, remaining_attrs)
385    }
386}
387
388/// A URI as a value for the `href` attribute of a `<a>` HTML element.
389///
390/// This is a helper type that recognizes `matrix:` and `https://matrix.to` URIs to detect mentions.
391///
392/// If the URI is an invalid Matrix URI or does not use one of the suggested schemes, the `href`
393/// attribute will be in the `attrs` list of [`MatrixElementData`].
394#[derive(Debug, Clone)]
395#[non_exhaustive]
396pub enum AnchorUri {
397    /// A `matrix:` URI.
398    Matrix(MatrixUri),
399    /// A `https://matrix.to` URI.
400    MatrixTo(MatrixToUri),
401    /// An other URL using one of the suggested schemes.
402    ///
403    /// Those schemes are:
404    ///
405    /// * `https`
406    /// * `http`
407    /// * `ftp`
408    /// * `mailto`
409    /// * `magnet`
410    Other(StrTendril),
411}
412
413impl AnchorUri {
414    /// Parse the given string to construct a new `AnchorUri`.
415    fn parse(value: &StrTendril) -> Option<Self> {
416        let s = value.as_ref();
417
418        // Check if it starts with a supported scheme.
419        let mut allowed_schemes =
420            ALLOWED_SCHEMES_A_HREF_STRICT.iter().chain(ALLOWED_SCHEMES_A_HREF_COMPAT.iter());
421        if !allowed_schemes.any(|scheme| s.starts_with(&format!("{scheme}:"))) {
422            return None;
423        }
424
425        match MatrixUri::parse(s) {
426            Ok(uri) => return Some(Self::Matrix(uri)),
427            // It's not a `matrix:` URI, continue.
428            Err(IdParseError::InvalidMatrixUri(MatrixUriError::WrongScheme)) => {}
429            // The URI is invalid.
430            _ => return None,
431        }
432
433        match MatrixToUri::parse(s) {
434            Ok(uri) => return Some(Self::MatrixTo(uri)),
435            // It's not a `https://matrix.to` URI, continue.
436            Err(IdParseError::InvalidMatrixToUri(MatrixToError::WrongBaseUrl)) => {}
437            // The URI is invalid.
438            _ => return None,
439        }
440
441        Some(Self::Other(value.clone()))
442    }
443}
444
445/// The supported data of a `<ol>` HTML element.
446#[derive(Debug, Clone)]
447#[non_exhaustive]
448pub struct OrderedListData {
449    /// An integer to start counting from for the list items.
450    ///
451    /// If parsing the integer from a string fails, the attribute will be in the `attrs` list of
452    /// [`MatrixElementData`].
453    pub start: Option<i64>,
454}
455
456impl OrderedListData {
457    /// Construct an empty `OrderedListData`.
458    fn new() -> Self {
459        Self { start: None }
460    }
461
462    /// Parse the given attributes to construct a new `OrderedListData`.
463    ///
464    /// Returns a tuple containing the constructed data and the remaining unsupported attributes.
465    #[allow(clippy::mutable_key_type)]
466    fn parse(attrs: &BTreeSet<Attribute>) -> (Self, BTreeSet<Attribute>) {
467        let mut data = Self::new();
468        let mut remaining_attrs = BTreeSet::new();
469
470        for attr in attrs {
471            if attr.name.ns != ns!() {
472                remaining_attrs.insert(attr.clone());
473                continue;
474            }
475
476            match attr.name.local.as_bytes() {
477                b"start" => {
478                    if let Ok(start) = attr.value.parse() {
479                        data.start = Some(start);
480                    } else {
481                        remaining_attrs.insert(attr.clone());
482                    }
483                }
484                _ => {
485                    remaining_attrs.insert(attr.clone());
486                }
487            }
488        }
489
490        (data, remaining_attrs)
491    }
492}
493
494/// The supported data of a `<code>` HTML element.
495#[derive(Debug, Clone)]
496#[non_exhaustive]
497pub struct CodeData {
498    /// The language of the code, for syntax highlighting.
499    ///
500    /// This corresponds to the `class` attribute with a value that starts with the
501    /// `language-` prefix. The prefix is stripped from the value.
502    ///
503    /// If there are other classes in the `class` attribute, the whole attribute will be in the
504    /// `attrs` list of [`MatrixElementData`].
505    pub language: Option<StrTendril>,
506}
507
508impl CodeData {
509    /// Construct an empty `CodeData`.
510    fn new() -> Self {
511        Self { language: None }
512    }
513
514    /// Parse the given attributes to construct a new `CodeData`.
515    ///
516    /// Returns a tuple containing the constructed data and the remaining unsupported attributes.
517    #[allow(clippy::mutable_key_type)]
518    fn parse(attrs: &BTreeSet<Attribute>) -> (Self, BTreeSet<Attribute>) {
519        let mut data = Self::new();
520        let mut remaining_attrs = BTreeSet::new();
521
522        for attr in attrs {
523            if attr.name.ns != ns!() {
524                remaining_attrs.insert(attr.clone());
525                continue;
526            }
527
528            match attr.name.local.as_bytes() {
529                b"class" => {
530                    let value_str = attr.value.as_ref();
531
532                    // The attribute could contain several classes separated by spaces, so let's
533                    // find the first class starting with `language-`.
534                    for (match_start, _) in value_str.match_indices(CLASS_LANGUAGE_PREFIX) {
535                        // The class name must either be at the start of the string or preceded by a
536                        // space.
537                        if match_start != 0
538                            && !value_str.as_bytes()[match_start - 1].is_ascii_whitespace()
539                        {
540                            continue;
541                        }
542
543                        let language_start = match_start + CLASS_LANGUAGE_PREFIX.len();
544
545                        let str_end = &value_str[language_start..];
546                        let language_end = str_end
547                            .find(|c: char| c.is_ascii_whitespace())
548                            .map(|pos| language_start + pos)
549                            .unwrap_or(value_str.len());
550
551                        if language_end == language_start {
552                            continue;
553                        }
554
555                        let sub_len = (language_end - language_start) as u32;
556                        data.language = Some(attr.value.subtendril(language_start as u32, sub_len));
557
558                        if match_start != 0 || language_end != value_str.len() {
559                            // There are other classes, keep the whole attribute for the conversion
560                            // to be lossless.
561                            remaining_attrs.insert(attr.clone());
562                        }
563
564                        break;
565                    }
566
567                    if data.language.is_none() {
568                        // We didn't find the class we want, keep the whole attribute.
569                        remaining_attrs.insert(attr.clone());
570                    }
571                }
572                _ => {
573                    remaining_attrs.insert(attr.clone());
574                }
575            }
576        }
577
578        (data, remaining_attrs)
579    }
580}
581
582/// The supported data of a `<span>` HTML element.
583#[derive(Debug, Clone)]
584#[non_exhaustive]
585pub struct SpanData {
586    /// `data-mx-bg-color`, the background color of the text.
587    pub bg_color: Option<StrTendril>,
588
589    /// `data-mx-color`, the foreground color of the text.
590    pub color: Option<StrTendril>,
591
592    /// `data-mx-spoiler`, a Matrix [spoiler message].
593    ///
594    /// The value is the reason of the spoiler. If the string is empty, this is a spoiler
595    /// without a reason.
596    ///
597    /// [spoiler message]: https://spec.matrix.org/latest/client-server-api/#spoiler-messages
598    pub spoiler: Option<StrTendril>,
599
600    /// `data-mx-maths`, an inline Matrix [mathematical message].
601    ///
602    /// The value is the mathematical notation in [LaTeX] format.
603    ///
604    /// If this attribute is present, the content of the span is the fallback representation of the
605    /// mathematical notation.
606    ///
607    /// [mathematical message]: https://spec.matrix.org/latest/client-server-api/#mathematical-messages
608    /// [LaTeX]: https://www.latex-project.org/
609    pub maths: Option<StrTendril>,
610}
611
612impl SpanData {
613    /// Construct an empty `SpanData`.
614    fn new() -> Self {
615        Self { bg_color: None, color: None, spoiler: None, maths: None }
616    }
617
618    /// Parse the given attributes to construct a new `SpanData`.
619    ///
620    /// Returns a tuple containing the constructed data and the remaining unsupported attributes.
621    #[allow(clippy::mutable_key_type)]
622    fn parse(attrs: &BTreeSet<Attribute>) -> (Self, BTreeSet<Attribute>) {
623        let mut data = Self::new();
624        let mut remaining_attrs = BTreeSet::new();
625
626        for attr in attrs {
627            if attr.name.ns != ns!() {
628                remaining_attrs.insert(attr.clone());
629                continue;
630            }
631
632            match attr.name.local.as_bytes() {
633                b"data-mx-bg-color" => {
634                    data.bg_color = Some(attr.value.clone());
635                }
636                b"data-mx-color" => data.color = Some(attr.value.clone()),
637                b"data-mx-spoiler" => {
638                    data.spoiler = Some(attr.value.clone());
639                }
640                b"data-mx-maths" => {
641                    data.maths = Some(attr.value.clone());
642                }
643                _ => {
644                    remaining_attrs.insert(attr.clone());
645                }
646            }
647        }
648
649        (data, remaining_attrs)
650    }
651}
652
653/// The supported data of a `<img>` HTML element.
654#[derive(Debug, Clone)]
655#[non_exhaustive]
656pub struct ImageData {
657    /// The intrinsic width of the image, in pixels.
658    ///
659    /// If parsing the integer from a string fails, the attribute will be in the `attrs` list of
660    /// `MatrixElementData`.
661    pub width: Option<i64>,
662
663    /// The intrinsic height of the image, in pixels.
664    ///
665    /// If parsing the integer from a string fails, the attribute will be in the `attrs` list of
666    /// [`MatrixElementData`].
667    pub height: Option<i64>,
668
669    /// Text that can replace the image.
670    pub alt: Option<StrTendril>,
671
672    ///  Text representing advisory information about the image.
673    pub title: Option<StrTendril>,
674
675    /// The image URL.
676    ///
677    /// It this is not a valid `mxc:` URI, the attribute will be in the `attrs` list of
678    /// [`MatrixElementData`].
679    pub src: Option<OwnedMxcUri>,
680}
681
682impl ImageData {
683    /// Construct an empty `ImageData`.
684    fn new() -> Self {
685        Self { width: None, height: None, alt: None, title: None, src: None }
686    }
687
688    /// Parse the given attributes to construct a new `ImageData`.
689    ///
690    /// Returns a tuple containing the constructed data and the remaining unsupported attributes.
691    #[allow(clippy::mutable_key_type)]
692    fn parse(attrs: &BTreeSet<Attribute>) -> (Self, BTreeSet<Attribute>) {
693        let mut data = Self::new();
694        let mut remaining_attrs = BTreeSet::new();
695
696        for attr in attrs {
697            if attr.name.ns != ns!() {
698                remaining_attrs.insert(attr.clone());
699                continue;
700            }
701
702            match attr.name.local.as_bytes() {
703                b"width" => {
704                    if let Ok(width) = attr.value.parse() {
705                        data.width = Some(width);
706                    } else {
707                        remaining_attrs.insert(attr.clone());
708                    }
709                }
710                b"height" => {
711                    if let Ok(height) = attr.value.parse() {
712                        data.height = Some(height);
713                    } else {
714                        remaining_attrs.insert(attr.clone());
715                    }
716                }
717                b"alt" => data.alt = Some(attr.value.clone()),
718                b"title" => data.title = Some(attr.value.clone()),
719                b"src" => {
720                    let uri = <&MxcUri>::from(attr.value.as_ref());
721                    if uri.validate().is_ok() {
722                        data.src = Some(uri.to_owned());
723                    } else {
724                        remaining_attrs.insert(attr.clone());
725                    }
726                }
727                _ => {
728                    remaining_attrs.insert(attr.clone());
729                }
730            }
731        }
732
733        (data, remaining_attrs)
734    }
735}
736
737/// The supported data of a `<div>` HTML element.
738#[derive(Debug, Clone)]
739#[non_exhaustive]
740pub struct DivData {
741    /// `data-mx-maths`, a Matrix [mathematical message] block.
742    ///
743    /// The value is the mathematical notation in [LaTeX] format.
744    ///
745    /// If this attribute is present, the content of the div is the fallback representation of the
746    /// mathematical notation.
747    ///
748    /// [mathematical message]: https://spec.matrix.org/latest/client-server-api/#mathematical-messages
749    /// [LaTeX]: https://www.latex-project.org/
750    pub maths: Option<StrTendril>,
751}
752
753impl DivData {
754    /// Construct an empty `DivData`.
755    fn new() -> Self {
756        Self { maths: None }
757    }
758
759    /// Parse the given attributes to construct a new `SpanData`.
760    ///
761    /// Returns a tuple containing the constructed data and the remaining unsupported attributes.
762    #[allow(clippy::mutable_key_type)]
763    fn parse(attrs: &BTreeSet<Attribute>) -> (Self, BTreeSet<Attribute>) {
764        let mut data = Self::new();
765        let mut remaining_attrs = BTreeSet::new();
766
767        for attr in attrs {
768            if attr.name.ns != ns!() {
769                remaining_attrs.insert(attr.clone());
770                continue;
771            }
772
773            match attr.name.local.as_bytes() {
774                b"data-mx-maths" => {
775                    data.maths = Some(attr.value.clone());
776                }
777                _ => {
778                    remaining_attrs.insert(attr.clone());
779                }
780            }
781        }
782
783        (data, remaining_attrs)
784    }
785}