Module: SafeImage::SvgMetadata
- Defined in:
- lib/safe_image/svg_metadata.rb
Constant Summary collapse
- MAX_SVG_BYTES =
1 * 1024 * 1024
- MAX_SVG_DEPTH =
64- MAX_SVG_ELEMENTS =
10_000- MAX_SVG_ATTRIBUTES =
50_000- MAX_SVG_DIMENSION =
100_000- MAX_SVG_PIXELS =
100_000_000- LENGTH_PATTERN =
/\A\s*([+]?(?:\d+(?:\.\d+)?|\.\d+))(?:px)?\s*\z/i.freeze
- VIEWBOX_SPLIT =
/[\s,]+/.freeze
Class Method Summary collapse
- .dimensions(path, max_pixels: nil, max_bytes: MAX_SVG_BYTES) ⇒ Object
-
.parse(path, max_bytes: MAX_SVG_BYTES) ⇒ Object
Builds the full REXML tree.
- .parse_length(value) ⇒ Object
- .parse_view_box(value) ⇒ Object
- .probe(path, max_pixels: nil, max_bytes: MAX_SVG_BYTES) ⇒ Object
- .read_svg(path, max_bytes: MAX_SVG_BYTES) ⇒ Object
- .reject_unsafe_xml!(xml) ⇒ Object
- .safe_svg_path(path) ⇒ Object
-
.scan_svg!(xml) ⇒ Object
Streams the document with a pull parser, enforcing the structural caps as events arrive, so a hostile “millions of tiny elements” document is rejected at the cap without ever retaining the multi-million-object DOM that a parse-then-validate approach would build first.
- .validate_dimensions!(width, height, max_pixels: nil) ⇒ Object
Class Method Details
.dimensions(path, max_pixels: nil, max_bytes: MAX_SVG_BYTES) ⇒ Object
34 35 36 37 38 39 40 41 42 43 44 45 46 47 |
# File 'lib/safe_image/svg_metadata.rb', line 34 def dimensions(path, max_pixels: nil, max_bytes: MAX_SVG_BYTES) xml = read_svg(path, max_bytes: max_bytes) _name, attributes = scan_svg!(xml) width = parse_length(attributes["width"]) height = parse_length(attributes["height"]) unless width && height view_box = parse_view_box(attributes["viewBox"]) width ||= view_box&.fetch(2) height ||= view_box&.fetch(3) end validate_dimensions!(width, height, max_pixels: max_pixels) end |
.parse(path, max_bytes: MAX_SVG_BYTES) ⇒ Object
Builds the full REXML tree. Used only by the SVG sanitizer, which needs to walk and rewrite the document; metadata reads go through the DOM-free streaming path above. The streaming validation runs first so a document that breaches the structural caps is rejected before the tree is built.
53 54 55 56 57 58 59 60 61 62 |
# File 'lib/safe_image/svg_metadata.rb', line 53 def parse(path, max_bytes: MAX_SVG_BYTES) xml = read_svg(path, max_bytes: max_bytes) scan_svg!(xml) doc = REXML::Document.new(xml) raise InvalidImageError, "SVG root required" unless doc.root&.name == "svg" doc rescue REXML::ParseException => e raise InvalidImageError, "invalid SVG: #{e.}" end |
.parse_length(value) ⇒ Object
86 87 88 89 90 91 92 93 94 95 96 97 |
# File 'lib/safe_image/svg_metadata.rb', line 86 def parse_length(value) value = value.to_s match = LENGTH_PATTERN.match(value) return nil unless match number = Float(match[1]) return nil unless number.finite? && number.positive? number rescue ArgumentError nil end |
.parse_view_box(value) ⇒ Object
99 100 101 102 103 104 105 106 107 108 109 |
# File 'lib/safe_image/svg_metadata.rb', line 99 def parse_view_box(value) parts = value.to_s.strip.split(VIEWBOX_SPLIT) return nil unless parts.length == 4 numbers = parts.map { |part| Float(part) } return nil unless numbers.all?(&:finite?) && numbers[2].positive? && numbers[3].positive? numbers rescue ArgumentError nil end |
.probe(path, max_pixels: nil, max_bytes: MAX_SVG_BYTES) ⇒ Object
21 22 23 24 25 26 27 28 29 30 31 32 |
# File 'lib/safe_image/svg_metadata.rb', line 21 def probe(path, max_pixels: nil, max_bytes: MAX_SVG_BYTES) started = Process.clock_gettime(Process::CLOCK_MONOTONIC) path = safe_svg_path(path) width, height = dimensions(path, max_pixels: max_pixels, max_bytes: max_bytes) { input_format: "svg", width: width, height: height, frames: 1, duration_ms: (Process.clock_gettime(Process::CLOCK_MONOTONIC) - started) * 1000 } end |
.read_svg(path, max_bytes: MAX_SVG_BYTES) ⇒ Object
64 65 66 67 68 69 70 71 72 73 |
# File 'lib/safe_image/svg_metadata.rb', line 64 def read_svg(path, max_bytes: MAX_SVG_BYTES) path = safe_svg_path(path) size = File.size(path) raise LimitError, "SVG exceeds #{max_bytes} bytes" if size > max_bytes xml = File.binread(path, max_bytes + 1) raise LimitError, "SVG exceeds #{max_bytes} bytes" if xml.bytesize > max_bytes reject_unsafe_xml!(xml) xml end |
.reject_unsafe_xml!(xml) ⇒ Object
81 82 83 84 |
# File 'lib/safe_image/svg_metadata.rb', line 81 def reject_unsafe_xml!(xml) raise InvalidImageError, "doctype is not allowed in SVG" if xml.match?(/<!DOCTYPE/i) raise InvalidImageError, "XML processing instructions are not allowed in SVG" if xml.match?(/<\?(?!xml\s)/i) end |
.safe_svg_path(path) ⇒ Object
75 76 77 78 79 |
# File 'lib/safe_image/svg_metadata.rb', line 75 def safe_svg_path(path) path = PathSafety.ensure_regular_file!(path) raise UnsupportedFormatError, "not an SVG file: #{path}" unless File.extname(path.to_s).downcase == ".svg" path.to_s end |
.scan_svg!(xml) ⇒ Object
Streams the document with a pull parser, enforcing the structural caps as events arrive, so a hostile “millions of tiny elements” document is rejected at the cap without ever retaining the multi-million-object DOM that a parse-then-validate approach would build first. Returns the root element’s name and its attributes hash.
127 128 129 130 131 132 133 134 135 136 137 138 139 140 141 142 143 144 145 146 147 148 149 150 151 152 153 154 155 156 157 158 159 160 |
# File 'lib/safe_image/svg_metadata.rb', line 127 def scan_svg!(xml) parser = REXML::Parsers::PullParser.new(xml) depth = -1 elements = 0 attributes = 0 root_name = nil root_attributes = nil while parser.has_next? event = parser.pull if event.start_element? depth += 1 raise LimitError, "SVG nesting exceeds #{MAX_SVG_DEPTH}" if depth > MAX_SVG_DEPTH elements += 1 raise LimitError, "SVG has too many elements" if elements > MAX_SVG_ELEMENTS attributes += event[1].size raise LimitError, "SVG has too many attributes" if attributes > MAX_SVG_ATTRIBUTES if root_name.nil? root_name = event[0] root_attributes = event[1] end elsif event.end_element? depth -= 1 end end raise InvalidImageError, "SVG root required" unless root_name == "svg" [root_name, root_attributes] rescue REXML::ParseException => e raise InvalidImageError, "invalid SVG: #{e.}" end |
.validate_dimensions!(width, height, max_pixels: nil) ⇒ Object
111 112 113 114 115 116 117 118 119 120 |
# File 'lib/safe_image/svg_metadata.rb', line 111 def validate_dimensions!(width, height, max_pixels: nil) raise InvalidImageError, "SVG dimensions are missing or invalid" unless width&.positive? && height&.positive? raise LimitError, "SVG dimensions exceed #{MAX_SVG_DIMENSION}px" if width > MAX_SVG_DIMENSION || height > MAX_SVG_DIMENSION pixels = width * height limit = max_pixels || MAX_SVG_PIXELS raise LimitError, "SVG has #{pixels.to_i} pixels, exceeds #{limit}" if pixels > limit [width.ceil, height.ceil] end |