cat-bookmarker/deps/html_entities/lib/html_entities.ex

90 lines
2.1 KiB
Elixir
Raw Normal View History

2024-03-10 18:52:04 +00:00
defmodule HtmlEntities do
@moduledoc """
Decode and encode HTML entities in a string.
## Examples
Decoding:
iex> "Tom & Jerry" |> HtmlEntities.decode
"Tom & Jerry"
iex> "¡Ay, caramba!" |> HtmlEntities.decode
"¡Ay, caramba!"
iex> "ő ő" |> HtmlEntities.decode
"ő ő"
Encoding:
iex> "Tom & Jerry" |> HtmlEntities.encode
"Tom & Jerry"
iex> "<< KAPOW!! >>" |> HtmlEntities.encode
"&lt;&lt; KAPOW!! &gt;&gt;"
"""
@external_resource "lib/html_entities_list.txt"
@doc "Decode HTML entities in a string."
@spec decode(String.t()) :: String.t()
def decode(string) when is_binary(string) do
decode(string, "")
end
defp decode(<<"&", rest::binary>>, acc) do
case decode_entity(rest) do
{character, rest} -> decode(rest, <<acc::binary, character::binary>>)
:error -> decode(rest, <<acc::binary, ?&>>)
end
end
defp decode(<<head, rest::binary>>, acc) do
decode(rest, <<acc::binary, head>>)
end
defp decode(<<>>, acc) do
acc
end
defp decode_entity(<<"#x", c, rest::binary>>) when c in ?0..?9 or c in ?a..?f or c in ?A..?F do
case Integer.parse(<<c, rest::binary>>, 16) do
{number, ";" <> rest} -> {<<number::utf8>>, rest}
_ -> :error
end
rescue
ArgumentError -> :error
end
defp decode_entity(<<"#", rest::binary>>) do
case Integer.parse(rest, 10) do
{number, ";" <> rest} -> {<<number::utf8>>, rest}
_ -> :error
end
rescue
ArgumentError -> :error
end
codes = HtmlEntities.Util.load_entities(@external_resource)
for {name, _character, codepoint} <- codes do
defp decode_entity(<<unquote(name), ?;, rest::binary>>) do
{<<unquote(codepoint)::utf8>>, rest}
end
end
defp decode_entity(_), do: :error
@doc "Encode HTML entities in a string."
@spec encode(String.t()) :: String.t()
def encode(string) when is_binary(string) do
for <<x <- string>>, into: "" do
case x do
?' -> "&#39;"
?" -> "&quot;"
?& -> "&amp;"
?< -> "&lt;"
?> -> "&gt;"
_ -> <<x>>
end
end
end
end