diff --git a/lib/auto_linker/builder.ex b/lib/auto_linker/builder.ex
index 4ebe85e..22d1758 100644
--- a/lib/auto_linker/builder.ex
+++ b/lib/auto_linker/builder.ex
@@ -112,6 +112,64 @@ defmodule AutoLinker.Builder do
+ def create_mention_link("@" <> name, _buffer, opts) do
+ mention_prefix = opts[:mention_prefix]
+ url = mention_prefix <> name
+ []
+ |> build_attrs(url, opts, :rel)
+ |> build_attrs(url, opts, :target)
+ |> build_attrs(url, opts, :class)
+ |> build_attrs(url, opts, :scheme)
+ |> format_mention(name, opts)
+ end
+ def create_hashtag_link(tag, _buffer, opts) do
+ hashtag_prefix = opts[:hashtag_prefix]
+ url = hashtag_prefix <> tag
+ []
+ |> build_attrs(url, opts, :rel)
+ |> build_attrs(url, opts, :target)
+ |> build_attrs(url, opts, :class)
+ |> build_attrs(url, opts, :scheme)
+ |> format_hashtag(tag, opts)
+ end
+ def create_email_link(email, opts) do
+ []
+ |> build_attrs(email, opts, :class)
+ |> format_email(email, opts)
+ end
+ def create_extra_link(uri, opts) do
+ []
+ |> build_attrs(uri, opts, :class)
+ |> format_extra(uri, opts)
+ end
+ def format_mention(attrs, name, _opts) do
+ attrs = format_attrs(attrs)
+ "@" <> name <> ""
+ end
+ def format_hashtag(attrs, tag, _opts) do
+ attrs = format_attrs(attrs)
+ "#" <> tag <> ""
+ end
+ def format_email(attrs, email, _opts) do
+ attrs = format_attrs(attrs)
+ "#{email}"
+ end
+ def format_extra(attrs, uri, _opts) do
+ attrs = format_attrs(attrs)
+ "#{uri}"
+ end
defp format_attributes(attrs) do
Enum.reduce(attrs, "", fn {name, value}, acc ->
acc <> ~s' #{name}="#{value}"'
diff --git a/lib/auto_linker/parser.ex b/lib/auto_linker/parser.ex
index 1f68733..0fbf86a 100644
--- a/lib/auto_linker/parser.ex
+++ b/lib/auto_linker/parser.ex
@@ -28,19 +28,43 @@ defmodule AutoLinker.Parser do
# @invalid_url ~r/\.\.+/
@invalid_url ~r/(\.\.+)|(^(\d+\.){1,2}\d+$)/
- @match_url ~r{^[\w\.-]+(?:\.[\w\.-]+)+[\w\-\._~:/?#[\]@!\$&'\(\)\*\+,;=.]+$}
- @match_scheme ~r{^(?:http(s)?:\/\/)?[\w.-]+(?:\.[\w\.-]+)+[\w\-\._~:/?#[\]@!\$&'\(\)\*\+,;=.]+$}
+ @match_url ~r{^[\w\.-]+(?:\.[\w\.-]+)+[\w\-\._~%:/?#[\]@!\$&'\(\)\*\+,;=.]+$}
+ @match_scheme ~r{^(?:http(s)?:\/\/)?[\w.-]+(?:\.[\w\.-]+)+[\w\-\._~%:/?#[\]@!\$&'\(\)\*\+,;=.]+$}
@match_phone ~r"((?:x\d{2,7})|(?:(?:\+?1\s?(?:[.-]\s?)?)?(?:\(\s?(?:[2-9]1[02-9]|[2-9][02-8]1|[2-9][02-8][02-9])\s?\)|(?:[2-9]1[02-9]|[2-9][02-8]1|[2-9][02-8][02-9]))\s?(?:[.-]\s?)?)(?:[2-9]1[02-9]|[2-9][02-9]1|[2-9][02-9]{2})\s?(?:[.-]\s?)?(?:[0-9]{4}))"
- @match_hostname ~r{^(?:https?:\/\/)?(?:[^@\n]+@)?(?[^:#~\/\n?]+)}
+ @match_hostname ~r{^(?:https?:\/\/)?(?:[^@\n]+\\w@)?(?[^:#~\/\n?]+)}
@match_ip ~r"^(([0-9]|[1-9][0-9]|1[0-9]{2}|2[0-4][0-9]|25[0-5])\.){3}([0-9]|[1-9][0-9]|1[0-9]{2}|2[0-4][0-9]|25[0-5])$"
- @default_opts ~w(url)a
+ # @user
+ # @user@example.com
+ @match_mention ~r/^@[a-zA-Z0-9.!#$%&'*+\/=?^_`{|}~-]+@?[a-zA-Z0-9_-](?:[a-zA-Z0-9-]{0,61}[a-zA-Z0-9])?(?:\.[a-zA-Z0-9](?:[a-zA-Z0-9-]{0,61}[a-zA-Z0-9])?)*/u
+ # https://www.w3.org/TR/html5/forms.html#valid-e-mail-address
+ @match_email ~r/^[a-zA-Z0-9.!#$%&'*+\/=?^_`{|}~-]+@[a-zA-Z0-9](?:[a-zA-Z0-9-]{0,61}[a-zA-Z0-9])?(?:\.[a-zA-Z0-9](?:[a-zA-Z0-9-]{0,61}[a-zA-Z0-9])?)*$/u
+ @match_hashtag ~r/^\#(?\w+)/u
+ @prefix_extra [
+ "magnet:?",
+ "dweb://",
+ "dat://",
+ "gopher://",
+ "ipfs://",
+ "ipns://",
+ "irc://",
+ "ircs://",
+ "irc6://",
+ "mumble://",
+ "ssb://"
+ ]
@tlds "./priv/tlds.txt" |> File.read!() |> String.trim() |> String.split("\n")
+ @default_opts ~w(url)a
def parse(text, opts \\ %{})
def parse(text, list) when is_list(list), do: parse(text, Enum.into(list, %{}))
@@ -75,12 +99,30 @@ defmodule AutoLinker.Parser do
|> do_parse(Map.delete(opts, :phone))
+ defp do_parse(text, %{mention: true} = opts) do
+ text
+ |> do_parse(false, opts, {"", "", :parsing}, &check_and_link_mention/3)
+ |> do_parse(Map.delete(opts, :mention))
+ end
+ defp do_parse(text, %{extra: true} = opts) do
+ text
+ |> do_parse(false, opts, {"", "", :parsing}, &check_and_link_extra/3)
+ |> do_parse(Map.delete(opts, :extra))
+ end
defp do_parse(text, %{markdown: true} = opts) do
|> Builder.create_markdown_links(opts)
|> do_parse(Map.delete(opts, :markdown))
+ defp do_parse(text, %{email: true} = opts) do
+ text
+ |> do_parse(false, opts, {"", "", :parsing}, &check_and_link_email/3)
+ |> do_parse(Map.delete(opts, :email))
+ end
defp do_parse(text, %{url: _} = opts) do
if (exclude = Map.get(opts, :exclude_pattern, false)) && String.starts_with?(text, exclude) do
@@ -90,6 +132,12 @@ defmodule AutoLinker.Parser do
|> do_parse(Map.delete(opts, :url))
+ defp do_parse(text, %{hashtag: true} = opts) do
+ text
+ |> do_parse(false, opts, {"", "", :parsing}, &check_and_link_hashtag/3)
+ |> do_parse(Map.delete(opts, :hashtag))
+ end
defp do_parse(text, _), do: text
defp do_parse("", _scheme, _opts, {"", acc, _}, _handler),
@@ -110,8 +158,9 @@ defmodule AutoLinker.Parser do
defp do_parse(">" <> text, scheme, opts, {buffer, acc, {:attrs, level}}, handler),
do: do_parse(text, scheme, opts, {"", acc <> buffer <> ">", {:html, level}}, handler)
- defp do_parse(<> <> text, scheme, opts, {"", acc, {:attrs, level}}, handler),
- do: do_parse(text, scheme, opts, {"", acc <> <>, {:attrs, level}}, handler)
+ defp do_parse(<> <> text, scheme, opts, {"", acc, {:attrs, level}}, handler) do
+ do_parse(text, scheme, opts, {"", acc <> <>, {:attrs, level}}, handler)
+ end
defp do_parse("" <> text, scheme, opts, {buffer, acc, {:html, level}}, handler),
@@ -178,13 +227,43 @@ defmodule AutoLinker.Parser do
|> link_url(buffer, opts)
+ def check_and_link_email(buffer, _, opts) do
+ buffer
+ |> is_email?
+ |> link_email(buffer, opts)
+ end
def check_and_link_phone(buffer, _, opts) do
|> match_phone
|> link_phone(buffer, opts)
- @doc false
+ def check_and_link_mention(buffer, _, opts) do
+ buffer
+ |> match_mention
+ |> link_mention(buffer, opts)
+ end
+ def check_and_link_hashtag(buffer, _, opts) do
+ buffer
+ |> match_hashtag
+ |> link_hashtag(buffer, opts)
+ end
+ def check_and_link_extra("xmpp:" <> handle, _, opts) do
+ handle
+ |> is_email?
+ |> link_extra("xmpp:" <> handle, opts)
+ end
+ def check_and_link_extra(buffer, _, opts) do
+ buffer
+ |> String.starts_with?(@prefix_extra)
+ |> link_extra(buffer, opts)
+ end
+ # @doc false
def is_url?(buffer, true) do
if Regex.match?(@invalid_url, buffer) do
@@ -201,6 +280,14 @@ defmodule AutoLinker.Parser do
+ def is_email?(buffer) do
+ if Regex.match?(@invalid_url, buffer) do
+ false
+ else
+ Regex.match?(@match_email, buffer) |> is_valid_tld?(buffer)
+ end
+ end
def is_valid_tld?(true, buffer) do
[host] = Regex.run(@match_hostname, buffer, capture: [:host])
@@ -227,6 +314,37 @@ defmodule AutoLinker.Parser do
+ def match_mention(buffer) do
+ case Regex.run(@match_mention, buffer) do
+ [mention] -> mention
+ _ -> nil
+ end
+ end
+ def match_hashtag(buffer) do
+ case Regex.run(@match_hashtag, buffer, capture: [:tag]) do
+ [hashtag] -> hashtag
+ _ -> nil
+ end
+ end
+ def link_hashtag(nil, buffer, _), do: buffer
+ def link_hashtag(hashtag, buffer, opts) do
+ Builder.create_hashtag_link(hashtag, buffer, opts)
+ end
+ def link_mention(nil, buffer, _), do: buffer
+ def link_mention(mention, _buffer, %{mention_formatter: mention_formatter} = opts) do
+ {buffer, _} = mention_formatter.(mention, opts)
+ buffer
+ end
+ def link_mention(mention, buffer, opts) do
+ Builder.create_mention_link(mention, buffer, opts)
+ end
def link_phone(nil, buffer, _), do: buffer
def link_phone(list, buffer, opts) do
@@ -239,4 +357,17 @@ defmodule AutoLinker.Parser do
def link_url(_, buffer, _opts), do: buffer
+ @doc false
+ def link_email(true, buffer, opts) do
+ Builder.create_email_link(buffer, opts)
+ end
+ def link_email(_, buffer, _opts), do: buffer
+ def link_extra(true, buffer, opts) do
+ Builder.create_extra_link(buffer, opts)
+ end
+ def link_extra(_, buffer, _opts), do: buffer
diff --git a/test/auto_linker_test.exs b/test/auto_linker_test.exs
index bddf6dd..880e838 100644
--- a/test/auto_linker_test.exs
+++ b/test/auto_linker_test.exs
@@ -28,6 +28,213 @@ defmodule AutoLinkerTest do
" ab"
+ test "all kinds of links" do
+ text =
+ "hello @user google.com https://ddg.com 888 888-8888 #tag user@email.com [google.com](http://google.com) irc:///mIRC"
+ expected =
+ "hello @user google.com ddg.com 888 888-8888 #tag user@email.com google.com irc:///mIRC"
+ assert AutoLinker.link(text,
+ phone: true,
+ markdown: true,
+ email: true,
+ mention: true,
+ mention_prefix: "https://example.com/user/",
+ hashtag: true,
+ hashtag_prefix: "https://example.com/tag/",
+ scheme: true,
+ extra: true,
+ class: false,
+ new_window: false,
+ rel: false
+ ) == expected
+ end
+ describe "mentions" do
+ test "simple mentions" do
+ expected =
+ ~s{hello @user and @anotherUser}
+ assert AutoLinker.link("hello @user and @anotherUser",
+ mention: true,
+ mention_prefix: "https://example.com/user/"
+ ) == expected
+ end
+ test "metion @user@example.com" do
+ text = "hey @user@example.com"
+ expected =
+ "hey @user@example.com"
+ assert AutoLinker.link(text,
+ mention: true,
+ mention_prefix: "https://example.com/user/"
+ ) == expected
+ end
+ test "skip if starts with @@" do
+ text = "hello @@user and @anotherUser"
+ expected =
+ "hello @@user and @anotherUser"
+ assert AutoLinker.link(text,
+ mention: true,
+ mention_prefix: "https://example.com/user/"
+ ) == expected
+ end
+ end
+ describe "hashtag links" do
+ test "hashtag" do
+ expected =
+ "one #two three #four"
+ assert AutoLinker.link("one #two three #four",
+ hashtag: true,
+ hashtag_prefix: "https://example.com/tag/"
+ ) == expected
+ end
+ test "do not turn urls with hashes into hashtags" do
+ text = "google.com#test #test google.com/#test #tag"
+ expected =
+ "google.com#test #test google.com/#test #tag"
+ assert AutoLinker.link(text,
+ scheme: true,
+ hashtag: true,
+ class: false,
+ new_window: false,
+ rel: false,
+ hashtag_prefix: "https://example.com/tag/"
+ ) == expected
+ end
+ test "works with non-latin characters" do
+ text = "#漢字 #は #тест #ทดสอบ"
+ expected =
+ "#漢字 #は #тест #ทดสอบ"
+ assert AutoLinker.link(text,
+ scheme: true,
+ class: false,
+ new_window: false,
+ rel: false,
+ hashtag: true,
+ hashtag_prefix: "https://example.com/tag/"
+ ) == expected
+ end
+ end
+ describe "links" do
+ test "turning urls into links" do
+ text = "Hey, check out http://www.youtube.com/watch?v=8Zg1-TufF%20zY?x=1&y=2#blabla ."
+ expected =
+ "Hey, check out youtube.com/watch?v=8Zg1-TufF%20zY?x=1&y=2#blabla ."
+ assert AutoLinker.link(text, scheme: true) == expected
+ # no scheme
+ text = "Hey, check out www.youtube.com/watch?v=8Zg1-TufF%20zY?x=1&y=2#blabla ."
+ assert AutoLinker.link(text, scheme: true) == expected
+ end
+ test "hostname/@user" do
+ text = "https://example.com/@user"
+ expected =
+ "example.com/@user"
+ assert AutoLinker.link(text, scheme: true) == expected
+ text = "https://example.com:4000/@user"
+ expected =
+ "example.com:4000/@user"
+ assert AutoLinker.link(text, scheme: true) == expected
+ text = "https://example.com:4000/@user"
+ expected =
+ "example.com:4000/@user"
+ assert AutoLinker.link(text, scheme: true) == expected
+ text = "@username"
+ expected = "@username"
+ assert AutoLinker.link(text, scheme: true) == expected
+ text = "http://www.cs.vu.nl/~ast/intel/"
+ expected =
+ "cs.vu.nl/~ast/intel/"
+ assert AutoLinker.link(text, scheme: true) == expected
+ text = "https://forum.zdoom.org/viewtopic.php?f=44&t=57087"
+ expected =
+ "forum.zdoom.org/viewtopic.php?f=44&t=57087"
+ assert AutoLinker.link(text, scheme: true) == expected
+ text = "https://en.wikipedia.org/wiki/Sophia_(Gnosticism)#Mythos_of_the_soul"
+ expected =
+ "en.wikipedia.org/wiki/Sophia_(Gnosticism)#Mythos_of_the_soul"
+ assert AutoLinker.link(text, scheme: true) == expected
+ text = "https://en.wikipedia.org/wiki/Duff's_device"
+ expected =
+ "en.wikipedia.org/wiki/Duff's_device"
+ assert AutoLinker.link(text, scheme: true) == expected
+ end
+ end
+ describe "non http links" do
+ test "xmpp" do
+ text = "xmpp:user@example.com"
+ expected = "xmpp:user@example.com"
+ assert AutoLinker.link(text, extra: true) == expected
+ end
+ test "email" do
+ text = "user@example.com"
+ expected = "user@example.com"
+ assert AutoLinker.link(text, email: true) == expected
+ end
+ test "magnet" do
+ text =
+ "magnet:?xt=urn:btih:a4104a9d2f5615601c429fe8bab8177c47c05c84&dn=ubuntu-"
+ expected =
+ "magnet:?xt=urn:btih:a4104a9d2f5615601c429fe8bab8177c47c05c84&dn=ubuntu-"
+ assert AutoLinker.link(text, extra: true) == expected
+ end
+ test "dweb" do
+ text =
+ "dweb://584faa05d394190ab1a3f0240607f9bf2b7e2bd9968830a11cf77db0cea36a21+v1.0.0/path/to/file.txt"
+ expected =
+ "dweb://584faa05d394190ab1a3f0240607f9bf2b7e2bd9968830a11cf77db0cea36a21+v1.0.0/path/to/file.txt"
+ assert AutoLinker.link(text, extra: true) == expected
+ end
+ end
describe "TLDs" do
test "parse with scheme" do
text = "https://google.com"