lib/bumblebee/text/camembert_tokenizer.ex
defmodule Bumblebee.Text.CamembertTokenizer do
@moduledoc """
Camembert tokenizer.
"""
import Bumblebee.Shared
tokenizer_impl(
special_tokens: %{
bos: "<s>",
eos: "</s>",
unk: "<unk>",
sep: "</s>",
pad: "<pad>",
cls: "<s>",
mask: "<mask>"
}
)
end