lib/bumblebee/text/bert_tokenizer.ex

defmodule Bumblebee.Text.BertTokenizer do
  @moduledoc """
  BERT tokenizer.
  """

  import Bumblebee.Shared

  tokenizer_impl(
    special_tokens: %{unk: "[UNK]", sep: "[SEP]", pad: "[PAD]", cls: "[CLS]", mask: "[MASK]"}
  )
end