lib/bumblebee/text/whisper_tokenizer.ex
defmodule Bumblebee.Text.WhisperTokenizer do
@moduledoc """
Whisper tokenizer.
"""
import Bumblebee.Shared
tokenizer_impl(
special_tokens: %{
unk: "<|endoftext|>",
bos: "<|endoftext|>",
eos: "<|endoftext|>",
pad: "<|endoftext|>"
}
)
end