Bumblebee STT

elixir/bumblebee_stt.livemd

Lucas Eduardo

@lucasew

playground

Share to X

Share to Bluesky

More notebooks

Bumblebee STT

Mix.install([
  {:bumblebee, "~> 0.6.0"},
  {:telegram, github: "visciang/telegram", tag: "2.0.0"},
  {:exla, "~> 0.9.1"},
  {:kino_bumblebee, "~> 0.5.1"}
], [
  config: [
    exla: [
      clients: [
        cuda: [
          platform: :cuda,
          preallocate: false
        ]
      ]
    ]
  ]
])

Section

System.cmd("apt", ["update"])
System.cmd("apt", ["install", "ffmpeg", "-y"])


audio_input = Kino.Input.file("Audio a ser transcrito")

Nx.default_backend(EXLA.Backend)

{:ok, whisper} = Bumblebee.load_model({:hf, "openai/whisper-medium"})
{:ok, featurizer} = Bumblebee.load_featurizer({:hf, "openai/whisper-medium"})
{:ok, tokenizer} = Bumblebee.load_tokenizer({:hf, "openai/whisper-medium"})
{:ok, generation_config} = Bumblebee.load_generation_config({:hf, "openai/whisper-medium"})

serving =
  Bumblebee.Audio.speech_to_text_whisper(whisper, featurizer, tokenizer, generation_config,
    defn_options: [
      compiler: EXLA,
      preallocate: false
    ],
    language: "pt"
    # chunk_num_seconds: 5
  )
# IO.puts(inspect(audio_input))

%{file_ref: input} = Kino.Input.read(audio_input)
data = input
  |> Kino.Input.file_path()
  
IO.inspect(data)


Nx.Serving.run(serving, {:file, data})

# doesn't work to release vram
whisper = nil
featurizer = nil
tokenizer = nil
generation_config = nil
serving = nil
:erlang.garbage_collect()

serving

Other notebooks:

Michal Slaski
@michalslaski

livebook_examples

Salary predictions

salary_prediction.livemd

advanced data-science exla axon nx

2022-8-18
Dr. Christian Geuer-Pollmann
@chgeuer

livebook_on_azure

Christian's first LiveBook test

notebook1.livemd

tutorial advanced data-science axon exla nx

2022-8-18
@andyl

elix_util

MNIST

mnist.livemd

tutorial advanced data-science req axon exla nx

2022-8-18
@TomBers

livebookNotes

Trying Nx

NX.livemd

advanced data-science exla axon nx

2022-8-18
piacerex
@piacerex

livebook_trial

Iris classification

iris_knn.livemd

tutorial advanced data-science nx scholar explorer kino_explorer kino_vega_lite scidata exla

2023-8-31
Shozo Fukuda
@shoz-f

tfl_interp

Fast Neural Style Transfer

Candy.livemd

tutorial advanced data-science tfl_interp cimg kino

2024-12-1
@DockYard-Academy

curriculum

Reduce

reduce.livemd

tutorial intermediate jason kino youtube hidden_cell smart_animation visual

2023-1-21

Back