Text generation

text_generation_exla_cuda.livemd

Ryo Wakabayashi

@RyoWakabayashi

elixir-learning

Share to X

Share to Bluesky

More notebooks

Text generation

Mix.install(
  [
    {:bumblebee, "~> 0.5"},
    {:nx, "~> 0.9", override: true},
    {:exla, "~> 0.9"},
    {:kino, "~> 0.15"}
  ],
  system_env: [
    {"XLA_TARGET", "cuda12"},
    {"EXLA_TARGET", "cuda"}
  ],
  config: [nx: [default_backend: EXLA.Backend]]
)

設定

cache_dir = "/tmp/bumblebee_cache"

モデルのダウンロード

{:ok, gpt2} =
  Bumblebee.load_model({:hf, "gpt2", cache_dir: cache_dir})

{:ok, tokenizer} =
  Bumblebee.load_tokenizer({:hf, "gpt2", cache_dir: cache_dir})

{:ok, generation_config} =
  Bumblebee.load_generation_config({:hf, "gpt2", cache_dir: cache_dir})

generation_config =
  Bumblebee.configure(generation_config, max_new_tokens: 10)

サービスの提供

serving = Bumblebee.Text.generation(gpt2, tokenizer, generation_config)

補完する文章の準備

text_input = Kino.Input.text("TEXT", default: "Robots have gained human rights and")

text = Kino.Input.read(text_input)

serving
|> Nx.Serving.run(text)
|> Map.get(:results)

時間計測

1..10
|> Enum.map(fn _ ->
  {time, _} = :timer.tc(Nx.Serving, :run, [serving, text])
  time
end)
|> then(&amp;(Enum.sum(&amp;1) / 10))

他のモデル

serve_model = fn repository_id ->
  {:ok, model} =
    Bumblebee.load_model({:hf, repository_id, cache_dir: cache_dir})

  {:ok, tokenizer} =
    Bumblebee.load_tokenizer({:hf, repository_id, cache_dir: cache_dir})

  {:ok, generation_config} =
    Bumblebee.load_generation_config({:hf, repository_id, cache_dir: cache_dir})

  generation_config =
    Bumblebee.configure(generation_config, max_new_tokens: 10)

  Bumblebee.Text.generation(model, tokenizer, generation_config)
end

"gpt2-medium"
|> serve_model.()
|> Nx.Serving.run(text)
|> Map.get(:results)

"gpt2-large"
|> serve_model.()
|> Nx.Serving.run(text)
|> Map.get(:results)

Other notebooks:

Michal Slaski
@michalslaski

livebook_examples

Salary predictions

salary_prediction.livemd

advanced data-science exla axon nx

2022-8-18
Dr. Christian Geuer-Pollmann
@chgeuer

livebook_on_azure

Christian's first LiveBook test

notebook1.livemd

tutorial advanced data-science axon exla nx

2022-8-18
@andyl

elix_util

MNIST

mnist.livemd

tutorial advanced data-science req axon exla nx

2022-8-18
Yejun Su
@goofansu

ogp

ogp

ogp.livemd

tutorial intermediate ogp kino

2022-8-18
Aurélien Noce
@ushu

elixir-course

C1N2 – Aller un peu plus loin en Elixir

2-aller-plus-loin.livemd

tutorial intermediate kino pythonx kino_pythonx

2025-8-23
Camelo
@josecfreittas

elixir-notebooks

Ecto with schemaless queries

ecto-with-schemaless-queries.livemd

tutorial advanced sql jason ecto_sql postgrex kino

2022-8-18
Nick C
@flowerett

aoc

Day17

day17.livemd

advanced algorithms kino_aoc benchee nimble_parsec libgraph math heap

2023-12-23

Back