Evision DNN

livebooks/evision/dnn.livemd

Ryo Wakabayashi

@RyoWakabayashi

elixir-learning

Share to X

Share to Bluesky

More notebooks

Evision DNN

Mix.install([
  {:req, "~> 0.5"},
  {:evision, "~> 0.2"},
  {:kino, "~> 0.15"},
  {:nx, "~> 0.9"}
])

Download model

weights_path = "/tmp/yolov3.weights"
cfg_path = "/tmp/yolov3.cfg"
label_path = "/tmp/label.txt"

"https://pjreddie.com/media/files/yolov3.weights"
|> Req.get!(connect_options: [timeout: 300_000], into: File.stream!(weights_path))

"https://raw.githubusercontent.com/pjreddie/darknet/master/cfg/yolov3.cfg"
|> Req.get!(into: File.stream!(cfg_path))

"https://raw.githubusercontent.com/pjreddie/darknet/master/data/coco.names"
|> Req.get!(into: File.stream!(label_path))

Load model

net = Evision.DNN.readNet(weights_path, config: cfg_path, framework: "")

out_names = Evision.DNN.Net.getUnconnectedOutLayersNames(net)

label_list =
  label_path
  |> File.stream!()
  |> Enum.map(&amp;String.trim/1)

Download image

img_path = "/tmp/dog.jpg"

"https://raw.githubusercontent.com/pjreddie/darknet/master/data/dog.jpg"
|> Req.get!(into: File.stream!(img_path))

Load image

img = Evision.imread(img_path)

{height, width, _} = Evision.Mat.shape(img)

Detect objects

blob = Evision.DNN.blobFromImage(img, size: {608, 608}, swapRB: true, crop: false)

predictions =
  net
  |> Evision.DNN.Net.setInput(
    blob,
    name: "",
    scalefactor: 1 / 255,
    mean: {0, 0, 0}
  )
  |> Evision.DNN.Net.forward(outBlobNames: out_names)

Format predictions

score_threshold = 0.8

predictions_tensor =
  predictions
  # テンソルに変換
  |> Enum.map(&amp;Evision.Mat.to_nx(&amp;1, Nx.BinaryBackend))
  # くっつける
  |> Nx.concatenate()

score_threshold = 0.8

formed_predictions =
  predictions
  # テンソルに変換
  |> Enum.map(&amp;Evision.Mat.to_nx(&amp;1, Nx.BinaryBackend))
  # くっつける
  |> Nx.concatenate()
  # 配列にする
  |> Nx.to_batched(1)
  # [4] にスコアが入っているので、閾値以下のものを除外する
  |> Enum.filter(fn t ->
    t[0][4]
    |> Nx.to_number()
    |> Kernel.>(score_threshold)
  end)
  |> Enum.map(fn t ->
    # [5] 以降に各クラスに対するスコアが入っているため、トップのものを取得する
    class_score_list = t[0][5..-1//1]
    class_id = class_score_list |> Nx.argmax() |> Nx.to_number()
    class_score = class_score_list[class_id] |> Nx.to_number()
    score = t[0][4] |> Nx.to_number() |> Kernel.*(class_score)

    # [0] から [3] に座標情報が入っている
    # 中央+サイズから、左上右下の値に変換する
    center_x = t[0][0] |> Nx.to_number()
    center_y = t[0][1] |> Nx.to_number()
    box_width = t[0][2] |> Nx.to_number()
    box_height = t[0][3] |> Nx.to_number()
    min_x = center_x - box_width / 2
    min_y = center_y - box_height / 2
    max_x = center_x + box_width / 2
    max_y = center_y + box_height / 2

    box = {min_x, min_y, max_x, max_y}

    # マップに格納する
    %{
      box: box,
      score: score,
      class: class_id
    }
  end)

Non Max Suppression

box_list = Enum.map(formed_predictions, &amp; &amp;1.box)
score_list = Enum.map(formed_predictions, &amp; &amp;1.score)

nms_threshold = 0.7

index_list = Evision.DNN.nmsBoxes(box_list, score_list, score_threshold, nms_threshold)

selected_predictions = Enum.map(index_list, &amp;Enum.at(formed_predictions, &amp;1))

Draw predictions

selected_predictions
|> Enum.reduce(img, fn prediction, drawed_mat ->
  # 座標に画像サイズを掛ける
  box = Tuple.to_list(prediction.box)
  left = Enum.at(box, 0) |> Kernel.*(width) |> trunc()
  top = Enum.at(box, 1) |> Kernel.*(height) |> trunc()
  right = Enum.at(box, 2) |> Kernel.*(width) |> trunc()
  bottom = Enum.at(box, 3) |> Kernel.*(height) |> trunc()

  # class の値に対応するラベルを取得する
  label = Enum.at(label_list, prediction.class)

  drawed_mat
  # 四角形を描画する
  |> Evision.rectangle(
    {left, top},
    {right, bottom},
    {255, 0, 0},
    thickness: 4
  )
  # ラベル文字を書く
  |> Evision.putText(
    label,
    {left + 6, top + 26},
    Evision.Constant.cv_FONT_HERSHEY_SIMPLEX(),
    0.8,
    {0, 0, 255},
    thickness: 2
  )
end)

Other notebooks:

Michal Slaski
@michalslaski

livebook_examples

Salary predictions

salary_prediction.livemd

exla axon nx

2022-8-18
Dr. Christian Geuer-Pollmann
@chgeuer

livebook_on_azure

Christian's first LiveBook test

notebook1.livemd

axon exla nx

2022-8-18
@andyl

elix_util

MNIST

mnist.livemd

req axon exla nx

2022-8-18
@TomBers

livebookNotes

Attractors

attractors.livemd

decimal vega_lite kino

2022-8-18
@DockYard-Academy

curriculum

Rock Paper Scissors Lizard Spock

rock_paper_scissors_lizard_spock.livemd

jason kino youtube hidden_cell

2023-1-23
Ryo Wakabayashi
@RyoWakabayashi

elixir-learning

SQS trigger a Lambda function

broadway_sqs_lambda.livemd

aws ex_aws ex_aws_lambda ex_aws_s3 ex_aws_sqs ex_aws_sts kino hackney jason sweet_xml broadway broadway_sqs

2023-10-21
Byzan Team
@Byzanteam

coloured_flow

Traffic Light

traffic_light.livemd

kino_excalidraw coloured_flow kino

2024-11-16

Back