Skip to content

Commit

Permalink
forgot fill
Browse files Browse the repository at this point in the history
  • Loading branch information
Tristan Konolige committed May 13, 2022
1 parent de4b825 commit bd758eb
Showing 1 changed file with 1 addition and 0 deletions.
1 change: 1 addition & 0 deletions python/tvm/utils/roofline.py
Original file line number Diff line number Diff line change
Expand Up @@ -175,6 +175,7 @@ def estimate_peak_fma_flops(
assert random_fill, "Please make sure USE_RANDOM is ON in config.cmake"

a = nd.empty((nthreads, num_vector_registers, vec_width), dtype="float32", device=dev)
random_fill(a)
times = f.time_evaluator(f.entry_name, dev, repeat=100, number=1)(a)
flops = 2 * vec_width * num_vector_registers * nthreads * iters # fma is two flops
flop_s = flops / times.min
Expand Down

0 comments on commit bd758eb

Please sign in to comment.