make dtype selection a function of host and device (#768)

* address #651 by making dtype selection a function of host and device * fix typo * typo * typo
pytorch · May 13, 2024 · 49651ab · 49651ab
1 parent 262d5de
commit 49651ab
Show file tree

Hide file tree

Showing 4 changed files with 10 additions and 5 deletions.
diff --git a/.github/workflows/run-readme-pr-mps.yml b/.github/workflows/run-readme-pr-mps.yml
@@ -56,7 +56,7 @@ jobs:
           conda activate test-quantization-mps-macos
           # NS: Remove previous installation  of torch first
           # as this script does not isntall anything into conda env
-	  #but rather  system dep
+          #but rather  system dep
           pip3 uninstall -y torch || true
           set -eou pipefail
 

diff --git a/build/builder.py b/build/builder.py
@@ -120,11 +120,14 @@ def from_args(cls, args):  # -> BuilderArgs:
 
         if args.output_pte_path and args.dtype.startswith("fast"):
             if args.dtype == "fast":
+                # As per Kimish, float32 should be faster on ET XNNPACK
+                # (because fp16 is implemented as upcast to fp32 for several
+                # operators, and in particular a8w4dq and ET's sdpa+kv)
                 dtype = torch.float32
             else:
                 dtype = torch.float16
         else:
-            dtype = name_to_dtype(args.dtype)
+            dtype = name_to_dtype(args.dtype, args.device)
 
         return cls(
             checkpoint_dir=checkpoint_dir,

diff --git a/build/utils.py b/build/utils.py
@@ -130,13 +130,15 @@ def get_precision():
 ###               dtype name to torch.dtype mapping                    ###
 
 
-def name_to_dtype(name):
+def name_to_dtype(name, device):
     if (name == "fast") or (name == "fast16"):
         # MacOS now supports bfloat16
         import platform
 
         if platform.processor() == "arm":
-            if int(platform.mac_ver()[0].split(".")[0]) < 14:
+            device=get_device_str(device)
+            # ARM CPU is faster with float16, MPS with bf16 if supported
+            if device == "cpu" or int(platform.mac_ver()[0].split(".")[0]) < 14:
                 return torch.float16
         return torch.bfloat16
 

diff --git a/quantize.py b/quantize.py
@@ -93,7 +93,7 @@ def __init__(self, model: nn.Module, device="cpu", tokenizer=None, *, dtype):
         self.tokenizer = tokenizer
 
         if isinstance(dtype, str):
-            dtype = name_to_dtype(dtype)
+            dtype = name_to_dtype(dtype, device)
         self.dtype = dtype
 
     def create_quantized_state_dict(self) -> Dict:  # "StateDict"