facebookresearch · vladkalinichencko · Jan 13, 2024 · Jan 13, 2024 · Jan 13, 2024 · Jan 13, 2024
diff --git a/README.md b/README.md
@@ -50,7 +50,7 @@ $ nougat path/to/directory -o output_directory
 
 ```
 usage: nougat [-h] [--batchsize BATCHSIZE] [--checkpoint CHECKPOINT] [--model MODEL] [--out OUT]
-              [--recompute] [--markdown] [--no-skipping] pdf [pdf ...]
+              [--recompute] [--markdown] [--no-skipping] [--device-index DEVICEINDEX] pdf [pdf ...]
 
 positional arguments:
   pdf                   PDF(s) to process.

diff --git a/nougat/model.py b/nougat/model.py
@@ -266,7 +266,7 @@ def __init__(
                     ]
                 else:
                     new_bart_state_dict[x] = bart_state_dict[x]
-            self.model.load_state_dict(new_bart_state_dict, strict=False)
+            self.model.load_state_dict(new_bart_state_dict)
 
     def add_special_tokens(self, list_of_tokens: List[str]):
         """

diff --git a/nougat/utils/device.py b/nougat/utils/device.py
@@ -24,15 +24,14 @@ def default_batch_size():
         logging.warning("No GPU found. Conversion on CPU is very slow.")
     return batch_size
 
-
-def move_to_device(model, bf16: bool = True, cuda: bool = True):
-    try:
-        if torch.backends.mps.is_available():
-            return model.to("mps")
-    except AttributeError:
-        pass
-    if bf16:
-        model = model.to(torch.bfloat16)
-    if cuda and torch.cuda.is_available():
-        model = model.to("cuda")
-    return model
+def move_to_device(model, bf16: bool = True, cuda: bool = True, device_index: int = 0):
+   try:
+       if torch.backends.mps.is_available():
+           return model.to("mps")
+   except AttributeError:
+       pass
+   if bf16:
+       model = model.to(torch.bfloat16)
+   if cuda and torch.cuda.is_available():
+       model = model.to(f"cuda:{device_index}")
+   return model
diff --git a/predict.py b/predict.py
@@ -82,6 +82,12 @@ def get_args():
         type=str,
         help="Provide page numbers like '1-4,7' for pages 1 through 4 and page 7. Only works for single PDF input.",
     )
+    parser.add_argument(
+        "--device-index",
+        type=int,
+        default=0,
+        help="Index of the preferred GPU device.",
+    )
     parser.add_argument("pdf", nargs="+", type=Path, help="PDF(s) to process.")
     args = parser.parse_args()
     if args.checkpoint is None or not args.checkpoint.exists():
@@ -125,7 +131,7 @@ def get_args():
 def main():
     args = get_args()
     model = NougatModel.from_pretrained(args.checkpoint)
-    model = move_to_device(model, bf16=not args.full_precision, cuda=args.batchsize > 0)
+    model = move_to_device(model, bf16=not args.full_precision, cuda=args.batchsize > 0, device_index=args.device_index)
     if args.batchsize <= 0:
         # set batch size to 1. Need to check if there are benefits for CPU conversion for >1
         args.batchsize = 1