Merge pull request #58 from BBuf/patch-1

Avoid computing model initialization time
pull/65/head
Qinkai 2 years ago committed by GitHub
commit 95041530a0
No known key found for this signature in database
GPG Key ID: 4AEE18F83AFDEB23

@ -137,6 +137,7 @@ def main():
if args.quantize:
model = quantize(model, weight_bit_width=8, backend="torch")
model.cuda()
torch.cuda.synchronize()
with open(args.prompt_file, "r") as f:
prompt = f.readlines()

Loading…
Cancel
Save