Update README.md

2026-03-07 22:33:47 +00:00 · 2023-09-14 21:29:06 -05:00
parent 57c2b6eee3
commit 2c4eec6aa8
1 changed files with 2 additions and 1 deletions
--- a/anima_100k/README.md
+++ b/anima_100k/README.md
@@ -184,7 +184,8 @@ inputs['attention_mask'] = inputs['attention_mask'].cuda()

 # Generate
 generate_ids = model.generate(**inputs, max_new_tokens=30,
-                       only_last_logit=True,
+                       only_last_logit=True, # to save memory
+                       use_cache=False, # when run into OOM, enable this can save memory
                       xentropy=True)
 output = tokenizer.batch_decode(generate_ids, 
                                skip_special_tokens=True,