There was an error while loading. Please reload this page.
1 parent d9054c6 commit 5bfd107Copy full SHA for 5bfd107
lightrag/llm.py
@@ -268,7 +268,7 @@ async def hf_model_if_cache(
268
).to("cuda")
269
inputs = {k: v.to(hf_model.device) for k, v in input_ids.items()}
270
output = hf_model.generate(
271
- **input_ids, max_new_tokens=200, num_return_sequences=1, early_stopping=True
+ **input_ids, max_new_tokens=512, num_return_sequences=1, early_stopping=True
272
)
273
response_text = hf_tokenizer.decode(output[0][len(inputs["input_ids"][0]):], skip_special_tokens=True)
274
if hashing_kv is not None:
0 commit comments