qecil
diff --git a/‎lightrag/llm.py‎
Lines changed: 1 addition & 1 deletion b/‎lightrag/llm.py‎
Lines changed: 1 addition & 1 deletion
@@ -268,7 +268,7 @@ async def hf_model_if_cache(
     ).to("cuda")
     inputs = {k: v.to(hf_model.device) for k, v in input_ids.items()}
     output = hf_model.generate(
-        **input_ids, max_new_tokens=200, num_return_sequences=1, early_stopping=True
+        **input_ids, max_new_tokens=512, num_return_sequences=1, early_stopping=True
     )
     response_text = hf_tokenizer.decode(output[0][len(inputs["input_ids"][0]):], skip_special_tokens=True)
     if hashing_kv is not None:
Original file line number	Diff line number	Diff line change
`@@ -268,7 +268,7 @@ async def hf_model_if_cache(`
`268`	`268`	`).to("cuda")`
`269`	`269`	`inputs = {k: v.to(hf_model.device) for k, v in input_ids.items()}`
`270`	`270`	`output = hf_model.generate(`
`271`		`- **input_ids, max_new_tokens=200, num_return_sequences=1, early_stopping=True`
	`271`	`+ **input_ids, max_new_tokens=512, num_return_sequences=1, early_stopping=True`
`272`	`272`	`)`
`273`	`273`	`response_text = hf_tokenizer.decode(output[0][len(inputs["input_ids"][0]):], skip_special_tokens=True)`
`274`	`274`	`if hashing_kv is not None:`