File tree Expand file tree Collapse file tree 1 file changed +13
-2
lines changed Expand file tree Collapse file tree 1 file changed +13
-2
lines changed Original file line number Diff line number Diff line change @@ -275,6 +275,7 @@ def _create_completion(
275
275
repeat_penalty : float = 1.1 ,
276
276
top_k : int = 40 ,
277
277
stream : bool = False ,
278
+ interactive : bool = False ,
278
279
) -> Union [
279
280
Generator [Completion , None , None ],
280
281
Generator [CompletionChunk , None , None ],
@@ -299,13 +300,23 @@ def _create_completion(
299
300
stop_sequences = []
300
301
301
302
finish_reason = None
302
- for token in self .generate (
303
+ if interactive :
304
+ self ._session = self .generate (
305
+ prompt_tokens ,
306
+ top_k = top_k ,
307
+ top_p = top_p ,
308
+ temp = temperature ,
309
+ repeat_penalty = repeat_penalty ,)
310
+ session = self ._session
311
+ else :
312
+ session = self .generate (
303
313
prompt_tokens ,
304
314
top_k = top_k ,
305
315
top_p = top_p ,
306
316
temp = temperature ,
307
317
repeat_penalty = repeat_penalty ,
308
- ):
318
+ )
319
+ for token in session :
309
320
if token == llama_cpp .llama_token_eos ():
310
321
text = self .detokenize (completion_tokens )
311
322
finish_reason = "stop"
You can’t perform that action at this time.
0 commit comments