Skip to content

Commit ce3c09d

Browse files
import proposer from nlp
1 parent e3bc5aa commit ce3c09d

2 files changed

Lines changed: 2 additions & 95 deletions

File tree

llm/server/server/engine/infer.py

Lines changed: 2 additions & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -29,7 +29,7 @@
2929
from paddlenlp_ops import step_paddle, speculate_step_paddle
3030
from server.data.processor import DataProcessor
3131
from server.engine.config import Config
32-
from server.engine.proposers import InferenceWithReferenceProposer
32+
from paddlenlp.experimental.transformers import InferenceWithReferenceProposer
3333
from server.utils import get_logger
3434
from task_queue_manager import TaskQueueManager
3535

@@ -518,6 +518,7 @@ def run(self):
518518
self.share_inputs['infer_seed'].add_(infer_seed_increment)
519519
self.share_inputs['infer_seed'][:] %= self.MAX_INFER_SEED
520520
if self.free_list_len > 0:
521+
logger.info('You got into step CUDA!!!')
521522
self.step_cuda(seq_lens_this_time)
522523

523524

llm/server/server/engine/proposers.py

Lines changed: 0 additions & 94 deletions
This file was deleted.

0 commit comments

Comments
 (0)