InternLM · lvhan028 · Nov 22, 2024 · Nov 17, 2024 · Nov 18, 2024 · Nov 18, 2024
diff --git a/lmdeploy/vl/engine.py b/lmdeploy/vl/engine.py
@@ -246,10 +246,10 @@ async def async_infer(self, messages: List[Dict]) -> List[Dict]:
         assert isinstance(messages, List)
         assert all(isinstance(item, Dict) for item in messages)
         for i, message in enumerate(messages):
-            preprocess = message.pop('preprocess', None)
+            preprocess = message['preprocess']
             if preprocess:
                 result = self.model.forward(preprocess)
-                messages[i].update(preprocess=result)
+                messages[i].update(forward=result)
         return messages
 
     async def wrap_for_pytorch(self, messages: List[Dict], chat_template,
@@ -275,5 +275,17 @@ async def wrap_for_pytorch(self, messages: List[Dict], chat_template,
 
     async def wrap_for_turbomind(self, messages: List[Dict], chat_template,
                                  tokenizer, sequence_start) -> Dict:
+        """
+        Args:
+            messages (List[Dict]): a list of message, which is supposed to be
+                the output of `async_infer`
+        Returns:
+            a dict which will be passed to pytorch engine_instance's forward.
+            The dict is like the following:
+            Dict(
+                'prompt': 'the prompt after applying chat template'
+                'input_ids': [],
+
+        """
         return self.model.to_turbomind(messages, chat_template, tokenizer,
                                        sequence_start)
diff --git a/lmdeploy/vl/model/base.py b/lmdeploy/vl/model/base.py
@@ -149,8 +149,8 @@ def to_turbomind_aux(cls, messages, prompt, IMAGE_TOKEN, tokenizer,
                          sequence_start):
         # collect image features from messages
         features = [
-            message.pop('preprocess') for message in messages
-            if 'preprocess' in message.keys()
+            message.pop('forward') for message in messages
+            if 'forward' in message.keys()
         ]
         # flatten the list
         features = list(itertools.chain(*features))