forked from phoenix-oss/llama-stack-mirror
		
	Remove request arg from chat completion response processing (#240)
Signed-off-by: Yuan Tang <terrytangyuan@gmail.com>
This commit is contained in:
		
							parent
							
								
									209cd3d35e
								
							
						
					
					
						commit
						80ada04f76
					
				
					 7 changed files with 14 additions and 18 deletions
				
			
		|  | @ -116,7 +116,7 @@ class _HfAdapter(Inference, ModelsProtocolPrivate): | |||
|         response = OpenAICompatCompletionResponse( | ||||
|             choices=[choice], | ||||
|         ) | ||||
|         return process_chat_completion_response(request, response, self.formatter) | ||||
|         return process_chat_completion_response(response, self.formatter) | ||||
| 
 | ||||
|     async def _stream_chat_completion( | ||||
|         self, request: ChatCompletionRequest | ||||
|  | @ -135,7 +135,7 @@ class _HfAdapter(Inference, ModelsProtocolPrivate): | |||
| 
 | ||||
|         stream = _generate_and_convert_to_openai_compat() | ||||
|         async for chunk in process_chat_completion_stream_response( | ||||
|             request, stream, self.formatter | ||||
|             stream, self.formatter | ||||
|         ): | ||||
|             yield chunk | ||||
| 
 | ||||
|  |  | |||
		Loading…
	
	Add table
		Add a link
		
	
		Reference in a new issue