Xiangyu Tian
								
							 
						 | 
						
							
							
								
								
							
							
							
								
							
							
								11550d3f25
								
							
						 | 
						
							
							
								
								LLM: Add length check for IPEX-CPU speculative decoding  (#10529)
							
							
							
							
							
							
							
							Add length check for IPEX-CPU speculative decoding. 
							
						 | 
						
							2024-03-26 17:47:10 +08:00 | 
						
						
							
							
							
								
							
							
						 | 
					
				
					
						
							
								
								
									 
									Guancheng Fu
								
							 
						 | 
						
							
							
								
								
							
							
							
								
							
							
								a3b007f3b1
								
							
						 | 
						
							
							
								
								[Serving] Fix fastchat breaks (#10548)
							
							
							
							
							
							
							
							* fix fastchat
* fix doc 
							
						 | 
						
							2024-03-26 17:03:52 +08:00 | 
						
						
							
							
							
								
							
							
						 | 
					
				
					
						
							
								
								
									 
									Yishuo Wang
								
							 
						 | 
						
							
							
								
								
							
							
							
								
							
							
								69a28d6b4c
								
							
						 | 
						
							
							
								
								fix chatglm (#10540)
							
							
							
							
							
						 | 
						
							2024-03-26 16:01:00 +08:00 | 
						
						
							
							
							
								
							
							
						 | 
					
				
					
						
							
								
								
									 
									binbin Deng
								
							 
						 | 
						
							
							
								
								
							
							
							
								
							
							
								0a3e4e788f
								
							
						 | 
						
							
							
								
								LLM: fix mistral hidden_size setting for deepspeed autotp (#10527)
							
							
							
							
							
						 | 
						
							2024-03-26 10:55:44 +08:00 | 
						
						
							
							
							
								
							
							
						 | 
					
				
					
						
							
								
								
									 
									Xin Qiu
								
							 
						 | 
						
							
							
								
								
							
							
							
								
							
							
								1dd40b429c
								
							
						 | 
						
							
							
								
								enable fp4 fused mlp and qkv (#10531)
							
							
							
							
							
							
							
							* enable fp4 fused mlp and qkv
* update qwen
* update qwen2 
							
						 | 
						
							2024-03-26 08:34:00 +08:00 | 
						
						
							
							
							
								
							
							
						 | 
					
				
					
						
							
								
								
									 
									Wang, Jian4
								
							 
						 | 
						
							
							
								
								
							
							
							
								
							
							
								16b2ef49c6
								
							
						 | 
						
							
							
								
								Update_document by heyang (#30)
							
							
							
							
							
						 | 
						
							2024-03-25 10:06:02 +08:00 | 
						
						
							
							
							
								
							
							
						 | 
					
				
					
						
							
								
								
									 
									Wang, Jian4
								
							 
						 | 
						
							
							
								
								
							
							
							
								
							
							
								a1048ca7f6
								
							
						 | 
						
							
							
								
								Update setup.py and add new actions and add compatible mode (#25)
							
							
							
							
							
							
							
							* update setup.py
* add new action
* add compatible mode 
							
						 | 
						
							2024-03-22 15:44:59 +08:00 | 
						
						
							
							
							
								
							
							
						 | 
					
				
					
						
							
								
								
									 
									Wang, Jian4
								
							 
						 | 
						
							
							
								
								
							
							
							
								
							
							
								9df70d95eb
								
							
						 | 
						
							
							
								
								Refactor bigdl.llm to  ipex_llm (#24)
							
							
							
							
							
							
							
							* Rename bigdl/llm to ipex_llm
* rm python/llm/src/bigdl
* from bigdl.llm to from ipex_llm 
							
						 | 
						
							2024-03-22 15:41:21 +08:00 | 
						
						
							
							
							
								
							
							
						 |