Yuwen Hu 
								
							 
						 
						
							
							
								
								
							
							
							
								
							
							
								643458d8f0 
								
							 
						 
						
							
							
								
								Update GraphRAG QuickStart ( #11995 )  
							
							 
							
							... 
							
							
							
							* Update GraphRAG QuickStart
* Further updates
* Small fixes
* Small fix 
							
						 
						
							2024-09-03 15:52:08 +08:00  
						
						
							 
							
							
								 
							 
							
						 
					 
				
					
						
							
								
								
									 
									binbin Deng 
								
							 
						 
						
							
							
								
								
							
							
							
								
							
							
								01099f08ee 
								
							 
						 
						
							
							
								
								Revert prefill logic of qwen2-7b ( #11992 )  
							
							 
							
							
							
						 
						
							2024-09-03 14:45:01 +08:00  
						
						
							 
							
							
								 
							 
							
						 
					 
				
					
						
							
								
								
									 
									Yuwen Hu 
								
							 
						 
						
							
							
								
								
							
							
							
								
							
							
								659d15defc 
								
							 
						 
						
							
							
								
								Fix wrong attention mask and garbage output for inputs_embeds inputs during lookup generation ( #11989 )  
							
							 
							
							... 
							
							
							
							* Fix garbage output for input_embeds inputs during lookup generation
* Fix on sliding windows
* Simplify code 
							
						 
						
							2024-09-02 19:09:12 +08:00  
						
						
							 
							
							
								 
							 
							
						 
					 
				
					
						
							
								
								
									 
									binbin Deng 
								
							 
						 
						
							
							
								
								
							
							
							
								
							
							
								2f3d1bd0ec 
								
							 
						 
						
							
							
								
								hotfix qwen2-7b weight setting ( #11991 )  
							
							 
							
							
							
						 
						
							2024-09-02 18:11:08 +08:00  
						
						
							 
							
							
								 
							 
							
						 
					 
				
					
						
							
								
								
									 
									binbin Deng 
								
							 
						 
						
							
							
								
								
							
							
							
								
							
							
								a40ea7038d 
								
							 
						 
						
							
							
								
								Fix AttributeError of qwen2-1.5B ( #11990 )  
							
							 
							
							
							
						 
						
							2024-09-02 17:55:10 +08:00  
						
						
							 
							
							
								 
							 
							
						 
					 
				
					
						
							
								
								
									 
									Yang Wang 
								
							 
						 
						
							
							
								
								
							
							
							
								
							
							
								c48817bd43 
								
							 
						 
						
							
							
								
								Support Qwen2-7b MLP in int4 and transpose_value_cache=True ( #11968 )  
							
							 
							
							
							
						 
						
							2024-09-02 14:37:44 +08:00  
						
						
							 
							
							
								 
							 
							
						 
					 
				
					
						
							
								
								
									 
									Jin, Qiao 
								
							 
						 
						
							
							
								
								
							
							
							
								
							
							
								65e281bb29 
								
							 
						 
						
							
							
								
								Add MiniCPM-V cpu example ( #11975 )  
							
							 
							
							... 
							
							
							
							* Add MiniCPM-V cpu example
* fix
* fix
* fix
* fix 
							
						 
						
							2024-09-02 10:17:57 +08:00  
						
						
							 
							
							
								 
							 
							
						 
					 
				
					
						
							
								
								
									 
									Ruonan Wang 
								
							 
						 
						
							
							
								
								
							
							
							
								
							
							
								79978e6f36 
								
							 
						 
						
							
							
								
								update npu multimodal readme ( #11979 )  
							
							 
							
							... 
							
							
							
							* update npu readme of multimodal
* small fix
* meet comment 
							
						 
						
							2024-08-30 19:02:06 +08:00  
						
						
							 
							
							
								 
							 
							
						 
					 
				
					
						
							
								
								
									 
									Ruonan Wang 
								
							 
						 
						
							
							
								
								
							
							
							
								
							
							
								4811a490ef 
								
							 
						 
						
							
							
								
								small fix ( #11978 )  
							
							 
							
							... 
							
							
							
							* fix
* meet comment 
							
						 
						
							2024-08-30 17:55:15 +08:00  
						
						
							 
							
							
								 
							 
							
						 
					 
				
					
						
							
								
								
									 
									Ruonan Wang 
								
							 
						 
						
							
							
								
								
							
							
							
								
							
							
								573c20bae6 
								
							 
						 
						
							
							
								
								fix npu lm_head cpu condition ( #11976 )  
							
							 
							
							... 
							
							
							
							* fix
* fix
* fix
* fix stype
* fix style
* fix style 
							
						 
						
							2024-08-30 17:11:26 +08:00  
						
						
							 
							
							
								 
							 
							
						 
					 
				
					
						
							
								
								
									 
									Ruonan Wang 
								
							 
						 
						
							
							
								
								
							
							
							
								
							
							
								60aa1a2c0f 
								
							 
						 
						
							
							
								
								Initial NPU support for MiniCPM-V-2_6 ( #11966 )  
							
							 
							
							... 
							
							
							
							* initial pr
* update npu model
* fix
* fix kv cache type
* fix
* small fix
* fix style
* fix model id
* change inter_pp=4
* address comment
* fix
* fix style
* fix
* rebase 
							
						 
						
							2024-08-30 16:34:35 +08:00  
						
						
							 
							
							
								 
							 
							
						 
					 
				
					
						
							
								
								
									 
									SONG Ge 
								
							 
						 
						
							
							
								
								
							
							
							
								
							
							
								158289d205 
								
							 
						 
						
							
							
								
								[NPU] Add initial support for minicpm-llama-v2.5 ( #11962 )  
							
							 
							
							... 
							
							
							
							* add initial support for minicpm-llama-v2.5
* update impl
* add minicpm-llama3-v2.5 example 
							
						 
						
							2024-08-30 16:00:33 +08:00  
						
						
							 
							
							
								 
							 
							
						 
					 
				
					
						
							
								
								
									 
									Chu,Youcheng 
								
							 
						 
						
							
							
								
								
							
							
							
								
							
							
								ae7302a654 
								
							 
						 
						
							
							
								
								add gptq option for ppl test ( #11921 )  
							
							 
							
							... 
							
							
							
							* feat:add gptq for ppl
* fix: add an empty line
* fix: add an empty line
* fix: remove an empty line
* Resolve comments
* Resolve comments
* Resolve comments 
							
						 
						
							2024-08-30 13:43:48 +08:00  
						
						
							 
							
							
								 
							 
							
						 
					 
				
					
						
							
								
								
									 
									Shaojun Liu 
								
							 
						 
						
							
							
								
								
							
							
							
								
							
							
								1e8c87050f 
								
							 
						 
						
							
							
								
								fix model path ( #11973 )  
							
							 
							
							
							
						 
						
							2024-08-30 13:28:28 +08:00  
						
						
							 
							
							
								 
							 
							
						 
					 
				
					
						
							
								
								
									 
									Jinhe 
								
							 
						 
						
							
							
								
								
							
							
							
								
							
							
								e895e1b4c5 
								
							 
						 
						
							
							
								
								modification on llamacpp readme after Ipex-llm latest update ( #11971 )  
							
							 
							
							... 
							
							
							
							* update on readme after ipex-llm update
* update on readme after ipex-llm update
* rebase & delete redundancy
* revise
* add numbers for troubleshooting 
							
						 
						
							2024-08-30 11:36:45 +08:00  
						
						
							 
							
							
								 
							 
							
						 
					 
				
					
						
							
								
								
									 
									binbin Deng 
								
							 
						 
						
							
							
								
								
							
							
							
								
							
							
								cd077881f1 
								
							 
						 
						
							
							
								
								Disable lm head ( #11972 )  
							
							 
							
							
							
						 
						
							2024-08-30 11:05:18 +08:00  
						
						
							 
							
							
								 
							 
							
						 
					 
				
					
						
							
								
								
									 
									Wang, Jian4 
								
							 
						 
						
							
							
								
								
							
							
							
								
							
							
								7d103417b8 
								
							 
						 
						
							
							
								
								Fix glm4-9b-chat nan error on vllm 0.3.3 ( #11970 )  
							
							 
							
							... 
							
							
							
							* fix nan value
* update 
							
						 
						
							2024-08-30 09:50:18 +08:00  
						
						
							 
							
							
								 
							 
							
						 
					 
				
					
						
							
								
								
									 
									Ch1y0q 
								
							 
						 
						
							
							
								
								
							
							
							
								
							
							
								77b04efcc5 
								
							 
						 
						
							
							
								
								add notes for SYCL_PI_LEVEL_ZERO_USE_IMMEDIATE_COMMANDLISTS ( #11936 )  
							
							 
							
							... 
							
							
							
							* add notes for `SYCL_PI_LEVEL_ZERO_USE_IMMEDIATE_COMMANDLISTS`
* also update other quickstart 
							
						 
						
							2024-08-30 09:26:47 +08:00  
						
						
							 
							
							
								 
							 
							
						 
					 
				
					
						
							
								
								
									 
									Yang Wang 
								
							 
						 
						
							
							
								
								
							
							
							
								
							
							
								fbf088f61e 
								
							 
						 
						
							
							
								
								remove obselete npu code ( #11967 )  
							
							 
							
							
							
						 
						
							2024-08-29 14:16:44 -07:00  
						
						
							 
							
							
								 
							 
							
						 
					 
				
					
						
							
								
								
									 
									Yuwen Hu 
								
							 
						 
						
							
							
								
								
							
							
							
								
							
							
								a9e485eb1b 
								
							 
						 
						
							
							
								
								Support MiniCPM-V-2_6 multi-modal benchmarking with latency text streamer ( #11963 )  
							
							 
							
							... 
							
							
							
							* Support MiniCPM-V-2_6 multi-modal benchmarking with latency text streamer
* Style fixes 
							
						 
						
							2024-08-29 19:22:09 +08:00  
						
						
							 
							
							
								 
							 
							
						 
					 
				
					
						
							
								
								
									 
									Yuwen Hu 
								
							 
						 
						
							
							
								
								
							
							
							
								
							
							
								2e49e1f8e9 
								
							 
						 
						
							
							
								
								Further fix for MiniCPM-V-2_6 example ( #11965 )  
							
							 
							
							
							
						 
						
							2024-08-29 19:14:13 +08:00  
						
						
							 
							
							
								 
							 
							
						 
					 
				
					
						
							
								
								
									 
									Jason Dai 
								
							 
						 
						
							
							
								
								
							
							
							
								
							
							
								431affd0a0 
								
							 
						 
						
							
							
								
								Update README.md ( #11964 )  
							
							 
							
							
							
						 
						
							2024-08-29 18:56:35 +08:00  
						
						
							 
							
							
								 
							 
							
						 
					 
				
					
						
							
								
								
									 
									binbin Deng 
								
							 
						 
						
							
							
								
								
							
							
							
								
							
							
								14b2c8dc32 
								
							 
						 
						
							
							
								
								Update qwen2-7b example script ( #11961 )  
							
							 
							
							
							
						 
						
							2024-08-29 18:25:17 +08:00  
						
						
							 
							
							
								 
							 
							
						 
					 
				
					
						
							
								
								
									 
									Yuwen Hu 
								
							 
						 
						
							
							
								
								
							
							
							
								
							
							
								7abe17d6f7 
								
							 
						 
						
							
							
								
								Update MiniCPM-V-2_6 Example ( #11958 )  
							
							 
							
							... 
							
							
							
							* Update example scripts regarding warmup, stream generate, moudles to not convert, etc.
* Update readme accordingly
* Fix based on comments
* Small fix
* Remove n_predict 
							
						 
						
							2024-08-29 18:23:48 +08:00  
						
						
							 
							
							
								 
							 
							
						 
					 
				
					
						
							
								
								
									 
									Jinhe 
								
							 
						 
						
							
							
								
								
							
							
							
								
							
							
								6fc9340d53 
								
							 
						 
						
							
							
								
								restore ollama webui quickstart ( #11955 )  
							
							 
							
							
							
						 
						
							2024-08-29 17:53:19 +08:00  
						
						
							 
							
							
								 
							 
							
						 
					 
				
					
						
							
								
								
									 
									Yina Chen 
								
							 
						 
						
							
							
								
								
							
							
							
								
							
							
								5f7ff76ea5 
								
							 
						 
						
							
							
								
								update troubleshooting ( #11960 )  
							
							 
							
							
							
						 
						
							2024-08-29 17:44:22 +08:00  
						
						
							 
							
							
								 
							 
							
						 
					 
				
					
						
							
								
								
									 
									Yina Chen 
								
							 
						 
						
							
							
								
								
							
							
							
								
							
							
								882f4a5ff7 
								
							 
						 
						
							
							
								
								Add lnl npu driver recommend version and enable cpu_lm_head on llama3 ( #11952 )  
							
							 
							
							... 
							
							
							
							* update lnl npu driver version and enable cpu_lm_head on llama3
* update
* fix style
* typo
* address comments
* update
* add qwen2-7b 
							
						 
						
							2024-08-29 15:01:18 +08:00  
						
						
							 
							
							
								 
							 
							
						 
					 
				
					
						
							
								
								
									 
									binbin Deng 
								
							 
						 
						
							
							
								
								
							
							
							
								
							
							
								71f03dcc39 
								
							 
						 
						
							
							
								
								Support qwen2-7b with fused decoderlayer optimization on NPU ( #11912 )  
							
							 
							
							
							
						 
						
							2024-08-29 13:34:20 +08:00  
						
						
							 
							
							
								 
							 
							
						 
					 
				
					
						
							
								
								
									 
									Jiao Wang 
								
							 
						 
						
							
							
								
								
							
							
							
								
							
							
								63ac5f64bb 
								
							 
						 
						
							
							
								
								Refactor NPU baichuan multiple-process ( #11945 )  
							
							 
							
							... 
							
							
							
							* update
* add baichuan mp
* clean
* refactor
* merge
* style
* update
* update 
							
						 
						
							2024-08-28 11:33:40 -07:00  
						
						
							 
							
							
								 
							 
							
						 
					 
				
					
						
							
								
								
									 
									SONG Ge 
								
							 
						 
						
							
							
								
								
							
							
							
								
							
							
								5ca7390082 
								
							 
						 
						
							
							
								
								[NPU] Add minicpm-2b support for npu multi-processing ( #11949 )  
							
							 
							
							... 
							
							
							
							* add minicpm-2b support
* update example for minicpm-2b
* add LNL NPU driver requirement in readme 
							
						 
						
							2024-08-28 18:08:49 +08:00  
						
						
							 
							
							
								 
							 
							
						 
					 
				
					
						
							
								
								
									 
									Yishuo Wang 
								
							 
						 
						
							
							
								
								
							
							
							
								
							
							
								0fbb10259a 
								
							 
						 
						
							
							
								
								use sdp_causal to reduce internvl2-4b memory usage if set environment variable ( #11953 )  
							
							 
							
							
							
						 
						
							2024-08-28 17:35:05 +08:00  
						
						
							 
							
							
								 
							 
							
						 
					 
				
					
						
							
								
								
									 
									Guancheng Fu 
								
							 
						 
						
							
							
								
								
							
							
							
								
							
							
								0a7bd274e2 
								
							 
						 
						
							
							
								
								Add vllm awq loading logic ( #11950 )  
							
							 
							
							... 
							
							
							
							* add vllm awq loading logic
* fix
* refine 
							
						 
						
							2024-08-28 16:46:18 +08:00  
						
						
							 
							
							
								 
							 
							
						 
					 
				
					
						
							
								
								
									 
									Yina Chen 
								
							 
						 
						
							
							
								
								
							
							
							
								
							
							
								b38fb67bec 
								
							 
						 
						
							
							
								
								[NPU] lm head to cpu ( #11943 )  
							
							 
							
							... 
							
							
							
							* lm head to cpu
* qwen2
* mv logic and add param to disable cpu_lm_head
* use env and lm_head opt to mp file
* fix
* update
* remove print 
							
						 
						
							2024-08-28 16:34:07 +08:00  
						
						
							 
							
							
								 
							 
							
						 
					 
				
					
						
							
								
								
									 
									Jinhe 
								
							 
						 
						
							
							
								
								
							
							
							
								
							
							
								ec67ee7177 
								
							 
						 
						
							
							
								
								added accelerate version specification in open webui quickstart( #11948 )  
							
							 
							
							
							
						 
						
							2024-08-28 15:02:39 +08:00  
						
						
							 
							
							
								 
							 
							
						 
					 
				
					
						
							
								
								
									 
									hxsz1997 
								
							 
						 
						
							
							
								
								
							
							
							
								
							
							
								e23549f63f 
								
							 
						 
						
							
							
								
								Update llamaindex examples ( #11940 )  
							
							 
							
							... 
							
							
							
							* modify rag.py
* update readme of gpu example
* update llamaindex cpu example and readme
* add llamaindex doc
* update note style
* import before instancing IpexLLMEmbedding
* update index in readme
* update links
* update link
* update related links 
							
						 
						
							2024-08-28 14:03:44 +08:00  
						
						
							 
							
							
								 
							 
							
						 
					 
				
					
						
							
								
								
									 
									Shaojun Liu 
								
							 
						 
						
							
							
								
								
							
							
							
								
							
							
								23f51f87f0 
								
							 
						 
						
							
							
								
								update tag to 2.2.0-SNAPSHOT ( #11947 )  
							
							 
							
							
							
						 
						
							2024-08-28 09:20:32 +08:00  
						
						
							 
							
							
								 
							 
							
						 
					 
				
					
						
							
								
								
									 
									Ruonan Wang 
								
							 
						 
						
							
							
								
								
							
							
							
								
							
							
								460bc96d32 
								
							 
						 
						
							
							
								
								update version of llama.cpp / ollama ( #11930 )  
							
							 
							
							... 
							
							
							
							* update version
* fix version 
							
						 
						
							2024-08-27 21:21:44 +08:00  
						
						
							 
							
							
								 
							 
							
						 
					 
				
					
						
							
								
								
									 
									binbin Deng 
								
							 
						 
						
							
							
								
								
							
							
							
								
							
							
								bec00e2015 
								
							 
						 
						
							
							
								
								Improve baichuan2 NPU performance ( #11942 )  
							
							 
							
							
							
						 
						
							2024-08-27 18:37:08 +08:00  
						
						
							 
							
							
								 
							 
							
						 
					 
				
					
						
							
								
								
									 
									Zijie Li 
								
							 
						 
						
							
							
								
								
							
							
							
								
							
							
								90f692937d 
								
							 
						 
						
							
							
								
								Update npu baichuan2 ( #11939 )  
							
							 
							
							
							
						 
						
							2024-08-27 16:56:26 +08:00  
						
						
							 
							
							
								 
							 
							
						 
					 
				
					
						
							
								
								
									 
									binbin Deng 
								
							 
						 
						
							
							
								
								
							
							
							
								
							
							
								7f7f6c89f5 
								
							 
						 
						
							
							
								
								Quick fix benchmark script ( #11938 )  
							
							 
							
							
							
						 
						
							2024-08-27 15:29:27 +08:00  
						
						
							 
							
							
								 
							 
							
						 
					 
				
					
						
							
								
								
									 
									Jiao Wang 
								
							 
						 
						
							
							
								
								
							
							
							
								
							
							
								b4b6ddf73c 
								
							 
						 
						
							
							
								
								NPU Baichuan2 Multi- Process example ( #11928 )  
							
							 
							
							
							
						 
						
							2024-08-27 15:25:49 +08:00  
						
						
							 
							
							
								 
							 
							
						 
					 
				
					
						
							
								
								
									 
									SONG Ge 
								
							 
						 
						
							
							
								
								
							
							
							
								
							
							
								e211a5b076 
								
							 
						 
						
							
							
								
								update minicpm to meet latest refactor ( #11937 )  
							
							 
							
							
							
						 
						
							2024-08-27 15:08:01 +08:00  
						
						
							 
							
							
								 
							 
							
						 
					 
				
					
						
							
								
								
									 
									SONG Ge 
								
							 
						 
						
							
							
								
								
							
							
							
								
							
							
								a81a329a5f 
								
							 
						 
						
							
							
								
								[NPU] Add example for NPU multi-processing minicpm-1b model ( #11935 )  
							
							 
							
							... 
							
							
							
							* add minicpm example 
							
						 
						
							2024-08-27 14:57:46 +08:00  
						
						
							 
							
							
								 
							 
							
						 
					 
				
					
						
							
								
								
									 
									binbin Deng 
								
							 
						 
						
							
							
								
								
							
							
							
								
							
							
								7c8c9a0670 
								
							 
						 
						
							
							
								
								Update benchmark script for NPU ( #11932 )  
							
							 
							
							
							
						 
						
							2024-08-27 14:41:14 +08:00  
						
						
							 
							
							
								 
							 
							
						 
					 
				
					
						
							
								
								
									 
									Ch1y0q 
								
							 
						 
						
							
							
								
								
							
							
							
								
							
							
								730d9ec811 
								
							 
						 
						
							
							
								
								Add Qwen2-audio example ( #11835 )  
							
							 
							
							... 
							
							
							
							* add draft for qwen2-audio
* update example for `Qwen2-Audio`
* update
* update
* add warmup 
							
						 
						
							2024-08-27 13:35:24 +08:00  
						
						
							 
							
							
								 
							 
							
						 
					 
				
					
						
							
								
								
									 
									Shaojun Liu 
								
							 
						 
						
							
							
								
								
							
							
							
								
							
							
								b11b28e9a9 
								
							 
						 
						
							
							
								
								update CORE_XE_VERSION to 2.6.0 ( #11929 )  
							
							 
							
							
							
						 
						
							2024-08-27 13:10:13 +08:00  
						
						
							 
							
							
								 
							 
							
						 
					 
				
					
						
							
								
								
									 
									Yina Chen 
								
							 
						 
						
							
							
								
								
							
							
							
								
							
							
								e246f1e258 
								
							 
						 
						
							
							
								
								update llama3 npu example ( #11933 )  
							
							 
							
							
							
						 
						
							2024-08-27 13:03:18 +08:00  
						
						
							 
							
							
								 
							 
							
						 
					 
				
					
						
							
								
								
									 
									binbin Deng 
								
							 
						 
						
							
							
								
								
							
							
							
								
							
							
								14dddfc0d6 
								
							 
						 
						
							
							
								
								Update NPU example readme ( #11931 )  
							
							 
							
							
							
						 
						
							2024-08-27 12:44:58 +08:00  
						
						
							 
							
							
								 
							 
							
						 
					 
				
					
						
							
								
								
									 
									Zijie Li 
								
							 
						 
						
							
							
								
								
							
							
							
								
							
							
								6c3eb1e1e8 
								
							 
						 
						
							
							
								
								refactor from_pretrained API for NPU ( #11927 )  
							
							 
							
							
							
						 
						
							2024-08-27 09:50:30 +08:00  
						
						
							 
							
							
								 
							 
							
						 
					 
				
					
						
							
								
								
									 
									Xiangyu Tian 
								
							 
						 
						
							
							
								
								
							
							
							
								
							
							
								7ca557aada 
								
							 
						 
						
							
							
								
								LLM: Fix vLLM CPU convert error ( #11926 )  
							
							 
							
							
							
						 
						
							2024-08-27 09:22:19 +08:00