Yishuo Wang 
								
							 
						 
						
							
							
							
							
								
							
							
								bfd9f88f0d 
								
							 
						 
						
							
							
								
								[LLM] Use fp32 as dtype when batch_size <=8 and qtype is q4_0/q8_0/fp8 ( #9365 )  
							
							 
							
							
							
						 
						
							2023-11-08 09:54:53 +08:00  
						
						
							 
							
							
								 
							 
							
						 
					 
				
					
						
							
								
								
									 
									WeiguangHan 
								
							 
						 
						
							
							
							
							
								
							
							
								84ab614aab 
								
							 
						 
						
							
							
								
								LLM: add more models and skip runtime error ( #9349 )  
							
							 
							
							... 
							
							
							
							* add more models and skip runtime error
* upgrade transformers
* temporarily removed Mistral-7B-v0.1
* temporarily disable the upload of arc perf result 
							
						 
						
							2023-11-08 09:45:53 +08:00  
						
						
							 
							
							
								 
							 
							
						 
					 
				
					
						
							
								
								
									 
									Heyang Sun 
								
							 
						 
						
							
							
							
							
								
							
							
								fae6db3ddc 
								
							 
						 
						
							
							
								
								[LLM] refactor cpu low-bit forward logic ( #9366 )  
							
							 
							
							... 
							
							
							
							* [LLM] refactor cpu low-bit forward logic
* fix style
* Update low_bit_linear.py
* Update low_bit_linear.py
* refine 
							
						 
						
							2023-11-07 15:09:16 +08:00  
						
						
							 
							
							
								 
							 
							
						 
					 
				
					
						
							
								
								
									 
									Heyang Sun 
								
							 
						 
						
							
							
							
							
								
							
							
								af94058203 
								
							 
						 
						
							
							
								
								[LLM] Support CPU deepspeed distributed inference ( #9259 )  
							
							 
							
							... 
							
							
							
							* [LLM] Support CPU Deepspeed distributed inference
* Update run_deepspeed.py
* Rename
* fix style
* add new codes
* refine
* remove annotated codes
* refine
* Update README.md
* refine doc and example code 
							
						 
						
							2023-11-06 17:56:42 +08:00  
						
						
							 
							
							
								 
							 
							
						 
					 
				
					
						
							
								
								
									 
									Jin Qiao 
								
							 
						 
						
							
							
							
							
								
							
							
								f9bf5382ff 
								
							 
						 
						
							
							
								
								Fix: add aquila2 in README ( #9362 )  
							
							 
							
							
							
						 
						
							2023-11-06 16:37:57 +08:00  
						
						
							 
							
							
								 
							 
							
						 
					 
				
					
						
							
								
								
									 
									Jin Qiao 
								
							 
						 
						
							
							
							
							
								
							
							
								e6b6afa316 
								
							 
						 
						
							
							
								
								LLM: add aquila2 model example ( #9356 )  
							
							 
							
							
							
						 
						
							2023-11-06 15:47:39 +08:00  
						
						
							 
							
							
								 
							 
							
						 
					 
				
					
						
							
								
								
									 
									Xin Qiu 
								
							 
						 
						
							
							
							
							
								
							
							
								1420e45cc0 
								
							 
						 
						
							
							
								
								Chatglm2 rope optimization on xpu ( #9350 )  
							
							 
							
							
							
						 
						
							2023-11-06 13:56:34 +08:00  
						
						
							 
							
							
								 
							 
							
						 
					 
				
					
						
							
								
								
									 
									Yining Wang 
								
							 
						 
						
							
							
							
							
								
							
							
								9377b9c5d7 
								
							 
						 
						
							
							
								
								add CodeShell CPU example ( #9345 )  
							
							 
							
							... 
							
							
							
							* add CodeShell CPU example
* fix some problems 
							
						 
						
							2023-11-03 13:15:54 +08:00  
						
						
							 
							
							
								 
							 
							
						 
					 
				
					
						
							
								
								
									 
									ZehuaCao 
								
							 
						 
						
							
							
							
							
								
							
							
								ef83c3302e 
								
							 
						 
						
							
							
								
								Use to test llm-performance on spr-perf ( #9316 )  
							
							 
							
							... 
							
							
							
							* Update llm_performance_tests.yml
* Update llm_performance_tests.yml
* Update action.yml
* Create cpu-perf-test.yaml
* Update action.yml
* Update action.yml
* Update llm_performance_tests.yml
* Update llm_performance_tests.yml
* Update llm_performance_tests.yml
* Update llm_performance_tests.yml
* Update llm_performance_tests.yml
* Update llm_performance_tests.yml
* Update llm_performance_tests.yml
* Update llm_performance_tests.yml
* Update llm_performance_tests.yml
* Update llm_performance_tests.yml
* Update llm_performance_tests.yml 
							
						 
						
							2023-11-03 11:17:16 +08:00  
						
						
							 
							
							
								 
							 
							
						 
					 
				
					
						
							
								
								
									 
									Yuwen Hu 
								
							 
						 
						
							
							
							
							
								
							
							
								a0150bb205 
								
							 
						 
						
							
							
								
								[LLM] Move embedding layer to CPU for iGPU inference ( #9343 )  
							
							 
							
							... 
							
							
							
							* Move embedding layer to CPU for iGPU llm inference
* Empty cache after to cpu
* Remove empty cache as it seems to have some negative effect to first token 
							
						 
						
							2023-11-03 11:13:45 +08:00  
						
						
							 
							
							
								 
							 
							
						 
					 
				
					
						
							
								
								
									 
									Cheen Hau, 俊豪 
								
							 
						 
						
							
							
							
							
								
							
							
								8f23fb04dc 
								
							 
						 
						
							
							
								
								Add inference test for Whisper model on Arc ( #9330 )  
							
							 
							
							... 
							
							
							
							* Add inference test for Whisper model
* Remove unnecessary inference time measurement 
							
						 
						
							2023-11-03 10:15:52 +08:00  
						
						
							 
							
							
								 
							 
							
						 
					 
				
					
						
							
								
								
									 
									Zheng, Yi 
								
							 
						 
						
							
							
							
							
								
							
							
								63411dff75 
								
							 
						 
						
							
							
								
								Add cpu examples of WizardCoder ( #9344 )  
							
							 
							
							... 
							
							
							
							* Add wizardcoder example
* Minor fixes 
							
						 
						
							2023-11-02 20:22:43 +08:00  
						
						
							 
							
							
								 
							 
							
						 
					 
				
					
						
							
								
								
									 
									dingbaorong 
								
							 
						 
						
							
							
							
							
								
							
							
								2e3bfbfe1f 
								
							 
						 
						
							
							
								
								Add internlm_xcomposer cpu examples ( #9337 )  
							
							 
							
							... 
							
							
							
							* add internlm-xcomposer cpu examples
* use chat
* some fixes
* add license
* address shengsheng's comments
* use demo.jpg 
							
						 
						
							2023-11-02 15:50:02 +08:00  
						
						
							 
							
							
								 
							 
							
						 
					 
				
					
						
							
								
								
									 
									Jin Qiao 
								
							 
						 
						
							
							
							
							
								
							
							
								97a38958bd 
								
							 
						 
						
							
							
								
								LLM: add CodeLlama CPU and GPU examples ( #9338 )  
							
							 
							
							... 
							
							
							
							* LLM: add codellama CPU pytorch examples
* LLM: add codellama CPU transformers examples
* LLM: add codellama GPU transformers examples
* LLM: add codellama GPU pytorch examples
* LLM: add codellama in readme
* LLM: add LLaVA link 
							
						 
						
							2023-11-02 15:34:25 +08:00  
						
						
							 
							
							
								 
							 
							
						 
					 
				
					
						
							
								
								
									 
									Chen, Zhentao 
								
							 
						 
						
							
							
							
							
								
							
							
								d4dffbdb62 
								
							 
						 
						
							
							
								
								Merge harness ( #9319 )  
							
							 
							
							... 
							
							
							
							* add harness patch and llb script
* add readme
* add license
* use patch instead
* update readme
* rename tests to evaluation
* fix typo
* remove nano dependency
* add original harness link
* rename title of usage
* rename BigDLGPULM as BigDLLM
* empty commit to rerun job 
							
						 
						
							2023-11-02 15:14:19 +08:00  
						
						
							 
							
							
								 
							 
							
						 
					 
				
					
						
							
								
								
									 
									Zheng, Yi 
								
							 
						 
						
							
							
							
							
								
							
							
								63b2556ce2 
								
							 
						 
						
							
							
								
								Add cpu examples of skywork ( #9340 )  
							
							 
							
							
							
						 
						
							2023-11-02 15:10:45 +08:00  
						
						
							 
							
							
								 
							 
							
						 
					 
				
					
						
							
								
								
									 
									dingbaorong 
								
							 
						 
						
							
							
							
							
								
							
							
								f855a864ef 
								
							 
						 
						
							
							
								
								add llava gpu example ( #9324 )  
							
							 
							
							... 
							
							
							
							* add llava gpu example
* use 7b model
* fix typo
* add in README 
							
						 
						
							2023-11-02 14:48:29 +08:00  
						
						
							 
							
							
								 
							 
							
						 
					 
				
					
						
							
								
								
									 
									Ziteng Zhang 
								
							 
						 
						
							
							
							
							
								
							
							
								dd3cf2f153 
								
							 
						 
						
							
							
								
								LLM: Add python 3.10 & 3.11 UT  
							
							 
							
							... 
							
							
							
							LLM: Add python 3.10 & 3.11 UT 
							
						 
						
							2023-11-02 14:09:29 +08:00  
						
						
							 
							
							
								 
							 
							
						 
					 
				
					
						
							
								
								
									 
									Wang, Jian4 
								
							 
						 
						
							
							
							
							
								
							
							
								149146004f 
								
							 
						 
						
							
							
								
								LLM: Add qlora finetunning CPU example ( #9275 )  
							
							 
							
							... 
							
							
							
							* add qlora finetunning example
* update readme
* update example
* remove merge.py and update readme 
							
						 
						
							2023-11-02 09:45:42 +08:00  
						
						
							 
							
							
								 
							 
							
						 
					 
				
					
						
							
								
								
									 
									WeiguangHan 
								
							 
						 
						
							
							
							
							
								
							
							
								9722e811be 
								
							 
						 
						
							
							
								
								LLM: add more models to the arc perf test ( #9297 )  
							
							 
							
							... 
							
							
							
							* LLM: add more models to the arc perf test
* remove some old models
* install some dependencies 
							
						 
						
							2023-11-01 16:56:32 +08:00  
						
						
							 
							
							
								 
							 
							
						 
					 
				
					
						
							
								
								
									 
									Jin Qiao 
								
							 
						 
						
							
							
							
							
								
							
							
								6a128aee32 
								
							 
						 
						
							
							
								
								LLM: add ui for portable-zip ( #9262 )  
							
							 
							
							
							
						 
						
							2023-11-01 15:36:59 +08:00  
						
						
							 
							
							
								 
							 
							
						 
					 
				
					
						
							
								
								
									 
									Jasonzzt 
								
							 
						 
						
							
							
							
							
								
							
							
								cb7ef38e86 
								
							 
						 
						
							
							
								
								rerun  
							
							 
							
							
							
						 
						
							2023-11-01 15:30:34 +08:00  
						
						
							 
							
							
								 
							 
							
						 
					 
				
					
						
							
								
								
									 
									Jasonzzt 
								
							 
						 
						
							
							
							
							
								
							
							
								ba148ff3ff 
								
							 
						 
						
							
							
								
								test py311  
							
							 
							
							
							
						 
						
							2023-11-01 14:08:49 +08:00  
						
						
							 
							
							
								 
							 
							
						 
					 
				
					
						
							
								
								
									 
									Yishuo Wang 
								
							 
						 
						
							
							
							
							
								
							
							
								726203d778 
								
							 
						 
						
							
							
								
								[LLM] Replace Embedding layer to fix it on CPU ( #9254 )  
							
							 
							
							
							
						 
						
							2023-11-01 13:58:10 +08:00  
						
						
							 
							
							
								 
							 
							
						 
					 
				
					
						
							
								
								
									 
									Jasonzzt 
								
							 
						 
						
							
							
							
							
								
							
							
								7c7a7f2ec1 
								
							 
						 
						
							
							
								
								spr & arc ut with python3,9&3.10&3.11  
							
							 
							
							
							
						 
						
							2023-11-01 13:17:13 +08:00  
						
						
							 
							
							
								 
							 
							
						 
					 
				
					
						
							
								
								
									 
									Yang Wang 
								
							 
						 
						
							
							
							
							
								
							
							
								e1bc18f8eb 
								
							 
						 
						
							
							
								
								fix import ipex problem ( #9323 )  
							
							 
							
							... 
							
							
							
							* fix import ipex problem
* fix style 
							
						 
						
							2023-10-31 20:31:34 -07:00  
						
						
							 
							
							
								 
							 
							
						 
					 
				
					
						
							
								
								
									 
									Cengguang Zhang 
								
							 
						 
						
							
							
							
							
								
							
							
								9f3d4676c6 
								
							 
						 
						
							
							
								
								LLM: Add qwen-vl gpu example ( #9290 )  
							
							 
							
							... 
							
							
							
							* create qwen-vl gpu example.
* add readme.
* fix.
* change input figure and update outputs.
* add qwen-vl pytorch model gpu example.
* fix.
* add readme. 
							
						 
						
							2023-11-01 11:01:39 +08:00  
						
						
							 
							
							
								 
							 
							
						 
					 
				
					
						
							
								
								
									 
									Ruonan Wang 
								
							 
						 
						
							
							
							
							
								
							
							
								7e73c354a6 
								
							 
						 
						
							
							
								
								LLM: decoupling bigdl-llm and bigdl-nano ( #9306 )  
							
							 
							
							
							
						 
						
							2023-11-01 11:00:54 +08:00  
						
						
							 
							
							
								 
							 
							
						 
					 
				
					
						
							
								
								
									 
									Yina Chen 
								
							 
						 
						
							
							
							
							
								
							
							
								2262ae4d13 
								
							 
						 
						
							
							
								
								Support MoFQ4 on arc ( #9301 )  
							
							 
							
							... 
							
							
							
							* init
* update
* fix style
* fix style
* fix style
* meet comments 
							
						 
						
							2023-11-01 10:59:46 +08:00  
						
						
							 
							
							
								 
							 
							
						 
					 
				
					
						
							
								
								
									 
									binbin Deng 
								
							 
						 
						
							
							
							
							
								
							
							
								8ef8e25178 
								
							 
						 
						
							
							
								
								LLM: improve response speed in multi-turn chat ( #9299 )  
							
							 
							
							... 
							
							
							
							* update
* fix stop word and add chatglm2 support
* remove system prompt 
							
						 
						
							2023-11-01 10:30:44 +08:00  
						
						
							 
							
							
								 
							 
							
						 
					 
				
					
						
							
								
								
									 
									Cengguang Zhang 
								
							 
						 
						
							
							
							
							
								
							
							
								d4ab5904ef 
								
							 
						 
						
							
							
								
								LLM: Add python 3.10 llm UT ( #9302 )  
							
							 
							
							... 
							
							
							
							* add py310 test for llm-unit-test.
* add py310 llm-unit-tests
* add llm-cpp-build-py310
* test
* test
* test.
* test
* test
* fix deactivate.
* fix
* fix.
* fix
* test
* test
* test
* add build chatglm for win.
* test.
* fix 
							
						 
						
							2023-11-01 10:15:32 +08:00  
						
						
							 
							
							
								 
							 
							
						 
					 
				
					
						
							
								
								
									 
									WeiguangHan 
								
							 
						 
						
							
							
							
							
								
							
							
								03aa368776 
								
							 
						 
						
							
							
								
								LLM: add the comparison between latest arc perf test and last one ( #9296 )  
							
							 
							
							... 
							
							
							
							* add the comparison between latest test and last one to html
* resolve some comments
* modify some code logics 
							
						 
						
							2023-11-01 09:53:02 +08:00  
						
						
							 
							
							
								 
							 
							
						 
					 
				
					
						
							
								
								
									 
									Jin Qiao 
								
							 
						 
						
							
							
							
							
								
							
							
								96f8158fe2 
								
							 
						 
						
							
							
								
								LLM: adjust dolly v2 GPU example README ( #9318 )  
							
							 
							
							
							
						 
						
							2023-11-01 09:50:22 +08:00  
						
						
							 
							
							
								 
							 
							
						 
					 
				
					
						
							
								
								
									 
									Jin Qiao 
								
							 
						 
						
							
							
							
							
								
							
							
								c44c6dc43a 
								
							 
						 
						
							
							
								
								LLM: add chatglm3 examples ( #9305 )  
							
							 
							
							
							
						 
						
							2023-11-01 09:50:05 +08:00  
						
						
							 
							
							
								 
							 
							
						 
					 
				
					
						
							
								
								
									 
									Xin Qiu 
								
							 
						 
						
							
							
							
							
								
							
							
								06447a3ef6 
								
							 
						 
						
							
							
								
								add malloc and intel openmp to llm deps ( #9322 )  
							
							 
							
							
							
						 
						
							2023-11-01 09:47:45 +08:00  
						
						
							 
							
							
								 
							 
							
						 
					 
				
					
						
							
								
								
									 
									Cheen Hau, 俊豪 
								
							 
						 
						
							
							
							
							
								
							
							
								d638b93dfe 
								
							 
						 
						
							
							
								
								Add test script and workflow for qlora fine-tuning ( #9295 )  
							
							 
							
							... 
							
							
							
							* Add test script and workflow for qlora fine-tuning
* Test fix export model
* Download dataset
* Fix export model issue
* Reduce number of training steps
* Rename script
* Correction 
							
						 
						
							2023-11-01 09:39:53 +08:00  
						
						
							 
							
							
								 
							 
							
						 
					 
				
					
						
							
								
								
									 
									Ruonan Wang 
								
							 
						 
						
							
							
							
							
								
							
							
								d383ee8efb 
								
							 
						 
						
							
							
								
								LLM: update QLoRA example about accelerate version( #9314 )  
							
							 
							
							
							
						 
						
							2023-10-31 13:54:38 +08:00  
						
						
							 
							
							
								 
							 
							
						 
					 
				
					
						
							
								
								
									 
									Cheen Hau, 俊豪 
								
							 
						 
						
							
							
							
							
								
							
							
								cee9eaf542 
								
							 
						 
						
							
							
								
								[LLM] Fix llm arc ut oom ( #9300 )  
							
							 
							
							... 
							
							
							
							* Move model to cpu after testing so that gpu memory is deallocated
* Add code comment
---------
Co-authored-by: sgwhat <ge.song@intel.com> 
							
						 
						
							2023-10-30 14:38:34 +08:00  
						
						
							 
							
							
								 
							 
							
						 
					 
				
					
						
							
								
								
									 
									dingbaorong 
								
							 
						 
						
							
							
							
							
								
							
							
								ee5becdd61 
								
							 
						 
						
							
							
								
								use coco image in Qwen-VL ( #9298 )  
							
							 
							
							... 
							
							
							
							* use coco image
* add output
* address yuwen's comments 
							
						 
						
							2023-10-30 14:32:35 +08:00  
						
						
							 
							
							
								 
							 
							
						 
					 
				
					
						
							
								
								
									 
									Yang Wang 
								
							 
						 
						
							
							
							
							
								
							
							
								163d033616 
								
							 
						 
						
							
							
								
								Support qlora in CPU ( #9233 )  
							
							 
							
							... 
							
							
							
							* support qlora in CPU
* revert example
* fix style 
							
						 
						
							2023-10-27 14:01:15 -07:00  
						
						
							 
							
							
								 
							 
							
						 
					 
				
					
						
							
								
								
									 
									Yang Wang 
								
							 
						 
						
							
							
							
							
								
							
							
								8838707009 
								
							 
						 
						
							
							
								
								Add deepspeed autotp example readme ( #9289 )  
							
							 
							
							... 
							
							
							
							* Add deepspeed autotp example readme
* change word 
							
						 
						
							2023-10-27 13:04:38 -07:00  
						
						
							 
							
							
								 
							 
							
						 
					 
				
					
						
							
								
								
									 
									dingbaorong 
								
							 
						 
						
							
							
							
							
								
							
							
								f053688cad 
								
							 
						 
						
							
							
								
								add cpu example of LLaVA ( #9269 )  
							
							 
							
							... 
							
							
							
							* add LLaVA cpu example
* Small text updates
* update link
---------
Co-authored-by: Yuwen Hu <yuwen.hu@intel.com> 
							
						 
						
							2023-10-27 18:59:20 +08:00  
						
						
							 
							
							
								 
							 
							
						 
					 
				
					
						
							
								
								
									 
									Zheng, Yi 
								
							 
						 
						
							
							
							
							
								
							
							
								7f2ad182fd 
								
							 
						 
						
							
							
								
								Minor Fixes of README ( #9294 )  
							
							 
							
							
							
						 
						
							2023-10-27 18:25:46 +08:00  
						
						
							 
							
							
								 
							 
							
						 
					 
				
					
						
							
								
								
									 
									Zheng, Yi 
								
							 
						 
						
							
							
							
							
								
							
							
								1bff54a378 
								
							 
						 
						
							
							
								
								Display demo.jpg n the README.md of HuggingFace Transformers Agent ( #9293 )  
							
							 
							
							... 
							
							
							
							* Display demo.jpg
* remove demo.jpg 
							
						 
						
							2023-10-27 18:00:03 +08:00  
						
						
							 
							
							
								 
							 
							
						 
					 
				
					
						
							
								
								
									 
									Zheng, Yi 
								
							 
						 
						
							
							
							
							
								
							
							
								a4a1dec064 
								
							 
						 
						
							
							
								
								Add a cpu example of HuggingFace Transformers Agent (use vicuna-7b-v1.5) ( #9284 )  
							
							 
							
							... 
							
							
							
							* Add examples of HF Agent
* Modify folder structure and add link of demo.jpg
* Fixes of readme
* Merge applications and Applications 
							
						 
						
							2023-10-27 17:14:12 +08:00  
						
						
							 
							
							
								 
							 
							
						 
					 
				
					
						
							
								
								
									 
									Guoqiong Song 
								
							 
						 
						
							
							
							
							
								
							
							
								aa319de5e8 
								
							 
						 
						
							
							
								
								Add streaming-llm using llama2 on CPU ( #9265 )  
							
							 
							
							... 
							
							
							
							Enable streaming-llm to let model take infinite inputs, tested on desktop and SPR10 
							
						 
						
							2023-10-27 01:30:39 -07:00  
						
						
							 
							
							
								 
							 
							
						 
					 
				
					
						
							
								
								
									 
									Cheen Hau, 俊豪 
								
							 
						 
						
							
							
							
							
								
							
							
								6c9ae420a5 
								
							 
						 
						
							
							
								
								Add regression test for optimize_model on gpu ( #9268 )  
							
							 
							
							... 
							
							
							
							* Add MPT model to transformer API test
* Add regression test for optimize_model on gpu.
---------
Co-authored-by: sgwhat <ge.song@intel.com> 
							
						 
						
							2023-10-27 09:23:19 +08:00  
						
						
							 
							
							
								 
							 
							
						 
					 
				
					
						
							
								
								
									 
									Cengguang Zhang 
								
							 
						 
						
							
							
							
							
								
							
							
								44b5fcc190 
								
							 
						 
						
							
							
								
								LLM: fix pretraining_tp argument issue. ( #9281 )  
							
							 
							
							
							
						 
						
							2023-10-26 18:43:58 +08:00  
						
						
							 
							
							
								 
							 
							
						 
					 
				
					
						
							
								
								
									 
									WeiguangHan 
								
							 
						 
						
							
							
							
							
								
							
							
								6b2a32eba2 
								
							 
						 
						
							
							
								
								LLM: add missing function for PyTorch InternLM model ( #9285 )  
							
							 
							
							
							
						 
						
							2023-10-26 18:05:23 +08:00  
						
						
							 
							
							
								 
							 
							
						 
					 
				
					
						
							
								
								
									 
									Yina Chen 
								
							 
						 
						
							
							
							
							
								
							
							
								f879c48f98 
								
							 
						 
						
							
							
								
								fp8 convert use ggml code ( #9277 )  
							
							 
							
							
							
						 
						
							2023-10-26 17:03:29 +08:00