add: output results for various models and datasets
This commit is contained in:
		
							parent
							
								
									a028413832
								
							
						
					
					
						commit
						39516acf9a
					
				
					 3 changed files with 39 additions and 0 deletions
				
			
		
							
								
								
									
										13
									
								
								tests/outputs/results (CoT).CSV
									
										
									
									
									
										Normal file
									
								
							
							
						
						
									
										13
									
								
								tests/outputs/results (CoT).CSV
									
										
									
									
									
										Normal file
									
								
							|  | @ -0,0 +1,13 @@ | |||
| ,model name,dataname,expected,human,AI,unsure,invalid | ||||
| 0,Microsoft Phi,LDAG,human,13,14,12,20 | ||||
| 1,Microsoft Phi,HLTC,human,12,11,19,17 | ||||
| 2,Microsoft Phi,LDAG,AI,10,18,14,17 | ||||
| 3,Microsoft Phi,HLTC,AI,14,13,23,9 | ||||
| 4,Gemma 2,LDAG,human,35,24,0,0 | ||||
| 5,Gemma 2,HLTC,human,45,14,0,0 | ||||
| 6,Gemma 2,LDAG,AI,51,8,0,0 | ||||
| 7,Gemma 2,HLTC,AI,42,17,0,0 | ||||
| 8,Tinyllama,LDAG,human,11,4,34,10 | ||||
| 9,Tinyllama,HLTC,human,13,5,30,11 | ||||
| 10,Tinyllama,LDAG,AI,11,5,31,12 | ||||
| 11,Tinyllama,HLTC,AI,11,3,35,10 | ||||
| 
 | 
							
								
								
									
										13
									
								
								tests/outputs/results (Multi-Shot).CSV
									
										
									
									
									
										Normal file
									
								
							
							
						
						
									
										13
									
								
								tests/outputs/results (Multi-Shot).CSV
									
										
									
									
									
										Normal file
									
								
							|  | @ -0,0 +1,13 @@ | |||
| ,model name,dataname,expected,human,AI,unsure,invalid | ||||
| 0,Microsoft Phi,LDAG,human,1,10,46,2 | ||||
| 1,Microsoft Phi,HLTC,human,7,6,44,2 | ||||
| 2,Microsoft Phi,LDAG,AI,7,4,43,5 | ||||
| 3,Microsoft Phi,HLTC,AI,4,7,47,1 | ||||
| 4,Gemma 2,LDAG,human,24,35,0,0 | ||||
| 5,Gemma 2,HLTC,human,48,11,0,0 | ||||
| 6,Gemma 2,LDAG,AI,49,10,0,0 | ||||
| 7,Gemma 2,HLTC,AI,48,11,0,0 | ||||
| 8,Tinyllama,LDAG,human,24,5,28,2 | ||||
| 9,Tinyllama,HLTC,human,17,3,36,3 | ||||
| 10,Tinyllama,LDAG,AI,14,3,37,5 | ||||
| 11,Tinyllama,HLTC,AI,17,1,39,2 | ||||
| 
 | 
							
								
								
									
										13
									
								
								tests/outputs/results (classic).CSV
									
										
									
									
									
										Normal file
									
								
							
							
						
						
									
										13
									
								
								tests/outputs/results (classic).CSV
									
										
									
									
									
										Normal file
									
								
							|  | @ -0,0 +1,13 @@ | |||
| ,model name,dataname,expected,human,AI,unsure,invalid | ||||
| 0,Microsoft Phi,LDAG,human,3,4,48,4 | ||||
| 1,Microsoft Phi,HLTC,human,7,6,42,4 | ||||
| 2,Microsoft Phi,LDAG,AI,5,9,43,2 | ||||
| 3,Microsoft Phi,HLTC,AI,4,4,49,2 | ||||
| 4,Gemma 2,LDAG,human,38,21,0,0 | ||||
| 5,Gemma 2,HLTC,human,47,12,0,0 | ||||
| 6,Gemma 2,LDAG,AI,51,8,0,0 | ||||
| 7,Gemma 2,HLTC,AI,46,13,0,0 | ||||
| 8,Tinyllama,LDAG,human,13,3,37,6 | ||||
| 9,Tinyllama,HLTC,human,9,3,40,7 | ||||
| 10,Tinyllama,LDAG,AI,8,5,40,6 | ||||
| 11,Tinyllama,HLTC,AI,11,4,37,7 | ||||
| 
 | 
		Loading…
	
	Add table
		Add a link
		
	
		Reference in a new issue