saharNooby
							
						 | 
						
							
							
							
							
							
								
							
							
								935d16f5db
								
							
						 | 
						
							
							
								
								Move library wrapper to separate file, refactor code
							
							
							
							
							
						 | 
						
							2023-04-02 12:24:40 +04:00 | 
						
					
				
					
						
							
							
								 
								saharNooby
							
						 | 
						
							
							
							
							
							
								
							
							
								972e28d48d
								
							
						 | 
						
							
							
								
								Implement INT4 conversion and inference
							
							
							
							
							
						 | 
						
							2023-04-01 19:22:01 +04:00 | 
						
					
				
					
						
							
							
								 
								saharNooby
							
						 | 
						
							
							
							
							
							
								
							
							
								a1e1d34c93
								
							
						 | 
						
							
							
								
								Add Python wrapper for C library
							
							
							
							
							
						 | 
						
							2023-04-01 16:02:22 +04:00 | 
						
					
				
					
						
							
							
								 
								saharNooby
							
						 | 
						
							
							
							
							
							
								
							
							
								7130a89d1f
								
							
						 | 
						
							
							
								
								[FILE FORMAT CHANGED] Reverse dimensions in ggml file (makes it more similar to llama.cpp format)
							
							
							
							
							
						 | 
						
							2023-04-01 14:41:30 +04:00 | 
						
					
				
					
						
							
							
								 
								saharNooby
							
						 | 
						
							
							
							
							
							
								
							
							
								f6d45baec0
								
							
						 | 
						
							
							
								
								Support FP16 inference
							
							
							
							
							
						 | 
						
							2023-04-01 11:53:49 +04:00 | 
						
					
				
					
						
							
							
								 
								saharNooby
							
						 | 
						
							
							
							
							
							
								
							
							
								fe98c94a63
								
							
						 | 
						
							
							
								
								[FILE FORMAT CHANGED] Use ggml_get_rows to get embedding
							
							
							
							
							
						 | 
						
							2023-04-01 11:28:32 +04:00 | 
						
					
				
					
						
							
							
								 
								saharNooby
							
						 | 
						
							
							
							
							
							
								
							
							
								16ec7a5c18
								
							
						 | 
						
							
							
								
								Add fail-fast version of the test
							
							
							
							
							
						 | 
						
							2023-04-01 11:15:15 +04:00 | 
						
					
				
					
						
							
							
								 
								saharNooby
							
						 | 
						
							
							
							
							
							
								
							
							
								0fcb7c64c6
								
							
						 | 
						
							
							
								
								Remove reference implementation code and test against pre-created logits
							
							
							
							
							
						 | 
						
							2023-04-01 11:09:24 +04:00 | 
						
					
				
					
						
							
							
								 
								saharNooby
							
						 | 
						
							
							
							
							
							
								
							
							
								6fe9486cee
								
							
						 | 
						
							
							
								
								Finally, FP32 inference
							
							
							
							
							
						 | 
						
							2023-04-01 10:06:39 +04:00 | 
						
					
				
					
						
							
							
								 
								saharNooby
							
						 | 
						
							
							
							
							
							
								
							
							
								61c6b1a4e0
								
							
						 | 
						
							
							
								
								Add comparison against reference implementation script, implement state & logits saving
							
							
							
							
							
						 | 
						
							2023-03-31 20:23:42 +04:00 | 
						
					
				
					
						
							
							
								 
								saharNooby
							
						 | 
						
							
							
							
							
							
								
							
							
								d00f28581a
								
							
						 | 
						
							
							
								
								Add reference implementation of RWKV RNN
							
							
							
							
							
						 | 
						
							2023-03-31 19:57:16 +04:00 | 
						
					
				
					
						
							
							
								 
								saharNooby
							
						 | 
						
							
							
							
							
							
								
							
							
								fe272dc3d3
								
							
						 | 
						
							
							
								
								Minor changes
							
							
							
							
							
						 | 
						
							2023-03-31 10:24:12 +04:00 | 
						
					
				
					
						
							
							
								 
								saharNooby
							
						 | 
						
							
							
							
							
							
								
							
							
								873cb954d0
								
							
						 | 
						
							
							
								
								Make ln0 work correctly
							
							
							
							
							
						 | 
						
							2023-03-30 20:01:26 +04:00 | 
						
					
				
					
						
							
							
								 
								saharNooby
							
						 | 
						
							
							
							
							
							
								
							
							
								2f51451561
								
							
						 | 
						
							
							
								
								Initial commit
							
							
							
							
							
						 | 
						
							2023-03-30 17:55:30 +04:00 |