MNC-LLM
		
		
				
				·
				 
		
		
		
			AI & ML interests
		
		None yet
		
		
			Organizations
		
		
	
			models
			33
		
	
				MNC-LLM/batch1_epochs4_lr1e-05_paged_adamw_32bit_cosine_length2048_warmup_0.05_max_grad1.0_grad_accu32
				
				
			
			Text Generation
			
• 
		
				7B
			• 
	
				Updated
					
				
				• 
					
					1
				
	
				
				
 
		
	
				MNC-LLM/batch1_epochs1_lr1e-05_paged_adamw_32bit_cosine_length2048_warmup_0.05_max_grad1.0_grad_accu16
				
				
			
			Text Generation
			
• 
		
	
				Updated
					
				
				• 
					
					1
				
	
				
				
 
		
	
				MNC-LLM/Mistral-7B-NWS-u2k-Marcoroni-prompt-found-LaAdMoAl-ep4lr5
				
				
			
			Text Generation
			
• 
		
	
				Updated
					
				
				• 
					
					1
				
	
				
				
 
		
	
				MNC-LLM/Mistral-7B-NWS-u2k-merge-Marcoroni-LaAdMoAl-ep4-lr5
				
				
			
			Text Generation
			
• 
		
	
				Updated
					
				
				• 
					
					1
				
	
				
				
 
		
	
				MNC-LLM/batch1_epochs4_lr1e-05_paged_adamw_32bit_cosine_length2048_warmup_0.05_max_grad1.0_grad_accu16
				
				
			
			Text Generation
			
• 
		
	
				Updated
					
				
				• 
					
					1
				
	
				
				
 
		
	
				MNC-LLM/batch1_epochs2_lr1e-05_paged_adamw_32bit_cosine_length2048_warmup_0.05_max_grad1.0_grad_accu32
				
				
			
		
	
				Updated
					
				
				
				
	
				
				
 
		
	
				MNC-LLM/Mistral-7B-NWS-u2k-merge-Marcoroni
				
				
			
			Text Generation
			
• 
		
	
				Updated
					
				
				• 
					
					1
				
	
				
				
 
		
	
				MNC-LLM/Mistral-7B-LaAdMoAl-merge-Marcoroni
				
				
			
			Text Generation
			
• 
		
	
				Updated
					
				
				• 
					
					1
				
	
				
				
 
		
	
				MNC-LLM/tulu-2-dpo-7B-NWSCot-600-ep4lr5
				
				
			
			Text Generation
			
• 
		
	
				Updated
					
				
				• 
					
					3
				
	
				
				
 
		
	
				MNC-LLM/Tulu-2-DPO-7B-NWSO-5k-4ep-lr5
				
				
			
			Text Generation
			
• 
		
	
				Updated
					
				
				• 
					
					2