 
				cleanrl/EleutherAI_pythia-6.9b-deduped__ppo__tldr
				
				
			
			Text Generation
			
• 
		
				7B
			• 
	
				Updated
					
				
				• 
					
					2
				
	
				
				
 
				cleanrl/EleutherAI_pythia-2.8b-deduped__ppo__tldr
				
				
			
			Text Generation
			
• 
		
				3B
			• 
	
				Updated
					
				
				
				
	
				
				 
				cleanrl/EleutherAI_pythia-1b-deduped__ppo__tldr
				
				
			
			Text Generation
			
• 
		
				1B
			• 
	
				Updated
					
				
				• 
					
					2
				
	
				
				
 
				cleanrl/EleutherAI_pythia-2.8b-deduped__reward__tldr
				
				
			
			Text Classification
			
• 
		
	
				Updated
					
				
				• 
					
					2
				
	
				
				
 
				cleanrl/EleutherAI_pythia-1b-deduped__reward__tldr
				
				
			
			Text Classification
			
• 
		
	
				Updated
					
				
				• 
					
					997
				
	
				
				
 
				cleanrl/EleutherAI_pythia-1b-deduped__sft__tldr
				
				
			
			Text Generation
			
• 
		
	
				Updated
					
				
				• 
					
					1.21k
				
	
				
				
 
				cleanrl/EleutherAI_pythia-2.8b-deduped__sft__tldr
				
				
			
			Text Generation
			
• 
		
	
				Updated
					
				
				• 
					
					1
				
	
				
				
 
				cleanrl/EleutherAI_pythia-6.9b-deduped__sft__tldr
				
				
			
			Text Generation
			
• 
		
	
				Updated
					
				
				• 
					
					347
				
	
				
				
 
				cleanrl/EleutherAI_pythia-6.9b-deduped__reward__tldr
				
				
			
			Text Classification
			
• 
		
	
				Updated
					
				
				• 
					
					181
				
	
				
				
 
				cleanrl/ppo_zephyr310
				
				
			
			Text Generation
			
• 
		
				7B
			• 
	
				Updated
					
				
				
				
	
				
				 
			datasets
			15
		
	
				cleanrl/summarize_from_feedback_oai_preprocessing_1705009345
				
				
			
			Viewer
			
• 
	
				Updated
					
				• 
			
			179k
	
				• 
					
					146
				
				
				
 
		
				cleanrl/summarize_from_feedback_tldr_3_filtered_oai_preprocessing_1705009345
				
				
			
			Viewer
			
• 
	
				Updated
					
				• 
			
			130k
	
				• 
					
					52
				
				
				
 
		
				cleanrl/summarize_from_feedback_oai_preprocessing_1704578687
				
				
			
			Viewer
			
• 
	
				Updated
					
				• 
			
			179k
	
				• 
					
					78
				
				
				
 
		
				cleanrl/summarize_from_feedback_tldr_3_filtered_oai_preprocessing_1704578687
				
				
			
			Viewer
			
• 
	
				Updated
					
				• 
			
			130k
	
				• 
					
					29
				
				
				
 
		
				cleanrl/summarize_from_feedback_oai_preprocessing_1704563162
				
				
			
			Viewer
			
• 
	
				Updated
					
				• 
			
			179k
	
				• 
					
					61
				
				
				
 
		
				cleanrl/summarize_from_feedback_tldr_3_filtered_oai_preprocessing_1704563162
				
				
			
			Viewer
			
• 
	
				Updated
					
				• 
			
			130k
	
				• 
					
					129
				
				
				
 
		
				cleanrl/summarize_from_feedback_oai_preprocessing_1704496365
				
				
			
			Viewer
			
• 
	
				Updated
					
				• 
			
			179k
	
				• 
					
					12
				
				
				
 
		
				cleanrl/summarize_from_feedback_tldr_3_filtered_oai_preprocessing_1704496365
				
				
			
			Viewer
			
• 
	
				Updated
					
				• 
			
			130k
	
				• 
					
					74
				
				
				
 
		
				cleanrl/summarize_from_feedback_oai_preprocessing_1704427060
				
				
			
			Viewer
			
• 
	
				Updated
					
				• 
			
			179k
	
				• 
					
					22
				
				
				
 
		
				cleanrl/summarize_from_feedback_tldr_3_filtered_oai_preprocessing_1704427060
				
				
			
			Viewer
			
• 
	
				Updated
					
				• 
			
			130k
	
				• 
					
					17