zorazrw
/

filco-llama2-open

Text Generation

retrieval-augmented generation

text-generation-inference

Model card Files Files and versions

filco-llama2-open / xturing.json

zorazrw's picture

Upload 9 files

5e85c91 verified almost 2 years ago

history blame contribute delete

696 Bytes

	{
	"model_name": "llama2_lora",
	"finetuning_config": {
	"learning_rate": 5e-05,
	"gradient_accumulation_steps": 1,
	"batch_size": 1,
	"weight_decay": 0.01,
	"warmup_steps": 50,
	"eval_steps": 5000,
	"save_steps": 5000,
	"max_length": 512,
	"num_train_epochs": 3,
	"logging_steps": 10,
	"max_grad_norm": 2.0,
	"save_total_limit": 4,
	"optimizer_name": "adamw",
	"output_dir": "./checkpoints/llama2-lora_nq-mctx_em-top1"
	},
	"generation_config": {
	"penalty_alpha": 0.6,
	"top_k": 4,
	"max_new_tokens": 256,
	"do_sample": false,
	"top_p": null
	}
	}