esa-sceva
/

llama3-satcom-8b

Text Generation

satellite communications

question-answering

text-generation-inference

Model card Files Files and versions

llama3-satcom-8b / hyperparameters.yaml

CamelShirt43's picture

Upload folder using huggingface_hub

0d78611 verified 4 months ago

history blame contribute delete

1.02 kB

	checkpoint_dir: /teamspace/studios/this_studio/out/finetune/llama-8b-dataset12/final
	out_dir: out/finetune-2/llama-8b-dataset12-cot
	precision: bf16-true
	devices: 1
	num_nodes: 1
	lora_r: 8
	lora_alpha: 16
	lora_dropout: 0.1
	lora_query: true
	lora_key: false
	lora_value: true
	lora_projection: false
	lora_mlp: false
	lora_head: false
	data:
	class_path: litgpt.data.JSON
	init_args:
	json_path: cot_satcom_litgpt.json
	mask_prompt: false
	val_split_fraction: 0.05
	prompt_style: alpaca
	ignore_index: -100
	seed: 42
	num_workers: 4
	train:
	save_interval: 25
	log_interval: 1
	global_batch_size: 32
	micro_batch_size: 4
	lr_warmup_steps: 25
	epochs: 12
	max_seq_length: 2048
	min_lr: 2.0e-05
	log: {}
	eval:
	interval: 20
	max_new_tokens: 100
	max_iters: 100
	initial_validation: true
	final_validation: true
	evaluate_example: first
	optimizer:
	class_path: torch.optim.AdamW
	init_args:
	lr: 2.0e-05
	weight_decay: 0.0
	betas:
	- 0.9
	- 0.999
	logger_name: wandb
	seed: 1337