Spaces:

helamouri
/

medichat_assignment

Sleeping

medichat_assignment / src /config.py

update model

eca6215 11 months ago

1.11 kB

	import torch


	def get_device_map():
	if torch.cuda.is_available():
	return {'' : torch.cuda.current_device()}
	else:
	return {} # Or some default, fallback configuration

	# General configuration
	MAX_SEQ_LENGTH = 2**4
	DTYPE = None
	LOAD_IN_4BIT = True
	DEVICE_MAP = {'': get_device_map()}
	EOS_TOKEN = None # Set dynamically based on tokenizer

	# Alpaca prompt template
	ALPACA_PROMPT_TEMPLATE = """Below is an instruction that describes a task, paired with an input that provides further context. Write a response that appropriately completes the request.

	###Instruction:
	{}

	###Input:
	{}

	###Response:
	{}"""

	# Training arguments
	TRAIN_ARGS = {
	"per_device_train_batch_size": 2,
	"gradient_accumulation_steps": 4,
	"warmup_steps": 5,
	"max_steps": 60,
	"learning_rate": 2e-4,
	"fp16": not torch.cuda.is_bf16_supported(),
	"bf16": torch.cuda.is_bf16_supported(),
	"logging_steps": 1,
	"optim": "adamw_8bit",
	"weight_decay": 0.01,
	"lr_scheduler_type": "linear",
	"seed": 3407,
	"output_dir": "outputs",
	}