Commit21e611e

authored

Update transformers_gemma3.py

1 parente102c0f commit21e611eCopy full SHA for 21e611e

File tree

-5

lines changed

-5

lines changed

Lines changed: 4 additions & 5 deletions

Original file line number	Diff line number	Diff line change
`@@ -16,12 +16,11 @@ class Gemma3(BaseLM):`
`16`	`16`	`- Total input context of 128K tokens for the 4B, 12B, and 27B sizes, and 32K tokens for the 1B size`
`17`	`17`	`"""`
`18`	`18`
`19`		`-def__init__(self,model_name="google/gemma-3-1b-it",temp=0.1,device='cpu',`
`20`		`-max_new_tokens=None,api_token=None,use_bf16=False,**kwargs):`
`21`		`-super(Gemma,self).__init__(name=model_name,support_batching=True,**kwargs)`
	`19`	`+def__init__(self,model_name="google/gemma-3-1b-it",temp=0.1,device='cuda',`
	`20`	`+max_new_tokens=None,api_token=None,**kwargs):`
	`21`	`+super(Gemma3,self).__init__(name=model_name,support_batching=True,**kwargs)`
`22`	`22`	`self.__device=device`
`23`		`-self.__model=AutoModelForCausalLM.from_pretrained(`
`24`		`-model_name,torch_dtype=torch.bfloat16ifuse_bf16else"auto",token=api_token)`
	`23`	`+self.__model=AutoModelForCausalLM.from_pretrained(model_name,torch_dtype="auto",token=api_token)`
`25`	`24`	`self.__max_new_tokens=max_new_tokens`
`26`	`25`	`self.__model.to(device)`
`27`	`26`	`self.__tokenizer=AutoTokenizer.from_pretrained(model_name,token=api_token)`

Comments

(0)