Spaces:

Koios-API
/

KoiosAPI-codegemma-7b-it

Runtime error

stakelovelace commited on Apr 29

Commit

457f3a4

•

1 Parent(s): acc7015

commit from tesla

Files changed (1) hide show

app.py CHANGED Viewed

@@ -1,5 +1,5 @@
 import torch
-from transformers import AutoModelForCausalLM, AutoTokenizer, TrainingArguments, Trainer, BertLMHeadModel, BertForSequenceClassification
 from datasets import Dataset
 import pandas as pd
 import csv
@@ -67,6 +67,11 @@ def main(api_name, base_url):
     device = get_device()  # Get the appropriate device
     data = load_data_and_config("train2.csv")
     tokenizer = AutoTokenizer.from_pretrained("google/codegemma-2b")
     model = AutoModelForCausalLM.from_pretrained('google/codegemma-2b', is_decoder=True)
     #model = BertLMHeadModel.from_pretrained('google/codegemma-2b', is_decoder=True)
     # Example assuming you have a prepared dataset for classification
@@ -74,7 +79,8 @@ def main(api_name, base_url):
     model.to(device)  # Move model to the appropriate device
     train_model(model, tokenizer, data, device)
     model.save_pretrained("./fine_tuned_model")
     tokenizer.save_pretrained("./fine_tuned_model")

 import torch
+from transformers import AutoModelForCausalLM, AutoTokenizer, AutoConfig, TrainingArguments, Trainer, BertLMHeadModel, BertForSequenceClassification
 from datasets import Dataset
 import pandas as pd
 import csv
     device = get_device()  # Get the appropriate device
     data = load_data_and_config("train2.csv")
     tokenizer = AutoTokenizer.from_pretrained("google/codegemma-2b")
+    # Load the configuration for a specific model
+    config = AutoConfig.from_pretrained('google/codegemma-2b')
+    # Update the activation function
+    config.hidden_act = 'gelu_pytorch_tanh'  # Set to use approximate GeLU
     model = AutoModelForCausalLM.from_pretrained('google/codegemma-2b', is_decoder=True)
     #model = BertLMHeadModel.from_pretrained('google/codegemma-2b', is_decoder=True)
     # Example assuming you have a prepared dataset for classification
     model.to(device)  # Move model to the appropriate device
     train_model(model, tokenizer, data, device)
     model.save_pretrained("./fine_tuned_model")
     tokenizer.save_pretrained("./fine_tuned_model")