Spaces:

JeffMII
/

CEC-Learning

Running

App Files Files Community

Jeff Myers II commited on Apr 21

Commit

acf540f

1 Parent(s): 5326dc3

Update space

Browse files

Files changed (1) hide show

Gemma_Model.py +7 -7

Gemma_Model.py CHANGED Viewed

@@ -8,14 +8,14 @@ class GemmaLLM:
     def __init__(self):
         model_id = "google/gemma-3-1b-it"
-        quantization_config = BitsAndBytesConfig(load_in_8bit=True)
         self.model = Gemma3ForCausalLM.from_pretrained(
             model_id,
             device_map="cpu",
-            quantization_config=quantization_config,
-            low_cpu_mem_usage=True,
-            torch_dtype=torch.float16,
         ).eval()
         self.tokenizer = AutoTokenizer.from_pretrained(model_id)
@@ -73,9 +73,9 @@ class GemmaLLM:
     def get_questions_message(self, summary, num_questions, difficulty) -> dict:
         schema = json.dumps([
-        dict(question=str.__name__, correct_answer=str.__name__, false_answers=[str.__name__, str.__name__, str.__name__]),
-        dict(question=str.__name__, correct_answer=str.__name__, false_answers=[str.__name__, str.__name__, str.__name__]),
-        dict(question=str.__name__, correct_answer=str.__name__, false_answers=[str.__name__, str.__name__, str.__name__])], indent=4)
         question = "You are a helpful assistant. Your main task is to generate " + str(num_questions) + " multiple choice questions from an article. Respond in the following JSON structure and schema:\n\njson\n```\n" + schema + "\n```\n\nThere should only be " + str(num_questions) + " questions generated. Each question should only have 3 false answers and 1 correct answer. The correct answer should be the most relevant answer based on the context derived from the article. False answers should not contain the correct answer. False answers should contain false information but also be reasonably plausible for answering the question. ONLY RESPOND WITH RAW JSON!!!"

     def __init__(self):
         model_id = "google/gemma-3-1b-it"
+        # quantization_config = BitsAndBytesConfig(load_in_8bit=True)
         self.model = Gemma3ForCausalLM.from_pretrained(
             model_id,
             device_map="cpu",
+            # quantization_config=quantization_config,
+            # low_cpu_mem_usage=True,
+            # torch_dtype=torch.float16,
         ).eval()
         self.tokenizer = AutoTokenizer.from_pretrained(model_id)
     def get_questions_message(self, summary, num_questions, difficulty) -> dict:
         schema = json.dumps([
+            dict(question=str.__name__, correct_answer=str.__name__, false_answers=[str.__name__, str.__name__, str.__name__]),
+            dict(question=str.__name__, correct_answer=str.__name__, false_answers=[str.__name__, str.__name__, str.__name__]),
+            dict(question=str.__name__, correct_answer=str.__name__, false_answers=[str.__name__, str.__name__, str.__name__])], indent=4)
         question = "You are a helpful assistant. Your main task is to generate " + str(num_questions) + " multiple choice questions from an article. Respond in the following JSON structure and schema:\n\njson\n```\n" + schema + "\n```\n\nThere should only be " + str(num_questions) + " questions generated. Each question should only have 3 false answers and 1 correct answer. The correct answer should be the most relevant answer based on the context derived from the article. False answers should not contain the correct answer. False answers should contain false information but also be reasonably plausible for answering the question. ONLY RESPOND WITH RAW JSON!!!"