Spaces:

Fred808
/

808-GPT2

Running

Fred808 commited on Jan 9

Commit

8527515

verified ·

1 Parent(s): e91b142

Update app.py

Files changed (1) hide show

app.py CHANGED Viewed

@@ -26,7 +26,7 @@ model_id = "google/gemma-2b"  # Use Google Gemma 2B
 tokenizer = AutoTokenizer.from_pretrained(model_id)
 # Load the model without quantization for CPU
-logger.info("Loading model for CPU...")
 model = AutoModelForCausalLM.from_pretrained(
     model_id,
     torch_dtype=torch.float32,  # Use FP32 for CPU compatibility
@@ -37,8 +37,7 @@ model = AutoModelForCausalLM.from_pretrained(
 pipe = pipeline(
     "text-generation",
     model=model,
-    tokenizer=tokenizer,
-    device="cpu"  # Explicitly set device to CPU
 )
 # Define request body schema

 tokenizer = AutoTokenizer.from_pretrained(model_id)
 # Load the model without quantization for CPU
+logger.info("Loading model...")
 model = AutoModelForCausalLM.from_pretrained(
     model_id,
     torch_dtype=torch.float32,  # Use FP32 for CPU compatibility
 pipe = pipeline(
     "text-generation",
     model=model,
+    tokenizer=tokenizer
 )
 # Define request body schema