Fred808 commited on
Commit
df5b28a
·
verified ·
1 Parent(s): 8527515

Update app.py

Browse files
Files changed (1) hide show
  1. app.py +2 -2
app.py CHANGED
@@ -21,8 +21,8 @@ app = FastAPI()
21
  logging.basicConfig(level=logging.INFO)
22
  logger = logging.getLogger(__name__)
23
 
24
- # Load the Google Gemma 2B model and tokenizer
25
- model_id = "google/gemma-2b" # Use Google Gemma 2B
26
  tokenizer = AutoTokenizer.from_pretrained(model_id)
27
 
28
  # Load the model without quantization for CPU
 
21
  logging.basicConfig(level=logging.INFO)
22
  logger = logging.getLogger(__name__)
23
 
24
+ # Load a smaller model (GPT-Neo-125M) and tokenizer
25
+ model_id = "EleutherAI/gpt-neo-125M" # Use GPT-Neo-125M for faster performance
26
  tokenizer = AutoTokenizer.from_pretrained(model_id)
27
 
28
  # Load the model without quantization for CPU