harismlnaslm commited on
Commit
7396832
·
1 Parent(s): b98c2d7

fix: handle serverless 404 by falling back to DialoGPT/distilgpt2; default serverless model to DialoGPT

Browse files
Files changed (1) hide show
  1. app.py +4 -2
app.py CHANGED
@@ -355,7 +355,8 @@ class TextilindoAI:
355
  self.endpoint_url = (os.getenv('HF_ENDPOINT_URL') or '').strip()
356
  # Normalize model: block unsupported/gated models; prefer widely available ones
357
  env_model = (os.getenv('DEFAULT_MODEL') or '').strip()
358
- default_supported = 'TinyLlama/TinyLlama-1.1B-Chat-v1.0'
 
359
  if env_model and (
360
  'gpt2' in env_model.lower()
361
  or 'meta-llama/llama-3.2-1b-instruct' in env_model.lower()
@@ -366,7 +367,8 @@ class TextilindoAI:
366
  else:
367
  # Safer default
368
  self.model = env_model or default_supported
369
- self._fallback_model = default_supported
 
370
  self.system_prompt = self.load_system_prompt()
371
  self.data_loader = TrainingDataLoader()
372
 
 
355
  self.endpoint_url = (os.getenv('HF_ENDPOINT_URL') or '').strip()
356
  # Normalize model: block unsupported/gated models; prefer widely available ones
357
  env_model = (os.getenv('DEFAULT_MODEL') or '').strip()
358
+ # Use a widely available serverless default to avoid 404s
359
+ default_supported = 'microsoft/DialoGPT-medium'
360
  if env_model and (
361
  'gpt2' in env_model.lower()
362
  or 'meta-llama/llama-3.2-1b-instruct' in env_model.lower()
 
367
  else:
368
  # Safer default
369
  self.model = env_model or default_supported
370
+ # Fallback model used on serverless 404s
371
+ self._fallback_model = 'distilgpt2'
372
  self.system_prompt = self.load_system_prompt()
373
  self.data_loader = TrainingDataLoader()
374