Fix LLM provider selection in podcast handlers
- Remove hardcoded preferred_provider=huggingface in podcast handlers - Set preferred_provider=None to respect GPT_PROVIDER env var - Change default model from Qwen to gpt-oss-120b:cerebras (the model user had access to) - WaveSpeed will now use gpt-oss-120b model instead of Qwen
This commit is contained in:
@@ -80,7 +80,7 @@ Return JSON with:
|
|||||||
prompt=prompt,
|
prompt=prompt,
|
||||||
user_id=user_id,
|
user_id=user_id,
|
||||||
json_struct=None,
|
json_struct=None,
|
||||||
preferred_provider="huggingface",
|
preferred_provider=None,
|
||||||
flow_type="premium_tool",
|
flow_type="premium_tool",
|
||||||
)
|
)
|
||||||
|
|
||||||
@@ -279,7 +279,7 @@ Requirements:
|
|||||||
prompt=prompt,
|
prompt=prompt,
|
||||||
user_id=user_id,
|
user_id=user_id,
|
||||||
json_struct=None,
|
json_struct=None,
|
||||||
preferred_provider="huggingface",
|
preferred_provider=None,
|
||||||
flow_type="premium_tool",
|
flow_type="premium_tool",
|
||||||
)
|
)
|
||||||
except HTTPException:
|
except HTTPException:
|
||||||
|
|||||||
@@ -94,7 +94,7 @@ def llm_text_gen(
|
|||||||
primary_provider = provider_list[0]
|
primary_provider = provider_list[0]
|
||||||
if primary_provider in ['wavespeed', 'wave']:
|
if primary_provider in ['wavespeed', 'wave']:
|
||||||
gpt_provider = "wavespeed"
|
gpt_provider = "wavespeed"
|
||||||
model = os.getenv('WAVESPEED_TEXT_MODEL', 'Qwen/Qwen2.5-7B-Instruct')
|
model = os.getenv('WAVESPEED_TEXT_MODEL', 'openai/gpt-oss-120b:cerebras')
|
||||||
elif primary_provider in ['gemini', 'google']:
|
elif primary_provider in ['gemini', 'google']:
|
||||||
gpt_provider = "google"
|
gpt_provider = "google"
|
||||||
model = "gemini-2.0-flash-001"
|
model = "gemini-2.0-flash-001"
|
||||||
@@ -111,7 +111,7 @@ def llm_text_gen(
|
|||||||
elif preferred_provider:
|
elif preferred_provider:
|
||||||
if preferred_provider in ['wavespeed', 'wave']:
|
if preferred_provider in ['wavespeed', 'wave']:
|
||||||
gpt_provider = "wavespeed"
|
gpt_provider = "wavespeed"
|
||||||
model = os.getenv('WAVESPEED_TEXT_MODEL', 'Qwen/Qwen2.5-7B-Instruct')
|
model = os.getenv('WAVESPEED_TEXT_MODEL', 'openai/gpt-oss-120b:cerebras')
|
||||||
elif preferred_provider in ['openai', 'gpt']:
|
elif preferred_provider in ['openai', 'gpt']:
|
||||||
gpt_provider = "openai"
|
gpt_provider = "openai"
|
||||||
model = os.getenv('OPENAI_MODEL', 'gpt-4o-mini')
|
model = os.getenv('OPENAI_MODEL', 'gpt-4o-mini')
|
||||||
@@ -363,7 +363,7 @@ def llm_text_gen(
|
|||||||
from services.llm_providers.wavespeed_provider import wavespeed_text_response
|
from services.llm_providers.wavespeed_provider import wavespeed_text_response
|
||||||
response_text = wavespeed_text_response(
|
response_text = wavespeed_text_response(
|
||||||
prompt=prompt,
|
prompt=prompt,
|
||||||
model=model or "Qwen/Qwen2.5-7B-Instruct",
|
model=model or "openai/gpt-oss-120b:cerebras",
|
||||||
temperature=temperature,
|
temperature=temperature,
|
||||||
max_tokens=max_tokens,
|
max_tokens=max_tokens,
|
||||||
top_p=top_p,
|
top_p=top_p,
|
||||||
|
|||||||
Reference in New Issue
Block a user