Skip to content

Commit fc91390

Browse files
committed
Lighten direct CPU AI smoke generation path
1 parent cf38639 commit fc91390

1 file changed

Lines changed: 2 additions & 2 deletions

File tree

run_ai_trading_smoke_direct.py

Lines changed: 2 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -71,7 +71,7 @@ def _candidate_prompt(candidate):
7171
def _load_runtime():
7272
base_model = os.getenv("TRAINED_MODEL_BASE_MODEL", "Qwen/Qwen2.5-7B-Instruct")
7373
adapter_path = os.getenv("TRAINED_MODEL_ADAPTER_PATH", "_smoke_artifacts/lora_solid_adapter")
74-
cpu_threads = max(1, int(os.getenv("TRAINED_MODEL_CPU_THREADS", "8") or 8))
74+
cpu_threads = max(1, int(os.getenv("TRAINED_MODEL_CPU_THREADS", "4") or 4))
7575
torch.set_num_threads(cpu_threads)
7676
tokenizer = AutoTokenizer.from_pretrained(base_model, trust_remote_code=True)
7777
if tokenizer.pad_token is None:
@@ -102,7 +102,7 @@ def _predict_one(model, tokenizer, candidate):
102102
with torch.no_grad():
103103
output = model.generate(
104104
**encoded,
105-
max_new_tokens=24,
105+
max_new_tokens=16,
106106
do_sample=False,
107107
pad_token_id=tokenizer.eos_token_id,
108108
)

0 commit comments

Comments
 (0)