aider/aider/models.py at main · Aider-AI/aider

History

1331 lines (1111 loc) · 45.1 KB

Raw

100

101

102

103

104

105

106

107

108

109

110

111

112

113

114

115

116

117

118

119

120

121

122

123

124

125

126

127

128

129

130

131

132

133

134

135

136

137

138

139

140

141

142

143

144

145

146

147

148

149

150

151

152

153

154

155

156

157

158

159

160

161

162

163

164

165

166

167

168

169

170

171

172

173

174

175

176

177

178

179

180

181

182

183

184

185

186

187

188

189

190

191

192

193

194

195

196

197

198

199

200

201

202

203

204

205

206

207

208

209

210

211

212

213

214

215

216

217

218

219

220

221

222

223

224

225

226

227

228

229

230

231

232

233

234

235

236

237

238

239

240

241

242

243

244

245

246

247

248

249

250

251

252

253

254

255

256

257

258

259

260

261

262

263

264

265

266

267

268

269

270

271

272

273

274

275

276

277

278

279

280

281

282

283

284

285

286

287

288

289

290

291

292

293

294

295

296

297

298

299

300

301

302

303

304

305

306

307

308

309

310

311

312

313

314

315

316

317

318

319

320

321

322

323

324

325

326

327

328

329

330

331

332

333

334

335

336

337

338

339

340

341

342

343

344

345

346

347

348

349

350

351

352

353

354

355

356

357

358

359

360

361

362

363

364

365

366

367

368

369

370

371

372

373

374

375

376

377

378

379

380

381

382

383

384

385

386

387

388

389

390

391

392

393

394

395

396

397

398

399

400

401

402

403

404

405

406

407

408

409

410

411

412

413

414

415

416

417

418

419

420

421

422

423

424

425

426

427

428

429

430

431

432

433

434

435

436

437

438

439

440

441

442

443

444

445

446

447

448

449

450

451

452

453

454

455

456

457

458

459

460

461

462

463

464

465

466

467

468

469

470

471

472

473

474

475

476

477

478

479

480

481

482

483

484

485

486

487

488

489

490

491

492

493

494

495

496

497

498

499

500

501

502

503

504

505

506

507

508

509

510

511

512

513

514

515

516

517

518

519

520

521

522

523

524

525

526

527

528

529

530

531

532

533

534

535

536

537

538

539

540

541

542

543

544

545

546

547

548

549

550

551

552

553

554

555

556

557

558

559

560

561

562

563

564

565

566

567

568

569

570

571

572

573

574

575

576

577

578

579

580

581

582

583

584

585

586

587

588

589

590

591

592

593

594

595

596

597

598

599

600

601

602

603

604

605

606

607

608

609

610

611

612

613

614

615

616

617

618

619

620

621

622

623

624

625

626

627

628

629

630

631

632

633

634

635

636

637

638

639

640

641

642

643

644

645

646

647

648

649

650

651

652

653

654

655

656

657

658

659

660

661

662

663

664

665

666

667

668

669

670

671

672

673

674

675

676

677

678

679

680

681

682

683

684

685

686

687

688

689

690

691

692

693

694

695

696

697

698

699

700

701

702

703

704

705

706

707

708

709

710

711

712

713

714

715

716

717

718

719

720

721

722

723

724

725

726

727

728

729

730

731

732

733

734

735

736

737

738

739

740

741

742

743

744

745

746

747

748

749

750

751

752

753

754

755

756

757

758

759

760

761

762

763

764

765

766

767

768

769

770

771

772

773

774

775

776

777

778

779

780

781

782

783

784

785

786

787

788

789

790

791

792

793

794

795

796

797

798

799

800

801

802

803

804

805

806

807

808

809

810

811

812

813

814

815

816

817

818

819

820

821

822

823

824

825

826

827

828

829

830

831

832

833

834

835

836

837

838

839

840

841

842

843

844

845

846

847

848

849

850

851

852

853

854

855

856

857

858

859

860

861

862

863

864

865

866

867

868

869

870

871

872

873

874

875

876

877

878

879

880

881

882

883

884

885

886

887

888

889

890

891

892

893

894

895

896

897

898

899

900

901

902

903

904

905

906

907

908

909

910

911

912

913

914

915

916

917

918

919

920

921

922

923

924

925

926

927

928

929

930

931

932

933

934

935

936

937

938

939

940

941

942

943

944

945

946

947

948

949

950

951

952

953

954

955

956

957

958

959

960

961

962

963

964

965

966

967

968

969

970

971

972

973

974

975

976

977

978

979

980

981

982

983

984

985

986

987

988

989

990

991

992

993

994

995

996

997

998

999

1000

import difflib

import hashlib

import importlib.resources

import json

import math

import os

import platform

import sys

import time

from dataclasses import dataclass, fields

from datetime import datetime

from pathlib import Path

from typing import Optional, Union

import json5

import yaml

from PIL import Image

from aider import __version__

from aider.dump import dump # noqa: F401

from aider.llm import litellm

from aider.openrouter import OpenRouterModelManager

from aider.sendchat import ensure_alternating_roles, sanity_check_messages

from aider.utils import check_pip_install_extra

RETRY_TIMEOUT = 60

request_timeout = 600

DEFAULT_MODEL_NAME = "gpt-4o"

ANTHROPIC_BETA_HEADER = "prompt-caching-2024-07-31,pdfs-2024-09-25"

OPENAI_MODELS = """

o1-preview

o1-mini

o3-mini

gpt-4

gpt-4o

gpt-4o-2024-05-13

gpt-4-turbo-preview

gpt-4-0314

gpt-4-0613

gpt-4-32k

gpt-4-32k-0314

gpt-4-32k-0613

gpt-4-turbo

gpt-4-turbo-2024-04-09

gpt-4-1106-preview

gpt-4-0125-preview

gpt-4-vision-preview

gpt-4-1106-vision-preview

gpt-4o-mini

gpt-4o-mini-2024-07-18

gpt-5.5

gpt-5.5-pro

gpt-5.5-chat-latest

gpt-3.5-turbo

gpt-3.5-turbo-0301

gpt-3.5-turbo-0613

gpt-3.5-turbo-1106

gpt-3.5-turbo-0125

gpt-3.5-turbo-16k

gpt-3.5-turbo-16k-0613

"""

OPENAI_MODELS = [ln.strip() for ln in OPENAI_MODELS.splitlines() if ln.strip()]

ANTHROPIC_MODELS = """

claude-2

claude-2.1

claude-3-haiku-20240307

claude-3-5-haiku-20241022

claude-3-opus-20240229

claude-3-sonnet-20240229

claude-3-5-sonnet-20240620

claude-3-5-sonnet-20241022

claude-sonnet-4-20250514

claude-opus-4-20250514

claude-opus-4-6

claude-opus-4-7

claude-sonnet-4-5

claude-sonnet-4-5-20250929

claude-sonnet-4-6

claude-haiku-4-5

claude-haiku-4-5-20251001

"""

ANTHROPIC_MODELS = [ln.strip() for ln in ANTHROPIC_MODELS.splitlines() if ln.strip()]

# Mapping of model aliases to their canonical names

MODEL_ALIASES = {

# Claude models

"sonnet": "claude-sonnet-4-6",

"haiku": "claude-haiku-4-5",

"opus": "claude-opus-4-7",

# GPT models

"4": "gpt-4-0613",

"4o": "gpt-4o",

"4-turbo": "gpt-4-1106-preview",

"35turbo": "gpt-3.5-turbo",

"35-turbo": "gpt-3.5-turbo",

"3": "gpt-3.5-turbo",

# Other models

"deepseek": "deepseek/deepseek-chat",

"flash": "gemini/gemini-flash-latest",

"flash-lite": "gemini/gemini-2.5-flash-lite",

"quasar": "openrouter/openrouter/quasar-alpha",

"r1": "deepseek/deepseek-reasoner",

"gemini-2.5-pro": "gemini/gemini-2.5-pro",

"gemini-3-pro-preview": "gemini/gemini-3-pro-preview",

"gemini": "gemini/gemini-3-pro-preview",

"gemini-exp": "gemini/gemini-2.5-pro-exp-03-25",

"grok3": "xai/grok-3-beta",

"optimus": "openrouter/openrouter/optimus-alpha",

}

# Model metadata loaded from resources and user's files.

@dataclass

class ModelSettings:

# Model class needs to have each of these as well

name: str

edit_format: str = "whole"

weak_model_name: Optional[str] = None

use_repo_map: bool = False

send_undo_reply: bool = False

lazy: bool = False

overeager: bool = False

reminder: str = "user"

examples_as_sys_msg: bool = False

extra_params: Optional[dict] = None

cache_control: bool = False

caches_by_default: bool = False

use_system_prompt: bool = True

use_temperature: Union[bool, float] = True

streaming: bool = True

editor_model_name: Optional[str] = None

editor_edit_format: Optional[str] = None

reasoning_tag: Optional[str] = None

remove_reasoning: Optional[str] = None # Deprecated alias for reasoning_tag

system_prompt_prefix: Optional[str] = None

accepts_settings: Optional[list] = None

# Load model settings from package resource

MODEL_SETTINGS = []

with importlib.resources.open_text("aider.resources", "model-settings.yml") as f:

model_settings_list = yaml.safe_load(f)

for model_settings_dict in model_settings_list:

MODEL_SETTINGS.append(ModelSettings(**model_settings_dict))

class ModelInfoManager:

MODEL_INFO_URL = (

"https://raw.githubusercontent.com/BerriAI/litellm/main/"

"model_prices_and_context_window.json"

)

CACHE_TTL = 60 * 60 * 24 # 24 hours

def __init__(self):

self.cache_dir = Path.home() / ".aider" / "caches"

self.cache_file = self.cache_dir / "model_prices_and_context_window.json"

self.content = None

self.local_model_metadata = {}

self.verify_ssl = True

self._cache_loaded = False

# Manager for the cached OpenRouter model database

self.openrouter_manager = OpenRouterModelManager()

def set_verify_ssl(self, verify_ssl):

self.verify_ssl = verify_ssl

if hasattr(self, "openrouter_manager"):

self.openrouter_manager.set_verify_ssl(verify_ssl)

def _load_cache(self):

if self._cache_loaded:

return

try:

self.cache_dir.mkdir(parents=True, exist_ok=True)

if self.cache_file.exists():

cache_age = time.time() - self.cache_file.stat().st_mtime

if cache_age < self.CACHE_TTL:

try:

self.content = json.loads(self.cache_file.read_text())

except json.JSONDecodeError:

# If the cache file is corrupted, treat it as missing

self.content = None

except OSError:

pass

self._cache_loaded = True

def _update_cache(self):

try:

import requests

# Respect the --no-verify-ssl switch

response = requests.get(self.MODEL_INFO_URL, timeout=5, verify=self.verify_ssl)

if response.status_code == 200:

self.content = response.json()

try:

self.cache_file.write_text(json.dumps(self.content, indent=4))

except OSError:

pass

except Exception as ex:

print(str(ex))

try:

# Save empty dict to cache file on failure

self.cache_file.write_text("{}")

except OSError:

pass

def get_model_from_cached_json_db(self, model):

data = self.local_model_metadata.get(model)

if data:

return data

# Ensure cache is loaded before checking content

self._load_cache()

if not self.content:

self._update_cache()

if not self.content:

return dict()

info = self.content.get(model, dict())

if info:

return info

pieces = model.split("/")

if len(pieces) == 2:

info = self.content.get(pieces[1])

if info and info.get("litellm_provider") == pieces[0]:

return info

return dict()

def get_model_info(self, model):

cached_info = self.get_model_from_cached_json_db(model)

litellm_info = None

if litellm._lazy_module or not cached_info:

try:

litellm_info = litellm.get_model_info(model)

except Exception as ex:

if "model_prices_and_context_window.json" not in str(ex):

print(str(ex))

if litellm_info:

return litellm_info

if not cached_info and model.startswith("openrouter/"):

# First try using the locally cached OpenRouter model database

openrouter_info = self.openrouter_manager.get_model_info(model)

if openrouter_info:

return openrouter_info

# Fallback to legacy web-scraping if the API cache does not contain the model

openrouter_info = self.fetch_openrouter_model_info(model)

if openrouter_info:

return openrouter_info

return cached_info

def fetch_openrouter_model_info(self, model):

"""

Fetch model info by scraping the openrouter model page.

Expected URL: https://openrouter.ai/<model_route>

Example: openrouter/qwen/qwen-2.5-72b-instruct:free

Returns a dict with keys: max_tokens, max_input_tokens, max_output_tokens,

input_cost_per_token, output_cost_per_token.

"""

url_part = model[len("openrouter/") :]

url = "https://openrouter.ai/" + url_part

try:

import requests

response = requests.get(url, timeout=5, verify=self.verify_ssl)

if response.status_code != 200:

return {}

html = response.text

import re

if re.search(

rf"The model\s*.*{re.escape(url_part)}.* is not available", html, re.IGNORECASE

print(f"\033[91mError: Model '{url_part}' is not available\033[0m")

return {}

text = re.sub(r"<[^>]+>", " ", html)

context_match = re.search(r"([\d,]+)\s*context", text)

if context_match:

context_str = context_match.group(1).replace(",", "")

context_size = int(context_str)

else:

context_size = None

input_cost_match = re.search(r"\$\s*([\d.]+)\s*/M input tokens", text, re.IGNORECASE)

output_cost_match = re.search(r"\$\s*([\d.]+)\s*/M output tokens", text, re.IGNORECASE)

input_cost = float(input_cost_match.group(1)) / 1000000 if input_cost_match else None

output_cost = float(output_cost_match.group(1)) / 1000000 if output_cost_match else None

if context_size is None or input_cost is None or output_cost is None:

return {}

params = {

"max_input_tokens": context_size,

"max_tokens": context_size,

"max_output_tokens": context_size,

"input_cost_per_token": input_cost,

"output_cost_per_token": output_cost,

}

return params

except Exception as e:

print("Error fetching openrouter info:", str(e))

return {}

model_info_manager = ModelInfoManager()

class Model(ModelSettings):

def __init__(

self, model, weak_model=None, editor_model=None, editor_edit_format=None, verbose=False

# Map any alias to its canonical name

model = MODEL_ALIASES.get(model, model)

self.name = model

self.verbose = verbose

self.max_chat_history_tokens = 1024

self.weak_model = None

self.editor_model = None

# Find the extra settings

self.extra_model_settings = next(

(ms for ms in MODEL_SETTINGS if ms.name == "aider/extra_params"), None

)

self.info = self.get_model_info(model)

# Are all needed keys/params available?

res = self.validate_environment()

self.missing_keys = res.get("missing_keys")

self.keys_in_environment = res.get("keys_in_environment")

max_input_tokens = self.info.get("max_input_tokens") or 0

# Calculate max_chat_history_tokens as 1/16th of max_input_tokens,

# with minimum 1k and maximum 8k

self.max_chat_history_tokens = min(max(max_input_tokens / 16, 1024), 8192)

self.configure_model_settings(model)

if weak_model is False:

self.weak_model_name = None

else:

self.get_weak_model(weak_model)

if editor_model is False:

self.editor_model_name = None

else:

self.get_editor_model(editor_model, editor_edit_format)

def get_model_info(self, model):

return model_info_manager.get_model_info(model)

def _copy_fields(self, source):

"""Helper to copy fields from a ModelSettings instance to self"""

for field in fields(ModelSettings):

val = getattr(source, field.name)

setattr(self, field.name, val)

# Handle backward compatibility: if remove_reasoning is set but reasoning_tag isn't,

# use remove_reasoning's value for reasoning_tag

if self.reasoning_tag is None and self.remove_reasoning is not None:

self.reasoning_tag = self.remove_reasoning

def configure_model_settings(self, model):

# Look for exact model match

exact_match = False

for ms in MODEL_SETTINGS:

# direct match, or match "provider/<model>"

if model == ms.name:

self._copy_fields(ms)

exact_match = True

break # Continue to apply overrides

# Initialize accepts_settings if it's None

if self.accepts_settings is None:

self.accepts_settings = []

model = model.lower()

# If no exact match, try generic settings

if not exact_match:

self.apply_generic_model_settings(model)

# Apply override settings last if they exist

if (

self.extra_model_settings

and self.extra_model_settings.extra_params

and self.extra_model_settings.name == "aider/extra_params"

# Initialize extra_params if it doesn't exist

if not self.extra_params:

self.extra_params = {}

# Deep merge the extra_params dicts

for key, value in self.extra_model_settings.extra_params.items():

if isinstance(value, dict) and isinstance(self.extra_params.get(key), dict):

# For nested dicts, merge recursively

self.extra_params[key] = {**self.extra_params[key], **value}

else:

# For non-dict values, simply update

self.extra_params[key] = value

# Ensure OpenRouter models accept thinking_tokens and reasoning_effort

if self.name.startswith("openrouter/"):

if self.accepts_settings is None:

self.accepts_settings = []

if (

"thinking_tokens" not in self.accepts_settings

and "claude-opus-4.7" not in self.name

and "claude-opus-4-7" not in self.name

self.accepts_settings.append("thinking_tokens")

if "reasoning_effort" not in self.accepts_settings:

self.accepts_settings.append("reasoning_effort")

def apply_generic_model_settings(self, model):

if "/o3-mini" in model:

self.edit_format = "diff"

self.use_repo_map = True

self.use_temperature = False

self.system_prompt_prefix = "Formatting re-enabled. "

if "reasoning_effort" not in self.accepts_settings:

self.accepts_settings.append("reasoning_effort")

return # <--

if "gpt-4.1-mini" in model:

self.edit_format = "diff"

self.use_repo_map = True

self.reminder = "sys"

self.examples_as_sys_msg = False

return # <--

if "gpt-4.1" in model:

self.edit_format = "diff"

self.use_repo_map = True

self.reminder = "sys"

self.examples_as_sys_msg = False

return # <--

last_segment = model.split("/")[-1]

if last_segment in ("gpt-5", "gpt-5-2025-08-07"):

self.use_temperature = False

self.edit_format = "diff"

if "reasoning_effort" not in self.accepts_settings:

self.accepts_settings.append("reasoning_effort")

return # <--

if "/o1-mini" in model:

self.use_repo_map = True

self.use_temperature = False

self.use_system_prompt = False

return # <--

if "/o1-preview" in model:

self.edit_format = "diff"

self.use_repo_map = True

self.use_temperature = False

self.use_system_prompt = False

return # <--

if "/o1" in model:

self.edit_format = "diff"

self.use_repo_map = True

self.use_temperature = False

self.streaming = False

self.system_prompt_prefix = "Formatting re-enabled. "

if "reasoning_effort" not in self.accepts_settings:

self.accepts_settings.append("reasoning_effort")

return # <--

if "deepseek" in model and "v3" in model:

self.edit_format = "diff"

self.use_repo_map = True

self.reminder = "sys"

self.examples_as_sys_msg = True

return # <--

if "deepseek" in model and ("r1" in model or "reasoning" in model):

self.edit_format = "diff"

self.use_repo_map = True

self.examples_as_sys_msg = True

self.use_temperature = False

self.reasoning_tag = "think"

return # <--

if ("llama3" in model or "llama-3" in model) and "70b" in model:

self.edit_format = "diff"

self.use_repo_map = True

self.send_undo_reply = True

self.examples_as_sys_msg = True

return # <--

if "gpt-4-turbo" in model or ("gpt-4-" in model and "-preview" in model):

self.edit_format = "udiff"

self.use_repo_map = True

self.send_undo_reply = True

return # <--

if "gpt-4" in model or "claude-3-opus" in model:

self.edit_format = "diff"

self.use_repo_map = True

self.send_undo_reply = True

return # <--

if "gpt-3.5" in model or "gpt-4" in model:

self.reminder = "sys"

return # <--

if "sonnet-4-" in model or "opus-4-" in model or "haiku-4-" in model:

self.edit_format = "diff"

self.use_repo_map = True

self.examples_as_sys_msg = False

if "opus-4-" in model:

self.use_temperature = False

if (

"thinking_tokens" not in self.accepts_settings

and "4.7" not in model

and "4-7" not in model

self.accepts_settings.append("thinking_tokens")

return # <--

if "3-7-sonnet" in model:

self.edit_format = "diff"

self.use_repo_map = True

self.examples_as_sys_msg = True

self.reminder = "user"

if "thinking_tokens" not in self.accepts_settings:

self.accepts_settings.append("thinking_tokens")

return # <--

if "3.5-sonnet" in model or "3-5-sonnet" in model:

self.edit_format = "diff"

self.use_repo_map = True

self.examples_as_sys_msg = True

self.reminder = "user"

return # <--

if model.startswith("o1-") or "/o1-" in model:

self.use_system_prompt = False

self.use_temperature = False

return # <--

if (

"qwen" in model

and "coder" in model

and ("2.5" in model or "2-5" in model)

and "32b" in model

self.edit_format = "diff"

self.editor_edit_format = "editor-diff"

self.use_repo_map = True

return # <--

if "qwq" in model and "32b" in model and "preview" not in model:

self.edit_format = "diff"

self.editor_edit_format = "editor-diff"

self.use_repo_map = True

self.reasoning_tag = "think"

self.examples_as_sys_msg = True

self.use_temperature = 0.6

self.extra_params = dict(top_p=0.95)

return # <--

if "qwen3" in model and "235b" in model:

self.edit_format = "diff"

self.use_repo_map = True

self.system_prompt_prefix = "/no_think"

self.use_temperature = 0.7

self.extra_params = {"top_p": 0.8, "top_k": 20, "min_p": 0.0}

return # <--

# use the defaults

if self.edit_format == "diff":

self.use_repo_map = True

return # <--

def __str__(self):

return self.name

def get_weak_model(self, provided_weak_model_name):

# If weak_model_name is provided, override the model settings

if provided_weak_model_name:

self.weak_model_name = provided_weak_model_name

if not self.weak_model_name:

self.weak_model = self

return

if self.weak_model_name == self.name:

self.weak_model = self

return

self.weak_model = Model(

self.weak_model_name,

weak_model=False,

)

return self.weak_model

def commit_message_models(self):

return [self.weak_model, self]

def get_editor_model(self, provided_editor_model_name, editor_edit_format):

# If editor_model_name is provided, override the model settings

if provided_editor_model_name:

self.editor_model_name = provided_editor_model_name

if editor_edit_format:

self.editor_edit_format = editor_edit_format

if not self.editor_model_name or self.editor_model_name == self.name:

self.editor_model = self

else:

self.editor_model = Model(

self.editor_model_name,

editor_model=False,

)

if not self.editor_edit_format:

self.editor_edit_format = self.editor_model.edit_format

if self.editor_edit_format in ("diff", "whole", "diff-fenced"):

self.editor_edit_format = "editor-" + self.editor_edit_format

return self.editor_model

def tokenizer(self, text):

return litellm.encode(model=self.name, text=text)

def token_count(self, messages):

if type(messages) is list:

try:

return litellm.token_counter(model=self.name, messages=messages)

except Exception as err:

print(f"Unable to count tokens: {err}")

return 0

if not self.tokenizer:

return

if type(messages) is str:

msgs = messages

else:

msgs = json.dumps(messages)

try:

return len(self.tokenizer(msgs))

except Exception as err:

print(f"Unable to count tokens: {err}")

return 0

def token_count_for_image(self, fname):

"""

Calculate the token cost for an image assuming high detail.

The token cost is determined by the size of the image.

:param fname: The filename of the image.

:return: The token cost for the image.

"""

width, height = self.get_image_size(fname)

# If the image is larger than 2048 in any dimension, scale it down to fit within 2048x2048

max_dimension = max(width, height)

if max_dimension > 2048:

scale_factor = 2048 / max_dimension

width = int(width * scale_factor)

height = int(height * scale_factor)

# Scale the image such that the shortest side is 768 pixels long

min_dimension = min(width, height)

scale_factor = 768 / min_dimension

width = int(width * scale_factor)

height = int(height * scale_factor)

# Calculate the number of 512x512 tiles needed to cover the image

tiles_width = math.ceil(width / 512)

tiles_height = math.ceil(height / 512)

num_tiles = tiles_width * tiles_height

# Each tile costs 170 tokens, and there's an additional fixed cost of 85 tokens

token_cost = num_tiles * 170 + 85

return token_cost

def get_image_size(self, fname):

"""

Retrieve the size of an image.

:param fname: The filename of the image.

:return: A tuple (width, height) representing the image size in pixels.

"""

with Image.open(fname) as img:

return img.size

def fast_validate_environment(self):

"""Fast path for common models. Avoids forcing litellm import."""

model = self.name

pieces = model.split("/")

if len(pieces) > 1:

provider = pieces[0]

else:

provider = None

keymap = dict(

openrouter="OPENROUTER_API_KEY",

openai="OPENAI_API_KEY",

deepseek="DEEPSEEK_API_KEY",

gemini="GEMINI_API_KEY",

anthropic="ANTHROPIC_API_KEY",

groq="GROQ_API_KEY",

fireworks_ai="FIREWORKS_API_KEY",

)

var = None

if model in OPENAI_MODELS:

var = "OPENAI_API_KEY"

elif model in ANTHROPIC_MODELS:

var = "ANTHROPIC_API_KEY"

else:

var = keymap.get(provider)

if var and os.environ.get(var):

return dict(keys_in_environment=[var], missing_keys=[])

def validate_environment(self):

res = self.fast_validate_environment()

if res:

return res

# https://github.com/BerriAI/litellm/issues/3190

model = self.name

res = litellm.validate_environment(model)

# If missing AWS credential keys but AWS_PROFILE is set, consider AWS credentials valid

if res["missing_keys"] and any(

key in ["AWS_ACCESS_KEY_ID", "AWS_SECRET_ACCESS_KEY"] for key in res["missing_keys"]

if model.startswith("bedrock/") or model.startswith("us.anthropic."):

if os.environ.get("AWS_PROFILE"):

res["missing_keys"] = [

for k in res["missing_keys"]

if k not in ["AWS_ACCESS_KEY_ID", "AWS_SECRET_ACCESS_KEY"]

]

if not res["missing_keys"]:

res["keys_in_environment"] = True

if res["keys_in_environment"]:

return res

if res["missing_keys"]:

return res

provider = self.info.get("litellm_provider", "").lower()

if provider == "cohere_chat":

return validate_variables(["COHERE_API_KEY"])

if provider == "gemini":

return validate_variables(["GEMINI_API_KEY"])

if provider == "groq":

return validate_variables(["GROQ_API_KEY"])

return res

def get_repo_map_tokens(self):

map_tokens = 1024

max_inp_tokens = self.info.get("max_input_tokens")

if max_inp_tokens:

map_tokens = max_inp_tokens / 8

map_tokens = min(map_tokens, 4096)

map_tokens = max(map_tokens, 1024)

return map_tokens

def set_reasoning_effort(self, effort):

"""Set the reasoning effort parameter for models that support it"""

if effort is not None:

if self.name.startswith("openrouter/"):

if not self.extra_params:

self.extra_params = {}

if "extra_body" not in self.extra_params:

self.extra_params["extra_body"] = {}

self.extra_params["extra_body"]["reasoning"] = {"effort": effort}

else:

if not self.extra_params:

self.extra_params = {}

if "extra_body" not in self.extra_params:

self.extra_params["extra_body"] = {}

self.extra_params["extra_body"]["reasoning_effort"] = effort

def parse_token_value(self, value):

"""

Parse a token value string into an integer.

Accepts formats: 8096, "8k", "10.5k", "0.5M", "10K", etc.

Args:

value: String or int token value

Returns:

Integer token value

"""

if isinstance(value, int):

return value

if not isinstance(value, str):

return int(value) # Try to convert to int

value = value.strip().upper()

if value.endswith("K"):

multiplier = 1024

value = value[:-1]

elif value.endswith("M"):

multiplier = 1024 * 1024

value = value[:-1]

else:

multiplier = 1

# Convert to float first to handle decimal values like "10.5k"

return int(float(value) * multiplier)

def set_thinking_tokens(self, value):

"""

Set the thinking token budget for models that support it.

Accepts formats: 8096, "8k", "10.5k", "0.5M", "10K", etc.

Pass "0" to disable thinking tokens.

"""

if value is not None:

num_tokens = self.parse_token_value(value)

self.use_temperature = False

if not self.extra_params:

self.extra_params = {}

# OpenRouter models use 'reasoning' instead of 'thinking'

if self.name.startswith("openrouter/"):

if "extra_body" not in self.extra_params:

self.extra_params["extra_body"] = {}

if num_tokens > 0:

self.extra_params["extra_body"]["reasoning"] = {"max_tokens": num_tokens}

else:

if "reasoning" in self.extra_params["extra_body"]:

del self.extra_params["extra_body"]["reasoning"]

else:

if num_tokens > 0:

self.extra_params["thinking"] = {"type": "enabled", "budget_tokens": num_tokens}

else:

if "thinking" in self.extra_params:

del self.extra_params["thinking"]

def get_raw_thinking_tokens(self):

"""Get formatted thinking token budget if available"""

budget = None

if self.extra_params:

# Check for OpenRouter reasoning format

if self.name.startswith("openrouter/"):

if (

"extra_body" in self.extra_params

and "reasoning" in self.extra_params["extra_body"]

and "max_tokens" in self.extra_params["extra_body"]["reasoning"]

budget = self.extra_params["extra_body"]["reasoning"]["max_tokens"]

# Check for standard thinking format

elif (

"thinking" in self.extra_params and "budget_tokens" in self.extra_params["thinking"]

budget = self.extra_params["thinking"]["budget_tokens"]

return budget

def get_thinking_tokens(self):

budget = self.get_raw_thinking_tokens()

if budget is not None:

# Format as xx.yK for thousands, xx.yM for millions

if budget >= 1024 * 1024:

value = budget / (1024 * 1024)

if value == int(value):

return f"{int(value)}M"

else:

return f"{value:.1f}M"

else:

value = budget / 1024

if value == int(value):

return f"{int(value)}k"

else:

return f"{value:.1f}k"

return None

def get_reasoning_effort(self):

"""Get reasoning effort value if available"""

if self.extra_params:

# Check for OpenRouter reasoning format

if self.name.startswith("openrouter/"):

if (

"extra_body" in self.extra_params

and "reasoning" in self.extra_params["extra_body"]

and "effort" in self.extra_params["extra_body"]["reasoning"]

return self.extra_params["extra_body"]["reasoning"]["effort"]

# Check for standard reasoning_effort format (e.g. in extra_body)

elif (

"extra_body" in self.extra_params

and "reasoning_effort" in self.extra_params["extra_body"]

return self.extra_params["extra_body"]["reasoning_effort"]

return None

def is_deepseek_r1(self):

name = self.name.lower()

if "deepseek" not in name:

return

return "r1" in name or "reasoner" in name

def is_ollama(self):

return self.name.startswith("ollama/") or self.name.startswith("ollama_chat/")

def github_copilot_token_to_open_ai_key(self, extra_headers):

# check to see if there's an openai api key

# If so, check to see if it's expire

openai_api_key = "OPENAI_API_KEY"

if openai_api_key not in os.environ or (

int(dict(x.split("=") for x in os.environ[openai_api_key].split(";"))["exp"])

< int(datetime.now().timestamp())

import requests

class GitHubCopilotTokenError(Exception):

"""Custom exception for GitHub Copilot token-related errors."""

pass

# Validate GitHub Copilot token exists

if "GITHUB_COPILOT_TOKEN" not in os.environ:

raise KeyError("GITHUB_COPILOT_TOKEN environment variable not found")

github_token = os.environ["GITHUB_COPILOT_TOKEN"]

if not github_token.strip():

raise KeyError("GITHUB_COPILOT_TOKEN environment variable is empty")

headers = {

"Authorization": f"Bearer {os.environ['GITHUB_COPILOT_TOKEN']}",

"Editor-Version": extra_headers["Editor-Version"],

"Copilot-Integration-Id": extra_headers["Copilot-Integration-Id"],

"Content-Type": "application/json",

}

url = "https://api.github.com/copilot_internal/v2/token"

res = requests.get(url, headers=headers)

if res.status_code != 200:

safe_headers = {k: v for k, v in headers.items() if k != "Authorization"}

token_preview = github_token[:5] + "..." if len(github_token) >= 5 else github_token

safe_headers["Authorization"] = f"Bearer {token_preview}"

raise GitHubCopilotTokenError(

f"GitHub Copilot API request failed (Status: {res.status_code})\n"

f"URL: {url}\n"

f"Headers: {json.dumps(safe_headers, indent=2)}\n"

f"JSON: {res.text}"

)

response_data = res.json()

token = response_data.get("token")

if not token:

raise GitHubCopilotTokenError("Response missing 'token' field")

os.environ[openai_api_key] = token

def send_completion(self, messages, functions, stream, temperature=None):

if os.environ.get("AIDER_SANITY_CHECK_TURNS"):

sanity_check_messages(messages)

if self.is_deepseek_r1():

messages = ensure_alternating_roles(messages)

kwargs = dict(

model=self.name,

stream=stream,

)

if self.use_temperature is not False:

if temperature is None:

if isinstance(self.use_temperature, bool):

temperature = 0

else:

temperature = float(self.use_temperature)

kwargs["temperature"] = temperature

if functions is not None:

function = functions[0]

View remainder of file in raw view

Provide feedback

Saved searches

Use saved searches to filter your results more quickly

FilesExpand file tree

models.py

Latest commit

History

models.py

File metadata and controls