Skip to content

Commit b9012fb

Browse files
Merge pull request #1 from winglian/longchat-args
add rope scaling as a cli arg so openai server can load rope scaled models
2 parents 58e7121 + bb8e153 commit b9012fb

File tree

1 file changed

+5
-0
lines changed

1 file changed

+5
-0
lines changed

vllm/engine/arg_utils.py

Lines changed: 5 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -1,5 +1,6 @@
11
import argparse
22
import dataclasses
3+
import json
34
from dataclasses import dataclass
45
from typing import Optional, Tuple
56

@@ -131,6 +132,10 @@ def add_cli_args(
131132
parser.add_argument('--disable-log-stats',
132133
action='store_true',
133134
help='disable logging statistics')
135+
parser.add_argument('--rope-scaling',
136+
default=None,
137+
type=json.loads,
138+
help='RoPE scaling configuration')
134139
return parser
135140

136141
@classmethod

0 commit comments

Comments
 (0)