-
Notifications
You must be signed in to change notification settings - Fork 391
/
Copy pathjson_schema.py
34 lines (32 loc) · 1.04 KB
/
json_schema.py
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
from mistralrs import Runner, Which, ChatCompletionRequest, Architecture
from json import dumps
runner = Runner(
which=Which.Plain(
model_id="microsoft/Phi-3.5-mini-instruct",
),
num_device_layers=["500"],
)
res = runner.send_chat_completion_request(
ChatCompletionRequest(
model="phi",
messages=[{"role": "user", "content": "Give me a sample address."}],
max_tokens=256,
temperature=0.1,
grammar_type="json_schema",
grammar=dumps(
{
"type": "object",
"properties": {
"street": {"type": "string"},
"city": {"type": "string"},
"state": {"type": "string", "pattern": "^[A-Z]{2}$"},
"zip": {"type": "integer", "minimum": 10000, "maximum": 99999},
},
"required": ["street", "city", "state", "zip"],
"additionalProperties": False,
}
),
)
)
print(res.choices[0].message.content)
print(res.usage)