Skip to content
Merged
Show file tree
Hide file tree
Changes from all commits
Commits
File filter

Filter by extension

Filter by extension

Conversations
Failed to load comments.
Loading
Jump to
Jump to file
Failed to load files.
Loading
Diff view
Diff view
41 changes: 41 additions & 0 deletions models/z-ai/glm-4.5-air-subscription.yaml
Original file line number Diff line number Diff line change
@@ -0,0 +1,41 @@
# yaml-language-server: $schema=https://modelparams.dev/api/v1/schema.json
provider: z-ai
authType: subscription
model: glm-4.5-air
params:
- path: max_tokens
type: integer
label: Max tokens
description: Maximum number of tokens to generate in the response.
range:
min: 1
group: generation_length
- path: temperature
type: number
label: Temperature
description: Controls randomness. Lower values make outputs more focused; higher values make them more varied.
default: 0.6
range:
min: 0
max: 1
step: 0.1
group: sampling
- path: top_p
type: number
label: Top P
description: Controls nucleus sampling by limiting generation to tokens within the selected cumulative probability.
default: 0.95
range:
min: 0.01
max: 1
step: 0.01
group: sampling
- path: thinking.type
type: enum
label: Thinking mode
description: Toggles the model's extended reasoning before it produces the final answer.
default: enabled
values:
- enabled
- disabled
group: reasoning
62 changes: 62 additions & 0 deletions models/z-ai/glm-4.5-air.yaml
Original file line number Diff line number Diff line change
@@ -0,0 +1,62 @@
# yaml-language-server: $schema=https://modelparams.dev/api/v1/schema.json
provider: z-ai
authType: api_key
model: glm-4.5-air
params:
- path: max_tokens
type: integer
label: Max tokens
description: Maximum number of tokens to generate in the response.
range:
min: 1
group: generation_length
- path: temperature
type: number
label: Temperature
description: Controls randomness. Lower values make outputs more focused; higher values make them more varied.
default: 0.6
range:
min: 0
max: 1
step: 0.1
group: sampling
applicability:
except:
do_sample: false
- path: top_p
type: number
label: Top P
description: Controls nucleus sampling by limiting generation to tokens within the selected cumulative probability.
default: 0.95
range:
min: 0.01
max: 1
step: 0.01
group: sampling
applicability:
except:
do_sample: false
- path: do_sample
type: boolean
label: Do sample
description: When false, the model uses greedy decoding and ignores temperature and top_p.
default: true
group: sampling
- path: thinking.type
type: enum
label: Thinking mode
description: Toggles the model's extended reasoning before it produces the final answer.
default: enabled
values:
- enabled
- disabled
group: reasoning
- path: response_format.type
type: enum
label: Response format
description: Forces the response into plain text or a JSON object.
default: text
values:
- text
- json_object
group: output_format
62 changes: 62 additions & 0 deletions models/z-ai/glm-4.5-airx.yaml
Original file line number Diff line number Diff line change
@@ -0,0 +1,62 @@
# yaml-language-server: $schema=https://modelparams.dev/api/v1/schema.json
provider: z-ai
authType: api_key
model: glm-4.5-airx
params:
- path: max_tokens
type: integer
label: Max tokens
description: Maximum number of tokens to generate in the response.
range:
min: 1
group: generation_length
- path: temperature
type: number
label: Temperature
description: Controls randomness. Lower values make outputs more focused; higher values make them more varied.
default: 0.6
range:
min: 0
max: 1
step: 0.1
group: sampling
applicability:
except:
do_sample: false
- path: top_p
type: number
label: Top P
description: Controls nucleus sampling by limiting generation to tokens within the selected cumulative probability.
default: 0.95
range:
min: 0.01
max: 1
step: 0.01
group: sampling
applicability:
except:
do_sample: false
- path: do_sample
type: boolean
label: Do sample
description: When false, the model uses greedy decoding and ignores temperature and top_p.
default: true
group: sampling
- path: thinking.type
type: enum
label: Thinking mode
description: Toggles the model's extended reasoning before it produces the final answer.
default: enabled
values:
- enabled
- disabled
group: reasoning
- path: response_format.type
type: enum
label: Response format
description: Forces the response into plain text or a JSON object.
default: text
values:
- text
- json_object
group: output_format
62 changes: 62 additions & 0 deletions models/z-ai/glm-4.5-flash.yaml
Original file line number Diff line number Diff line change
@@ -0,0 +1,62 @@
# yaml-language-server: $schema=https://modelparams.dev/api/v1/schema.json
provider: z-ai
authType: api_key
model: glm-4.5-flash
params:
- path: max_tokens
type: integer
label: Max tokens
description: Maximum number of tokens to generate in the response.
range:
min: 1
group: generation_length
- path: temperature
type: number
label: Temperature
description: Controls randomness. Lower values make outputs more focused; higher values make them more varied.
default: 0.6
range:
min: 0
max: 1
step: 0.1
group: sampling
applicability:
except:
do_sample: false
- path: top_p
type: number
label: Top P
description: Controls nucleus sampling by limiting generation to tokens within the selected cumulative probability.
default: 0.95
range:
min: 0.01
max: 1
step: 0.01
group: sampling
applicability:
except:
do_sample: false
- path: do_sample
type: boolean
label: Do sample
description: When false, the model uses greedy decoding and ignores temperature and top_p.
default: true
group: sampling
- path: thinking.type
type: enum
label: Thinking mode
description: Toggles the model's extended reasoning before it produces the final answer.
default: enabled
values:
- enabled
- disabled
group: reasoning
- path: response_format.type
type: enum
label: Response format
description: Forces the response into plain text or a JSON object.
default: text
values:
- text
- json_object
group: output_format
62 changes: 62 additions & 0 deletions models/z-ai/glm-4.5-x.yaml
Original file line number Diff line number Diff line change
@@ -0,0 +1,62 @@
# yaml-language-server: $schema=https://modelparams.dev/api/v1/schema.json
provider: z-ai
authType: api_key
model: glm-4.5-x
params:
- path: max_tokens
type: integer
label: Max tokens
description: Maximum number of tokens to generate in the response.
range:
min: 1
group: generation_length
- path: temperature
type: number
label: Temperature
description: Controls randomness. Lower values make outputs more focused; higher values make them more varied.
default: 0.6
range:
min: 0
max: 1
step: 0.1
group: sampling
applicability:
except:
do_sample: false
- path: top_p
type: number
label: Top P
description: Controls nucleus sampling by limiting generation to tokens within the selected cumulative probability.
default: 0.95
range:
min: 0.01
max: 1
step: 0.01
group: sampling
applicability:
except:
do_sample: false
- path: do_sample
type: boolean
label: Do sample
description: When false, the model uses greedy decoding and ignores temperature and top_p.
default: true
group: sampling
- path: thinking.type
type: enum
label: Thinking mode
description: Toggles the model's extended reasoning before it produces the final answer.
default: enabled
values:
- enabled
- disabled
group: reasoning
- path: response_format.type
type: enum
label: Response format
description: Forces the response into plain text or a JSON object.
default: text
values:
- text
- json_object
group: output_format
62 changes: 62 additions & 0 deletions models/z-ai/glm-4.5.yaml
Original file line number Diff line number Diff line change
@@ -0,0 +1,62 @@
# yaml-language-server: $schema=https://modelparams.dev/api/v1/schema.json
provider: z-ai
authType: api_key
model: glm-4.5
params:
- path: max_tokens
type: integer
label: Max tokens
description: Maximum number of tokens to generate in the response.
range:
min: 1
group: generation_length
- path: temperature
type: number
label: Temperature
description: Controls randomness. Lower values make outputs more focused; higher values make them more varied.
default: 0.6
range:
min: 0
max: 1
step: 0.1
group: sampling
applicability:
except:
do_sample: false
- path: top_p
type: number
label: Top P
description: Controls nucleus sampling by limiting generation to tokens within the selected cumulative probability.
default: 0.95
range:
min: 0.01
max: 1
step: 0.01
group: sampling
applicability:
except:
do_sample: false
- path: do_sample
type: boolean
label: Do sample
description: When false, the model uses greedy decoding and ignores temperature and top_p.
default: true
group: sampling
- path: thinking.type
type: enum
label: Thinking mode
description: Toggles the model's extended reasoning before it produces the final answer.
default: enabled
values:
- enabled
- disabled
group: reasoning
- path: response_format.type
type: enum
label: Response format
description: Forces the response into plain text or a JSON object.
default: text
values:
- text
- json_object
group: output_format
Loading
Loading