Configuration Description

ms_coordinator.json Startup Configuration File

The following is an example of the ms_coordinator.json startup configuration file. For details about the parameters, see Parameters in the ms_coordinator.json Startup Configuration File.
{
    "http_config": {
        "allow_all_zero_ip_listening": false,        
        "predict_ip": "127.0.0.1",
        "predict_port": "1025",
        "manage_ip": "127.0.0.1",
        "manage_port": "1026",
        "alarm_port": "1027",
        "external_port": "1028",
        "status_port": "1029",
        "server_thread_num": 10,
        "client_thread_num": 10,
        "http_timeout_seconds": 600,
        "keep_alive_seconds": 180,
        "server_name": "MindIE-MS",
        "user_agent": "Coordinator/1.0"
    },
    "request_limit": {
        "single_node_max_requests": 1000,
        "max_requests": 10000,
        "body_limit": 1
    },
    "metrics_config": {
        "enable": false,
        "trigger_size": 100
    },
    "prometheus_metrics_config": {
        "reuse_time": 3
    },
    "exception_config": {
        "max_retry": 5,
        "schedule_timeout": 600,
        "first_token_timeout": 600,
        "infer_timeout": 600,
        "tokenizer_timeout": 300
    },
    "log_info": {
        "log_level": "INFO",
        "to_file": true,
        "to_stdout": true,
        "run_log_path": "./logs/ms_coordinator_run_log.txt",
        "operation_log_path": "./logs/ms_coordinator_operation_log.txt",
        "max_log_str_size": 4096,
        "max_log_file_size": 20,
        "max_log_file_num": 10
    },
    "digs_scheduler_config": {
        "deploy_mode": "pd_separate",
        "scheduler_type": "digs_scheduler",
        "algorithm_type": "load_balance",
        "cache_size": "100",
        "slots_thresh": "0.05",
        "block_thresh": "0.05",
        "max_schedule_count": "10000",
        "reordering_type": "1",
        "max_res_num": "5000",
        "res_limit_rate": "1.1",
        "select_type": "2",
        "load_cost_values": "1, 0",
        "load_cost_coefficient": "0, 0.22, 1024, 24, 6, 0, 1, 0, 1"
    },
    "string_token_rate": 4.02,
    "tls_config": {
        "controller_server_tls_enable": true,
        "controller_server_tls_items": {
            "ca_cert" : "./security/controller/security/certs/ca.pem",
            "tls_cert": "./security/controller/security/certs/cert.pem",
            "tls_key": "./security/controller/security/keys/cert.key.pem",
            "tls_passwd": "./security/controller/security/pass/key_pwd.txt",
            "kmcKsfMaster": "./security/controller/tools/pmt/master/ksfa",
            "kmcKsfStandby": "./security/controller/tools/pmt/standby/ksfb",
            "tls_crl": ""
        },
        "request_server_tls_enable": true,
        "request_server_tls_items": {
            "ca_cert" : "./security/request/security/certs/ca.pem",
            "tls_cert": "./security/request/security/certs/cert.pem",
            "tls_key": "./security/request/security/keys/cert.key.pem",
            "tls_passwd": "./security/request/security/pass/key_pwd.txt",
            "kmcKsfMaster": "./security/request/tools/pmt/master/ksfa",
            "kmcKsfStandby": "./security/request/tools/pmt/standby/ksfb",
            "tls_crl": ""
        },
        "mindie_client_tls_enable": true,
        "mindie_client_tls_items": {
            "ca_cert" : "./security/mindie/security/certs/ca.pem",
            "tls_cert": "./security/mindie/security/certs/cert.pem",
            "tls_key": "./security/mindie/security/keys/cert.key.pem",
            "tls_passwd": "./security/mindie/security/pass/key_pwd.txt",
            "kmcKsfMaster": "./security/mindie/tools/pmt/master/ksfa",
            "kmcKsfStandby": "./security/mindie/tools/pmt/standby/ksfb",
            "tls_crl": ""
        },
        "mindie_mangment_tls_enable": true,
        "mindie_mangment_tls_items": {
            "ca_cert" : "./security/mindie_mgmt/security/certs/ca.pem",
            "tls_cert": "./security/mindie_mgmt/security/certs/cert.pem",
            "tls_key": "./security/mindie_mgmt/security/keys/cert.key.pem",
            "tls_passwd": "./security/mindie_mgmt/security/pass/key_pwd.txt",
            "kmcKsfMaster": "./security/mindie_mgmt/tools/pmt/master/ksfa",
            "kmcKsfStandby": "./security/mindie_mgmt/tools/pmt/standby/ksfb",
            "tls_crl": ""
        },
        "external_tls_enable": true,
        "external_tls_items": {
            "ca_cert" : "./security/external/security/certs/ca.pem",
            "tls_cert": "./security/external/security/certs/cert.pem",
            "tls_key": "./security/external/security/keys/cert.key.pem",
            "tls_passwd": "./security/external/security/pass/key_pwd.txt",
            "kmcKsfMaster": "./security/external/tools/pmt/master/ksfa",
            "kmcKsfStandby": "./security/external/tools/pmt/standby/ksfb",
            "tls_crl": ""
        },
        "status_tls_enable": true,
        "status_tls_items": {
            "ca_cert" : "./security/status/security/certs/ca.pem",
            "tls_cert": "./security/status/security/certs/cert.pem",
            "tls_key": "./security/status/security/keys/cert.key.pem",
            "tls_passwd": "./security/status/security/pass/key_pwd.txt",
            "kmcKsfMaster": "./security/status/tools/pmt/master/ksfa",
            "kmcKsfStandby": "./security/status/tools/pmt/standby/ksfb",
            "tls_crl": ""
        },
        "etcd_server_tls_enable": true,
        "etcd_server_tls_items": {
            "ca_cert" : "./security/etcd_server/security/certs/ca.pem",
            "tls_cert": "./security/etcd_server/security/certs/cert.pem",
            "tls_key": "./security/etcd_server/security/keys/cert.key.pem",
            "tls_passwd": "./security/etcd_server/security/pass/key_pwd.txt",
            "kmcKsfMaster": "./security/etcd_server/tools/pmt/master/ksfa",
            "kmcKsfStandby": "./security/etcd_server/tools/pmt/standby/ksfb",
            "tls_crl": ""
        },
        "alarm_client_tls_enable": true,
        "alarm_client_tls_items": {
            "ca_cert" : "./security/alarm/security/certs/ca.pem",
            "tls_cert": "./security/alarm/security/certs/cert.pem",
            "tls_key": "./security/alarm/security/keys/cert.key.pem",
            "tls_passwd": "./security/alarm/security/pass/key_pwd.txt",
            "kmcKsfMaster": "./security/alarm/tools/pmt/master/ksfa",
            "kmcKsfStandby": "./security/alarm/tools/pmt/standby/ksfb",
            "tls_crl": ""
        }
    },
    "backup_config":{
        "database_server_dns":"etcd.default.svc.cluster.local",
        "database_server_port":2379,
        "function_enable": false
    }
}

Parameters in the ms_coordinator.json Startup Configuration File

The fields in the ms_coordinator.json configuration file are described in Table 1. You can configure the fields as needed.

Table 1 Parameters in the ms_coordinator.json startup configuration file

Parameter Name

Supported Features

Value Range

Configuration Description

http_config: communication configuration

allow_all_zero_ip_listening

Prefill-decode disaggregation

Prefix Cache (single-node system)

  • true: All-zero monitoring is allowed.
  • false: All-zero monitoring is disabled.

Mandatory. The default value is false.

Whether to allow all-zero monitoring. If the value is false, the program fails to run and an error is reported when all-zero monitoring is used.

NOTE:

If all-zero monitoring is enabled, triple-plane isolation becomes invalid, which does not meet security configuration requirements. Therefore, the IP address cannot be set to 0.0.0.0 by default. If the IP address must be set to 0.0.0.0, set this parameter to true under the premise of security.

predict_ip

Prefill-decode disaggregation

Prefix Cache (single-node system)

IPv4 or IPv6

Mandatory. The default value is "127.0.0.1".

Monitoring IP address of the user API.

predict_port

Prefill-decode disaggregation

Prefix Cache (single-node system)

[1024, 65535]

Mandatory. The default value is "1025".

Monitoring port of the user API.

manage_ip

Prefill-decode disaggregation

Prefix Cache (single-node system)

IPv4 or IPv6

Mandatory. The default value is "127.0.0.1".

Monitoring IP address of the communication API in the cluster.

manage_port

Prefill-decode disaggregation

Prefix Cache (single-node system)

[1024, 65535]

Mandatory. The default value is "1026".

Monitoring port of the communication API in the cluster.

alarm_port

Prefill-decode disaggregation

[1024, 65535]

Mandatory. The default value is "1027".

Port used by the Coordinator to report alarms to the Controller.

external_port

Prefill-decode disaggregation

Prefix Cache (single-node system)

[1024, 65535]

Mandatory. The default value is "1028".

External port of the Coordinator.

status_port

Prefill-decode disaggregation

Prefix Cache (single-node system)

[1024, 65535]

Mandatory. The default value is "1029".

Port for querying the Coordinator status.

server_thread_num

Prefill-decode disaggregation

Prefix Cache (single-node system)

[1, 10000]

Mandatory. The default value is 10.

Number of threads in the HTTP Server thread pool. It is recommended that the value be less than or equal to 1/4 of the maximum number of threads in the system.

client_thread_num

Prefill-decode disaggregation

Prefix Cache (single-node system)

[1, 10000]

Mandatory. The default value is 10.

Number of threads in the HTTP Client thread pool. It is recommended that the value be less than or equal to 1/4 of the maximum number of threads in the system.

http_timeout_seconds

Prefill-decode disaggregation

Prefix Cache (single-node system)

[0, 3600], in seconds.

Mandatory. The default value is 600. The value 0 indicates that timeout is triggered immediately.

HTTP communication timeout interval.

keep_alive_seconds

Prefill-decode disaggregation

[0, 3600], in seconds.

Mandatory. The default value is 180. 0 disables the keepalive check for persistent connections.

Keepalive check time of a persistent connection. If no message is detected within the keepalive check period, the persistent connection will be disabled.

NOTE:

You are advised to set this value to a value greater than 0 to prevent the Coordinator from DoS attacks.

server_name

Prefill-decode disaggregation

Prefix Cache (single-node system)

-

Mandatory. The default value is MindIE-MS.

Server name.

user_agent

Prefill-decode disaggregation

Prefix Cache (single-node system)

-

Mandatory. The default value is Coordinator/1.0.

Software version number.

request_limit: request limit

single_node_max_requests

Prefill-decode disaggregation

Prefix Cache (single-node system)

[1, 2000]

Mandatory. The default value is 1000.

Maximum number of requests that can be processed by a single Server node. The value of this parameter cannot exceed the maximum number of requests supported by the Server.

If the environment variable MINDIE_MS_COORDINATOR_CONFIG_SINGLE_NODE_MAX_REQ is set, the value of the environment variable is read first.

max_requests

Prefill-decode disaggregation

Prefix Cache (single-node system)

[1, 90000]

Mandatory. The default value is 10000.

Maximum number of requests that can be processed.

  • Prefill-decode disaggregation: (recommended) single_node_max_requests × Prefill node count + Margin of about 1000
  • Prefill-decode hybrid deployment: (recommended) single_node_max_requests × Node count + Margin of about 1000

If the environment variable MINDIE_MS_COORDINATOR_CONFIG_MAX_REQ is set, the value of the environment variable is read first.

NOTE:
  • Any requests exceeding the specified value will be rejected.
  • The maximum number of external links allowed by the Coordinator is 3 × max_requests. After the number of connections exceeds the upper limit, the Coordinator prohibits external connections to prevent DoS attacks.

body_limit

Prefill-decode disaggregation

Prefix Cache (single-node system)

[1, 20], in MB.

Mandatory. The default value is 1.

Maximum number of bytes in a request body. If the size of a request body exceeds the value, the request fails to be sent.

metrics_config: performance statistics

enable

Prefill-decode disaggregation

Prefix Cache (single-node system)

  • true: enabled
  • false: disabled

Mandatory. The default value is false.

Whether to enable performance statistics.

This parameter is used to assist fault locating. Enabling this function may affect service performance. You are advised to disable this function in normal service scenarios.

trigger_size

Prefill-decode disaggregation

Prefix Cache (single-node system)

[1, 10000]

Mandatory. This parameter takes effect when enable is set to true. The default value is 100.

Number of requests for triggering performance statistics.

prometheus_metrics_config: serving management and control metrics

reuse_time

Prefill-decode disaggregation

Prefix Cache (single-node system)

[1, 100], in seconds.

Mandatory. The default value is 3.

Used by the API for querying management and control metrics. If the interval between the current time and the previous query time is less than the value of reuse_time, the time of the previous management and control metrics is reused. The time of the previous query is not updated when the reuse result is queried.

exception_config: exception configuration

max_retry

Prefill-decode disaggregation

Prefix Cache (single-node system)

[0, 10]

Mandatory. The default value is 5.

Maximum number of retries upon a communication exception.

schedule_timeout

Prefill-decode disaggregation

Prefix Cache (single-node system)

[0, 3600], in seconds.

Mandatory. The default value is 600. The value 0 indicates that the scheduling timeout check is disabled.

Scheduling timeout interval. If a request is not scheduled within the timeout interval, an error is returned to the user.

first_token_timeout

Prefill-decode disaggregation

Prefix Cache (single-node system)

[0, 3600], in seconds.

Mandatory. The default value is 600. The value 0 indicates that the timeout check for the first token is disabled.

Timeout interval of the first token. If the first token inference is not complete within the timeout interval, an error is returned to the user.

infer_timeout

Prefill-decode disaggregation

Prefix Cache (single-node system)

[0, 65535], in seconds.

Mandatory. The default value is 600. The value 0 indicates that the inference timeout check is disabled.

Timeout interval for requesting inference. If the inference is not complete within the timeout interval, an error is returned to the user.

tokenizer_timeout

Prefill-decode disaggregation

[0, 3600], in seconds.

Mandatory. The default value is 300. The value 0 indicates that the timeout check for token calculation is disabled.

Timeout interval for token calculation. If the tokenizer job is not completed within the timeout interval, an error is returned to the user.

log_info: log configuration (You are advised to use environment variables to configure logs. For details, see Log Configuration.)

log_level

Prefill-decode disaggregation

Prefix Cache (single-node system)

  • CRITICAL
  • ERROR
  • WARN
  • INFO
  • DEBUG

Optional. The default value is INFO.

Sets the log level.

If the environment variable MINDIE_LOG_LEVEL or MINDIEMS_LOG_LEVEL is set, the value of the environment variable is read first.

NOTE:

The service performance is greatly affected by the parameter. When the parameter is set to ERROR, the performance is the best. When the parameter is set to DEBUG, the performance is the worst. The performance difference between the two values is about 10 times.

to_file

Prefill-decode disaggregation

Prefix Cache (single-node system)

  • true: Output logs to a file.
  • false: Do not output logs to a file.

Optional. The default value is true.

Whether to output logs to a file.

If the environment variable MINDIE_LOG_TO_FILE is set, the value of the environment variable is read first.

to_stdout

Prefill-decode disaggregation

Prefix Cache (single-node system)

  • true: Output logs to the standard output stream.
  • false: Do not output logs to the standard output stream.

Optional. The default value is false.

Whether to output logs to the standard output stream.

If the MINDIE_LOG_TO_STDOUT environment variable is set, the value of the environment variable is read first.

run_log_path

Prefill-decode disaggregation

Prefix Cache (single-node system)

-

Optional. The default path is the same as that of the MINDIE_LOG_PATH environment variable. For details, see Log Configuration. If the MINDIE_LOG_PATH environment variable is set, the value of the environment variable is read first. This parameter takes effect when to_file is set to true.

Run log path. The path must exist and be readable. The file is automatically created during running.

operation_log_path

Prefill-decode disaggregation

Prefix Cache (single-node system)

-

Optional. The default path is the same as that of the MINDIE_LOG_PATH environment variable. For details, see Log Configuration. If the MINDIE_LOG_PATH environment variable is set, the value of the environment variable is read first. This parameter takes effect when to_file is set to true.

Audit log path. The path must exist and be readable. The file is automatically created during running.

max_log_str_size

Prefill-decode disaggregation

Prefix Cache (single-node system)

[128, 65535]

Optional. The default value is 4096.

Maximum length of a log.

max_log_file_size

Prefill-decode disaggregation

Prefix Cache (single-node system)

[1, 500], in MB.

Optional. The default value is 20.

Maximum size of a log file. If the MINDIE_LOG_ROTATE environment variable is set, the value of the environment variable is read first.

max_log_file_num

Prefill-decode disaggregation

Prefix Cache (single-node system)

[1, 64]

Optional. The default value is 10.

Maximum number of log files that can be stored. If the MINDIE_LOG_ROTATE environment variable is set, the value of the environment variable is read first.

digs_scheduler_config: Coordinator configuration

deploy_mode

Prefill-decode disaggregation

Prefix Cache (single-node system)

  • Prefill-decode disaggregation

    pd_separate or pd_disaggregation: multi-node prefill-decode disaggregation deployment

    pd_disaggregation_single_container: single-node prefill-decode disaggregation deployment

  • Prefix Cache (single-node system)

    single_node: single-node deployment

Mandatory. The default value is "pd_separate".

Deployment mode.

scheduler_type

Prefill-decode disaggregation

Prefix Cache (single-node system)

  • Prefill-decode disaggregation

    digs_scheduler: digs coordinator

  • Prefix Cache (single-node system)

    default_scheduler: default coordinator

Mandatory. The default value is "digs_scheduler".

Coordinator type.

  • If deploy_mode is set to "pd_separate", this parameter must be set to "digs_scheduler".
  • If deploy_mode is set to "single_node", this parameter must be set to "default_scheduler".

algorithm_type

Prefill-decode disaggregation

Prefix Cache (single-node system)

  • Prefill-decode disaggregation

    load_balance: load balancing. Inference requests are scheduled to instances with more resources.

  • Prefix Cache (single-node system)

    cache_affinity: cache affinity algorithm. In the OpenAI multi-round session scenario, inference requests are scheduled to instances that have processed historical rounds of sessions.

Mandatory. The default value is "load_balance".

Scheduling algorithm.

  • If scheduler_type is set to "digs_scheduler", this parameter must be set to "load_balance".
  • If scheduler_type is set to "default_scheduler", this parameter must be set to "cache_affinity".

cache_size

Prefix Cache (single-node system)

["1", "10000"]

This parameter is mandatory when algorithm_type is set to "cache_affinity". The default value is "100".

Upper limit of the cache. (Only the Prefix Cache algorithm is supported.)

slots_thresh

Prefix Cache (single-node system)

["0.0", "1.0"]

This parameter is mandatory when algorithm_type is set to "cache_affinity". The default value is "0.05".

Ratio of available slots to total slots, slot resource warning threshold. (Only the Prefix Cache algorithm is supported.)

block_thresh

Prefix Cache (single-node system)

["0.0", "1.0"]

This parameter is mandatory when algorithm_type is set to "cache_affinity". The default value is "0.05".

Ratio of available blocks to total blocks, block resource warning threshold. (Only the Prefix Cache algorithm is supported.)

max_schedule_count

Prefill-decode disaggregation

["1", "90000"]

This parameter is mandatory when scheduler_type is set to "digs_scheduler". The default value is "10000".

Maximum number of requests that can be scheduled at the same time. It is recommended that the value be the same as that of max_requests. (Only the prefill-decode disaggregation load balancing algorithm is supported.)

reordering_type

Prefill-decode disaggregation

  • "1": FCFS, first-come, first-served.
  • "2": SJF, shortest job first.
  • "3": LJF, longest job first.

This parameter is mandatory when scheduler_type is set to "digs_scheduler". The default value is "1".

max_res_num

Prefill-decode disaggregation

["1", "10000"]

This parameter is mandatory when scheduler_type is set to "digs_scheduler". The default value is "5000".

Maximum number of nodes that can be registered with the Coordinator.

res_limit_rate

Prefill-decode disaggregation

[0.0, 2000.0]

This parameter takes effect only when "select_type" is set to "2". It indicates the upper limit of the ratio of the total number of resources occupied by requests to the actual total number of resources.

select_type

Prefill-decode disaggregation

  • "1": simple load balancing, without upper limit control.
  • "2": load balancing with resource upper limit control.

This parameter specifies the resource scheduling policy. The default value is "2".

load_cost_values

Prefill-decode disaggregation

  • "1, 0": indicates that the number of slots required by each request is 1, and the number of blocks required by each request is determined based on the actual situation.
  • "1, 1": indicates that the number of blocks required by each request is fixed to 1.

Optional. The default value is "1, 0".

Indicates the requested resources, which are resources in the slots and blocks dimensions.

  • If this parameter is set to "1, 0", the normal load balancing scheduling policy is configured.
  • If this parameter is set to "1, 1", the resource difference of requests in the blocks dimension is ignored, and the scheduling policy is degraded to round-robin.

load_cost_coefficient

Prefill-decode disaggregation

The meanings and value ranges of the values from left to right are as follows (the upper limits of the value ranges can be adjusted based on the site requirements):

  • Coefficient of the sequence length sensed by the AI Core: [0, 1000]
  • Coefficient of the request input length: [0, 1000]
  • Fixed output length of the request: [0, 100 MB]
  • Number of AI Cores: [1, 1000]
  • Number of cores in each AI Core group: [1, 1000]
  • Coefficient of maxBatchSize: [0, 1000]
  • Coefficient of the actually reported sequence length: [0, 1000]
  • Coefficient of slots: [0, 1000]
  • Coefficient of blocks: [0, 1000]

Optional. The default value is "0, 0.22, 1024, 24, 6, 0, 1, 0, 1".

Customized configuration of each parameter or coefficient in the load balancing scheduling policy formula.

string_token_rate

Prefill-decode disaggregation

[1.0, 100.0]

Ratio of the number of tokens converted from the input character string.

tls_config: certificate configuration

Certificate configuration for communication with the Coordinator management port

controller_server_tls_enable

Prefill-decode disaggregation

Prefix Cache (single-node system)

Whether to enable TLS verification for the communication with the Coordinator management port.

You are advised to enable this function to ensure communication security between the Controller or user and the management port. If this function is disabled, high network security risks exist.

Mandatory. The default value is true.

ca_cert

Prefill-decode disaggregation

Prefix Cache (single-node system)

Path of the CA root certificate.

Mandatory when TLS verification is enabled.

tls_cert

Prefill-decode disaggregation

Prefix Cache (single-node system)

TLS certificate path.

Mandatory when TLS verification is enabled.

tls_key

Prefill-decode disaggregation

Prefix Cache (single-node system)

Path of the TLS private key certificate encrypted using a password.

Mandatory when TLS verification is enabled.

tls_passwd

Prefill-decode disaggregation

Prefix Cache (single-node system)

Encrypted password of the TLS private key certificate. The password is encrypted by KMC and written into the ciphertext path.

Mandatory when TLS verification is enabled.

kmcKsfMaster

Prefill-decode disaggregation

Prefix Cache (single-node system)

Path of the root key for KMC encryption.

Mandatory when TLS verification is enabled.

kmcKsfStandby

Prefill-decode disaggregation

Prefix Cache (single-node system)

Working key path for KMC encryption.

Mandatory when TLS verification is enabled.

tls_crl

Prefill-decode disaggregation

Prefix Cache (single-node system)

CRL path.

Mandatory when TLS verification is enabled.

Path of the CRL file. The file must exist and be readable. If the value is empty, revocation verification is not performed.

Certificate configuration for communication between the Coordinator data port and users

request_server_tls_enable

Prefill-decode disaggregation

Prefix Cache (single-node system)

Whether to enable TLS verification for the input of the inference request.

You are advised to enable this function to ensure communication security with inference users. If this function is disabled, high network security risks exist.

Mandatory. The default value is true.

ca_cert

Prefill-decode disaggregation

Prefix Cache (single-node system)

Path of the CA root certificate.

Mandatory when TLS verification is enabled.

tls_cert

Prefill-decode disaggregation

Prefix Cache (single-node system)

TLS certificate path.

Mandatory when TLS verification is enabled.

tls_key

Prefill-decode disaggregation

Prefix Cache (single-node system)

Path of the TLS private key certificate encrypted using a password.

Mandatory when TLS verification is enabled.

tls_passwd

Prefill-decode disaggregation

Prefix Cache (single-node system)

Encrypted password of the TLS private key certificate. The password is encrypted by KMC and written into the ciphertext path.

Mandatory when TLS verification is enabled.

kmcKsfMaster

Prefill-decode disaggregation

Prefix Cache (single-node system)

Path of the root key for KMC encryption.

Mandatory when TLS verification is enabled.

kmcKsfStandby

Prefill-decode disaggregation

Prefix Cache (single-node system)

Working key path for KMC encryption.

Mandatory when TLS verification is enabled.

tls_crl

Prefill-decode disaggregation

Prefix Cache (single-node system)

CRL path.

Mandatory when TLS verification is enabled.

Path of the CRL file. The file must exist and be readable. If the value is empty, revocation verification is not performed.

Certificate configuration for communication between the Coordinator and Server data ports

mindie_client_tls_enable

Prefill-decode disaggregation

Prefix Cache (single-node system)

Whether to enable TLS verification for communication with the Server.

You are advised to enable this function to ensure secure communication with the Server. If this function is disabled, high network security risks exist.

Mandatory. The default value is true.

ca_cert

Prefill-decode disaggregation

Prefix Cache (single-node system)

Path of the CA root certificate.

Mandatory when TLS verification is enabled.

tls_cert

Prefill-decode disaggregation

Prefix Cache (single-node system)

TLS certificate path.

Mandatory when TLS verification is enabled.

tls_key

Prefill-decode disaggregation

Prefix Cache (single-node system)

Path of the TLS private key certificate encrypted using a password.

Mandatory when TLS verification is enabled.

tls_passwd

Prefill-decode disaggregation

Prefix Cache (single-node system)

Encrypted password of the TLS private key certificate. The password is encrypted by KMC and written into the ciphertext path.

Mandatory when TLS verification is enabled.

kmcKsfMaster

Prefill-decode disaggregation

Prefix Cache (single-node system)

Path of the root key for KMC encryption.

Mandatory when TLS verification is enabled.

kmcKsfStandby

Prefill-decode disaggregation

Prefix Cache (single-node system)

Working key path for KMC encryption.

Mandatory when TLS verification is enabled.

tls_crl

Prefill-decode disaggregation

Prefix Cache (single-node system)

CRL path.

Mandatory when TLS verification is enabled.

Path of the CRL file. The file must exist and be readable. If the value is empty, revocation verification is not performed.

Certificate configuration for communication between the Coordinator and Server management ports

mindie_mangment_tls_enable

Prefill-decode disaggregation

Prefix Cache (single-node system)

Whether to enable TLS verification for communication that allows users to query serving management and control metrics.

You are advised to enable this function to ensure communication security with management and control metric users. If this function is disabled, high network security risks exist.

Mandatory. The default value is true.

ca_cert

Prefill-decode disaggregation

Prefix Cache (single-node system)

Path of the CA root certificate.

Mandatory when TLS verification is enabled.

tls_cert

Prefill-decode disaggregation

Prefix Cache (single-node system)

TLS certificate path.

Mandatory when TLS verification is enabled.

tls_key

Prefill-decode disaggregation

Prefix Cache (single-node system)

Path of the TLS private key certificate encrypted using a password.

Mandatory when TLS verification is enabled.

tls_passwd

Prefill-decode disaggregation

Prefix Cache (single-node system)

Encrypted password of the TLS private key certificate. The password is encrypted by KMC and written into the ciphertext path.

Mandatory when TLS verification is enabled.

kmcKsfMaster

Prefill-decode disaggregation

Prefix Cache (single-node system)

Path of the root key for KMC encryption.

Mandatory when TLS verification is enabled.

kmcKsfStandby

Prefill-decode disaggregation

Prefix Cache (single-node system)

Working key path for KMC encryption.

Mandatory when TLS verification is enabled.

tls_crl

Prefill-decode disaggregation

Prefix Cache (single-node system)

CRL path.

Mandatory when TLS verification is enabled.

Path of the CRL file. The file must exist and be readable. If the value is empty, revocation verification is not performed.

Communication certificate configuration for users to query the Coordinator information

external_tls_enable

Prefill-decode disaggregation

Prefix Cache (single-node system)

Whether to enable TLS verification for communication that allows users to query.

You are advised to enable this function to ensure secure communication with the Coordinator. If this function is disabled, high network security risks exist.

Mandatory. The default value is true.

ca_cert

Prefill-decode disaggregation

Prefix Cache (single-node system)

Path of the CA root certificate.

Mandatory when TLS verification is enabled.

tls_cert

Prefill-decode disaggregation

Prefix Cache (single-node system)

TLS certificate path.

Mandatory when TLS verification is enabled.

tls_key

Prefill-decode disaggregation

Prefix Cache (single-node system)

Path of the TLS private key certificate encrypted using a password.

Mandatory when TLS verification is enabled.

tls_passwd

Prefill-decode disaggregation

Prefix Cache (single-node system)

Encrypted password of the TLS private key certificate. The password is encrypted by KMC and written into the ciphertext path.

Mandatory when TLS verification is enabled.

kmcKsfMaster

Prefill-decode disaggregation

Prefix Cache (single-node system)

Path of the root key for KMC encryption.

Mandatory when TLS verification is enabled.

kmcKsfStandby

Prefill-decode disaggregation

Prefix Cache (single-node system)

Working key path for KMC encryption.

Mandatory when TLS verification is enabled.

tls_crl

Prefill-decode disaggregation

Prefix Cache (single-node system)

CRL path.

Mandatory when TLS verification is enabled.

Path of the CRL file. The file must exist and be readable. If the value is empty, revocation verification is not performed.

Communication certificate configuration for querying the Coordinator status information

status_tls_enable

Prefill-decode disaggregation

Prefix Cache (single-node system)

Whether to enable TLS verification for querying the Coordinator status.

You are advised to enable this function to ensure secure communication with the Coordinator. If this function is disabled, high network security risks exist.

Mandatory. The default value is true.

ca_cert

Prefill-decode disaggregation

Prefix Cache (single-node system)

Path of the CA root certificate.

Mandatory when TLS verification is enabled.

tls_cert

Prefill-decode disaggregation

Prefix Cache (single-node system)

TLS certificate path.

Mandatory when TLS verification is enabled.

tls_key

Prefill-decode disaggregation

Prefix Cache (single-node system)

Path of the TLS private key certificate encrypted using a password.

Mandatory when TLS verification is enabled.

tls_passwd

Prefill-decode disaggregation

Prefix Cache (single-node system)

Encrypted password of the TLS private key certificate. The password is encrypted by KMC and written into the ciphertext path.

Mandatory when TLS verification is enabled.

kmcKsfMaster

Prefill-decode disaggregation

Prefix Cache (single-node system)

Path of the root key for KMC encryption.

Mandatory when TLS verification is enabled.

kmcKsfStandby

Prefill-decode disaggregation

Prefix Cache (single-node system)

Working key path for KMC encryption.

Mandatory when TLS verification is enabled.

tls_crl

Prefill-decode disaggregation

Prefix Cache (single-node system)

CRL path.

Mandatory when TLS verification is enabled.

Path of the CRL file. The file must exist and be readable. If the value is empty, revocation verification is not performed.

Communication certificate configuration for querying the etcd status information

etcd_server_tls_enable

Prefill-decode disaggregation

Whether to enable TLS verification for querying the etcd status.

You are advised to enable this function to ensure secure communication with the etcd. If this function is disabled, high network security risks exist.

Mandatory. The default value is true.

ca_cert

Prefill-decode disaggregation

Path of the CA root certificate.

Mandatory when TLS verification is enabled.

tls_cert

Prefill-decode disaggregation

TLS certificate path.

Mandatory when TLS verification is enabled.

tls_key

Prefill-decode disaggregation

Path of the TLS private key certificate encrypted using a password.

Mandatory when TLS verification is enabled.

tls_passwd

Prefill-decode disaggregation

Encrypted password of the TLS private key certificate. The password is encrypted by KMC and written into the ciphertext path.

Mandatory when TLS verification is enabled.

kmcKsfMaster

Prefill-decode disaggregation

Path of the root key for KMC encryption.

Mandatory when TLS verification is enabled.

kmcKsfStandby

Prefill-decode disaggregation

Working key path for KMC encryption.

Mandatory when TLS verification is enabled.

tls_crl

Prefill-decode disaggregation

CRL path.

Mandatory when TLS verification is enabled.

Path of the CRL file. The file must exist and be readable. If the value is empty, revocation verification is not performed.

Communication certificate configuration for the Coordinator to report alarms to the Controller port

alarm_client_tls_enable

Prefill-decode disaggregation

Whether to enable TLS verification for communication used by the Coordinator to report alarms to the Controller.

You are advised to enable this function to ensure secure communication with the Controller. If this function is disabled, high network security risks exist.

Mandatory. The default value is true.

ca_cert

Prefill-decode disaggregation

Path of the CA root certificate.

Mandatory when TLS verification is enabled.

tls_cert

Prefill-decode disaggregation

TLS certificate path.

Mandatory when TLS verification is enabled.

tls_key

Prefill-decode disaggregation

Path of the TLS private key certificate encrypted using a password.

Mandatory when TLS verification is enabled.

tls_passwd

Prefill-decode disaggregation

Encrypted password of the TLS private key certificate. The password is encrypted by KMC and written into the ciphertext path.

Mandatory when TLS verification is enabled.

kmcKsfMaster

Prefill-decode disaggregation

Path of the root key for KMC encryption.

Mandatory when TLS verification is enabled.

kmcKsfStandby

Prefill-decode disaggregation

Working key path for KMC encryption.

Mandatory when TLS verification is enabled.

tls_crl

Prefill-decode disaggregation

CRL path.

Mandatory when TLS verification is enabled.

Path of the CRL file. The file must exist and be readable. If the value is empty, revocation verification is not performed.

backup_config: controlling whether to enable master/slave switchover of the Coordinator

database_server_dns

Prefill-decode disaggregation

Domain name of the etcd service.

This parameter is mandatory when master/slave switchover is enabled. The default value is etcd.default.svc.cluster.local, indicating the etcd service deployed in the default namespace.

database_server_port

Prefill-decode disaggregation

Port number of the etcd service.

Mandatory when master/slave switchover is enabled. The default value is 2379.

function_enable

Prefill-decode disaggregation

  • true: master/slave switchover of the Coordinator is enabled.
  • false: master/slave switchover of the Coordinator is disabled.

Optional. The default value is false.

Whether to enable master/slave switchover of the Coordinator.

EnableDynamicAdjustTimeoutConfig: dynamic timeout delay configuration

By default, the ms_coordinator.json configuration file does not contain this parameter. If you need to enable this parameter, add it as required. The following is an example:

"EnableDynamicAdjustTimeoutConfig" : true,

If the compute node where the inference service is conducted is networked across both the WAN and LAN, the IP address bound to 0.0.0.0 could compromise network isolation, leading to significant security vulnerabilities. Therefore, the EndPoint IP address cannot be bound to 0.0.0.0 in this scenario by default. If you still need to use 0.0.0.0, ensure that the environment has the protection capability for all-zero monitoring and set allow_all_zero_ip_listening to true to manually allow all-zero monitoring. You need to bear the security risks of enabling all-zero monitoring.

Environment Variable

The following table lists the environment variables supported by the Coordinator.

Table 2 Environment variables supported by the Coordinator

Environment Variable

Description

MINDIE_MS_COORDINATOR_CONFIG_FILE_PATH

Path for reading the ms_coordinator configuration file.

MINDIE_MS_COORDINATOR_CONFIG_SINGLE_NODE_MAX_REQ

Maximum number of requests that can be processed by a single node.

MINDIE_MS_COORDINATOR_CONFIG_MAX_REQ

Maximum number of requests that can be processed.

MINDIE_CHECK_INPUTFILES_PERMISSION

You can set whether to check external mounted files, including ms_coordinator.json and certificate-related files. The default value is empty, indicating that permission verification is required.

  • 0: Permission verification is not performed on external mounted files.
  • Other values: Permission verification is performed on external mounted files.
NOTE:

When you use MINDIE_MS_COORDINATOR_CONFIG_FILE_PATH to set the configuration file path, ms_coordinator.json is used as an external mounted file.

HSECEASY_PATH

By default, this parameter is left blank. Set the path of the dependency library for the KMC decryption tool. Mandatory when TLS verification is enabled.

Note: For details about log-related environment variables, see Log Configuration.