o
    `۷iV                  
   @   s  U d dl Z d dlmZ d dlmZmZmZmZmZm	Z	m
Z
mZmZmZ dZdZdZdZdZd	Zd
ZdZdZedZeddZdZeddZg dZeededdeZeededdeZg dZeeddeZ eZ!eZ"g dZ#eedde#Z$g dZ%eedde%Z&dZ'd Z(e
d!d"Z)e
d#d$Z*d%Z+d&Z,d'Z-d(Z.d)Z/d&Z0e/Z1d%Z2ed*d+Z3ed,d+Z4ed-d.Z5dZ6ed/d0Z7d)Z8dZ9d1Z:dZ;ed2dZ<d3Z=d+Z>dZ?d4Z@d5ZAed6d7ZBd8ZCd9ZDd:ZEd;ZFd<ZGd=ZHd>ZId?ZJd@ZKdAZLeCdBeEdCeJdDeKdEeLdFiZMh dGZNe	dHd ZOdIZPdJZQdKZRdLZSedMd7ZTedNd7ZUedOdZVedPdZWedQd+ZXedRdSZYedTd+ZZedUdSZ[edVd+Z\edWd1Z]edXdYZ^d"Z_dZZ`ed[dYZaed\dZbed]d1Zced^d+Zded_dZeed`daZfedbd&ZgedcdSZhddZieded7Zjedfd+ZkedgdhZledidjZmdkelfdlelfgZnd'ZoedmdYZpedndYZqedoe jrsdndYZteedpdZueev ewdp< edqdYZxedrdYZydsZzedtd7Z{edudvZ|edwd"Z}dxZ~d'Zd(ZdyZedzd7Zed{d7Ze jrsd|dYd7kZe jrsd}d7kpe jrsd}dYk oeZed~dZeddYZdZe jrsddYd7kZee jrsddZee jrsddZee jrsddZee jrsddZee jrsddZee jrsddZdZdZeddYZerbedzdYZed~dZed{dYZed6dYZBdZeddYZdZedd.Zg dZdS )    N)List)
get_env_boolget_env_floatget_env_float_non_negativeget_env_float_positiveget_env_intget_env_int_non_negativeget_env_int_positiveget_env_strparse_latency_bucketsstr_to_listz	ray.serveSERVE_CONTROLLER_ACTORSERVE_PROXY_ACTORservez	127.0.0.1i@  Z   i(#  defaultg    .A!RAY_SERVE_CONTROL_LOOP_INTERVAL_Sg?<   %RAY_SERVE_MAX_PER_REPLICA_RETRY_COUNT   )         
      2   d      i,  i          '  `   i i'	 $RAY_SERVE_REQUEST_LATENCY_BUCKETS_MSREQUEST_LATENCY_BUCKETS_MS 'RAY_SERVE_MODEL_LOAD_LATENCY_BUCKETS_MSMODEL_LOAD_LATENCY_BUCKETS_MS)r   r   r   r      r   r   r    r!   r"   i N  i0u  r#   r$   i 5RAY_SERVE_REPLICA_STARTUP_SHUTDOWN_LATENCY_BUCKETS_MS)r   r   r      (   r   r   F   P   r   _   c   r   +RAY_SERVE_BATCH_UTILIZATION_BUCKETS_PERCENT)r   r                @         i   i   RAY_SERVE_BATCH_SIZE_BUCKETScheck_healthreconfigureRAY_SERVE_MAX_CACHED_HANDLESr   $RAY_SERVE_CONTROLLER_MAX_CONCURRENCYi:  r   r   r   r,   r   &RAY_SERVE_PROXY_HEALTH_CHECK_TIMEOUT_Sg      $@%RAY_SERVE_PROXY_HEALTH_CHECK_PERIOD_S%RAY_SERVE_PROXY_READY_CHECK_TIMEOUT_Sg      @%RAY_SERVE_PROXY_MIN_DRAINING_PERIOD_Sg      >@g      ?RAY_SERVE_KV_TIMEOUT_Sg      @zHSee https://docs.ray.io/en/latest/serve/index.html for more information.TEXTRAY_SERVE_LOG_TO_STDERR1
request_idrouteapplication
deploymentreplicacomponent_namecomponent_idmessage	levelnameasctimez%(request_id)sz%(application)sz-- %(message)sz%(levelname)sz%(asctime)s>   job_idtask_idserve_access_logskip_context_filter#RAY_SERVE_HTTP_KEEP_ALIVE_TIMEOUT_Sg        ray_serve_extra_fieldsserve_multiplexed_model_idzx-request-id)RAY_SERVE_PROXY_PREFER_LOCAL_NODE_ROUTING'RAY_SERVE_PROXY_PREFER_LOCAL_AZ_ROUTING)RAY_SERVE_HTTP_PROXY_CALLBACK_IMPORT_PATH)RAY_SERVE_CONTROLLER_CALLBACK_IMPORT_PATH,RAY_SERVE_RECORD_AUTOSCALING_STATS_TIMEOUT_S6RAY_SERVE_REPLICA_AUTOSCALING_METRIC_RECORD_INTERVAL_Sg      ?4RAY_SERVE_REPLICA_AUTOSCALING_METRIC_PUSH_INTERVAL_S5RAY_SERVE_HANDLE_AUTOSCALING_METRIC_RECORD_INTERVAL_S3RAY_SERVE_HANDLE_AUTOSCALING_METRIC_PUSH_INTERVAL_S1RAY_SERVE_MULTIPLEXED_MODEL_ID_MATCHING_TIMEOUT_S!RAY_SERVE_ENABLE_MEMORY_PROFILING0grpc_context'RAY_SERVE_FORCE_STOP_UNHEALTHY_REPLICAS*RAY_SERVE_QUEUE_LENGTH_RESPONSE_DEADLINE_S.RAY_SERVE_MAX_QUEUE_LENGTH_RESPONSE_DEADLINE_S&RAY_SERVE_QUEUE_LENGTH_CACHE_TIMEOUT_S+RAY_SERVE_ROUTER_QUEUE_LEN_GAUGE_THROTTLE_S(RAY_SERVE_ROUTER_RETRY_INITIAL_BACKOFF_Sg?)RAY_SERVE_ROUTER_RETRY_BACKOFF_MULTIPLIER$RAY_SERVE_ROUTER_RETRY_MAX_BACKOFF_Sz7ray.serve.autoscaling_policy:default_autoscaling_policy/RAY_SERVE_COLLECT_AUTOSCALING_METRICS_ON_HANDLE&RAY_SERVE_MIN_HANDLE_METRICS_TIMEOUT_SRAY_SERVE_GRPC_MAX_MESSAGE_SIZEi)RAY_SERVE_REPLICA_GRPC_MAX_MESSAGE_LENGTHi  @ zgrpc.max_send_message_lengthzgrpc.max_receive_message_lengthRAY_SERVE_ENABLE_TASK_EVENTS)RAY_SERVE_USE_COMPACT_SCHEDULING_STRATEGY&RAY_SERVE_USE_PACK_SCHEDULING_STRATEGY(RAY_SERVE_HIGH_PRIORITY_CUSTOM_RESOURCES"RAY_SERVE_FORCE_LOCAL_TESTING_MODE RAY_SERVE_RUN_SYNC_IN_THREADPOOLa7  Calling sync method '{method_name}' directly on the asyncio loop. In a future version, sync methods will be run in a threadpool by default. Ensure your sync methods are thread safe or keep the existing behavior by making them `async def`. Opt into the new behavior by setting RAY_SERVE_RUN_SYNC_IN_THREADPOOL=1.'RAY_SERVE_ENABLE_PROXY_GC_OPTIMIZATIONSRAY_SERVE_PROXY_GC_THRESHOLDi  $RAY_SERVE_METRICS_EXPORT_INTERVAL_MSz@ray.serve._private.request_router:PowerOfTwoChoicesRequestRouterrecord_routing_stats*RAY_SERVE_RUN_USER_CODE_IN_SEPARATE_THREAD%RAY_SERVE_RUN_ROUTER_IN_SEPARATE_LOOPRAY_SERVE_USE_GRPC_BY_DEFAULTRAY_SERVE_PROXY_USE_GRPC&RAY_SERVE_REQUEST_PATH_LOG_BUFFER_SIZEr   RAY_SERVE_FAIL_ON_RANK_ERRORsuccessRAY_SERVE_ENABLE_DIRECT_INGRESS&RAY_SERVE_DIRECT_INGRESS_MIN_HTTP_PORT30000&RAY_SERVE_DIRECT_INGRESS_MIN_GRPC_PORT40000&RAY_SERVE_DIRECT_INGRESS_MAX_HTTP_PORT31000&RAY_SERVE_DIRECT_INGRESS_MAX_GRPC_PORT41000)RAY_SERVE_DIRECT_INGRESS_PORT_RETRY_COUNT100.RAY_SERVE_DIRECT_INGRESS_MIN_DRAINING_PERIOD_S30zx-request-timeout-secondszx-request-disconnect-disabledRAY_SERVE_THROUGHPUT_OPTIMIZEDr   r    )RAY_SERVE_AGGREGATE_METRICS_AT_CONTROLLER__decision_counters*RAY_SERVE_EVENT_LOOP_MONITORING_INTERVAL_S)r   r   r      r   r   r*   r   r   i	  r!   r"   )ostypingr   "ray.serve._private.constants_utilsr   r   r   r   r   r   r	   r
   r   r   SERVE_LOGGER_NAMESERVE_CONTROLLER_NAMESERVE_PROXY_NAMESERVE_NAMESPACEDEFAULT_HTTP_HOSTDEFAULT_HTTP_PORT$DEFAULT_UVICORN_KEEP_ALIVE_TIMEOUT_SDEFAULT_GRPC_PORTSERVE_DEFAULT_APP_NAMEintASYNC_CONCURRENCYCONTROL_LOOP_INTERVAL_SHTTP_PROXY_TIMEOUTMAX_PER_REPLICA_RETRY_COUNTDEFAULT_LATENCY_BUCKET_MSr&   r)   3DEFAULT_REPLICA_STARTUP_SHUTDOWN_LATENCY_BUCKETS_MS+REPLICA_STARTUP_SHUTDOWN_LATENCY_BUCKETS_MSBATCH_EXECUTION_TIME_BUCKETS_MSBATCH_WAIT_TIME_BUCKETS_MS)DEFAULT_BATCH_UTILIZATION_BUCKETS_PERCENT!BATCH_UTILIZATION_BUCKETS_PERCENTDEFAULT_BATCH_SIZE_BUCKETSBATCH_SIZE_BUCKETSHEALTH_CHECK_METHODRECONFIGURE_METHODMAX_CACHED_HANDLESCONTROLLER_MAX_CONCURRENCY#DEFAULT_GRACEFUL_SHUTDOWN_TIMEOUT_S%DEFAULT_GRACEFUL_SHUTDOWN_WAIT_LOOP_SDEFAULT_HEALTH_CHECK_PERIOD_SDEFAULT_HEALTH_CHECK_TIMEOUT_SDEFAULT_MAX_ONGOING_REQUESTSDEFAULT_TARGET_ONGOING_REQUESTSDEFAULT_CONSUMER_CONCURRENCYDEFAULT_CONSTRUCTOR_RETRY_COUNTPROXY_HEALTH_CHECK_TIMEOUT_SPROXY_HEALTH_CHECK_PERIOD_SPROXY_READY_CHECK_TIMEOUT_S&PROXY_HEALTH_CHECK_UNHEALTHY_THRESHOLDPROXY_MIN_DRAINING_PERIOD_SPROXY_DRAIN_CHECK_PERIOD_S(REPLICA_HEALTH_CHECK_UNHEALTHY_THRESHOLDCLIENT_POLLING_INTERVAL_S(CLIENT_CHECK_CREATION_POLLING_INTERVAL_SrC   RAY_GCS_RPC_TIMEOUT_S(RECOVERING_LONG_POLL_BROADCAST_TIMEOUT_S%PUSH_MULTIPLEXED_MODEL_IDS_INTERVAL_SMIGRATION_MESSAGERAY_SERVE_LOG_ENCODINGrE   SERVE_LOG_REQUEST_IDSERVE_LOG_ROUTESERVE_LOG_APPLICATIONSERVE_LOG_DEPLOYMENTSERVE_LOG_REPLICASERVE_LOG_COMPONENTSERVE_LOG_COMPONENT_IDSERVE_LOG_MESSAGESERVE_LOG_LEVEL_NAMESERVE_LOG_TIMESERVE_LOG_RECORD_FORMATSERVE_LOG_UNWANTED_ATTRSrU   &RAY_SERVE_REQUEST_PROCESSING_TIMEOUT_SSERVE_LOG_EXTRA_FIELDSSERVE_MULTIPLEXED_MODEL_IDSERVE_HTTP_REQUEST_ID_HEADERrX   rY   rZ   r[   r\   r]   r^   r_   r`   ra   rb   MAX_REPLICAS_PER_NODE_MAX_VALUEGRPC_CONTEXT_ARG_NAMEre   rf   rg   rh   ri   rj   rk   rl   DEFAULT_AUTOSCALING_POLICY_NAMErm   rn   ro   rp   DEFAULT_GRPC_SERVER_OPTIONS*METRICS_PUSHER_GRACEFUL_SHUTDOWN_TIMEOUT_Srq   rr   environgetrs   rt   str__annotations__ru   rv   (RAY_SERVE_RUN_SYNC_IN_THREADPOOL_WARNINGrw   rx   ry   DEFAULT_REQUEST_ROUTER_PATH&DEFAULT_REQUEST_ROUTING_STATS_PERIOD_S'DEFAULT_REQUEST_ROUTING_STATS_TIMEOUT_SREQUEST_ROUTING_STATS_METHODr{   r|   r}   r~   r   r   HEALTHY_MESSAGEr   r   r   r   r   r   floatr   #SERVE_HTTP_REQUEST_TIMEOUT_S_HEADER-SERVE_HTTP_REQUEST_DISCONNECT_DISABLED_HEADERr   *RAY_SERVE_RPC_LATENCY_WARNING_THRESHOLD_MSr   'SERVE_AUTOSCALING_DECISION_COUNTERS_KEYr   0SERVE_EVENT_LOOP_LATENCY_HISTOGRAM_BOUNDARIES_MS r   r   R/home/ubuntu/vllm_env/lib/python3.10/site-packages/ray/serve/_private/constants.py<module>   s>  
 0
	 
		



	


	


