{"users":[{"id":6,"username":"bill-anyscale","name":"Bill","avatar_template":"/user_avatar/discuss.ray.io/bill-anyscale/{size}/724_2.png","primary_group_name":"Ray-Team","flair_name":"Ray-Team","flair_url":"https://us1.discourse-cdn.com/flex020/uploads/ray/original/2X/7/796fedd2b646b5e9ea776cb6287afced709a5676.png","flair_bg_color":"fff","flair_group_id":41,"trust_level":1},{"id":7699,"username":"mgb","name":"Marco Giovanni Bignotti","avatar_template":"https://avatars.discourse-cdn.com/v4/letter/m/2bfe46/{size}.png","trust_level":1},{"id":7472,"username":"RunLLM","name":"RunLLM","avatar_template":"/user_avatar/discuss.ray.io/runllm/{size}/8249_2.png","primary_group_name":"Ray-Team","flair_name":"Ray-Team","flair_url":"https://us1.discourse-cdn.com/flex020/uploads/ray/original/2X/7/796fedd2b646b5e9ea776cb6287afced709a5676.png","flair_bg_color":"fff","flair_group_id":41,"trust_level":3},{"id":7646,"username":"psnilesh","name":"Nilesh PS","avatar_template":"/user_avatar/discuss.ray.io/psnilesh/{size}/8424_2.png","trust_level":1},{"id":7685,"username":"Jeffrey_Wang","name":"Jeffrey Wang","avatar_template":"/user_avatar/discuss.ray.io/jeffrey_wang/{size}/8464_2.png","primary_group_name":"Ray-Team","flair_name":"Ray-Team","flair_url":"https://us1.discourse-cdn.com/flex020/uploads/ray/original/2X/7/796fedd2b646b5e9ea776cb6287afced709a5676.png","flair_bg_color":"fff","flair_group_id":41,"trust_level":3},{"id":7668,"username":"bhartendu_kumar","name":"bhartendu kumar","avatar_template":"/user_avatar/discuss.ray.io/bhartendu_kumar/{size}/8452_2.png","trust_level":0},{"id":7583,"username":"AlaEddine","name":null,"avatar_template":"https://avatars.discourse-cdn.com/v4/letter/a/b9e5f3/{size}.png","trust_level":0},{"id":6939,"username":"Dekermanjian","name":"","avatar_template":"https://avatars.discourse-cdn.com/v4/letter/d/96bed5/{size}.png","trust_level":1},{"id":7620,"username":"glingleNxn","name":"","avatar_template":"https://avatars.discourse-cdn.com/v4/letter/g/8c91f0/{size}.png","trust_level":1},{"id":7637,"username":"ABINA_SRINIVASAN","name":"ABINA SRINIVASAN","avatar_template":"/user_avatar/discuss.ray.io/abina_srinivasan/{size}/8416_2.png","trust_level":1},{"id":7062,"username":"czjghost","name":"肇杰 陈","avatar_template":"/user_avatar/discuss.ray.io/czjghost/{size}/7800_2.png","trust_level":1},{"id":6812,"username":"christina","name":"Christina Zhu","avatar_template":"/user_avatar/discuss.ray.io/christina/{size}/7542_2.png","primary_group_name":"Ray-Team","flair_name":"staff","flair_url":"https://us1.discourse-cdn.com/flex020/uploads/ray/original/2X/7/796fedd2b646b5e9ea776cb6287afced709a5676.png","flair_bg_color":"fff","flair_group_id":3,"moderator":true,"trust_level":4},{"id":7605,"username":"manuel.ramblr","name":null,"avatar_template":"https://avatars.discourse-cdn.com/v4/letter/m/977dab/{size}.png","trust_level":0},{"id":7562,"username":"dmtryzarubin","name":"Dmitriy Zarubin","avatar_template":"/user_avatar/discuss.ray.io/dmtryzarubin/{size}/8333_2.png","trust_level":1},{"id":7560,"username":"Ishika_Sahu","name":"Ishika Sahu","avatar_template":"/user_avatar/discuss.ray.io/ishika_sahu/{size}/8332_2.png","trust_level":0},{"id":7558,"username":"wciq1208","name":"wciq1208","avatar_template":"https://avatars.discourse-cdn.com/v4/letter/w/b5a626/{size}.png","trust_level":1},{"id":2626,"username":"psydok","name":"Psydok","avatar_template":"/user_avatar/discuss.ray.io/psydok/{size}/3518_2.png","trust_level":1},{"id":4236,"username":"zhanghx0905","name":"Hexiao Zhang","avatar_template":"/user_avatar/discuss.ray.io/zhanghx0905/{size}/5565_2.png","trust_level":0},{"id":4291,"username":"Abhishek_Jaiswal","name":"Abhishek Jaiswal","avatar_template":"/user_avatar/discuss.ray.io/abhishek_jaiswal/{size}/5121_2.png","trust_level":1},{"id":4686,"username":"tej","name":"","avatar_template":"https://avatars.discourse-cdn.com/v4/letter/t/48db29/{size}.png","trust_level":0},{"id":7489,"username":"Ruckley","name":"Samuel Jones","avatar_template":"https://avatars.discourse-cdn.com/v4/letter/r/b3f665/{size}.png","trust_level":0},{"id":7512,"username":"G117","name":null,"avatar_template":"https://avatars.discourse-cdn.com/v4/letter/g/2acd7d/{size}.png","trust_level":0},{"id":1349,"username":"jjyao","name":"Jiajun Yao","avatar_template":"/user_avatar/discuss.ray.io/jjyao/{size}/1799_2.png","primary_group_name":"Ray-Team","flair_name":"Ray-Team","flair_url":"https://us1.discourse-cdn.com/flex020/uploads/ray/original/2X/7/796fedd2b646b5e9ea776cb6287afced709a5676.png","flair_bg_color":"fff","flair_group_id":41,"admin":true,"trust_level":4},{"id":1827,"username":"Abhi_Sharma","name":"Abhi Sharma","avatar_template":"/user_avatar/discuss.ray.io/abhi_sharma/{size}/2033_2.png","trust_level":1},{"id":4487,"username":"lorstrae","name":"","avatar_template":"https://avatars.discourse-cdn.com/v4/letter/l/e95f7d/{size}.png","trust_level":1},{"id":5221,"username":"dentiny","name":"Dentiny","avatar_template":"/user_avatar/discuss.ray.io/dentiny/{size}/6575_2.png","trust_level":1},{"id":7446,"username":"nimayu","name":"Nicola","avatar_template":"https://avatars.discourse-cdn.com/v4/letter/n/b9e5f3/{size}.png","trust_level":1},{"id":7190,"username":"michaelripa","name":"","avatar_template":"https://avatars.discourse-cdn.com/v4/letter/m/67e7ee/{size}.png","trust_level":1},{"id":7217,"username":"manickavela29","name":"Manickavela","avatar_template":"/user_avatar/discuss.ray.io/manickavela29/{size}/7966_2.png","trust_level":2},{"id":2809,"username":"Akshay_Malik","name":"Akshay Malik","avatar_template":"/user_avatar/discuss.ray.io/akshay_malik/{size}/3807_2.png","primary_group_name":"Ray-Team","flair_name":"Ray-Team","flair_url":"https://us1.discourse-cdn.com/flex020/uploads/ray/original/2X/7/796fedd2b646b5e9ea776cb6287afced709a5676.png","flair_bg_color":"fff","flair_group_id":41,"trust_level":4},{"id":7368,"username":"raphael","name":"","avatar_template":"https://avatars.discourse-cdn.com/v4/letter/r/edb3f5/{size}.png","trust_level":1},{"id":7399,"username":"vaporeon","name":"Sam Zhuo Li","avatar_template":"https://avatars.discourse-cdn.com/v4/letter/v/a87d85/{size}.png","trust_level":1},{"id":7416,"username":"jdwillard19","name":"Jared Willard","avatar_template":"/user_avatar/discuss.ray.io/jdwillard19/{size}/8167_2.png","trust_level":0},{"id":7136,"username":"abrarsheikh","name":"Abrar Sheikh","avatar_template":"/user_avatar/discuss.ray.io/abrarsheikh/{size}/8019_2.png","primary_group_name":"Ray-Team","flair_name":"Ray-Team","flair_url":"https://us1.discourse-cdn.com/flex020/uploads/ray/original/2X/7/796fedd2b646b5e9ea776cb6287afced709a5676.png","flair_bg_color":"fff","flair_group_id":41,"trust_level":4},{"id":7259,"username":"Dominic_Laflamme","name":"Dominic Laflamme","avatar_template":"/user_avatar/discuss.ray.io/dominic_laflamme/{size}/7394_2.png","trust_level":1},{"id":7390,"username":"LemurPwned","name":"Jakub","avatar_template":"/user_avatar/discuss.ray.io/lemurpwned/{size}/8145_2.png","trust_level":0},{"id":2001,"username":"kourosh","name":"kourosh","avatar_template":"/user_avatar/discuss.ray.io/kourosh/{size}/2130_2.png","primary_group_name":"Ray-Team","flair_name":"Ray-Team","flair_url":"https://us1.discourse-cdn.com/flex020/uploads/ray/original/2X/7/796fedd2b646b5e9ea776cb6287afced709a5676.png","flair_bg_color":"fff","flair_group_id":41,"trust_level":4},{"id":763,"username":"raywala","name":"Ashwani","avatar_template":"/user_avatar/discuss.ray.io/raywala/{size}/1035_2.png","trust_level":0},{"id":7,"username":"eoakes","name":"Edward Oakes","avatar_template":"/user_avatar/discuss.ray.io/eoakes/{size}/7825_2.png","primary_group_name":"Ray-Team","flair_name":"Ray-Team","flair_url":"https://us1.discourse-cdn.com/flex020/uploads/ray/original/2X/7/796fedd2b646b5e9ea776cb6287afced709a5676.png","flair_bg_color":"fff","flair_group_id":41,"admin":true,"trust_level":2},{"id":3638,"username":"tjedwards","name":"","avatar_template":"/user_avatar/discuss.ray.io/tjedwards/{size}/4896_2.png","trust_level":0},{"id":332,"username":"yic","name":"Yi","avatar_template":"/user_avatar/discuss.ray.io/yic/{size}/437_2.png","primary_group_name":"Ray-Team","flair_name":"Ray-Team","flair_url":"https://us1.discourse-cdn.com/flex020/uploads/ray/original/2X/7/796fedd2b646b5e9ea776cb6287afced709a5676.png","flair_bg_color":"fff","flair_group_id":41,"trust_level":2},{"id":9,"username":"sangcho","name":"sangcho","avatar_template":"/user_avatar/discuss.ray.io/sangcho/{size}/425_2.png","primary_group_name":"Ray-Team","flair_name":"Ray-Team","flair_url":"https://us1.discourse-cdn.com/flex020/uploads/ray/original/2X/7/796fedd2b646b5e9ea776cb6287afced709a5676.png","flair_bg_color":"fff","flair_group_id":41,"trust_level":4},{"id":7307,"username":"mirage","name":"Mirage","avatar_template":"https://avatars.discourse-cdn.com/v4/letter/m/eb9ed0/{size}.png","trust_level":1},{"id":7376,"username":"Best_Vincent","name":"Best Vincent","avatar_template":"/user_avatar/discuss.ray.io/best_vincent/{size}/8133_2.png","trust_level":0}],"primary_groups":[{"id":41,"name":"Ray-Team"}],"flair_groups":[{"id":41,"name":"Ray-Team","flair_url":"https://us1.discourse-cdn.com/flex020/uploads/ray/original/2X/7/796fedd2b646b5e9ea776cb6287afced709a5676.png","flair_bg_color":"fff","flair_color":""},{"id":3,"name":"staff","flair_url":"https://us1.discourse-cdn.com/flex020/uploads/ray/original/2X/7/796fedd2b646b5e9ea776cb6287afced709a5676.png","flair_bg_color":"fff","flair_color":""}],"topic_list":{"can_create_topic":false,"more_topics_url":"/c/ray-serve/6?page=1","per_page":30,"top_tags":[],"topics":[{"fancy_title":"About the Ray Serve category","id":48,"title":"About the Ray Serve category","slug":"about-the-ray-serve-category","posts_count":1,"reply_count":0,"highest_post_number":1,"image_url":null,"created_at":"2020-11-17T00:02:52.418Z","last_posted_at":"2020-11-17T00:02:52.428Z","bumped":true,"bumped_at":"2025-03-05T19:51:32.897Z","archetype":"regular","unseen":false,"pinned":true,"unpinned":null,"excerpt":"Topics include model serving and inference. Use Serve to deploy and scale machine learning models with built-in support for APIs, batching, and multi-GPU inference. \nRay Serve is a scalable model serving library for buil&hellip;","visible":true,"closed":false,"archived":false,"bookmarked":null,"liked":null,"tags":[],"tags_descriptions":{},"views":823,"like_count":0,"has_summary":false,"last_poster_username":"bill-anyscale","category_id":6,"op_like_count":0,"pinned_globally":false,"featured_link":null,"has_accepted_answer":false,"can_have_answer":true,"can_vote":false,"posters":[{"extras":"latest single","description":"Original Poster, Most Recent Poster","user_id":6,"primary_group_id":41,"flair_group_id":41}]},{"fancy_title":"Load models from Docker volume without creating copies","id":23481,"title":"Load models from Docker volume without creating copies","slug":"load-models-from-docker-volume-without-creating-copies","posts_count":2,"reply_count":1,"highest_post_number":2,"image_url":null,"created_at":"2026-02-18T14:38:54.728Z","last_posted_at":"2026-02-18T14:39:17.988Z","bumped":true,"bumped_at":"2026-02-18T14:39:17.988Z","archetype":"regular","unseen":false,"pinned":false,"unpinned":null,"visible":true,"closed":false,"archived":false,"bookmarked":null,"liked":null,"tags":[],"tags_descriptions":{},"views":3,"like_count":0,"has_summary":false,"last_poster_username":"RunLLM","category_id":6,"op_like_count":0,"pinned_globally":false,"featured_link":null,"has_accepted_answer":false,"can_have_answer":true,"can_vote":false,"posters":[{"extras":null,"description":"Original Poster","user_id":7699,"primary_group_id":null,"flair_group_id":null},{"extras":"latest","description":"Most Recent Poster","user_id":7472,"primary_group_id":41,"flair_group_id":41}]},{"fancy_title":"Downloading models from custom sources when using LLMConfig","id":23473,"title":"Downloading models from custom sources when using LLMConfig","slug":"downloading-models-from-custom-sources-when-using-llmconfig","posts_count":6,"reply_count":4,"highest_post_number":6,"image_url":null,"created_at":"2026-02-11T18:28:46.159Z","last_posted_at":"2026-02-12T02:08:10.787Z","bumped":true,"bumped_at":"2026-02-12T02:08:10.787Z","archetype":"regular","unseen":false,"pinned":false,"unpinned":null,"visible":true,"closed":false,"archived":false,"bookmarked":null,"liked":null,"tags":[],"tags_descriptions":{},"views":11,"like_count":0,"has_summary":false,"last_poster_username":"psnilesh","category_id":6,"op_like_count":0,"pinned_globally":false,"featured_link":null,"has_accepted_answer":true,"can_have_answer":true,"can_vote":false,"posters":[{"extras":"latest","description":"Original Poster, Most Recent Poster","user_id":7646,"primary_group_id":null,"flair_group_id":null},{"extras":null,"description":"Frequent Poster, Accepted Answer","user_id":7685,"primary_group_id":41,"flair_group_id":41},{"extras":null,"description":"Frequent Poster","user_id":7472,"primary_group_id":41,"flair_group_id":41}]},{"fancy_title":"Optimal redis cache size for ray gcs backup","id":23457,"title":"Optimal redis cache size for ray gcs backup","slug":"optimal-redis-cache-size-for-ray-gcs-backup","posts_count":1,"reply_count":0,"highest_post_number":1,"image_url":null,"created_at":"2026-01-20T15:24:57.233Z","last_posted_at":"2026-01-20T15:24:57.287Z","bumped":true,"bumped_at":"2026-01-20T15:24:57.287Z","archetype":"regular","unseen":false,"pinned":false,"unpinned":null,"visible":true,"closed":false,"archived":false,"bookmarked":null,"liked":null,"tags":[],"tags_descriptions":{},"views":5,"like_count":0,"has_summary":false,"last_poster_username":"bhartendu_kumar","category_id":6,"op_like_count":0,"pinned_globally":false,"featured_link":null,"has_accepted_answer":false,"can_have_answer":true,"can_vote":false,"posters":[{"extras":"latest single","description":"Original Poster, Most Recent Poster","user_id":7668,"primary_group_id":null,"flair_group_id":null}]},{"fancy_title":"Setup api key to call LLM via rayserve","id":23319,"title":"Setup api key to call LLM via rayserve","slug":"setup-api-key-to-call-llm-via-rayserve","posts_count":15,"reply_count":12,"highest_post_number":15,"image_url":null,"created_at":"2025-11-12T11:25:22.349Z","last_posted_at":"2026-01-14T01:17:22.561Z","bumped":true,"bumped_at":"2026-01-14T01:17:22.561Z","archetype":"regular","unseen":false,"pinned":false,"unpinned":null,"visible":true,"closed":false,"archived":false,"bookmarked":null,"liked":null,"tags":[],"tags_descriptions":{},"views":56,"like_count":0,"has_summary":false,"last_poster_username":"RunLLM","category_id":29,"op_like_count":0,"pinned_globally":false,"featured_link":null,"has_accepted_answer":false,"can_have_answer":true,"can_vote":false,"posters":[{"extras":null,"description":"Original Poster","user_id":7583,"primary_group_id":null,"flair_group_id":null},{"extras":null,"description":"Frequent Poster","user_id":6939,"primary_group_id":null,"flair_group_id":null},{"extras":"latest","description":"Most Recent Poster","user_id":7472,"primary_group_id":41,"flair_group_id":41}]},{"fancy_title":"Example docker compose to run RayServe app","id":23409,"title":"Example docker compose to run RayServe app","slug":"example-docker-compose-to-run-rayserve-app","posts_count":2,"reply_count":1,"highest_post_number":2,"image_url":null,"created_at":"2025-12-23T20:23:25.517Z","last_posted_at":"2025-12-23T20:23:50.566Z","bumped":true,"bumped_at":"2025-12-23T20:23:50.566Z","archetype":"regular","unseen":false,"pinned":false,"unpinned":null,"visible":true,"closed":false,"archived":false,"bookmarked":null,"liked":null,"tags":[],"tags_descriptions":{},"views":66,"like_count":0,"has_summary":false,"last_poster_username":"RunLLM","category_id":6,"op_like_count":0,"pinned_globally":false,"featured_link":null,"has_accepted_answer":true,"can_have_answer":true,"can_vote":false,"posters":[{"extras":null,"description":"Original Poster","user_id":7620,"primary_group_id":null,"flair_group_id":null},{"extras":"latest","description":"Most Recent Poster, Accepted Answer","user_id":7472,"primary_group_id":41,"flair_group_id":41}]},{"fancy_title":"Deploying Multiple Ray Serve Microservices on a Single Cluster with Separate Ports","id":23403,"title":"Deploying Multiple Ray Serve Microservices on a Single Cluster with Separate Ports","slug":"deploying-multiple-ray-serve-microservices-on-a-single-cluster-with-separate-ports","posts_count":2,"reply_count":1,"highest_post_number":2,"image_url":null,"created_at":"2025-12-22T07:04:19.101Z","last_posted_at":"2025-12-22T07:04:56.524Z","bumped":true,"bumped_at":"2025-12-22T07:04:56.524Z","archetype":"regular","unseen":false,"pinned":false,"unpinned":null,"visible":true,"closed":false,"archived":false,"bookmarked":null,"liked":null,"tags":[],"tags_descriptions":{},"views":19,"like_count":0,"has_summary":false,"last_poster_username":"RunLLM","category_id":6,"op_like_count":0,"pinned_globally":false,"featured_link":null,"has_accepted_answer":false,"can_have_answer":true,"can_vote":false,"posters":[{"extras":null,"description":"Original Poster","user_id":7637,"primary_group_id":null,"flair_group_id":null},{"extras":"latest","description":"Most Recent Poster","user_id":7472,"primary_group_id":41,"flair_group_id":41}]},{"fancy_title":"Programmatic lightweight update from rest call","id":23395,"title":"Programmatic lightweight update from rest call","slug":"programmatic-lightweight-update-from-rest-call","posts_count":2,"reply_count":1,"highest_post_number":2,"image_url":null,"created_at":"2025-12-20T05:01:52.944Z","last_posted_at":"2025-12-20T05:02:14.854Z","bumped":true,"bumped_at":"2025-12-20T05:02:14.854Z","archetype":"regular","unseen":false,"pinned":false,"unpinned":null,"visible":true,"closed":false,"archived":false,"bookmarked":null,"liked":null,"tags":[],"tags_descriptions":{},"views":15,"like_count":0,"has_summary":false,"last_poster_username":"RunLLM","category_id":6,"op_like_count":0,"pinned_globally":false,"featured_link":null,"has_accepted_answer":true,"can_have_answer":true,"can_vote":false,"posters":[{"extras":null,"description":"Original Poster","user_id":7620,"primary_group_id":null,"flair_group_id":null},{"extras":"latest","description":"Most Recent Poster, Accepted Answer","user_id":7472,"primary_group_id":41,"flair_group_id":41}]},{"fancy_title":"About Ray DAG API for serve.deployment at Ray 2.44.1","id":23366,"title":"About Ray DAG API for serve.deployment at Ray 2.44.1","slug":"about-ray-dag-api-for-serve-deployment-at-ray-2-44-1","posts_count":5,"reply_count":4,"highest_post_number":7,"image_url":null,"created_at":"2025-12-08T09:22:34.798Z","last_posted_at":"2025-12-09T01:55:10.296Z","bumped":true,"bumped_at":"2025-12-09T01:55:10.296Z","archetype":"regular","unseen":false,"pinned":false,"unpinned":null,"visible":true,"closed":false,"archived":false,"bookmarked":null,"liked":null,"tags":[],"tags_descriptions":{},"views":41,"like_count":0,"has_summary":false,"last_poster_username":"czjghost","category_id":6,"op_like_count":0,"pinned_globally":false,"featured_link":null,"has_accepted_answer":false,"can_have_answer":true,"can_vote":false,"posters":[{"extras":"latest","description":"Original Poster, Most Recent Poster","user_id":7062,"primary_group_id":null,"flair_group_id":null},{"extras":null,"description":"Frequent Poster","user_id":7472,"primary_group_id":41,"flair_group_id":41},{"extras":null,"description":"Frequent Poster","user_id":6812,"primary_group_id":41,"flair_group_id":3}]},{"fancy_title":"Preprocessing in ray serve LLM","id":23346,"title":"Preprocessing in ray serve LLM","slug":"preprocessing-in-ray-serve-llm","posts_count":4,"reply_count":2,"highest_post_number":4,"image_url":"https://us1.discourse-cdn.com/flex020/uploads/ray/optimized/2X/2/26bce9c63b8ac9a93f2c0a535f7ddeef4ebbc4f7_2_1024x552.jpeg","created_at":"2025-12-01T13:26:14.414Z","last_posted_at":"2025-12-01T23:50:06.875Z","bumped":true,"bumped_at":"2025-12-01T23:50:06.875Z","archetype":"regular","unseen":false,"pinned":false,"unpinned":null,"visible":true,"closed":false,"archived":false,"bookmarked":null,"liked":null,"tags":[],"tags_descriptions":{},"views":56,"like_count":0,"has_summary":false,"last_poster_username":"christina","category_id":29,"op_like_count":0,"pinned_globally":false,"featured_link":null,"has_accepted_answer":true,"can_have_answer":true,"can_vote":false,"posters":[{"extras":null,"description":"Original Poster","user_id":7605,"primary_group_id":null,"flair_group_id":null},{"extras":null,"description":"Frequent Poster, Accepted Answer","user_id":7472,"primary_group_id":41,"flair_group_id":41},{"extras":"latest","description":"Most Recent Poster","user_id":6812,"primary_group_id":41,"flair_group_id":3}]},{"fancy_title":"Memory not released to default levels: `ray::IDLE` Processes Not Released**","id":23295,"title":"Memory not released to default levels: `ray::IDLE` Processes Not Released**","slug":"memory-not-released-to-default-levels-ray-idle-processes-not-released","posts_count":47,"reply_count":28,"highest_post_number":47,"image_url":"https://us1.discourse-cdn.com/flex020/uploads/ray/optimized/2X/b/b35c0dbbcea2f4258bfca87085358e3c63d61c9b_2_1024x443.png","created_at":"2025-11-01T10:22:46.669Z","last_posted_at":"2025-11-14T12:21:19.496Z","bumped":true,"bumped_at":"2025-11-14T12:21:19.496Z","archetype":"regular","unseen":false,"pinned":false,"unpinned":null,"visible":true,"closed":false,"archived":false,"bookmarked":null,"liked":null,"tags":[],"tags_descriptions":{},"views":329,"like_count":1,"has_summary":false,"last_poster_username":"RunLLM","category_id":6,"op_like_count":1,"pinned_globally":false,"featured_link":null,"has_accepted_answer":false,"can_have_answer":true,"can_vote":false,"posters":[{"extras":null,"description":"Original Poster","user_id":7562,"primary_group_id":null,"flair_group_id":null},{"extras":"latest","description":"Most Recent Poster","user_id":7472,"primary_group_id":41,"flair_group_id":41}]},{"fancy_title":"TypeError: Failed to serialize the ASGI app.:","id":23285,"title":"TypeError: Failed to serialize the ASGI app.:","slug":"typeerror-failed-to-serialize-the-asgi-app","posts_count":3,"reply_count":1,"highest_post_number":3,"image_url":null,"created_at":"2025-10-30T08:20:55.735Z","last_posted_at":"2025-10-30T09:27:28.118Z","bumped":true,"bumped_at":"2025-10-30T09:27:28.118Z","archetype":"regular","unseen":false,"pinned":false,"unpinned":null,"visible":true,"closed":false,"archived":false,"bookmarked":null,"liked":null,"tags":[],"tags_descriptions":{},"views":32,"like_count":0,"has_summary":false,"last_poster_username":"Ishika_Sahu","category_id":6,"op_like_count":0,"pinned_globally":false,"featured_link":null,"has_accepted_answer":true,"can_have_answer":true,"can_vote":false,"posters":[{"extras":"latest","description":"Original Poster, Most Recent Poster, Accepted Answer","user_id":7560,"primary_group_id":null,"flair_group_id":null},{"extras":null,"description":"Frequent Poster","user_id":7472,"primary_group_id":41,"flair_group_id":41}]},{"fancy_title":"Serve deploy app support custom router with runtime_env","id":23284,"title":"Serve deploy app support custom router with runtime_env","slug":"serve-deploy-app-support-custom-router-with-runtime-env","posts_count":2,"reply_count":1,"highest_post_number":2,"image_url":null,"created_at":"2025-10-30T02:29:44.029Z","last_posted_at":"2025-10-30T02:30:49.185Z","bumped":true,"bumped_at":"2025-10-30T02:30:49.185Z","archetype":"regular","unseen":false,"pinned":false,"unpinned":null,"visible":true,"closed":false,"archived":false,"bookmarked":null,"liked":null,"tags":[],"tags_descriptions":{},"views":30,"like_count":0,"has_summary":false,"last_poster_username":"RunLLM","category_id":6,"op_like_count":0,"pinned_globally":false,"featured_link":null,"has_accepted_answer":false,"can_have_answer":true,"can_vote":false,"posters":[{"extras":null,"description":"Original Poster","user_id":7558,"primary_group_id":null,"flair_group_id":null},{"extras":"latest","description":"Most Recent Poster","user_id":7472,"primary_group_id":41,"flair_group_id":41}]},{"fancy_title":"[Serve] The `ray start &ndash;head &ndash;node-ip-address ip` is not working correctly in Docker. And it&rsquo;s not clear which ports to open","id":13214,"title":"[Serve] The `ray start --head --node-ip-address ip` is not working correctly in Docker. And it's not clear which ports to open","slug":"serve-the-ray-start-head-node-ip-address-ip-is-not-working-correctly-in-docker-and-its-not-clear-which-ports-to-open","posts_count":9,"reply_count":5,"highest_post_number":9,"image_url":null,"created_at":"2023-12-20T14:08:01.446Z","last_posted_at":"2025-10-25T11:41:22.000Z","bumped":true,"bumped_at":"2025-10-25T11:41:22.000Z","archetype":"regular","unseen":false,"pinned":false,"unpinned":null,"visible":true,"closed":false,"archived":false,"bookmarked":null,"liked":null,"tags":[],"tags_descriptions":{},"views":950,"like_count":1,"has_summary":false,"last_poster_username":"RunLLM","category_id":6,"op_like_count":0,"pinned_globally":false,"featured_link":null,"has_accepted_answer":false,"can_have_answer":true,"can_vote":false,"posters":[{"extras":null,"description":"Original Poster","user_id":2626,"primary_group_id":null,"flair_group_id":null},{"extras":null,"description":"Frequent Poster","user_id":4236,"primary_group_id":null,"flair_group_id":null},{"extras":null,"description":"Frequent Poster","user_id":4291,"primary_group_id":null,"flair_group_id":null},{"extras":null,"description":"Frequent Poster","user_id":4686,"primary_group_id":null,"flair_group_id":null},{"extras":"latest","description":"Most Recent Poster","user_id":7472,"primary_group_id":41,"flair_group_id":41}]},{"fancy_title":"Nvidea-smi errors when deploying ray serve head on cpu only node","id":23138,"title":"Nvidea-smi errors when deploying ray serve head on cpu only node","slug":"nvidea-smi-errors-when-deploying-ray-serve-head-on-cpu-only-node","posts_count":3,"reply_count":1,"highest_post_number":4,"image_url":null,"created_at":"2025-09-23T22:01:06.510Z","last_posted_at":"2025-10-24T17:51:48.016Z","bumped":true,"bumped_at":"2025-10-24T17:51:48.016Z","archetype":"regular","unseen":false,"pinned":false,"unpinned":null,"visible":true,"closed":false,"archived":false,"bookmarked":null,"liked":null,"tags":[],"tags_descriptions":{},"views":73,"like_count":1,"has_summary":false,"last_poster_username":"jjyao","category_id":6,"op_like_count":1,"pinned_globally":false,"featured_link":null,"has_accepted_answer":false,"can_have_answer":true,"can_vote":false,"posters":[{"extras":null,"description":"Original Poster","user_id":7489,"primary_group_id":null,"flair_group_id":null},{"extras":null,"description":"Frequent Poster","user_id":7512,"primary_group_id":null,"flair_group_id":null},{"extras":"latest","description":"Most Recent Poster","user_id":1349,"primary_group_id":41,"flair_group_id":41}]},{"fancy_title":"Ray is creating hundreds of logs files under /tmp/ray/session_latest/logs/ causing disk space issue and I/O Spikes","id":12058,"title":"Ray is creating hundreds of logs files under /tmp/ray/session_latest/logs/ causing disk space issue and I/O Spikes","slug":"ray-is-creating-hundreds-of-logs-files-under-tmp-ray-session-latest-logs-causing-disk-space-issue-and-i-o-spikes","posts_count":11,"reply_count":3,"highest_post_number":11,"image_url":null,"created_at":"2023-09-06T18:57:58.505Z","last_posted_at":"2025-10-22T07:56:23.570Z","bumped":true,"bumped_at":"2025-10-22T07:56:23.570Z","archetype":"regular","unseen":false,"pinned":false,"unpinned":null,"visible":true,"closed":false,"archived":false,"bookmarked":null,"liked":null,"tags":[],"tags_descriptions":{},"views":1379,"like_count":2,"has_summary":false,"last_poster_username":"RunLLM","category_id":6,"op_like_count":0,"pinned_globally":false,"featured_link":null,"has_accepted_answer":false,"can_have_answer":true,"can_vote":false,"posters":[{"extras":null,"description":"Original Poster","user_id":1827,"primary_group_id":null,"flair_group_id":null},{"extras":null,"description":"Frequent Poster","user_id":4487,"primary_group_id":null,"flair_group_id":null},{"extras":null,"description":"Frequent Poster","user_id":5221,"primary_group_id":null,"flair_group_id":null},{"extras":null,"description":"Frequent Poster","user_id":7446,"primary_group_id":null,"flair_group_id":null},{"extras":"latest","description":"Most Recent Poster","user_id":7472,"primary_group_id":41,"flair_group_id":41}]},{"fancy_title":"Running Multiple Ray Heads on Same Node - Safety &amp; Best Practices?","id":23234,"title":"Running Multiple Ray Heads on Same Node - Safety & Best Practices?","slug":"running-multiple-ray-heads-on-same-node-safety-best-practices","posts_count":1,"reply_count":0,"highest_post_number":1,"image_url":null,"created_at":"2025-10-07T19:48:02.242Z","last_posted_at":"2025-10-07T19:48:02.303Z","bumped":true,"bumped_at":"2025-10-07T19:48:02.303Z","archetype":"regular","unseen":false,"pinned":false,"unpinned":null,"visible":true,"closed":false,"archived":false,"bookmarked":null,"liked":null,"tags":[],"tags_descriptions":{},"views":54,"like_count":0,"has_summary":false,"last_poster_username":"michaelripa","category_id":6,"op_like_count":0,"pinned_globally":false,"featured_link":null,"has_accepted_answer":false,"can_have_answer":true,"can_vote":false,"posters":[{"extras":"latest single","description":"Original Poster, Most Recent Poster","user_id":7190,"primary_group_id":null,"flair_group_id":null}]},{"fancy_title":"Ray Serve not distributing load to all replicas equally","id":22589,"title":"Ray Serve not distributing load to all replicas equally","slug":"ray-serve-not-distributing-load-to-all-replicas-equally","posts_count":5,"reply_count":3,"highest_post_number":5,"image_url":null,"created_at":"2025-06-03T03:17:08.208Z","last_posted_at":"2025-09-19T14:53:37.115Z","bumped":true,"bumped_at":"2025-09-19T14:53:37.115Z","archetype":"regular","unseen":false,"pinned":false,"unpinned":null,"visible":true,"closed":false,"archived":false,"bookmarked":null,"liked":null,"tags":[],"tags_descriptions":{},"views":131,"like_count":0,"has_summary":false,"last_poster_username":"manickavela29","category_id":6,"op_like_count":0,"pinned_globally":false,"featured_link":null,"has_accepted_answer":false,"can_have_answer":true,"can_vote":false,"posters":[{"extras":"latest","description":"Original Poster, Most Recent Poster","user_id":7217,"primary_group_id":null,"flair_group_id":null},{"extras":null,"description":"Frequent Poster","user_id":2809,"primary_group_id":41,"flair_group_id":41}]},{"fancy_title":"Non-linear throughput when scaling Ray Serve replicas","id":22959,"title":"Non-linear throughput when scaling Ray Serve replicas","slug":"non-linear-throughput-when-scaling-ray-serve-replicas","posts_count":4,"reply_count":2,"highest_post_number":4,"image_url":null,"created_at":"2025-08-07T15:47:19.789Z","last_posted_at":"2025-09-19T14:50:15.400Z","bumped":true,"bumped_at":"2025-09-19T14:50:15.400Z","archetype":"regular","unseen":false,"pinned":false,"unpinned":null,"visible":true,"closed":false,"archived":false,"bookmarked":null,"liked":null,"tags":[],"tags_descriptions":{},"views":111,"like_count":1,"has_summary":false,"last_poster_username":"manickavela29","category_id":6,"op_like_count":0,"pinned_globally":false,"featured_link":null,"has_accepted_answer":false,"can_have_answer":true,"can_vote":false,"posters":[{"extras":null,"description":"Original Poster","user_id":7368,"primary_group_id":null,"flair_group_id":null},{"extras":null,"description":"Frequent Poster","user_id":6812,"primary_group_id":41,"flair_group_id":3},{"extras":"latest","description":"Most Recent Poster","user_id":7217,"primary_group_id":null,"flair_group_id":null}]},{"fancy_title":"FastAPI backend + Ray Core vs Ray Serve","id":22972,"title":"FastAPI backend + Ray Core vs Ray Serve","slug":"fastapi-backend-ray-core-vs-ray-serve","posts_count":2,"reply_count":0,"highest_post_number":2,"image_url":null,"created_at":"2025-08-10T07:06:11.595Z","last_posted_at":"2025-08-18T20:21:38.675Z","bumped":true,"bumped_at":"2025-08-18T20:21:38.675Z","archetype":"regular","unseen":false,"pinned":false,"unpinned":null,"visible":true,"closed":false,"archived":false,"bookmarked":null,"liked":null,"tags":[],"tags_descriptions":{},"views":97,"like_count":0,"has_summary":false,"last_poster_username":"christina","category_id":6,"op_like_count":0,"pinned_globally":false,"featured_link":null,"has_accepted_answer":false,"can_have_answer":true,"can_vote":false,"posters":[{"extras":null,"description":"Original Poster","user_id":7399,"primary_group_id":null,"flair_group_id":null},{"extras":"latest","description":"Most Recent Poster","user_id":6812,"primary_group_id":41,"flair_group_id":3}]},{"fancy_title":"Stop Ray Serve from overwriting LD_LIBRARY_PATH?","id":23014,"title":"Stop Ray Serve from overwriting LD_LIBRARY_PATH?","slug":"stop-ray-serve-from-overwriting-ld-library-path","posts_count":2,"reply_count":0,"highest_post_number":2,"image_url":null,"created_at":"2025-08-18T15:55:24.541Z","last_posted_at":"2025-08-18T16:24:25.112Z","bumped":true,"bumped_at":"2025-08-18T16:24:25.112Z","archetype":"regular","unseen":false,"pinned":false,"unpinned":null,"visible":true,"closed":false,"archived":false,"bookmarked":null,"liked":null,"tags":[],"tags_descriptions":{},"views":33,"like_count":0,"has_summary":false,"last_poster_username":"abrarsheikh","category_id":6,"op_like_count":0,"pinned_globally":false,"featured_link":null,"has_accepted_answer":false,"can_have_answer":true,"can_vote":false,"posters":[{"extras":null,"description":"Original Poster","user_id":7416,"primary_group_id":null,"flair_group_id":null},{"extras":"latest","description":"Most Recent Poster","user_id":7136,"primary_group_id":41,"flair_group_id":41}]},{"fancy_title":"Trouble deploying simple app with uv","id":23003,"title":"Trouble deploying simple app with uv","slug":"trouble-deploying-simple-app-with-uv","posts_count":2,"reply_count":0,"highest_post_number":2,"image_url":null,"created_at":"2025-08-15T14:32:07.636Z","last_posted_at":"2025-08-17T14:59:57.229Z","bumped":true,"bumped_at":"2025-08-17T14:59:57.229Z","archetype":"regular","unseen":false,"pinned":false,"unpinned":null,"visible":true,"closed":false,"archived":false,"bookmarked":null,"liked":null,"tags":[],"tags_descriptions":{},"views":91,"like_count":0,"has_summary":false,"last_poster_username":"Dominic_Laflamme","category_id":6,"op_like_count":0,"pinned_globally":false,"featured_link":null,"has_accepted_answer":false,"can_have_answer":true,"can_vote":false,"posters":[{"extras":"latest single","description":"Original Poster, Most Recent Poster","user_id":7259,"primary_group_id":null,"flair_group_id":null}]},{"fancy_title":"Ray Serve vLLM multiple models per GPU in tensor parallelism","id":22973,"title":"Ray Serve vLLM multiple models per GPU in tensor parallelism","slug":"ray-serve-vllm-multiple-models-per-gpu-in-tensor-parallelism","posts_count":2,"reply_count":0,"highest_post_number":2,"image_url":null,"created_at":"2025-08-10T11:18:50.147Z","last_posted_at":"2025-08-14T18:37:52.267Z","bumped":true,"bumped_at":"2025-08-14T18:37:52.267Z","archetype":"regular","unseen":false,"pinned":false,"unpinned":null,"visible":true,"closed":false,"archived":false,"bookmarked":null,"liked":null,"tags":[],"tags_descriptions":{},"views":395,"like_count":0,"has_summary":false,"last_poster_username":"kourosh","category_id":29,"op_like_count":0,"pinned_globally":false,"featured_link":null,"has_accepted_answer":false,"can_have_answer":true,"can_vote":false,"posters":[{"extras":null,"description":"Original Poster","user_id":7390,"primary_group_id":null,"flair_group_id":null},{"extras":"latest","description":"Most Recent Poster","user_id":2001,"primary_group_id":41,"flair_group_id":41}]},{"fancy_title":"Dynamically scaling","id":2260,"title":"Dynamically scaling","slug":"dynamically-scaling","posts_count":3,"reply_count":1,"highest_post_number":3,"image_url":null,"created_at":"2021-05-23T07:22:38.487Z","last_posted_at":"2025-08-13T09:13:00.301Z","bumped":true,"bumped_at":"2025-08-13T09:13:00.301Z","archetype":"regular","unseen":false,"pinned":false,"unpinned":null,"visible":true,"closed":false,"archived":false,"bookmarked":null,"liked":null,"tags":[],"tags_descriptions":{},"views":477,"like_count":0,"has_summary":false,"last_poster_username":"raphael","category_id":6,"op_like_count":0,"pinned_globally":false,"featured_link":null,"has_accepted_answer":false,"can_have_answer":true,"can_vote":false,"posters":[{"extras":null,"description":"Original Poster","user_id":763,"primary_group_id":null,"flair_group_id":null},{"extras":null,"description":"Frequent Poster","user_id":7,"primary_group_id":41,"flair_group_id":41},{"extras":"latest","description":"Most Recent Poster","user_id":7368,"primary_group_id":null,"flair_group_id":null}]},{"fancy_title":"Integrating GradioIngress and non-gradio endpoints","id":11728,"title":"Integrating GradioIngress and non-gradio endpoints","slug":"integrating-gradioingress-and-non-gradio-endpoints","posts_count":4,"reply_count":1,"highest_post_number":4,"image_url":null,"created_at":"2023-08-09T14:44:47.880Z","last_posted_at":"2025-08-09T13:09:44.198Z","bumped":true,"bumped_at":"2025-08-09T13:09:44.198Z","archetype":"regular","unseen":false,"pinned":false,"unpinned":null,"visible":true,"closed":false,"archived":false,"bookmarked":null,"liked":null,"tags":[],"tags_descriptions":{},"views":535,"like_count":0,"has_summary":false,"last_poster_username":"Dominic_Laflamme","category_id":6,"op_like_count":0,"pinned_globally":false,"featured_link":null,"has_accepted_answer":false,"can_have_answer":true,"can_vote":false,"posters":[{"extras":null,"description":"Original Poster","user_id":3638,"primary_group_id":null,"flair_group_id":null},{"extras":null,"description":"Frequent Poster","user_id":332,"primary_group_id":41,"flair_group_id":41},{"extras":null,"description":"Frequent Poster","user_id":9,"primary_group_id":41,"flair_group_id":41},{"extras":"latest","description":"Most Recent Poster","user_id":7259,"primary_group_id":null,"flair_group_id":null}]},{"fancy_title":"Ray Serve kubernetes service also uses Head pod","id":22947,"title":"Ray Serve kubernetes service also uses Head pod","slug":"ray-serve-kubernetes-service-also-uses-head-pod","posts_count":1,"reply_count":0,"highest_post_number":1,"image_url":null,"created_at":"2025-08-06T09:12:42.130Z","last_posted_at":"2025-08-06T09:12:42.182Z","bumped":true,"bumped_at":"2025-08-06T09:12:42.182Z","archetype":"regular","unseen":false,"pinned":false,"unpinned":null,"visible":true,"closed":false,"archived":false,"bookmarked":null,"liked":null,"tags":[],"tags_descriptions":{},"views":30,"like_count":0,"has_summary":false,"last_poster_username":"mirage","category_id":6,"op_like_count":0,"pinned_globally":false,"featured_link":null,"has_accepted_answer":false,"can_have_answer":true,"can_vote":false,"posters":[{"extras":"latest single","description":"Original Poster, Most Recent Poster","user_id":7307,"primary_group_id":null,"flair_group_id":null}]},{"fancy_title":"How to download a model from an authenticated S3 storage?","id":22937,"title":"How to download a model from an authenticated S3 storage?","slug":"how-to-download-a-model-from-an-authenticated-s3-storage","posts_count":2,"reply_count":0,"highest_post_number":2,"image_url":null,"created_at":"2025-08-04T14:52:03.823Z","last_posted_at":"2025-08-04T19:26:16.968Z","bumped":true,"bumped_at":"2025-08-04T19:26:16.968Z","archetype":"regular","unseen":false,"pinned":false,"unpinned":null,"visible":true,"closed":false,"archived":false,"bookmarked":null,"liked":null,"tags":[],"tags_descriptions":{},"views":36,"like_count":0,"has_summary":false,"last_poster_username":"christina","category_id":6,"op_like_count":0,"pinned_globally":false,"featured_link":null,"has_accepted_answer":false,"can_have_answer":true,"can_vote":false,"posters":[{"extras":null,"description":"Original Poster","user_id":7376,"primary_group_id":null,"flair_group_id":null},{"extras":"latest","description":"Most Recent Poster","user_id":6812,"primary_group_id":41,"flair_group_id":3}]},{"fancy_title":"How to Expose Ray Serve API with proxy_location=&ldquo;EveryNode&rdquo; Outside the Cluster","id":22906,"title":"How to Expose Ray Serve API with proxy_location=\"EveryNode\" Outside the Cluster","slug":"how-to-expose-ray-serve-api-with-proxy-location-everynode-outside-the-cluster","posts_count":2,"reply_count":0,"highest_post_number":2,"image_url":null,"created_at":"2025-07-29T11:27:17.133Z","last_posted_at":"2025-08-01T23:48:06.031Z","bumped":true,"bumped_at":"2025-08-01T23:48:06.031Z","archetype":"regular","unseen":false,"pinned":false,"unpinned":null,"visible":true,"closed":false,"archived":false,"bookmarked":null,"liked":null,"tags":[],"tags_descriptions":{},"views":46,"like_count":1,"has_summary":false,"last_poster_username":"Akshay_Malik","category_id":6,"op_like_count":0,"pinned_globally":false,"featured_link":null,"has_accepted_answer":false,"can_have_answer":true,"can_vote":false,"posters":[{"extras":null,"description":"Original Poster","user_id":7368,"primary_group_id":null,"flair_group_id":null},{"extras":"latest","description":"Most Recent Poster","user_id":2809,"primary_group_id":41,"flair_group_id":41}]},{"fancy_title":"Ray Replica take more time to healthy than EKS Pod","id":22909,"title":"Ray Replica take more time to healthy than EKS Pod","slug":"ray-replica-take-more-time-to-healthy-than-eks-pod","posts_count":1,"reply_count":0,"highest_post_number":1,"image_url":null,"created_at":"2025-07-29T22:47:22.309Z","last_posted_at":"2025-07-29T22:47:22.454Z","bumped":true,"bumped_at":"2025-07-29T22:47:22.454Z","archetype":"regular","unseen":false,"pinned":false,"unpinned":null,"visible":true,"closed":false,"archived":false,"bookmarked":null,"liked":null,"tags":[],"tags_descriptions":{},"views":35,"like_count":0,"has_summary":false,"last_poster_username":"mirage","category_id":6,"op_like_count":0,"pinned_globally":false,"featured_link":null,"has_accepted_answer":false,"can_have_answer":true,"can_vote":false,"posters":[{"extras":"latest single","description":"Original Poster, Most Recent Poster","user_id":7307,"primary_group_id":null,"flair_group_id":null}]},{"fancy_title":"Does Ray Serve support PDB in EKS / Kubernetes","id":22899,"title":"Does Ray Serve support PDB in EKS / Kubernetes","slug":"does-ray-serve-support-pdb-in-eks-kubernetes","posts_count":2,"reply_count":0,"highest_post_number":2,"image_url":null,"created_at":"2025-07-27T13:28:02.510Z","last_posted_at":"2025-07-28T19:54:48.535Z","bumped":true,"bumped_at":"2025-07-28T19:54:48.535Z","archetype":"regular","unseen":false,"pinned":false,"unpinned":null,"visible":true,"closed":false,"archived":false,"bookmarked":null,"liked":null,"tags":[],"tags_descriptions":{},"views":45,"like_count":0,"has_summary":false,"last_poster_username":"christina","category_id":6,"op_like_count":0,"pinned_globally":false,"featured_link":null,"has_accepted_answer":false,"can_have_answer":true,"can_vote":false,"posters":[{"extras":null,"description":"Original Poster","user_id":7307,"primary_group_id":null,"flair_group_id":null},{"extras":"latest","description":"Most Recent Poster","user_id":6812,"primary_group_id":41,"flair_group_id":3}]}]}}