Skip to content
Closed
Show file tree
Hide file tree
Changes from all commits
Commits
File filter

Filter by extension

Filter by extension

Conversations
Failed to load comments.
Loading
Jump to
Jump to file
Failed to load files.
Loading
Diff view
Diff view
3 changes: 3 additions & 0 deletions .gitignore
Original file line number Diff line number Diff line change
Expand Up @@ -43,3 +43,6 @@ run-parallel-tests/
inference-chain/proto/github.com/
inference-chain/proto/api/
inference-chain/proto/**/module/*.pb.go

# Generated JSONLs
mlnode/packages/benchmarks/data/inference_results/*
3 changes: 2 additions & 1 deletion mlnode/.gitignore
Original file line number Diff line number Diff line change
Expand Up @@ -162,4 +162,5 @@ cython_debug/
#.idea/

**/*.jsonl
**/*.sqlite
**/*.sqlite
*.DS_Store

Large diffs are not rendered by default.

Large diffs are not rendered by default.

Large diffs are not rendered by default.

Original file line number Diff line number Diff line change
@@ -0,0 +1,89 @@
{
"timestamp": "2026-04-26T23:24:42.478379",
"artifact_dir": "/root/vlm-res/validation/fp8-enf_a100-h100",
"source_inference_artifact": "/root/vlm-res/inference/fp8-free_a100/inference_results.jsonl",
"validation_artifact": "/root/vlm-res/validation/fp8-enf_a100-h100/validation_results.jsonl",
"n_items": 1000,
"validation_model_info": {
"name": "/dev/shm/Qwen3-VL-235B-A22B-Instruct-FP8/",
"url": "http://localhost:8801/",
"deploy_params": {}
},
"request_params": {
"max_tokens": 3000,
"temperature": 0.99,
"seed": 42,
"additional_params": {},
"top_logprobs": 5,
"top_p": null,
"top_k": null,
"repetition_penalty": null,
"timeout_seconds": 300,
"retries_max_attempts": 3,
"retry_backoff_seconds_start": 1.0,
"retry_backoff_multiplier": 2.0
},
"vllm_runtime_probe": {
"base_url": "http://localhost:8801",
"models_url": "http://localhost:8801/v1/models",
"served_model_ids": [
"/dev/shm/Qwen3-VL-235B-A22B-Instruct-FP8/"
],
"raw_models_response": {
"object": "list",
"data": [
{
"id": "/dev/shm/Qwen3-VL-235B-A22B-Instruct-FP8/",
"object": "model",
"created": 1777245882,
"owned_by": "vllm",
"root": "/dev/shm/Qwen3-VL-235B-A22B-Instruct-FP8/",
"parent": null,
"max_model_len": 128000,
"permission": [
{
"id": "modelperm-bbf7c8fcbcb91ca1",
"object": "model_permission",
"created": 1777245882,
"allow_create_engine": false,
"allow_sampling": true,
"allow_logprobs": true,
"allow_search_indices": false,
"allow_view": true,
"allow_fine_tuning": false,
"organization": "*",
"group": null,
"is_blocking": false
}
]
}
]
},
"health_status_code": 200,
"version_status_code": 200,
"version_body": "{\"version\":\"0.8.2.dev8106+g9a6d76e05\"}",
"timestamp": "2026-04-26T23:24:42.478244"
},
"config_check_passed": true,
"config_diff_keys": [],
"cli": {
"validation_url": "http://localhost:8801",
"validation_model": "",
"max_workers": 64,
"wait_timeout_s": 120,
"max_attempts": 3,
"retry_backoff_start_s": 1.0,
"retry_backoff_mult": 2.0,
"artifact_tag": "",
"api_key_set": false,
"images_dir": "/root/flickr8k_images/test",
"fallback_images_count": 1000
},
"performance": {
"total_time_seconds": 244.051,
"n_prompts": 1000,
"total_output_tokens": 324684,
"output_tokens_per_second": 1330.39,
"average_time_per_prompt_seconds": 0.244
}
}
Original file line number Diff line number Diff line change
@@ -0,0 +1,89 @@
{
"timestamp": "2026-04-26T23:14:03.637249",
"artifact_dir": "/root/vlm-res/validation/fp8-enf_h100-h100",
"source_inference_artifact": "/root/vlm-res/inference/fp8-free_h100/inference_results.jsonl",
"validation_artifact": "/root/vlm-res/validation/fp8-enf_h100-h100/validation_results.jsonl",
"n_items": 1000,
"validation_model_info": {
"name": "/dev/shm/Qwen3-VL-235B-A22B-Instruct-FP8/",
"url": "http://localhost:8801/",
"deploy_params": {}
},
"request_params": {
"max_tokens": 3000,
"temperature": 0.99,
"seed": 42,
"additional_params": {},
"top_logprobs": 5,
"top_p": null,
"top_k": null,
"repetition_penalty": null,
"timeout_seconds": 300,
"retries_max_attempts": 3,
"retry_backoff_seconds_start": 1.0,
"retry_backoff_multiplier": 2.0
},
"vllm_runtime_probe": {
"base_url": "http://localhost:8801",
"models_url": "http://localhost:8801/v1/models",
"served_model_ids": [
"/dev/shm/Qwen3-VL-235B-A22B-Instruct-FP8/"
],
"raw_models_response": {
"object": "list",
"data": [
{
"id": "/dev/shm/Qwen3-VL-235B-A22B-Instruct-FP8/",
"object": "model",
"created": 1777245243,
"owned_by": "vllm",
"root": "/dev/shm/Qwen3-VL-235B-A22B-Instruct-FP8/",
"parent": null,
"max_model_len": 128000,
"permission": [
{
"id": "modelperm-aa87599cedc6d538",
"object": "model_permission",
"created": 1777245243,
"allow_create_engine": false,
"allow_sampling": true,
"allow_logprobs": true,
"allow_search_indices": false,
"allow_view": true,
"allow_fine_tuning": false,
"organization": "*",
"group": null,
"is_blocking": false
}
]
}
]
},
"health_status_code": 200,
"version_status_code": 200,
"version_body": "{\"version\":\"0.8.2.dev8106+g9a6d76e05\"}",
"timestamp": "2026-04-26T23:14:03.637111"
},
"config_check_passed": true,
"config_diff_keys": [],
"cli": {
"validation_url": "http://localhost:8801",
"validation_model": "",
"max_workers": 64,
"wait_timeout_s": 120,
"max_attempts": 3,
"retry_backoff_start_s": 1.0,
"retry_backoff_mult": 2.0,
"artifact_tag": "",
"api_key_set": false,
"images_dir": "/root/flickr8k_images/test",
"fallback_images_count": 1000
},
"performance": {
"total_time_seconds": 242.129,
"n_prompts": 1000,
"total_output_tokens": 323716,
"output_tokens_per_second": 1336.95,
"average_time_per_prompt_seconds": 0.242
}
}
Original file line number Diff line number Diff line change
@@ -0,0 +1,89 @@
{
"timestamp": "2026-04-26T23:19:36.261055",
"artifact_dir": "/root/vlm-res/validation/int4-enf_h100-h100",
"source_inference_artifact": "/root/vlm-res/inference/int4-free_h100/inference_results.jsonl",
"validation_artifact": "/root/vlm-res/validation/int4-enf_h100-h100/validation_results.jsonl",
"n_items": 1000,
"validation_model_info": {
"name": "/dev/shm/Qwen3-VL-235B-A22B-Instruct-FP8/",
"url": "http://localhost:8801/",
"deploy_params": {}
},
"request_params": {
"max_tokens": 3000,
"temperature": 0.99,
"seed": 42,
"additional_params": {},
"top_logprobs": 5,
"top_p": null,
"top_k": null,
"repetition_penalty": null,
"timeout_seconds": 300,
"retries_max_attempts": 3,
"retry_backoff_seconds_start": 1.0,
"retry_backoff_multiplier": 2.0
},
"vllm_runtime_probe": {
"base_url": "http://localhost:8801",
"models_url": "http://localhost:8801/v1/models",
"served_model_ids": [
"/dev/shm/Qwen3-VL-235B-A22B-Instruct-FP8/"
],
"raw_models_response": {
"object": "list",
"data": [
{
"id": "/dev/shm/Qwen3-VL-235B-A22B-Instruct-FP8/",
"object": "model",
"created": 1777245576,
"owned_by": "vllm",
"root": "/dev/shm/Qwen3-VL-235B-A22B-Instruct-FP8/",
"parent": null,
"max_model_len": 128000,
"permission": [
{
"id": "modelperm-8bb8cc4fd73a2099",
"object": "model_permission",
"created": 1777245576,
"allow_create_engine": false,
"allow_sampling": true,
"allow_logprobs": true,
"allow_search_indices": false,
"allow_view": true,
"allow_fine_tuning": false,
"organization": "*",
"group": null,
"is_blocking": false
}
]
}
]
},
"health_status_code": 200,
"version_status_code": 200,
"version_body": "{\"version\":\"0.8.2.dev8106+g9a6d76e05\"}",
"timestamp": "2026-04-26T23:19:36.260908"
},
"config_check_passed": true,
"config_diff_keys": [],
"cli": {
"validation_url": "http://localhost:8801",
"validation_model": "",
"max_workers": 64,
"wait_timeout_s": 120,
"max_attempts": 3,
"retry_backoff_start_s": 1.0,
"retry_backoff_mult": 2.0,
"artifact_tag": "",
"api_key_set": false,
"images_dir": "/root/flickr8k_images/test",
"fallback_images_count": 1000
},
"performance": {
"total_time_seconds": 231.601,
"n_prompts": 1000,
"total_output_tokens": 309206,
"output_tokens_per_second": 1335.08,
"average_time_per_prompt_seconds": 0.232
}
}
Loading
Loading