logo

InferX AI Function Platform (Lambda Function for Inference)

    --   Serve tens models in one box with ultra-fast (<2 sec) cold start (contact: support@inferx.net)



Snapshots

Snapshot Id nodename state gpu pageable pinned docker image name build id
public/BAAI/Aquila-7B/426#node3 node3 Ready {'0': 9669967872, '1': 8636071936} 1674 MB 8192 MB vllm/vllm-openai:v0.6.2 [34, 121, 77, 38, 80, 210, 154, 247, 143, 238, 177, 92, 243, 246, 34, 235, 189, 139, 138, 34]
public/Deci/DeciLM-7B-instruct/230#node3 node3 Ready {'0': 12333350912, '1': 12067012608} 1518 MB 8192 MB vllm/vllm-openai:v0.6.2 [34, 121, 77, 38, 80, 210, 154, 247, 143, 238, 177, 92, 243, 246, 34, 235, 189, 139, 138, 34]
public/Deci/DeciLM-7B/227#node3 node3 Ready {'0': 12333350912, '1': 12067012608} 1558 MB 8192 MB vllm/vllm-openai:v0.6.2 [34, 121, 77, 38, 80, 210, 154, 247, 143, 238, 177, 92, 243, 246, 34, 235, 189, 139, 138, 34]
public/EleutherAI/pythia-12b/243#node3 node3 Ready {'0': 13082034176, '1': 12610174976} 1558 MB 9216 MB vllm/vllm-openai:v0.6.2 [34, 121, 77, 38, 80, 210, 154, 247, 143, 238, 177, 92, 243, 246, 34, 235, 189, 139, 138, 34]
public/OpenAssistant/oasst-sft-4-pythia-12b-epoch-3.5/254#node3 node3 Ready {'0': 13075742720, '1': 12605980672} 2520 MB 9216 MB vllm/vllm-openai:v0.6.2 [34, 121, 77, 38, 80, 210, 154, 247, 143, 238, 177, 92, 243, 246, 34, 235, 189, 139, 138, 34]
public/Qwen/Qwen2.5-1.5B/128#node3 node3 Ready {'0': 7956594688} 1314 MB 7168 MB vllm/vllm-openai:v0.6.2 [34, 121, 77, 38, 80, 210, 154, 247, 143, 238, 177, 92, 243, 246, 34, 235, 189, 139, 138, 34]
public/Qwen/Qwen2.5-7B-Instruct-1M/138#node3 node3 Ready {'0': 13056868352, '1': 11528044544} 1570 MB 14336 MB vllm/vllm-openai:v0.6.2 [34, 121, 77, 38, 80, 210, 154, 247, 143, 238, 177, 92, 243, 246, 34, 235, 189, 139, 138, 34]
public/Qwen/Qwen2.5-7B-Instruct-GPTQ-Int8/126#node3 node3 Ready {'0': 14090764288} 1310 MB 7168 MB vllm/vllm-openai:v0.6.2 [34, 121, 77, 38, 80, 210, 154, 247, 143, 238, 177, 92, 243, 246, 34, 235, 189, 139, 138, 34]
public/Qwen/Qwen2.5-Coder-1.5B-Instruct/121#node3 node3 Ready {'0': 7509901312} 1310 MB 7168 MB vllm/vllm-openai:v0.6.2 [34, 121, 77, 38, 80, 210, 154, 247, 143, 238, 177, 92, 243, 246, 34, 235, 189, 139, 138, 34]
public/Qwen/Qwen2.5-Coder-14B-Instruct-GPTQ-Int8/124#node3 node3 Ready {'0': 13073645568, '1': 11546918912} 1666 MB 12288 MB vllm/vllm-openai:v0.6.2 [34, 121, 77, 38, 80, 210, 154, 247, 143, 238, 177, 92, 243, 246, 34, 235, 189, 139, 138, 34]
public/Qwen/Qwen2.5-Coder-3B/119#node3 node3 Ready {'0': 13411287040} 1310 MB 4608 MB vllm/vllm-openai:v0.6.2 [34, 121, 77, 38, 80, 210, 154, 247, 143, 238, 177, 92, 243, 246, 34, 235, 189, 139, 138, 34]
public/Qwen/Qwen2.5-Coder-7B-Instruct/117#node3 node3 Ready {'0': 13063159808, '1': 11534336000} 1570 MB 14336 MB vllm/vllm-openai:v0.6.2 [34, 121, 77, 38, 80, 210, 154, 247, 143, 238, 177, 92, 243, 246, 34, 235, 189, 139, 138, 34]
public/Qwen/Qwen2.5-Math-1.5B-Instruct/130#node3 node3 Ready {'0': 6987710464} 1330 MB 7168 MB vllm/vllm-openai:v0.6.2 [34, 121, 77, 38, 80, 210, 154, 247, 143, 238, 177, 92, 243, 246, 34, 235, 189, 139, 138, 34]
public/Qwen/Qwen2.5-Math-1.5B/132#node3 node3 Ready {'0': 7990149120} 1314 MB 7168 MB vllm/vllm-openai:v0.6.2 [34, 121, 77, 38, 80, 210, 154, 247, 143, 238, 177, 92, 243, 246, 34, 235, 189, 139, 138, 34]
public/Qwen/Qwen2.5-Math-7B-Instruct/134#node3 node3 Ready {'0': 13052674048, '1': 11523850240} 1570 MB 14336 MB vllm/vllm-openai:v0.6.2 [34, 121, 77, 38, 80, 210, 154, 247, 143, 238, 177, 92, 243, 246, 34, 235, 189, 139, 138, 34]
public/Qwen/Qwen2.5-Math-7B/136#node3 node3 Ready {'0': 13052674048, '1': 11523850240} 1594 MB 14336 MB vllm/vllm-openai:v0.6.2 [34, 121, 77, 38, 80, 210, 154, 247, 143, 238, 177, 92, 243, 246, 34, 235, 189, 139, 138, 34]
public/Salesforce/codegen-2B-multi/278#node3 node3 Ready {'0': 5670699008} 542 MB 0 MB vllm-openai-upgraded:v0.1.0 [34, 121, 77, 38, 80, 210, 154, 247, 143, 238, 177, 92, 243, 246, 34, 235, 189, 139, 138, 34]
public/THUDM/chatglm3-6b-128k/148#node3 node3 Ready {'0': 14380171264} 1260 MB 7168 MB vllm/vllm-openai:v0.6.2 [34, 121, 77, 38, 80, 210, 154, 247, 143, 238, 177, 92, 243, 246, 34, 235, 189, 139, 138, 34]
public/THUDM/chatglm3-6b-32k/146#node3 node3 Ready {'0': 14409531392} 1098 MB 7168 MB vllm/vllm-openai:v0.4.2 [34, 121, 77, 38, 80, 210, 154, 247, 143, 238, 177, 92, 243, 246, 34, 235, 189, 139, 138, 34]
public/THUDM/chatglm3-6b/144#node3 node3 Ready {'0': 14355005440} 1256 MB 7168 MB vllm/vllm-openai:v0.6.2 [34, 121, 77, 38, 80, 210, 154, 247, 143, 238, 177, 92, 243, 246, 34, 235, 189, 139, 138, 34]
public/TinyLlama/TinyLlama-1.1B-Chat-v1.0/100#node3 node3 Ready {'0': 5970591744} 1254 MB 5632 MB vllm/vllm-openai:v0.6.2 [34, 121, 77, 38, 80, 210, 154, 247, 143, 238, 177, 92, 243, 246, 34, 235, 189, 139, 138, 34]
public/TinyLlama/TinyLlama-1.1B-Chat-v1.0_13GB/106#node3 node3 Ready {'0': 13214154752} 1254 MB 5632 MB vllm/vllm-openai:v0.6.2 [34, 121, 77, 38, 80, 210, 154, 247, 143, 238, 177, 92, 243, 246, 34, 235, 189, 139, 138, 34]
public/TinyLlama/TinyLlama-1.1B-Chat-v1.0_2gpu/109#node3 node3 Ready {'0': 13046382592, '1': 12746489856} 1546 MB 11264 MB vllm/vllm-openai:v0.6.2 [34, 121, 77, 38, 80, 210, 154, 247, 143, 238, 177, 92, 243, 246, 34, 235, 189, 139, 138, 34]
public/allenai/OLMo-1B-hf/257#node3 node3 Ready {'0': 13065256960} 1270 MB 4096 MB vllm/vllm-openai:v0.6.2 [34, 121, 77, 38, 80, 210, 154, 247, 143, 238, 177, 92, 243, 246, 34, 235, 189, 139, 138, 34]
public/allenai/OLMo-7B-hf/259#node3 node3 Ready {'0': 13077839872, '1': 12608077824} 1758 MB 8192 MB vllm/vllm-openai:v0.6.2 [34, 121, 77, 38, 80, 210, 154, 247, 143, 238, 177, 92, 243, 246, 34, 235, 189, 139, 138, 34]
public/baichuan-inc/Baichuan-7B/158#node3 node3 Ready {'0': 13100908544, '1': 12505317376} 1566 MB 8192 MB vllm/vllm-openai:v0.6.2 [34, 121, 77, 38, 80, 210, 154, 247, 143, 238, 177, 92, 243, 246, 34, 235, 189, 139, 138, 34]
public/baichuan-inc/Baichuan2-7B-Chat/160#node3 node3 Ready {'0': 13103005696, '1': 11804868608} 1890 MB 8192 MB vllm/vllm-openai:v0.6.2 [34, 121, 77, 38, 80, 210, 154, 247, 143, 238, 177, 92, 243, 246, 34, 235, 189, 139, 138, 34]
public/bigcode/starcoder2-3b/284#node3 node3 Ready {'0': 13048479744} 1278 MB 7680 MB vllm/vllm-openai:v0.6.2 [34, 121, 77, 38, 80, 210, 154, 247, 143, 238, 177, 92, 243, 246, 34, 235, 189, 139, 138, 34]
public/bigcode/starcoder2-7b/359#node3 node3 Ready {'0': 13046382592, '1': 12591300608} 1634 MB 8192 MB vllm/vllm-openai:v0.6.2 [34, 121, 77, 38, 80, 210, 154, 247, 143, 238, 177, 92, 243, 246, 34, 235, 189, 139, 138, 34]
public/databricks/dolly-v2-12b/251#node3 node3 Ready {'0': 14673772544, '1': 14204010496} 2272 MB 9216 MB vllm/vllm-openai:v0.6.2 [34, 121, 77, 38, 80, 210, 154, 247, 143, 238, 177, 92, 243, 246, 34, 235, 189, 139, 138, 34]
public/deepseek-ai/DeepSeek-R1-Distill-Llama-8B/262#node3 node3 Ready {'0': 13086228480, '1': 11765022720} 1644 MB 8192 MB vllm/vllm-openai:v0.6.2 [34, 121, 77, 38, 80, 210, 154, 247, 143, 238, 177, 92, 243, 246, 34, 235, 189, 139, 138, 34]
public/deepseek-ai/DeepSeek-R1-Distill-Qwen-1.5B/264#node3 node3 Ready {'0': 12534677504} 1354 MB 7168 MB vllm/vllm-openai:v0.6.2 [34, 121, 77, 38, 80, 210, 154, 247, 143, 238, 177, 92, 243, 246, 34, 235, 189, 139, 138, 34]
public/deepseek-ai/DeepSeek-R1-Distill-Qwen-7B/266#node3 node3 Ready {'0': 13079937024, '1': 11551113216} 1638 MB 14336 MB vllm/vllm-openai:v0.6.2 [34, 121, 77, 38, 80, 210, 154, 247, 143, 238, 177, 92, 243, 246, 34, 235, 189, 139, 138, 34]
public/deepseek-ai/deepseek-llm-7b-chat/268#node3 node3 Ready {'0': 13071548416, '1': 12018778112} 1612 MB 15360 MB vllm/vllm-openai:v0.6.2 [34, 121, 77, 38, 80, 210, 154, 247, 143, 238, 177, 92, 243, 246, 34, 235, 189, 139, 138, 34]
public/deepseek-ai/deepseek-math-7b-instruct/271#node3 node3 Ready {'0': 13071548416, '1': 12018778112} 1816 MB 15360 MB vllm/vllm-openai:v0.6.2 [34, 121, 77, 38, 80, 210, 154, 247, 143, 238, 177, 92, 243, 246, 34, 235, 189, 139, 138, 34]
public/facebook/opt-iml-max-1.3b/113#node3 node3 Ready {'0': 3615490048} 1246 MB 6144 MB vllm/vllm-openai:v0.6.2 [34, 121, 77, 38, 80, 210, 154, 247, 143, 238, 177, 92, 243, 246, 34, 235, 189, 139, 138, 34]
public/llava-hf/llava-1.5-7b-hf/281#node3 node3 Ready {'0': 14623440896} 584 MB 0 MB vllm-openai-upgraded:v0.1.0 [34, 121, 77, 38, 80, 210, 154, 247, 143, 238, 177, 92, 243, 246, 34, 235, 189, 139, 138, 34]
public/microsoft/Phi-3-mini-128k-instruct/172#node3 node3 Ready {'0': 12708741120} 1246 MB 4096 MB vllm/vllm-openai:v0.6.2 [34, 121, 77, 38, 80, 210, 154, 247, 143, 238, 177, 92, 243, 246, 34, 235, 189, 139, 138, 34]
public/microsoft/Phi-3-mini-4k-instruct/170#node3 node3 Ready {'0': 12696158208} 1250 MB 4096 MB vllm/vllm-openai:v0.6.2 [34, 121, 77, 38, 80, 210, 154, 247, 143, 238, 177, 92, 243, 246, 34, 235, 189, 139, 138, 34]
public/mosaicml/mpt-7b-storywriter/349#node3 node3 Ready {'0': 13058965504, '1': 12587106304} 1984 MB 8192 MB vllm/vllm-openai:v0.6.2 [34, 121, 77, 38, 80, 210, 154, 247, 143, 238, 177, 92, 243, 246, 34, 235, 189, 139, 138, 34]
public/mosaicml/mpt-7b/165#node3 node3 Ready {'0': 13058965504, '1': 12587106304} 1872 MB 8192 MB vllm/vllm-openai:v0.6.2 [34, 121, 77, 38, 80, 210, 154, 247, 143, 238, 177, 92, 243, 246, 34, 235, 189, 139, 138, 34]
public/nomic-ai/gpt4all-j/240#node3 node3 Ready {'0': 13067354112, '1': 12597592064} 1562 MB 14336 MB vllm/vllm-openai:v0.6.2 [34, 121, 77, 38, 80, 210, 154, 247, 143, 238, 177, 92, 243, 246, 34, 235, 189, 139, 138, 34]
public/openai-community/gpt2-xl/237#node3 node3 Ready {'0': 11444158464} 1390 MB 6144 MB vllm/vllm-openai:v0.6.2 [34, 121, 77, 38, 80, 210, 154, 247, 143, 238, 177, 92, 243, 246, 34, 235, 189, 139, 138, 34]
public/openbmb/MiniCPM-2B-dpo-bf16/246#node3 node3 Ready {'0': 13100908544} 1304 MB 5120 MB vllm/vllm-openai:v0.6.2 [34, 121, 77, 38, 80, 210, 154, 247, 143, 238, 177, 92, 243, 246, 34, 235, 189, 139, 138, 34]
public/openbmb/MiniCPM-2B-sft-bf16/248#node3 node3 Ready {'0': 8738832384} 1304 MB 5120 MB vllm/vllm-openai:v0.6.2 [34, 121, 77, 38, 80, 210, 154, 247, 143, 238, 177, 92, 243, 246, 34, 235, 189, 139, 138, 34]
public/tiiuae/falcon-rw-7b/234#node3 node3 Ready {'0': 13077839872, '1': 12471762944} 1526 MB 9216 MB vllm/vllm-openai:v0.6.2 [34, 121, 77, 38, 80, 210, 154, 247, 143, 238, 177, 92, 243, 246, 34, 235, 189, 139, 138, 34]