logo

InferX AI Function Platform (Lambda Function for Inference)

    --   Serve tens models in one box with ultra-fast (<2 sec) cold start (contact: support@inferx.net)

Action

Snapshots

Snapshot Id nodename state gpu pageable pinned docker image name build id
public/BAAI/Aquila-7B/172#node2 node2 Ready {'0': 12702449664, '1': 11668553728} 1670 MB 8192 MB vllm/vllm-openai:v0.6.2 [43, 39, 201, 188, 250, 119, 64, 240, 112, 67, 55, 122, 34, 122, 33, 57, 101, 188, 202, 126]
public/Deci/DeciLM-7B/190#node2 node2 Ready {'0': 12694061056, '1': 12427722752} 1574 MB 8192 MB vllm/vllm-openai:v0.6.2 [43, 39, 201, 188, 250, 119, 64, 240, 112, 67, 55, 122, 34, 122, 33, 57, 101, 188, 202, 126]
public/EleutherAI/pythia-12b/205#node2 node2 Ready {'0': 13547601920, '1': 13075742720} 1546 MB 9216 MB vllm/vllm-openai:v0.6.2 [43, 39, 201, 188, 250, 119, 64, 240, 112, 67, 55, 122, 34, 122, 33, 57, 101, 188, 202, 126]
public/OpenAssistant/oasst-sft-4-pythia-12b-epoch-3.5/216#node2 node2 Ready {'0': 13075742720, '1': 12605980672} 2196 MB 9216 MB vllm/vllm-openai:v0.6.2 [43, 39, 201, 188, 250, 119, 64, 240, 112, 67, 55, 122, 34, 122, 33, 57, 101, 188, 202, 126]
public/Qwen/Qwen2.5-1.5B/146#node2 node2 Ready {'0': 7956594688} 1314 MB 7168 MB vllm/vllm-openai:v0.6.2 [43, 39, 201, 188, 250, 119, 64, 240, 112, 67, 55, 122, 34, 122, 33, 57, 101, 188, 202, 126]
public/Qwen/Qwen2.5-7B-Instruct-1M/156#node2 node2 Ready {'0': 13467910144, '1': 11936989184} 1586 MB 14336 MB vllm/vllm-openai:v0.6.2 [43, 39, 201, 188, 250, 119, 64, 240, 112, 67, 55, 122, 34, 122, 33, 57, 101, 188, 202, 126]
public/Qwen/Qwen2.5-7B-Instruct-GPTQ-Int8/144#node2 node2 Ready {'0': 13803454464} 1314 MB 7168 MB vllm/vllm-openai:v0.6.2 [43, 39, 201, 188, 250, 119, 64, 240, 112, 67, 55, 122, 34, 122, 33, 57, 101, 188, 202, 126]
public/Qwen/Qwen2.5-Coder-1.5B-Instruct/1208#node2 node2 Ready {'0': 6041894912} 1314 MB 7168 MB vllm/vllm-openai:v0.6.2 [11, 149, 111, 145, 17, 231, 165, 63, 205, 24, 31, 149, 89, 235, 58, 88, 209, 98, 225, 173]
public/Qwen/Qwen2.5-Coder-14B-Instruct-GPTQ-Int8/142#node2 node2 Ready {'0': 14090764288, '1': 12564037632} 1626 MB 12288 MB vllm/vllm-openai:v0.6.2 [43, 39, 201, 188, 250, 119, 64, 240, 112, 67, 55, 122, 34, 122, 33, 57, 101, 188, 202, 126]
public/Qwen/Qwen2.5-Coder-3B/137#node2 node2 Ready {'0': 10089398272} 1310 MB 4608 MB vllm/vllm-openai:v0.6.2 [43, 39, 201, 188, 250, 119, 64, 240, 112, 67, 55, 122, 34, 122, 33, 57, 101, 188, 202, 126]
public/Qwen/Qwen2.5-Coder-7B-Instruct/140#node2 node2 Ready {'0': 13474201600, '1': 11943280640} 1574 MB 14336 MB vllm/vllm-openai:v0.6.2 [43, 39, 201, 188, 250, 119, 64, 240, 112, 67, 55, 122, 34, 122, 33, 57, 101, 188, 202, 126]
public/Qwen/Qwen2.5-Math-1.5B-Instruct/825#node2 node2 Ready {'0': 7985954816} 1338 MB 7168 MB vllm/vllm-openai:v0.6.2 [11, 149, 111, 145, 17, 231, 165, 63, 205, 24, 31, 149, 89, 235, 58, 88, 209, 98, 225, 173]
public/Qwen/Qwen2.5-Math-1.5B/150#node2 node2 Ready {'0': 7990149120} 1314 MB 7168 MB vllm/vllm-openai:v0.6.2 [43, 39, 201, 188, 250, 119, 64, 240, 112, 67, 55, 122, 34, 122, 33, 57, 101, 188, 202, 126]
public/Qwen/Qwen2.5-Math-7B-Instruct/841#node2 node2 Ready {'0': 13461618688, '1': 11932794880} 1574 MB 14336 MB vllm/vllm-openai:v0.6.2 [11, 149, 111, 145, 17, 231, 165, 63, 205, 24, 31, 149, 89, 235, 58, 88, 209, 98, 225, 173]
public/Qwen/Qwen2.5-Math-7B/154#node2 node2 Ready {'0': 13461618688, '1': 11932794880} 1586 MB 14336 MB vllm/vllm-openai:v0.6.2 [43, 39, 201, 188, 250, 119, 64, 240, 112, 67, 55, 122, 34, 122, 33, 57, 101, 188, 202, 126]
public/Salesforce/codegen-2B-multi/239#node2 node2 Ready {'0': 5670699008} 538 MB 0 MB vllm-openai-upgraded:v0.1.0 [43, 39, 201, 188, 250, 119, 64, 240, 112, 67, 55, 122, 34, 122, 33, 57, 101, 188, 202, 126]
public/THUDM/chatglm3-6b-128k/164#node2 node2 Ready {'0': 14380171264} 1264 MB 7168 MB vllm/vllm-openai:v0.6.2 [43, 39, 201, 188, 250, 119, 64, 240, 112, 67, 55, 122, 34, 122, 33, 57, 101, 188, 202, 126]
public/THUDM/chatglm3-6b-32k/162#node2 node2 Ready {'0': 14409531392} 1102 MB 7168 MB vllm/vllm-openai:v0.4.2 [43, 39, 201, 188, 250, 119, 64, 240, 112, 67, 55, 122, 34, 122, 33, 57, 101, 188, 202, 126]
public/THUDM/chatglm3-6b/160#node2 node2 Ready {'0': 14355005440} 1264 MB 7168 MB vllm/vllm-openai:v0.6.2 [43, 39, 201, 188, 250, 119, 64, 240, 112, 67, 55, 122, 34, 122, 33, 57, 101, 188, 202, 126]
public/allenai/OLMo-1B-hf/219#node2 node2 Ready {'0': 14346616832} 1274 MB 4096 MB vllm/vllm-openai:v0.6.2 [43, 39, 201, 188, 250, 119, 64, 240, 112, 67, 55, 122, 34, 122, 33, 57, 101, 188, 202, 126]
public/allenai/OLMo-1B-hf_2gpu/221#node2 node2 Ready {'0': 14162067456, '1': 13665042432} 1634 MB 8192 MB vllm/vllm-openai:v0.6.2 [43, 39, 201, 188, 250, 119, 64, 240, 112, 67, 55, 122, 34, 122, 33, 57, 101, 188, 202, 126]
public/allenai/OLMo-7B-hf/223#node2 node2 Ready {'0': 13472104448, '1': 13002342400} 1790 MB 8192 MB vllm/vllm-openai:v0.6.2 [43, 39, 201, 188, 250, 119, 64, 240, 112, 67, 55, 122, 34, 122, 33, 57, 101, 188, 202, 126]
public/baichuan-inc/Baichuan-7B/175#node2 node2 Ready {'0': 13449035776, '1': 12853444608} 1590 MB 8192 MB vllm/vllm-openai:v0.6.2 [43, 39, 201, 188, 250, 119, 64, 240, 112, 67, 55, 122, 34, 122, 33, 57, 101, 188, 202, 126]
public/baichuan-inc/Baichuan2-7B-Chat/177#node2 node2 Ready {'0': 13451132928, '1': 12152995840} 1870 MB 8192 MB vllm/vllm-openai:v0.6.2 [43, 39, 201, 188, 250, 119, 64, 240, 112, 67, 55, 122, 34, 122, 33, 57, 101, 188, 202, 126]
public/bigcode/starcoder2-3b/242#node2 node2 Ready {'0': 13428064256} 1298 MB 7680 MB vllm/vllm-openai:v0.6.2 [43, 39, 201, 188, 250, 119, 64, 240, 112, 67, 55, 122, 34, 122, 33, 57, 101, 188, 202, 126]
public/bigcode/starcoder2-7b/244#node2 node2 Ready {'0': 13419675648, '1': 12941524992} 1534 MB 8192 MB vllm/vllm-openai:v0.6.2 [43, 39, 201, 188, 250, 119, 64, 240, 112, 67, 55, 122, 34, 122, 33, 57, 101, 188, 202, 126]
public/databricks/dolly-v2-12b/213#node2 node2 Ready {'0': 14673772544, '1': 14204010496} 2420 MB 9216 MB vllm/vllm-openai:v0.6.2 [43, 39, 201, 188, 250, 119, 64, 240, 112, 67, 55, 122, 34, 122, 33, 57, 101, 188, 202, 126]
public/deepseek-ai/DeepSeek-R1-Distill-Llama-8B/230#node2 node2 Ready {'0': 13472104448, '1': 12150898688} 1684 MB 8192 MB vllm/vllm-openai:v0.6.2 [43, 39, 201, 188, 250, 119, 64, 240, 112, 67, 55, 122, 34, 122, 33, 57, 101, 188, 202, 126]
public/deepseek-ai/DeepSeek-R1-Distill-Qwen-1.5B/232#node2 node2 Ready {'0': 12534677504} 1362 MB 7168 MB vllm/vllm-openai:v0.6.2 [43, 39, 201, 188, 250, 119, 64, 240, 112, 67, 55, 122, 34, 122, 33, 57, 101, 188, 202, 126]
public/deepseek-ai/DeepSeek-R1-Distill-Qwen-7B/234#node2 node2 Ready {'0': 13488881664, '1': 11960057856} 1630 MB 14336 MB vllm/vllm-openai:v0.6.2 [43, 39, 201, 188, 250, 119, 64, 240, 112, 67, 55, 122, 34, 122, 33, 57, 101, 188, 202, 126]
public/deepseek-ai/deepseek-llm-7b-chat/226#node2 node2 Ready {'0': 15464398848} 1304 MB 7680 MB vllm/vllm-openai:v0.6.2 [43, 39, 201, 188, 250, 119, 64, 240, 112, 67, 55, 122, 34, 122, 33, 57, 101, 188, 202, 126]
public/deepseek-ai/deepseek-llm-7b-chat_2gpu/228#node2 node2 Ready {'0': 13922992128, '1': 12870221824} 1784 MB 15360 MB vllm/vllm-openai:v0.6.2 [43, 39, 201, 188, 250, 119, 64, 240, 112, 67, 55, 122, 34, 122, 33, 57, 101, 188, 202, 126]
public/deepseek-ai/deepseek-math-7b-instruct/236#node2 node2 Ready {'0': 13421772800, '1': 12366905344} 1888 MB 15360 MB vllm/vllm-openai:v0.6.2 [43, 39, 201, 188, 250, 119, 64, 240, 112, 67, 55, 122, 34, 122, 33, 57, 101, 188, 202, 126]
public/facebook/opt-iml-max-1.3b/127#node2 node2 Ready {'0': 3810525184} 1254 MB 6144 MB vllm/vllm-openai:v0.6.2 [43, 39, 201, 188, 250, 119, 64, 240, 112, 67, 55, 122, 34, 122, 33, 57, 101, 188, 202, 126]
public/microsoft/Phi-3-mini-128k-instruct/187#node2 node2 Ready {'0': 12708741120} 1254 MB 4096 MB vllm/vllm-openai:v0.6.2 [43, 39, 201, 188, 250, 119, 64, 240, 112, 67, 55, 122, 34, 122, 33, 57, 101, 188, 202, 126]
public/microsoft/Phi-3-mini-4k-instruct/185#node2 node2 Ready {'0': 12696158208} 1258 MB 4096 MB vllm/vllm-openai:v0.6.2 [43, 39, 201, 188, 250, 119, 64, 240, 112, 67, 55, 122, 34, 122, 33, 57, 101, 188, 202, 126]
public/mosaicml/mpt-7b-storywriter/182#node2 node2 Ready {'0': 13386121216, '1': 12914262016} 1892 MB 8192 MB vllm/vllm-openai:v0.6.2 [43, 39, 201, 188, 250, 119, 64, 240, 112, 67, 55, 122, 34, 122, 33, 57, 101, 188, 202, 126]
public/mosaicml/mpt-7b/180#node2 node2 Ready {'0': 13386121216, '1': 12914262016} 1880 MB 8192 MB vllm/vllm-openai:v0.6.2 [43, 39, 201, 188, 250, 119, 64, 240, 112, 67, 55, 122, 34, 122, 33, 57, 101, 188, 202, 126]
public/nomic-ai/gpt4all-j/202#node2 node2 Ready {'0': 13335789568, '1': 12857638912} 1570 MB 14336 MB vllm/vllm-openai:v0.6.2 [43, 39, 201, 188, 250, 119, 64, 240, 112, 67, 55, 122, 34, 122, 33, 57, 101, 188, 202, 126]
public/openai-community/gpt2-xl/196#node2 node2 Ready {'0': 11630804992} 1386 MB 6144 MB vllm/vllm-openai:v0.6.2 [43, 39, 201, 188, 250, 119, 64, 240, 112, 67, 55, 122, 34, 122, 33, 57, 101, 188, 202, 126]
public/openbmb/MiniCPM-2B-dpo-bf16/208#node2 node2 Ready {'0': 13321109504} 1308 MB 5120 MB vllm/vllm-openai:v0.6.2 [43, 39, 201, 188, 250, 119, 64, 240, 112, 67, 55, 122, 34, 122, 33, 57, 101, 188, 202, 126]
public/openbmb/MiniCPM-2B-sft-bf16/210#node2 node2 Ready {'0': 8959033344} 1308 MB 5120 MB vllm/vllm-openai:v0.6.2 [43, 39, 201, 188, 250, 119, 64, 240, 112, 67, 55, 122, 34, 122, 33, 57, 101, 188, 202, 126]
public/tiiuae/falcon-rw-7b/193#node2 node2 Ready {'0': 13484687360, '1': 12878610432} 1538 MB 9216 MB vllm/vllm-openai:v0.6.2 [43, 39, 201, 188, 250, 119, 64, 240, 112, 67, 55, 122, 34, 122, 33, 57, 101, 188, 202, 126]