logo

InferX AI Function Platform (Lambda Function for Inference)

    --   Serve tens models in one box with ultra-fast (<2 sec) cold start (contact: support@inferx.net)



Pods

tenant namespace pod name state Node name Req Gpu Count Req Gpu vRam Type Standby allocated GPU vRam (MB) allocated GPU Slots
gpu pageable pinned
public BAAI public/BAAI/Aquila-7B/426/915 Standby node3 2 10000 MB Restore Blob : 17458 MB Blob : 1674 MB Blob : 8192 MB 0 {}
public Deci public/Deci/DeciLM-7B-instruct/230/916 Standby node3 2 13000 MB Restore Blob : 23270 MB Blob : 1518 MB Blob : 8192 MB 0 {}
public Deci public/Deci/DeciLM-7B/227/917 Standby node3 2 13000 MB Restore Blob : 23270 MB Blob : 1558 MB Blob : 8192 MB 0 {}
public EleutherAI public/EleutherAI/pythia-12b/243/964 Standby node3 2 13800 MB Restore Blob : 24502 MB Blob : 1558 MB Blob : 9216 MB 0 {}
public OpenAssistant public/OpenAssistant/oasst-sft-4-pythia-12b-epoch-3.5/254/919 Standby node3 2 13800 MB Restore Blob : 24492 MB Blob : 2520 MB Blob : 9216 MB 0 {}
public Qwen public/Qwen/Qwen2.5-1.5B/128/920 Ready node3 1 8000 MB Restore Blob : 7588 MB Blob : 1314 MB Blob : 7168 MB 8192 {'1': {'contextCnt': 1, 'slotCnt': 32}}
public Qwen public/Qwen/Qwen2.5-7B-Instruct-1M/138/963 Standby node3 2 13800 MB Restore Blob : 23446 MB Blob : 1570 MB Blob : 14336 MB 0 {}
public Qwen public/Qwen/Qwen2.5-7B-Instruct-GPTQ-Int8/126/965 Standby node3 1 13500 MB Restore Blob : 13438 MB Blob : 1310 MB Blob : 7168 MB 0 {}
public Qwen public/Qwen/Qwen2.5-Coder-1.5B-Instruct/121/923 Standby node3 1 7500 MB Restore Blob : 7162 MB Blob : 1310 MB Blob : 7168 MB 0 {}
public Qwen public/Qwen/Qwen2.5-Coder-14B-Instruct-GPTQ-Int8/124/966 Standby node3 2 13800 MB Restore Blob : 23480 MB Blob : 1666 MB Blob : 12288 MB 0 {}
public Qwen public/Qwen/Qwen2.5-Coder-3B/119/925 Standby node3 1 13800 MB Restore Blob : 12790 MB Blob : 1310 MB Blob : 4608 MB 0 {}
public Qwen public/Qwen/Qwen2.5-Coder-7B-Instruct/117/926 Standby node3 2 13800 MB Restore Blob : 23458 MB Blob : 1570 MB Blob : 14336 MB 0 {}
public Qwen public/Qwen/Qwen2.5-Math-1.5B-Instruct/130/927 Standby node3 1 7000 MB Restore Blob : 6664 MB Blob : 1330 MB Blob : 7168 MB 0 {}
public Qwen public/Qwen/Qwen2.5-Math-1.5B/132/928 Ready node3 1 8000 MB Restore Blob : 7620 MB Blob : 1314 MB Blob : 7168 MB 8192 {'0': {'contextCnt': 1, 'slotCnt': 32}}
public Qwen public/Qwen/Qwen2.5-Math-7B-Instruct/134/929 Standby node3 2 13800 MB Restore Blob : 23438 MB Blob : 1570 MB Blob : 14336 MB 0 {}
public Qwen public/Qwen/Qwen2.5-Math-7B/136/930 Standby node3 2 13800 MB Restore Blob : 23438 MB Blob : 1594 MB Blob : 14336 MB 0 {}
public Salesforce public/Salesforce/codegen-2B-multi/278/931 Standby node3 1 13000 MB Restore Blob : 5408 MB Blob : 542 MB Blob : 0 MB 0 {}
public THUDM public/THUDM/chatglm3-6b-128k/148/932 Standby node3 1 13800 MB Restore Blob : 13714 MB Blob : 1260 MB Blob : 7168 MB 0 {}
public THUDM public/THUDM/chatglm3-6b-32k/146/933 Standby node3 1 13800 MB Restore Blob : 13742 MB Blob : 1098 MB Blob : 7168 MB 0 {}
public THUDM public/THUDM/chatglm3-6b/144/934 Standby node3 1 13800 MB Restore Blob : 13690 MB Blob : 1256 MB Blob : 7168 MB 0 {}
public TinyLlama public/TinyLlama/TinyLlama-1.1B-Chat-v1.0/100/935 Standby node3 1 6000 MB Restore Blob : 5694 MB Blob : 1254 MB Blob : 5632 MB 0 {}
public TinyLlama public/TinyLlama/TinyLlama-1.1B-Chat-v1.0_13GB/106/936 Standby node3 1 13800 MB Restore Blob : 12602 MB Blob : 1254 MB Blob : 5632 MB 0 {}
public TinyLlama public/TinyLlama/TinyLlama-1.1B-Chat-v1.0_2gpu/109/937 Standby node3 2 13800 MB Restore Blob : 24598 MB Mem : 1546 MB Blob : 11264 MB 0 {}
public allenai public/allenai/OLMo-1B-hf/257/938 Standby node3 1 13800 MB Restore Blob : 12460 MB Blob : 1270 MB Blob : 4096 MB 0 {}
public allenai public/allenai/OLMo-7B-hf/259/939 Standby node3 2 13800 MB Restore Blob : 24496 MB Blob : 1758 MB Blob : 8192 MB 0 {}
public baichuan-inc public/baichuan-inc/Baichuan-7B/158/940 Standby node3 2 13800 MB Restore Blob : 24420 MB Blob : 1566 MB Blob : 8192 MB 0 {}
public baichuan-inc public/baichuan-inc/Baichuan2-7B-Chat/160/941 Standby node3 2 13800 MB Restore Blob : 23754 MB Blob : 1890 MB Blob : 8192 MB 0 {}
public bigcode public/bigcode/starcoder2-3b/284/942 Standby node3 1 13800 MB Restore Blob : 12444 MB Blob : 1278 MB Blob : 7680 MB 0 {}
public bigcode public/bigcode/starcoder2-7b/359/943 Standby node3 2 13800 MB Restore Blob : 24450 MB Blob : 1634 MB Blob : 8192 MB 0 {}
public databricks public/databricks/dolly-v2-12b/251/944 Standby node3 2 14000 MB Restore Blob : 27540 MB Blob : 2272 MB Blob : 9216 MB 0 {}
public deepseek-ai public/deepseek-ai/DeepSeek-R1-Distill-Llama-8B/262/945 Standby node3 2 13800 MB Restore Blob : 23700 MB Blob : 1644 MB Blob : 8192 MB 0 {}
public deepseek-ai public/deepseek-ai/DeepSeek-R1-Distill-Qwen-1.5B/264/946 Standby node3 1 13000 MB Restore Blob : 11954 MB Blob : 1354 MB Blob : 7168 MB 0 {}
public deepseek-ai public/deepseek-ai/DeepSeek-R1-Distill-Qwen-7B/266/947 Standby node3 2 13800 MB Restore Blob : 23490 MB Blob : 1638 MB Blob : 14336 MB 0 {}
public deepseek-ai public/deepseek-ai/deepseek-llm-7b-chat/268/948 Standby node3 2 13800 MB Restore Blob : 23928 MB Blob : 1612 MB Blob : 15360 MB 0 {}
public deepseek-ai public/deepseek-ai/deepseek-math-7b-instruct/271/949 Standby node3 2 13800 MB Restore Blob : 23928 MB Blob : 1816 MB Blob : 15360 MB 0 {}
public facebook public/facebook/opt-iml-max-1.3b/113/950 Standby node3 1 3800 MB Restore Mem : 3448 MB File : 1246 MB Mem : 6144 MB 0 {}
public llava-hf public/llava-hf/llava-1.5-7b-hf/281/952 Standby node3 1 14000 MB Restore Blob : 13946 MB Blob : 584 MB Blob : 0 MB 0 {}
public microsoft public/microsoft/Phi-3-mini-128k-instruct/172/953 Standby node3 1 13000 MB Restore Blob : 12120 MB Blob : 1246 MB Blob : 4096 MB 0 {}
public microsoft public/microsoft/Phi-3-mini-4k-instruct/170/954 Standby node3 1 13000 MB Restore Blob : 12108 MB Blob : 1250 MB Blob : 4096 MB 0 {}
public mosaicml public/mosaicml/mpt-7b-storywriter/349/955 Standby node3 2 13800 MB Restore Blob : 24458 MB Blob : 1984 MB Blob : 8192 MB 0 {}
public mosaicml public/mosaicml/mpt-7b/165/956 Standby node3 2 13800 MB Restore Blob : 24458 MB Blob : 1872 MB Blob : 8192 MB 0 {}
public nomic-ai public/nomic-ai/gpt4all-j/240/957 Standby node3 2 13800 MB Restore Blob : 24476 MB Blob : 1562 MB Blob : 14336 MB 0 {}
public openai-community public/openai-community/gpt2-xl/237/958 Standby node3 1 12000 MB Restore Blob : 10914 MB Blob : 1390 MB Blob : 6144 MB 0 {}
public openbmb public/openbmb/MiniCPM-2B-dpo-bf16/246/959 Standby node3 1 13800 MB Restore Blob : 12494 MB Blob : 1304 MB Blob : 5120 MB 0 {}
public openbmb public/openbmb/MiniCPM-2B-sft-bf16/248/960 Standby node3 1 9000 MB Restore Blob : 8334 MB Blob : 1304 MB Blob : 5120 MB 0 {}
public tiiuae public/tiiuae/falcon-rw-7b/234/961 Standby node3 2 13800 MB Restore Blob : 24366 MB Blob : 1526 MB Blob : 9216 MB 0 {}