logo

InferX AI Function Platform (Lambda Function for Inference)

    --   Serve tens models in one box with ultra-fast (<2 sec) cold start (contact: support@inferx.net)

Action

Pods

tenant namespace pod name state Node name Req Gpu Count Req Gpu vRam Type Standby allocated GPU vRam (MB) allocated GPU Slots
gpu pageable pinned
public BAAI public/BAAI/Aquila-7B/172/1218 Standby node2 2 13000 MB Restore Blob : 23242 MB Blob : 1670 MB Blob : 8192 MB 0 {}
public Deci public/Deci/DeciLM-7B/190/1219 Standby node2 2 13000 MB Restore Blob : 23958 MB Blob : 1574 MB Blob : 8192 MB 0 {}
public EleutherAI public/EleutherAI/pythia-12b/205/1196 Standby node2 2 14200 MB Restore Blob : 25390 MB Blob : 1546 MB Blob : 9216 MB 0 {}
public OpenAssistant public/OpenAssistant/oasst-sft-4-pythia-12b-epoch-3.5/216/1151 Standby node2 2 13800 MB Restore Blob : 24492 MB Blob : 2196 MB Blob : 9216 MB 0 {}
public Qwen public/Qwen/Qwen2.5-1.5B/146/1152 Standby node2 1 8000 MB Restore Blob : 7588 MB Blob : 1314 MB Blob : 7168 MB 0 {}
public Qwen public/Qwen/Qwen2.5-7B-Instruct-1M/156/1213 Standby node2 2 13800 MB Restore Blob : 24228 MB Blob : 1586 MB Blob : 14336 MB 0 {}
public Qwen public/Qwen/Qwen2.5-7B-Instruct-GPTQ-Int8/144/1154 Standby node2 1 14200 MB Restore Blob : 13164 MB Blob : 1314 MB Blob : 7168 MB 0 {}
public Qwen public/Qwen/Qwen2.5-Coder-1.5B-Instruct/1208/1220 Standby node2 1 6000 MB Restore Blob : 5762 MB Blob : 1314 MB Blob : 7168 MB 0 {}
public Qwen public/Qwen/Qwen2.5-Coder-14B-Instruct-GPTQ-Int8/142/1228 Standby node2 2 13800 MB Restore Blob : 25420 MB Blob : 1626 MB Blob : 12288 MB 0 {}
public Qwen public/Qwen/Qwen2.5-Coder-3B/137/1222 Standby node2 1 10000 MB Restore Blob : 9622 MB Blob : 1310 MB Blob : 4608 MB 0 {}
public Qwen public/Qwen/Qwen2.5-Coder-7B-Instruct/140/1224 Standby node2 2 13800 MB Restore Blob : 24240 MB Blob : 1574 MB Blob : 14336 MB 0 {}
public Qwen public/Qwen/Qwen2.5-Math-1.5B-Instruct/825/1227 Standby node2 1 8000 MB Restore Blob : 7616 MB Blob : 1338 MB Blob : 7168 MB 0 {}
public Qwen public/Qwen/Qwen2.5-Math-1.5B/150/1215 Standby node2 1 8000 MB Restore Blob : 7620 MB Blob : 1314 MB Blob : 7168 MB 0 {}
public Qwen public/Qwen/Qwen2.5-Math-7B-Instruct/841/1161 Standby node2 2 13800 MB Restore Blob : 24218 MB Blob : 1574 MB Blob : 14336 MB 0 {}
public Qwen public/Qwen/Qwen2.5-Math-7B/154/1203 Standby node2 2 13800 MB Restore Blob : 24218 MB Blob : 1586 MB Blob : 14336 MB 0 {}
public Salesforce public/Salesforce/codegen-2B-multi/239/1163 Standby node2 1 13000 MB Restore Blob : 5408 MB Blob : 538 MB Blob : 0 MB 0 {}
public THUDM public/THUDM/chatglm3-6b-128k/164/1164 Standby node2 1 13800 MB Restore Blob : 13714 MB Blob : 1264 MB Blob : 7168 MB 0 {}
public THUDM public/THUDM/chatglm3-6b-32k/162/1165 Standby node2 1 13800 MB Restore Blob : 13742 MB Blob : 1102 MB Blob : 7168 MB 0 {}
public THUDM public/THUDM/chatglm3-6b/160/1201 Standby node2 1 13800 MB Restore Blob : 13690 MB Blob : 1264 MB Blob : 7168 MB 0 {}
public allenai public/allenai/OLMo-1B-hf/219/1170 Standby node2 1 14600 MB Restore Blob : 13682 MB Blob : 1274 MB Blob : 4096 MB 0 {}
public allenai public/allenai/OLMo-1B-hf_2gpu/221/1226 Standby node2 2 14600 MB Restore Blob : 26538 MB Blob : 1634 MB Blob : 8192 MB 0 {}
public allenai public/allenai/OLMo-7B-hf/223/1172 Standby node2 2 13800 MB Restore Blob : 25248 MB Blob : 1790 MB Blob : 8192 MB 0 {}
public baichuan-inc public/baichuan-inc/Baichuan-7B/175/1211 Standby node2 2 13800 MB Restore Blob : 25084 MB Blob : 1590 MB Blob : 8192 MB 0 {}
public baichuan-inc public/baichuan-inc/Baichuan2-7B-Chat/177/1174 Standby node2 2 13800 MB Restore Blob : 24418 MB Blob : 1870 MB Blob : 8192 MB 0 {}
public bigcode public/bigcode/starcoder2-3b/242/1175 Standby node2 1 13800 MB Restore Blob : 12806 MB Blob : 1298 MB Blob : 7680 MB 0 {}
public bigcode public/bigcode/starcoder2-7b/244/1176 Standby node2 2 13800 MB Restore Blob : 25140 MB Blob : 1534 MB Blob : 8192 MB 0 {}
public databricks public/databricks/dolly-v2-12b/213/1177 Standby node2 2 14000 MB Restore Blob : 27540 MB Blob : 2420 MB Blob : 9216 MB 0 {}
public deepseek-ai public/deepseek-ai/DeepSeek-R1-Distill-Llama-8B/230/1178 Standby node2 2 13800 MB Restore Blob : 24436 MB Blob : 1684 MB Blob : 8192 MB 0 {}
public deepseek-ai public/deepseek-ai/DeepSeek-R1-Distill-Qwen-1.5B/232/1179 Standby node2 1 13000 MB Restore Blob : 11954 MB Blob : 1362 MB Blob : 7168 MB 0 {}
public deepseek-ai public/deepseek-ai/DeepSeek-R1-Distill-Qwen-7B/234/1223 Ready node2 2 13800 MB Restore Blob : 24270 MB Blob : 1630 MB Blob : 14336 MB 13824 {'0': {'contextCnt': 1, 'slotCnt': 54}, '1': {'contextCnt': 1, 'slotCnt': 54}}
public deepseek-ai public/deepseek-ai/deepseek-llm-7b-chat/226/1181 Standby node2 1 14600 MB Restore Blob : 14748 MB Blob : 1304 MB Blob : 7680 MB 0 {}
public deepseek-ai public/deepseek-ai/deepseek-llm-7b-chat_2gpu/228/1182 Standby node2 2 14200 MB Restore Blob : 25552 MB Blob : 1784 MB Blob : 15360 MB 0 {}
public deepseek-ai public/deepseek-ai/deepseek-math-7b-instruct/236/1195 Standby node2 2 13800 MB Restore Blob : 24594 MB Blob : 1888 MB Blob : 15360 MB 0 {}
public facebook public/facebook/opt-iml-max-1.3b/127/1184 Standby node2 1 3800 MB Restore Mem : 3634 MB File : 1254 MB Mem : 6144 MB 0 {}
public microsoft public/microsoft/Phi-3-mini-128k-instruct/187/1185 Standby node2 1 13000 MB Restore Blob : 12120 MB Blob : 1254 MB Blob : 4096 MB 0 {}
public microsoft public/microsoft/Phi-3-mini-4k-instruct/185/1186 Standby node2 1 13000 MB Restore Blob : 12108 MB Blob : 1258 MB Blob : 4096 MB 0 {}
public mosaicml public/mosaicml/mpt-7b-storywriter/182/1187 Standby node2 2 13800 MB Restore Blob : 25082 MB Blob : 1892 MB Blob : 8192 MB 0 {}
public mosaicml public/mosaicml/mpt-7b/180/1188 Standby node2 2 13800 MB Restore Blob : 25082 MB Blob : 1880 MB Blob : 8192 MB 0 {}
public nomic-ai public/nomic-ai/gpt4all-j/202/1189 Standby node2 2 13800 MB Restore Blob : 24980 MB Blob : 1570 MB Blob : 14336 MB 0 {}
public openai-community public/openai-community/gpt2-xl/196/1190 Standby node2 1 12000 MB Restore Blob : 11092 MB Blob : 1386 MB Blob : 6144 MB 0 {}
public openbmb public/openbmb/MiniCPM-2B-dpo-bf16/208/1191 Standby node2 1 13800 MB Restore Blob : 12704 MB Blob : 1308 MB Blob : 5120 MB 0 {}
public openbmb public/openbmb/MiniCPM-2B-sft-bf16/210/1205 Standby node2 1 9000 MB Restore Blob : 8544 MB Blob : 1308 MB Blob : 5120 MB 0 {}
public tiiuae public/tiiuae/falcon-rw-7b/193/1193 Standby node2 2 13800 MB Restore Blob : 25142 MB Blob : 1538 MB Blob : 9216 MB 0 {}