Using Microsoft Foundry Local models



To install Foundry Local using PowerShell, I’ll run winget install Microsoft.FoundryLocal.

AliasDeviceTaskFile SizeLicenseModel ID
phi-4GPUchat-completion8.37 GBMITPhi-4-cuda-gpu:1
phi-4GPUchat-completion8.37 GBMITPhi-4-trtrtx-gpu:1
phi-4GPUchat-completion8.83 GBMITphi-4-openvino-gpu:1
phi-4GPUchat-completion8.37 GBMITPhi-4-generic-gpu:1
phi-4CPUchat-completion10.16 GBMITPhi-4-generic-cpu:1
phi-3.5-miniGPUchat-completion2.13 GBMITPhi-3.5-mini-instruct-cuda-gpu:1
phi-3.5-miniGPUchat-completion1.95 GBMITPhi-3.5-mini-instruct-openvino-gpu:1
phi-3.5-miniGPUchat-completion2.13 GBMITphi-3.5-mini-instruct-trtrtx-gpu:1
phi-3.5-miniGPUchat-completion2.16 GBMITPhi-3.5-mini-instruct-generic-gpu:1
phi-3.5-miniCPUchat-completion2.53 GBMITPhi-3.5-mini-instruct-generic-cpu:1
phi-3-mini-128kGPUchat-completion2.13 GBMITPhi-3-mini-128k-instruct-cuda-gpu:1
phi-3-mini-128kGPUchat-completion2.13 GBMITphi-3-mini-128k-instruct-trtrtx-gpu:1
phi-3-mini-128kGPUchat-completion2.27 GBMITPhi-3-mini-128k-instruct-openvino-gpu:1
phi-3-mini-128kGPUchat-completion2.13 GBMITPhi-3-mini-128k-instruct-generic-gpu:1
phi-3-mini-128kCPUchat-completion2.54 GBMITPhi-3-mini-128k-instruct-generic-cpu:2
phi-3-mini-4kGPUchat-completion2.13 GBMITPhi-3-mini-4k-instruct-cuda-gpu:1
phi-3-mini-4kGPUchat-completion2.13 GBMITphi-3-mini-4k-instruct-trtrtx-gpu:1
phi-3-mini-4kGPUchat-completion2.01 GBMITPhi-3-mini-4k-instruct-openvino-gpu:1
phi-3-mini-4kGPUchat-completion2.13 GBMITPhi-3-mini-4k-instruct-generic-gpu:1
phi-3-mini-4kCPUchat-completion2.53 GBMITPhi-3-mini-4k-instruct-generic-cpu:2
mistral-7b-v0.2GPUchat-completion3.98 GBapache-2.0mistralai-Mistral-7B-Instruct-v0-2-cuda-gpu:1
mistral-7b-v0.2GPUchat-completion4.27 GBapache-2.0Mistral-7B-Instruct-v0-2-openvino-gpu:1
mistral-7b-v0.2GPUchat-completion3.98 GBApache-2.0mistralai-Mistral-7B-Instruct-v0-2-trtrtx-gpu:1
mistral-7b-v0.2GPUchat-completion4.07 GBapache-2.0mistralai-Mistral-7B-Instruct-v0-2-generic-gpu:1
mistral-7b-v0.2CPUchat-completion4.07 GBapache-2.0mistralai-Mistral-7B-Instruct-v0-2-generic-cpu:2
deepseek-r1-14bGPUchat-completion9.83 GBMITdeepseek-r1-distill-qwen-14b-cuda-gpu:3
deepseek-r1-14bGPUchat-completion9.83 GBMITdeepseek-r1-distill-qwen-14b-trtrtx-gpu:1
deepseek-r1-14bGPUchat-completion7.87 GBMITDeepSeek-R1-Distill-Qwen-14B-openvino-gpu:1
deepseek-r1-14bGPUchat-completion10.27 GBMITdeepseek-r1-distill-qwen-14b-generic-gpu:3
deepseek-r1-14bCPUchat-completion11.51 GBMITdeepseek-r1-distill-qwen-14b-generic-cpu:3
deepseek-r1-7bGPUchat-completion5.28 GBMITdeepseek-r1-distill-qwen-7b-cuda-gpu:3
deepseek-r1-7bGPUchat-completion4.19 GBMITDeepSeek-R1-Distill-Qwen-7B-openvino-gpu:1
deepseek-r1-7bGPUchat-completion5.58 GBMITdeepseek-r1-distill-qwen-7b-generic-gpu:3
deepseek-r1-7bCPUchat-completion6.43 GBMITdeepseek-r1-distill-qwen-7b-generic-cpu:3
deepseek-r1-7bGPUchat-completion5.28 GBMITDeepSeek-R1-Distill-Qwen-7B-trtrtx-gpu:1
qwen2.5-coder-0.5bGPUchat-completion0.52 GBapache-2.0qwen2.5-coder-0.5b-instruct-cuda-gpu:4
qwen2.5-coder-0.5bGPUchat-completion0.36 GBapache-2.0qwen2.5-coder-0.5b-instruct-openvino-gpu:2
qwen2.5-coder-0.5bGPUchat-completion0.52 GBMITqwen2.5-coder-0.5b-instruct-trtrtx-gpu:2
qwen2.5-coder-0.5bGPUchat-completion0.52 GBapache-2.0qwen2.5-coder-0.5b-instruct-generic-gpu:4
qwen2.5-coder-0.5bCPUchat-completion0.80 GBapache-2.0qwen2.5-coder-0.5b-instruct-generic-cpu:4
phi-4-mini-reasoningGPUchat-completion3.15 GBMITPhi-4-mini-reasoning-cuda-gpu:3
phi-4-mini-reasoningGPUchat-completion2.47 GBMITPhi-4-mini-reasoning-openvino-gpu:2
phi-4-mini-reasoningGPUchat-completion3.15 GBMITPhi-4-mini-reasoning-generic-gpu:3
phi-4-mini-reasoningCPUchat-completion4.52 GBMITPhi-4-mini-reasoning-generic-cpu:3
qwen2.5-0.5bGPUchat-completion0.52 GBapache-2.0qwen2.5-0.5b-instruct-cuda-gpu:4
qwen2.5-0.5bGPUchat-completion0.36 GBapache-2.0qwen2.5-0.5b-instruct-openvino-gpu:2
qwen2.5-0.5bGPUchat-completion0.52 GBMITqwen2.5-0.5b-instruct-trtrtx-gpu:2
qwen2.5-0.5bGPUchat-completion0.68 GBapache-2.0qwen2.5-0.5b-instruct-generic-gpu:4
qwen2.5-0.5bCPUchat-completion0.80 GBapache-2.0qwen2.5-0.5b-instruct-generic-cpu:4
qwen2.5-1.5bGPUchat-completion1.25 GBapache-2.0qwen2.5-1.5b-instruct-cuda-gpu:4
qwen2.5-1.5bGPUchat-completion1.00 GBapache-2.0qwen2.5-1.5b-instruct-openvino-gpu:2
qwen2.5-1.5bGPUchat-completion1.25 GBMITqwen2.5-1.5b-instruct-trtrtx-gpu:2
qwen2.5-1.5bGPUchat-completion1.51 GBapache-2.0qwen2.5-1.5b-instruct-generic-gpu:4
qwen2.5-1.5bCPUchat-completion1.78 GBapache-2.0qwen2.5-1.5b-instruct-generic-cpu:4
qwen2.5-coder-1.5bGPUchat-completion1.25 GBapache-2.0qwen2.5-coder-1.5b-instruct-cuda-gpu:4
qwen2.5-coder-1.5bGPUchat-completion0.99 GBapache-2.0qwen2.5-coder-1.5b-instruct-openvino-gpu:2
qwen2.5-coder-1.5bGPUchat-completion1.25 GBMITqwen2.5-coder-1.5b-instruct-trtrtx-gpu:2
qwen2.5-coder-1.5bGPUchat-completion1.25 GBapache-2.0qwen2.5-coder-1.5b-instruct-generic-gpu:4
qwen2.5-coder-1.5bCPUchat-completion1.78 GBapache-2.0qwen2.5-coder-1.5b-instruct-generic-cpu:4
phi-4-miniGPUchat-completion3.60 GBMITPhi-4-mini-instruct-cuda-gpu:5
phi-4-miniGPUchat-completion2.15 GBMITphi-4-mini-instruct-openvino-gpu:2
phi-4-miniGPUchat-completion3.72 GBMITPhi-4-mini-instruct-generic-gpu:5
phi-4-miniCPUchat-completion4.80 GBMITPhi-4-mini-instruct-generic-cpu:5
qwen2.5-14bGPUchat-completion8.79 GBapache-2.0qwen2.5-14b-instruct-cuda-gpu:4
qwen2.5-14bGPUchat-completion4.79 GBapache-2.0qwen2.5-14b-instruct-openvino-gpu:2
qwen2.5-14bGPUchat-completion8.79 GBMITqwen2.5-14b-instruct-trtrtx-gpu:2
qwen2.5-14bGPUchat-completion9.30 GBapache-2.0qwen2.5-14b-instruct-generic-gpu:4
qwen2.5-14bCPUchat-completion11.06 GBapache-2.0qwen2.5-14b-instruct-generic-cpu:4
qwen2.5-coder-14bGPUchat-completion8.79 GBapache-2.0qwen2.5-coder-14b-instruct-cuda-gpu:4
qwen2.5-coder-14bGPUchat-completion9.08 GBapache-2.0qwen2.5-coder-14b-instruct-openvino-gpu:2
qwen2.5-coder-14bGPUchat-completion8.79 GBMITqwen2.5-coder-14b-instruct-trtrtx-gpu:2
qwen2.5-coder-14bGPUchat-completion8.79 GBapache-2.0qwen2.5-coder-14b-instruct-generic-gpu:4
qwen2.5-coder-14bCPUchat-completion11.06 GBapache-2.0qwen2.5-coder-14b-instruct-generic-cpu:4
qwen2.5-coder-7bGPUchat-completion4.73 GBapache-2.0qwen2.5-coder-7b-instruct-cuda-gpu:4
qwen2.5-coder-7bGPUchat-completion4.80 GBapache-2.0qwen2.5-coder-7b-instruct-openvino-gpu:2
qwen2.5-coder-7bGPUchat-completion4.73 GBMITqwen2.5-coder-7b-instruct-trtrtx-gpu:2
qwen2.5-coder-7bGPUchat-completion4.73 GBapache-2.0qwen2.5-coder-7b-instruct-generic-gpu:4
qwen2.5-coder-7bCPUchat-completion6.16 GBapache-2.0qwen2.5-coder-7b-instruct-generic-cpu:4
qwen2.5-7bGPUchat-completion4.73 GBapache-2.0qwen2.5-7b-instruct-cuda-gpu:4
qwen2.5-7bGPUchat-completion4.79 GBapache-2.0qwen2.5-7b-instruct-openvino-gpu:2
qwen2.5-7bGPUchat-completion5.49 GBMITqwen2.5-7b-instruct-trtrtx-gpu:2
qwen2.5-7bGPUchat-completion5.20 GBapache-2.0qwen2.5-7b-instruct-generic-gpu:4
qwen2.5-7bCPUchat-completion6.16 GBapache-2.0qwen2.5-7b-instruct-generic-cpu:4
gpt-oss-20bGPUchat-completion9.65 GBapache-2.0gpt-oss-20b-cuda-gpu:1
deepseek-r1-1.5bGPUchat-completion1.43 GBMITDeepSeek-R1-Distill-Qwen-1.5B-trtrtx-gpu:1