mirror of
https://github.com/NVIDIA/dgx-spark-playbooks.git
synced 2026-04-25 11:23:52 +00:00
chore: Regenerate all playbooks
This commit is contained in:
parent
e9a3f2a759
commit
e17deb3167
@ -23,6 +23,8 @@
|
|||||||
# See the License for the specific language governing permissions and
|
# See the License for the specific language governing permissions and
|
||||||
# limitations under the License.
|
# limitations under the License.
|
||||||
#
|
#
|
||||||
|
#
|
||||||
|
# Author: William Benton <wbention@nvidia.com>
|
||||||
|
|
||||||
import marimo
|
import marimo
|
||||||
|
|
||||||
|
|||||||
@ -14,6 +14,10 @@
|
|||||||
# See the License for the specific language governing permissions and
|
# See the License for the specific language governing permissions and
|
||||||
# limitations under the License.
|
# limitations under the License.
|
||||||
#
|
#
|
||||||
|
#
|
||||||
|
# Author: William Benton <wbention@nvidia.com>
|
||||||
|
|
||||||
|
|
||||||
FROM nvidia/cuda:13.0.1-runtime-ubuntu24.04
|
FROM nvidia/cuda:13.0.1-runtime-ubuntu24.04
|
||||||
|
|
||||||
RUN ldconfig
|
RUN ldconfig
|
||||||
|
|||||||
@ -23,6 +23,8 @@
|
|||||||
# See the License for the specific language governing permissions and
|
# See the License for the specific language governing permissions and
|
||||||
# limitations under the License.
|
# limitations under the License.
|
||||||
#
|
#
|
||||||
|
#
|
||||||
|
# Author: William Benton <wbention@nvidia.com>
|
||||||
|
|
||||||
import marimo
|
import marimo
|
||||||
|
|
||||||
|
|||||||
@ -24,6 +24,8 @@
|
|||||||
# See the License for the specific language governing permissions and
|
# See the License for the specific language governing permissions and
|
||||||
# limitations under the License.
|
# limitations under the License.
|
||||||
#
|
#
|
||||||
|
#
|
||||||
|
# Author: William Benton <wbention@nvidia.com>
|
||||||
|
|
||||||
|
|
||||||
import marimo
|
import marimo
|
||||||
|
|||||||
@ -26,6 +26,8 @@
|
|||||||
# See the License for the specific language governing permissions and
|
# See the License for the specific language governing permissions and
|
||||||
# limitations under the License.
|
# limitations under the License.
|
||||||
#
|
#
|
||||||
|
#
|
||||||
|
# Author: William Benton <wbention@nvidia.com>
|
||||||
|
|
||||||
import marimo
|
import marimo
|
||||||
|
|
||||||
|
|||||||
@ -97,6 +97,7 @@ The following models are supported with TensorRT-LLM on Spark. All listed models
|
|||||||
| **Qwen3-8B** | NVFP4 | ✅ | `nvidia/Qwen3-8B-FP4` |
|
| **Qwen3-8B** | NVFP4 | ✅ | `nvidia/Qwen3-8B-FP4` |
|
||||||
| **Qwen3-14B** | FP8 | ✅ | `nvidia/Qwen3-14B-FP8` |
|
| **Qwen3-14B** | FP8 | ✅ | `nvidia/Qwen3-14B-FP8` |
|
||||||
| **Qwen3-14B** | NVFP4 | ✅ | `nvidia/Qwen3-14B-FP4` |
|
| **Qwen3-14B** | NVFP4 | ✅ | `nvidia/Qwen3-14B-FP4` |
|
||||||
|
| **Qwen3-32B** | NVFP4 | ✅ | `nvidia/Qwen3-32B-FP4` |
|
||||||
| **Phi-4-multimodal-instruct** | FP8 | ✅ | `nvidia/Phi-4-multimodal-instruct-FP8` |
|
| **Phi-4-multimodal-instruct** | FP8 | ✅ | `nvidia/Phi-4-multimodal-instruct-FP8` |
|
||||||
| **Phi-4-multimodal-instruct** | NVFP4 | ✅ | `nvidia/Phi-4-multimodal-instruct-FP4` |
|
| **Phi-4-multimodal-instruct** | NVFP4 | ✅ | `nvidia/Phi-4-multimodal-instruct-FP4` |
|
||||||
| **Phi-4-reasoning-plus** | FP8 | ✅ | `nvidia/Phi-4-reasoning-plus-FP8` |
|
| **Phi-4-reasoning-plus** | FP8 | ✅ | `nvidia/Phi-4-reasoning-plus-FP8` |
|
||||||
|
|||||||
Loading…
Reference in New Issue
Block a user