Notes for setting up GPU with Openshift
- Centos7 or RHEL7
- Openshift 3.7+
- CUDA9 and CuDNN7
lspci -nn | grep VGA
lspci | grep -i --color 'vga\|3d\|2d'| { | |
| "apiVersion": "v1", | |
| "kind": "Template", | |
| "labels": { | |
| "application": "oshinko-java-spark", | |
| "createdBy": "template-oshinko-java-build-dc" | |
| }, | |
| "metadata": { | |
| "annotations": { | |
| "description": "Create a buildconfig, imagestream and deploymentconfig using source-to-image and java spark source hosted in git", |
| ## Check the GPU model | |
| -------------------------------------- | |
| # lspci -nn | grep VGA | |
| 00:02.0 VGA compatible controller [0300]: Cirrus Logic GD 5446 [1013:00b8] | |
| 00:1e.0 VGA compatible controller [0300]: NVIDIA Corporation GM204GL [Tesla M60] [10de:13f2] (rev a1) | |
| # you might need to do #yum install pciutils | |
| ## Check the kernel versions. Not all kernel versions are supported for drivers | |
| ------------------------------------------------------------------------------------- | |
| # uname -r |
| { | |
| "apiVersion": "tensorflow.org/v1alpha1", | |
| "kind": "TfJob", | |
| "metadata": { | |
| "name": "sample-tfjob" | |
| }, | |
| "spec": { | |
| "replicaSpecs": [ | |
| { | |
| "template": { |
| { | |
| "apiVersion":"v1", | |
| "kind":"Template", | |
| "template":"kubeflow-operator", | |
| "labels":{ | |
| "template":"kubeflow-operator" | |
| }, | |
| "message":"Kubeflow TfJob Operator", | |
| "metadata":{ | |
| "name":"kubeflow-operator", |
| { | |
| "apiVersion": "tensorflow.org/v1alpha1", | |
| "kind": "TfJob", | |
| "metadata": { | |
| "name": "distributed-job" | |
| }, | |
| "spec": { | |
| "replicaSpecs": [ | |
| { | |
| "replicas": 1, |
| import os | |
| import sys | |
| import tensorflow as tf | |
| import numpy as np | |
| from tensorflow.python.saved_model import builder as saved_model_builder | |
| from tensorflow.python.saved_model import signature_constants | |
| from tensorflow.python.saved_model import signature_def_utils | |
| from tensorflow.python.saved_model import tag_constants | |
| from tensorflow.python.saved_model import utils | |
| from tensorflow.python.util import compat |
| --- | |
| apiVersion: v1 | |
| data: | |
| jupyterhub_config.py: | | |
| import json | |
| import os | |
| from kubespawner.spawner import KubeSpawner | |
| from jhub_remote_user_authenticator.remote_user_auth import RemoteUserAuthenticator | |
| from oauthenticator.github import GitHubOAuthenticator |