Updates the notebooks with final validated results
This commit is contained in:
Родитель
a303331aab
Коммит
296254499a
|
@ -39,16 +39,16 @@
|
|||
"name": "stdout",
|
||||
"output_type": "stream",
|
||||
"text": [
|
||||
"--2018-04-10 10:16:47-- http://download.tensorflow.org/models/resnet_v1_152_2016_08_28.tar.gz\n",
|
||||
"--2018-04-11 09:14:36-- http://download.tensorflow.org/models/resnet_v1_152_2016_08_28.tar.gz\n",
|
||||
"Resolving download.tensorflow.org (download.tensorflow.org)... 216.58.216.176, 2607:f8b0:400a:807::2010\n",
|
||||
"Connecting to download.tensorflow.org (download.tensorflow.org)|216.58.216.176|:80... connected.\n",
|
||||
"HTTP request sent, awaiting response... 200 OK\n",
|
||||
"Length: 224342140 (214M) [application/x-tar]\n",
|
||||
"Saving to: ‘resnet_v1_152_2016_08_28.tar.gz.1’\n",
|
||||
"Saving to: ‘resnet_v1_152_2016_08_28.tar.gz’\n",
|
||||
"\n",
|
||||
"resnet_v1_152_2016_ 100%[===================>] 213.95M 57.1MB/s in 4.9s \n",
|
||||
"resnet_v1_152_2016_ 100%[===================>] 213.95M 56.7MB/s in 4.2s \n",
|
||||
"\n",
|
||||
"2018-04-10 10:16:52 (43.8 MB/s) - ‘resnet_v1_152_2016_08_28.tar.gz.1’ saved [224342140/224342140]\n",
|
||||
"2018-04-11 09:14:40 (50.6 MB/s) - ‘resnet_v1_152_2016_08_28.tar.gz’ saved [224342140/224342140]\n",
|
||||
"\n"
|
||||
]
|
||||
}
|
||||
|
@ -90,16 +90,16 @@
|
|||
"name": "stdout",
|
||||
"output_type": "stream",
|
||||
"text": [
|
||||
"--2018-04-10 10:16:54-- http://data.dmlc.ml/mxnet/models/imagenet/synset.txt\n",
|
||||
"--2018-04-11 09:14:43-- http://data.dmlc.ml/mxnet/models/imagenet/synset.txt\n",
|
||||
"Resolving data.dmlc.ml (data.dmlc.ml)... 54.208.175.7\n",
|
||||
"Connecting to data.dmlc.ml (data.dmlc.ml)|54.208.175.7|:80... connected.\n",
|
||||
"HTTP request sent, awaiting response... 200 OK\n",
|
||||
"Length: 31675 (31K) [text/plain]\n",
|
||||
"Saving to: ‘synset.txt.1’\n",
|
||||
"Saving to: ‘synset.txt’\n",
|
||||
"\n",
|
||||
"synset.txt.1 100%[===================>] 30.93K --.-KB/s in 0.03s \n",
|
||||
"synset.txt 100%[===================>] 30.93K --.-KB/s in 0.03s \n",
|
||||
"\n",
|
||||
"2018-04-10 10:16:55 (912 KB/s) - ‘synset.txt.1’ saved [31675/31675]\n",
|
||||
"2018-04-11 09:14:43 (909 KB/s) - ‘synset.txt’ saved [31675/31675]\n",
|
||||
"\n"
|
||||
]
|
||||
}
|
||||
|
@ -202,16 +202,16 @@
|
|||
"name": "stdout",
|
||||
"output_type": "stream",
|
||||
"text": [
|
||||
"--2018-04-10 10:17:17-- https://upload.wikimedia.org/wikipedia/commons/thumb/6/68/Lynx_lynx_poing.jpg/220px-Lynx_lynx_poing.jpg\n",
|
||||
"--2018-04-11 09:14:55-- https://upload.wikimedia.org/wikipedia/commons/thumb/6/68/Lynx_lynx_poing.jpg/220px-Lynx_lynx_poing.jpg\n",
|
||||
"Resolving upload.wikimedia.org (upload.wikimedia.org)... 208.80.153.240, 2620:0:860:ed1a::2:b\n",
|
||||
"Connecting to upload.wikimedia.org (upload.wikimedia.org)|208.80.153.240|:443... connected.\n",
|
||||
"HTTP request sent, awaiting response... 200 OK\n",
|
||||
"Length: 27183 (27K) [image/jpeg]\n",
|
||||
"Saving to: ‘220px-Lynx_lynx_poing.jpg’\n",
|
||||
"\n",
|
||||
"220px-Lynx_lynx_poi 100%[===================>] 26.55K --.-KB/s in 0.02s \n",
|
||||
"220px-Lynx_lynx_poi 100%[===================>] 26.55K --.-KB/s in 0.01s \n",
|
||||
"\n",
|
||||
"2018-04-10 10:17:18 (1.04 MB/s) - ‘220px-Lynx_lynx_poing.jpg’ saved [27183/27183]\n",
|
||||
"2018-04-11 09:14:55 (2.52 MB/s) - ‘220px-Lynx_lynx_poing.jpg’ saved [27183/27183]\n",
|
||||
"\n"
|
||||
]
|
||||
}
|
||||
|
|
|
@ -17,7 +17,7 @@
|
|||
"name": "stdout",
|
||||
"output_type": "stream",
|
||||
"text": [
|
||||
"Overwriting driver.py\n"
|
||||
"Writing driver.py\n"
|
||||
]
|
||||
}
|
||||
],
|
||||
|
@ -239,7 +239,7 @@
|
|||
"output_type": "stream",
|
||||
"text": [
|
||||
"INFO:tensorflow:Restoring parameters from resnet_v1_152.ckpt\n",
|
||||
"INFO:model_driver:Model loading time: 12726.69 ms\n"
|
||||
"INFO:model_driver:Model loading time: 12212.94 ms\n"
|
||||
]
|
||||
}
|
||||
],
|
||||
|
@ -262,7 +262,7 @@
|
|||
"DEBUG:PIL.PngImagePlugin:Compression method 0\n",
|
||||
"DEBUG:PIL.PngImagePlugin:STREAM b'IDAT' 345 65536\n",
|
||||
"INFO:model_driver:Predictions: {'image': [('n02127052 lynx, catamount', 0.99745172262191772), ('n02128385 leopard, Panthera pardus', 0.0015076899435371161), ('n02128757 snow leopard, ounce, Panthera uncia', 0.00051647447980940342)]}\n",
|
||||
"INFO:model_driver:Predictions took 920.8 ms\n"
|
||||
"INFO:model_driver:Predictions took 958.24 ms\n"
|
||||
]
|
||||
}
|
||||
],
|
||||
|
@ -285,7 +285,7 @@
|
|||
{
|
||||
"data": {
|
||||
"text/plain": [
|
||||
"'[{\"image\": [[\"n02127052 lynx, catamount\", 0.9974517226219177], [\"n02128385 leopard, Panthera pardus\", 0.001507689943537116], [\"n02128757 snow leopard, ounce, Panthera uncia\", 0.0005164744798094034]]}, \"Computed in 920.8 ms\"]'"
|
||||
"'[{\"image\": [[\"n02127052 lynx, catamount\", 0.9974517226219177], [\"n02128385 leopard, Panthera pardus\", 0.001507689943537116], [\"n02128757 snow leopard, ounce, Panthera uncia\", 0.0005164744798094034]]}, \"Computed in 958.24 ms\"]'"
|
||||
]
|
||||
},
|
||||
"execution_count": 11,
|
||||
|
|
Различия файлов скрыты, потому что одна или несколько строк слишком длинны
Различия файлов скрыты, потому что одна или несколько строк слишком длинны
|
@ -68,7 +68,6 @@
|
|||
"cell_type": "code",
|
||||
"execution_count": null,
|
||||
"metadata": {
|
||||
"collapsed": true,
|
||||
"scrolled": false
|
||||
},
|
||||
"outputs": [],
|
||||
|
@ -133,7 +132,7 @@
|
|||
},
|
||||
{
|
||||
"cell_type": "code",
|
||||
"execution_count": 4,
|
||||
"execution_count": 3,
|
||||
"metadata": {},
|
||||
"outputs": [
|
||||
{
|
||||
|
@ -166,7 +165,7 @@
|
|||
},
|
||||
{
|
||||
"cell_type": "code",
|
||||
"execution_count": 5,
|
||||
"execution_count": 4,
|
||||
"metadata": {},
|
||||
"outputs": [
|
||||
{
|
||||
|
@ -191,9 +190,9 @@
|
|||
" }\n",
|
||||
" ],\n",
|
||||
" \"dnsPrefix\": \"msAKSTFClu-msaksrg-edf507\",\n",
|
||||
" \"fqdn\": \"msakstfclu-msaksrg-edf507-1f197d36.hcp.eastus.azmk8s.io\",\n",
|
||||
" \"fqdn\": \"msakstfclu-msaksrg-edf507-9dc6365c.hcp.eastus.azmk8s.io\",\n",
|
||||
" \"id\": \"/subscriptions/edf507a2-6235-46c5-b560-fd463ba2e771/resourcegroups/msaksrg/providers/Microsoft.ContainerService/managedClusters/msAKSTFCluster\",\n",
|
||||
" \"kubernetesVersion\": \"1.7.9\",\n",
|
||||
" \"kubernetesVersion\": \"1.8.10\",\n",
|
||||
" \"linuxProfile\": {\n",
|
||||
" \"additionalProperties\": {},\n",
|
||||
" \"adminUsername\": \"azureuser\",\n",
|
||||
|
@ -267,11 +266,17 @@
|
|||
},
|
||||
{
|
||||
"cell_type": "code",
|
||||
"execution_count": null,
|
||||
"metadata": {
|
||||
"collapsed": true
|
||||
},
|
||||
"outputs": [],
|
||||
"execution_count": 5,
|
||||
"metadata": {},
|
||||
"outputs": [
|
||||
{
|
||||
"name": "stdout",
|
||||
"output_type": "stream",
|
||||
"text": [
|
||||
"Merged \"msAKSTFCluster\" as current context in /home/mat/.kube/config\r\n"
|
||||
]
|
||||
}
|
||||
],
|
||||
"source": [
|
||||
"!az aks get-credentials --resource-group $resource_group --name $aks_name"
|
||||
]
|
||||
|
@ -285,11 +290,18 @@
|
|||
},
|
||||
{
|
||||
"cell_type": "code",
|
||||
"execution_count": null,
|
||||
"metadata": {
|
||||
"collapsed": true
|
||||
},
|
||||
"outputs": [],
|
||||
"execution_count": 6,
|
||||
"metadata": {},
|
||||
"outputs": [
|
||||
{
|
||||
"name": "stdout",
|
||||
"output_type": "stream",
|
||||
"text": [
|
||||
"NAME STATUS ROLES AGE VERSION\r\n",
|
||||
"aks-nodepool1-27496346-0 Ready agent 3m v1.8.10\r\n"
|
||||
]
|
||||
}
|
||||
],
|
||||
"source": [
|
||||
"!kubectl get nodes"
|
||||
]
|
||||
|
@ -303,11 +315,24 @@
|
|||
},
|
||||
{
|
||||
"cell_type": "code",
|
||||
"execution_count": null,
|
||||
"metadata": {
|
||||
"collapsed": true
|
||||
},
|
||||
"outputs": [],
|
||||
"execution_count": 7,
|
||||
"metadata": {},
|
||||
"outputs": [
|
||||
{
|
||||
"name": "stdout",
|
||||
"output_type": "stream",
|
||||
"text": [
|
||||
"NAMESPACE NAME READY STATUS RESTARTS AGE\r\n",
|
||||
"kube-system heapster-75f8df9884-vlt25 2/2 Running 0 1m\r\n",
|
||||
"kube-system kube-dns-v20-5bf84586f4-9jd9r 3/3 Running 0 1m\r\n",
|
||||
"kube-system kube-dns-v20-5bf84586f4-f8nsn 3/3 Running 0 1m\r\n",
|
||||
"kube-system kube-proxy-x64jp 1/1 Running 0 1m\r\n",
|
||||
"kube-system kube-svc-redirect-mkwss 1/1 Running 0 1m\r\n",
|
||||
"kube-system kubernetes-dashboard-665f768455-npsfh 1/1 Running 0 1m\r\n",
|
||||
"kube-system tunnelfront-5c48644fb8-4c6dt 1/1 Running 0 1m\r\n"
|
||||
]
|
||||
}
|
||||
],
|
||||
"source": [
|
||||
"!kubectl get pods --all-namespaces"
|
||||
]
|
||||
|
@ -324,7 +349,7 @@
|
|||
},
|
||||
{
|
||||
"cell_type": "code",
|
||||
"execution_count": 1,
|
||||
"execution_count": 8,
|
||||
"metadata": {
|
||||
"collapsed": true
|
||||
},
|
||||
|
@ -348,7 +373,7 @@
|
|||
" \"containers\":[\n",
|
||||
" {\n",
|
||||
" \"name\": \"azure-dl\",\n",
|
||||
" \"image\": \"masalvar/tfresnet-gpu\",\n",
|
||||
" \"image\": image_name,\n",
|
||||
" \"env\":[\n",
|
||||
" {\n",
|
||||
" \"name\": \"LD_LIBRARY_PATH\",\n",
|
||||
|
@ -412,7 +437,7 @@
|
|||
},
|
||||
{
|
||||
"cell_type": "code",
|
||||
"execution_count": 2,
|
||||
"execution_count": 9,
|
||||
"metadata": {
|
||||
"collapsed": true
|
||||
},
|
||||
|
@ -426,7 +451,7 @@
|
|||
},
|
||||
{
|
||||
"cell_type": "code",
|
||||
"execution_count": 3,
|
||||
"execution_count": 10,
|
||||
"metadata": {
|
||||
"collapsed": true
|
||||
},
|
||||
|
@ -437,7 +462,7 @@
|
|||
},
|
||||
{
|
||||
"cell_type": "code",
|
||||
"execution_count": 4,
|
||||
"execution_count": 11,
|
||||
"metadata": {
|
||||
"collapsed": true
|
||||
},
|
||||
|
@ -455,7 +480,7 @@
|
|||
},
|
||||
{
|
||||
"cell_type": "code",
|
||||
"execution_count": 5,
|
||||
"execution_count": 12,
|
||||
"metadata": {},
|
||||
"outputs": [
|
||||
{
|
||||
|
@ -557,7 +582,7 @@
|
|||
},
|
||||
{
|
||||
"cell_type": "code",
|
||||
"execution_count": 15,
|
||||
"execution_count": 13,
|
||||
"metadata": {},
|
||||
"outputs": [
|
||||
{
|
||||
|
@ -582,22 +607,22 @@
|
|||
},
|
||||
{
|
||||
"cell_type": "code",
|
||||
"execution_count": 18,
|
||||
"execution_count": 14,
|
||||
"metadata": {},
|
||||
"outputs": [
|
||||
{
|
||||
"name": "stdout",
|
||||
"output_type": "stream",
|
||||
"text": [
|
||||
"NAMESPACE NAME READY STATUS RESTARTS AGE\r\n",
|
||||
"default azure-dl-3880299103-v5mb7 1/1 Running 0 4m\r\n",
|
||||
"kube-system heapster-2574232661-07lzh 2/2 Running 0 5m\r\n",
|
||||
"kube-system kube-dns-v20-2253765213-730n6 3/3 Running 0 6m\r\n",
|
||||
"kube-system kube-dns-v20-2253765213-m9d9q 3/3 Running 0 6m\r\n",
|
||||
"kube-system kube-proxy-3d25d 1/1 Running 0 6m\r\n",
|
||||
"kube-system kube-svc-redirect-psp3n 1/1 Running 0 6m\r\n",
|
||||
"kube-system kubernetes-dashboard-2898242510-7h28r 1/1 Running 0 6m\r\n",
|
||||
"kube-system tunnelfront-527646831-lj63z 1/1 Running 0 6m\r\n"
|
||||
"NAMESPACE NAME READY STATUS RESTARTS AGE\r\n",
|
||||
"default azure-dl-9db45b4f7-bqq5g 0/1 ImagePullBackOff 0 2m\r\n",
|
||||
"kube-system heapster-75f8df9884-vlt25 2/2 Running 0 4m\r\n",
|
||||
"kube-system kube-dns-v20-5bf84586f4-9jd9r 3/3 Running 0 5m\r\n",
|
||||
"kube-system kube-dns-v20-5bf84586f4-f8nsn 3/3 Running 0 5m\r\n",
|
||||
"kube-system kube-proxy-x64jp 1/1 Running 0 5m\r\n",
|
||||
"kube-system kube-svc-redirect-mkwss 1/1 Running 0 5m\r\n",
|
||||
"kube-system kubernetes-dashboard-665f768455-npsfh 1/1 Running 0 5m\r\n",
|
||||
"kube-system tunnelfront-5c48644fb8-4c6dt 1/1 Running 0 5m\r\n"
|
||||
]
|
||||
}
|
||||
],
|
||||
|
@ -614,35 +639,35 @@
|
|||
},
|
||||
{
|
||||
"cell_type": "code",
|
||||
"execution_count": 19,
|
||||
"execution_count": 15,
|
||||
"metadata": {},
|
||||
"outputs": [
|
||||
{
|
||||
"name": "stdout",
|
||||
"output_type": "stream",
|
||||
"text": [
|
||||
"LAST SEEN FIRST SEEN COUNT NAME KIND SUBOBJECT TYPE REASON SOURCE MESSAGE\r\n",
|
||||
"9m 9m 1 aks-nodepool1-27496346-0.1520fb005972710f Node Normal Starting kubelet, aks-nodepool1-27496346-0 Starting kubelet.\r\n",
|
||||
"7m 8m 3 aks-nodepool1-27496346-0.1520fb08e765af3d Node Normal NodeHasSufficientDisk kubelet, aks-nodepool1-27496346-0 Node aks-nodepool1-27496346-0 status is now: NodeHasSufficientDisk\r\n",
|
||||
"7m 8m 3 aks-nodepool1-27496346-0.1520fb08e7663219 Node Normal NodeHasSufficientMemory kubelet, aks-nodepool1-27496346-0 Node aks-nodepool1-27496346-0 status is now: NodeHasSufficientMemory\r\n",
|
||||
"7m 8m 3 aks-nodepool1-27496346-0.1520fb08e7665b1e Node Normal NodeHasNoDiskPressure kubelet, aks-nodepool1-27496346-0 Node aks-nodepool1-27496346-0 status is now: NodeHasNoDiskPressure\r\n",
|
||||
"55s 8m 9 aks-nodepool1-27496346-0.1520fb08e780a4eb Node Warning FailedNodeAllocatableEnforcement kubelet, aks-nodepool1-27496346-0 Failed to update Node Allocatable Limits \"\": failed to set supported cgroup subsystems for cgroup : Failed to set config for supported subsystems : failed to write 59076296704 to memory.limit_in_bytes: write /var/lib/docker/overlay2/daad1bc683430e39749de19537b2702c53db1f36ba866537b8f76687375c368f/merged/sys/fs/cgroup/memory/memory.limit_in_bytes: invalid argument\r\n",
|
||||
"6m 6m 1 aks-nodepool1-27496346-0.1520fb2740f627b6 Node Normal RegisteredNode controllermanager Node aks-nodepool1-27496346-0 event: Registered Node aks-nodepool1-27496346-0 in NodeController\r\n",
|
||||
"6m 6m 1 aks-nodepool1-27496346-0.1520fb29877c82d1 Node Normal Starting kube-proxy, aks-nodepool1-27496346-0 Starting kube-proxy.\r\n",
|
||||
"6m 6m 1 aks-nodepool1-27496346-0.1520fb2d38a1c12c Node Normal NodeReady kubelet, aks-nodepool1-27496346-0 Node aks-nodepool1-27496346-0 status is now: NodeReady\r\n",
|
||||
"4m 4m 1 azure-dl-3880299103-v5mb7.1520fb46d4fdc9fa Pod Normal Scheduled default-scheduler Successfully assigned azure-dl-3880299103-v5mb7 to aks-nodepool1-27496346-0\r\n",
|
||||
"4m 4m 1 azure-dl-3880299103-v5mb7.1520fb46e1cd117d Pod Normal SuccessfulMountVolume kubelet, aks-nodepool1-27496346-0 MountVolume.SetUp succeeded for volume \"bin\" \r\n",
|
||||
"4m 4m 1 azure-dl-3880299103-v5mb7.1520fb46e1cf3b05 Pod Normal SuccessfulMountVolume kubelet, aks-nodepool1-27496346-0 MountVolume.SetUp succeeded for volume \"libcuda\" \r\n",
|
||||
"4m 4m 1 azure-dl-3880299103-v5mb7.1520fb46e1cf86ce Pod Normal SuccessfulMountVolume kubelet, aks-nodepool1-27496346-0 MountVolume.SetUp succeeded for volume \"lib\" \r\n",
|
||||
"4m 4m 1 azure-dl-3880299103-v5mb7.1520fb46e2516335 Pod Normal SuccessfulMountVolume kubelet, aks-nodepool1-27496346-0 MountVolume.SetUp succeeded for volume \"default-token-thxzk\" \r\n",
|
||||
"4m 4m 1 azure-dl-3880299103-v5mb7.1520fb47102b3c32 Pod spec.containers{azure-dl} Normal Pulling kubelet, aks-nodepool1-27496346-0 pulling image \"masalvar/tfresnet-gpu\"\r\n",
|
||||
"1m 1m 1 azure-dl-3880299103-v5mb7.1520fb73ea97742a Pod spec.containers{azure-dl} Normal Pulled kubelet, aks-nodepool1-27496346-0 Successfully pulled image \"masalvar/tfresnet-gpu\"\r\n",
|
||||
"1m 1m 1 azure-dl-3880299103-v5mb7.1520fb75bccdb1f5 Pod spec.containers{azure-dl} Normal Created kubelet, aks-nodepool1-27496346-0 Created container\r\n",
|
||||
"1m 1m 1 azure-dl-3880299103-v5mb7.1520fb76711f3dd5 Pod spec.containers{azure-dl} Normal Started kubelet, aks-nodepool1-27496346-0 Started container\r\n",
|
||||
"4m 4m 1 azure-dl-3880299103.1520fb46d46b36d8 ReplicaSet Normal SuccessfulCreate replicaset-controller Created pod: azure-dl-3880299103-v5mb7\r\n",
|
||||
"4m 4m 1 azure-dl.1520fb46d294f3d3 Deployment Normal ScalingReplicaSet deployment-controller Scaled up replica set azure-dl-3880299103 to 1\r\n",
|
||||
"4m 4m 1 azure-dl.1520fb46d8ebdb8a Service Normal CreatingLoadBalancer service-controller Creating load balancer\r\n",
|
||||
"2m 2m 1 azure-dl.1520fb66b2965ba7 Service Normal CreatedLoadBalancer service-controller Created load balancer\r\n"
|
||||
"LAST SEEN FIRST SEEN COUNT NAME KIND SUBOBJECT TYPE REASON SOURCE MESSAGE\r\n",
|
||||
"13m 13m 1 aks-nodepool1-27496346-0.152457f2d4c9a0c1 Node Normal Starting kubelet, aks-nodepool1-27496346-0 Starting kubelet.\r\n",
|
||||
"11m 13m 8 aks-nodepool1-27496346-0.152457f2d68e13e7 Node Normal NodeHasSufficientDisk kubelet, aks-nodepool1-27496346-0 Node aks-nodepool1-27496346-0 status is now: NodeHasSufficientDisk\r\n",
|
||||
"11m 13m 8 aks-nodepool1-27496346-0.152457f2d68e3bbf Node Normal NodeHasSufficientMemory kubelet, aks-nodepool1-27496346-0 Node aks-nodepool1-27496346-0 status is now: NodeHasSufficientMemory\r\n",
|
||||
"12m 13m 7 aks-nodepool1-27496346-0.152457f2d68ed1bf Node Normal NodeHasNoDiskPressure kubelet, aks-nodepool1-27496346-0 Node aks-nodepool1-27496346-0 status is now: NodeHasNoDiskPressure\r\n",
|
||||
"13m 13m 1 aks-nodepool1-27496346-0.152457f2d6a0f2ce Node Normal NodeAllocatableEnforced kubelet, aks-nodepool1-27496346-0 Updated Node Allocatable limit across pods\r\n",
|
||||
"9m 9m 1 aks-nodepool1-27496346-0.152458224f43e592 Node Normal RegisteredNode controllermanager Node aks-nodepool1-27496346-0 event: Registered Node aks-nodepool1-27496346-0 in Controller\r\n",
|
||||
"9m 9m 1 aks-nodepool1-27496346-0.15245824056578a2 Node Normal Starting kube-proxy, aks-nodepool1-27496346-0 Starting kube-proxy.\r\n",
|
||||
"6m 6m 1 azure-dl-9db45b4f7-bqq5g.152458484af7e9af Pod Normal Scheduled default-scheduler Successfully assigned azure-dl-9db45b4f7-bqq5g to aks-nodepool1-27496346-0\r\n",
|
||||
"6m 6m 1 azure-dl-9db45b4f7-bqq5g.1524584856327c4a Pod Normal SuccessfulMountVolume kubelet, aks-nodepool1-27496346-0 MountVolume.SetUp succeeded for volume \"nvidia\" \r\n",
|
||||
"6m 6m 1 azure-dl-9db45b4f7-bqq5g.1524584857145997 Pod Normal SuccessfulMountVolume kubelet, aks-nodepool1-27496346-0 MountVolume.SetUp succeeded for volume \"default-token-bb2wg\" \r\n",
|
||||
"4m 6m 2 azure-dl-9db45b4f7-bqq5g.1524584884dda263 Pod spec.containers{azure-dl} Normal Pulling kubelet, aks-nodepool1-27496346-0 pulling image \"masalvar/tfresnet-gpu\"\r\n",
|
||||
"5m 5m 1 azure-dl-9db45b4f7-bqq5g.152458607ea65616 Pod spec.containers{azure-dl} Warning Failed kubelet, aks-nodepool1-27496346-0 Failed to pull image \"masalvar/tfresnet-gpu\": rpc error: code = Canceled desc = context canceled\r\n",
|
||||
"5m 5m 2 azure-dl-9db45b4f7-bqq5g.152458607ea7d5af Pod Warning FailedSync kubelet, aks-nodepool1-27496346-0 Error syncing pod\r\n",
|
||||
"5m 5m 1 azure-dl-9db45b4f7-bqq5g.15245860c6aafe6f Pod spec.containers{azure-dl} Normal BackOff kubelet, aks-nodepool1-27496346-0 Back-off pulling image \"masalvar/tfresnet-gpu\"\r\n",
|
||||
"1m 1m 1 azure-dl-9db45b4f7-bqq5g.152458908b326961 Pod spec.containers{azure-dl} Normal Pulled kubelet, aks-nodepool1-27496346-0 Successfully pulled image \"masalvar/tfresnet-gpu\"\r\n",
|
||||
"1m 1m 1 azure-dl-9db45b4f7-bqq5g.152458909644c422 Pod spec.containers{azure-dl} Normal Created kubelet, aks-nodepool1-27496346-0 Created container\r\n",
|
||||
"1m 1m 1 azure-dl-9db45b4f7-bqq5g.152458909ed20818 Pod spec.containers{azure-dl} Normal Started kubelet, aks-nodepool1-27496346-0 Started container\r\n",
|
||||
"6m 6m 1 azure-dl-9db45b4f7.152458484a8f532a ReplicaSet Normal SuccessfulCreate replicaset-controller Created pod: azure-dl-9db45b4f7-bqq5g\r\n",
|
||||
"6m 6m 1 azure-dl.1524584848faa7c7 Deployment Normal ScalingReplicaSet deployment-controller Scaled up replica set azure-dl-9db45b4f7 to 1\r\n",
|
||||
"6m 6m 1 azure-dl.152458484c36803c Service Normal EnsuringLoadBalancer service-controller Ensuring load balancer\r\n",
|
||||
"3m 3m 1 azure-dl.152458762827d674 Service Normal EnsuredLoadBalancer service-controller Ensured load balancer\r\n"
|
||||
]
|
||||
}
|
||||
],
|
||||
|
@ -652,32 +677,32 @@
|
|||
},
|
||||
{
|
||||
"cell_type": "code",
|
||||
"execution_count": 38,
|
||||
"execution_count": 16,
|
||||
"metadata": {},
|
||||
"outputs": [
|
||||
{
|
||||
"name": "stdout",
|
||||
"output_type": "stream",
|
||||
"text": [
|
||||
"2018-03-31 10:45:57,344 CRIT Supervisor running as root (no user in config file)\r\n",
|
||||
"2018-03-31 10:45:57,346 INFO supervisord started with pid 7\r\n",
|
||||
"2018-03-31 10:45:58,348 INFO spawned: 'program_exit' with pid 15\r\n",
|
||||
"2018-03-31 10:45:58,349 INFO spawned: 'nginx' with pid 16\r\n",
|
||||
"2018-03-31 10:45:58,351 INFO spawned: 'gunicorn' with pid 17\r\n",
|
||||
"2018-03-31 10:45:59,380 INFO success: program_exit entered RUNNING state, process has stayed up for > than 1 seconds (startsecs)\r\n",
|
||||
"2018-03-31 10:45:59.971916: I tensorflow/core/platform/cpu_feature_guard.cc:137] Your CPU supports instructions that this TensorFlow binary was not compiled to use: SSE4.1 SSE4.2 AVX AVX2 FMA\r\n",
|
||||
"2018-03-31 10:46:03,977 INFO success: nginx entered RUNNING state, process has stayed up for > than 5 seconds (startsecs)\r\n",
|
||||
"2018-03-31 10:46:11.453255: I tensorflow/core/common_runtime/gpu/gpu_device.cc:1030] Found device 0 with properties: \r\n",
|
||||
"2018-04-11 09:45:52,173 CRIT Supervisor running as root (no user in config file)\r\n",
|
||||
"2018-04-11 09:45:52,175 INFO supervisord started with pid 1\r\n",
|
||||
"2018-04-11 09:45:53,178 INFO spawned: 'program_exit' with pid 9\r\n",
|
||||
"2018-04-11 09:45:53,179 INFO spawned: 'nginx' with pid 10\r\n",
|
||||
"2018-04-11 09:45:53,180 INFO spawned: 'gunicorn' with pid 11\r\n",
|
||||
"2018-04-11 09:45:54,211 INFO success: program_exit entered RUNNING state, process has stayed up for > than 1 seconds (startsecs)\r\n",
|
||||
"2018-04-11 09:45:54.734234: I tensorflow/core/platform/cpu_feature_guard.cc:137] Your CPU supports instructions that this TensorFlow binary was not compiled to use: SSE4.1 SSE4.2 AVX AVX2 FMA\r\n",
|
||||
"2018-04-11 09:45:58,739 INFO success: nginx entered RUNNING state, process has stayed up for > than 5 seconds (startsecs)\r\n",
|
||||
"2018-04-11 09:46:01.556833: I tensorflow/core/common_runtime/gpu/gpu_device.cc:1030] Found device 0 with properties: \r\n",
|
||||
"name: Tesla K80 major: 3 minor: 7 memoryClockRate(GHz): 0.8235\r\n",
|
||||
"pciBusID: cff2:00:00.0\r\n",
|
||||
"pciBusID: 1705:00:00.0\r\n",
|
||||
"totalMemory: 11.17GiB freeMemory: 11.10GiB\r\n",
|
||||
"2018-03-31 10:46:11.453299: I tensorflow/core/common_runtime/gpu/gpu_device.cc:1120] Creating TensorFlow device (/device:GPU:0) -> (device: 0, name: Tesla K80, pci bus id: cff2:00:00.0, compute capability: 3.7)\r\n",
|
||||
"2018-04-11 09:46:01.556879: I tensorflow/core/common_runtime/gpu/gpu_device.cc:1120] Creating TensorFlow device (/device:GPU:0) -> (device: 0, name: Tesla K80, pci bus id: 1705:00:00.0, compute capability: 3.7)\r\n",
|
||||
"INFO:tensorflow:Restoring parameters from resnet_v1_152.ckpt\r\n",
|
||||
"{\"timestamp\": \"2018-03-31T10:46:17.203847Z\", \"level\": \"INFO\", \"stack_info\": null, \"host\": \"azure-dl-3880299103-v5mb7\", \"message\": \"Restoring parameters from resnet_v1_152.ckpt\", \"logger\": \"tensorflow\", \"msg\": \"Restoring parameters from %s\", \"tags\": [], \"path\": \"/opt/conda/envs/py3.5/lib/python3.5/site-packages/tensorflow/python/platform/tf_logging.py\"}\r\n",
|
||||
"{\"timestamp\": \"2018-03-31T10:46:19.060001Z\", \"level\": \"INFO\", \"stack_info\": null, \"host\": \"azure-dl-3880299103-v5mb7\", \"message\": \"Model loading time: 19089.38 ms\", \"logger\": \"model_driver\", \"tags\": [], \"path\": \"/code/driver.py\"}\r\n",
|
||||
"2018-03-31 10:46:19,060 INFO success: gunicorn entered RUNNING state, process has stayed up for > than 20 seconds (startsecs)\r\n",
|
||||
"{\"level\": \"INFO\", \"host\": \"azure-dl-9db45b4f7-bqq5g\", \"timestamp\": \"2018-04-11T09:46:07.076248Z\", \"path\": \"/opt/conda/envs/py3.5/lib/python3.5/site-packages/tensorflow/python/platform/tf_logging.py\", \"msg\": \"Restoring parameters from %s\", \"logger\": \"tensorflow\", \"message\": \"Restoring parameters from resnet_v1_152.ckpt\", \"stack_info\": null, \"tags\": []}\r\n",
|
||||
"{\"level\": \"INFO\", \"host\": \"azure-dl-9db45b4f7-bqq5g\", \"timestamp\": \"2018-04-11T09:46:08.969746Z\", \"path\": \"/code/driver.py\", \"logger\": \"model_driver\", \"message\": \"Model loading time: 14236.73 ms\", \"stack_info\": null, \"tags\": []}\r\n",
|
||||
"Initialising\r\n",
|
||||
"{\"timestamp\": \"2018-03-31T10:46:19.065300Z\", \"level\": \"INFO\", \"stack_info\": null, \"host\": \"azure-dl-3880299103-v5mb7\", \"message\": \" * Running on http://127.0.0.1:5000/ (Press CTRL+C to quit)\", \"logger\": \"werkzeug\", \"msg\": \" * Running on %s://%s:%d/ %s\", \"tags\": [], \"path\": \"/opt/conda/envs/py3.5/lib/python3.5/site-packages/werkzeug/_internal.py\"}\r\n"
|
||||
"{\"level\": \"INFO\", \"host\": \"azure-dl-9db45b4f7-bqq5g\", \"timestamp\": \"2018-04-11T09:46:08.974735Z\", \"path\": \"/opt/conda/envs/py3.5/lib/python3.5/site-packages/werkzeug/_internal.py\", \"msg\": \" * Running on %s://%s:%d/ %s\", \"logger\": \"werkzeug\", \"message\": \" * Running on http://127.0.0.1:5000/ (Press CTRL+C to quit)\", \"stack_info\": null, \"tags\": []}\r\n",
|
||||
"2018-04-11 09:46:13,980 INFO success: gunicorn entered RUNNING state, process has stayed up for > than 20 seconds (startsecs)\r\n"
|
||||
]
|
||||
}
|
||||
],
|
||||
|
@ -696,15 +721,15 @@
|
|||
},
|
||||
{
|
||||
"cell_type": "code",
|
||||
"execution_count": 39,
|
||||
"execution_count": 17,
|
||||
"metadata": {},
|
||||
"outputs": [
|
||||
{
|
||||
"name": "stdout",
|
||||
"output_type": "stream",
|
||||
"text": [
|
||||
"NAME TYPE CLUSTER-IP EXTERNAL-IP PORT(S) AGE\r\n",
|
||||
"azure-dl LoadBalancer 10.0.204.221 40.71.172.160 80:32567/TCP 11m\r\n"
|
||||
"NAME TYPE CLUSTER-IP EXTERNAL-IP PORT(S) AGE\r\n",
|
||||
"azure-dl LoadBalancer 10.0.63.93 13.82.95.158 80:31941/TCP 7m\r\n"
|
||||
]
|
||||
}
|
||||
],
|
||||
|
@ -731,14 +756,14 @@
|
|||
},
|
||||
{
|
||||
"cell_type": "code",
|
||||
"execution_count": 72,
|
||||
"execution_count": 18,
|
||||
"metadata": {},
|
||||
"outputs": [
|
||||
{
|
||||
"name": "stdout",
|
||||
"output_type": "stream",
|
||||
"text": [
|
||||
"deployment \"azure-dl\" deleted\n",
|
||||
"deployment.apps \"azure-dl\" deleted\n",
|
||||
"service \"azure-dl\" deleted\n"
|
||||
]
|
||||
}
|
||||
|
@ -749,7 +774,7 @@
|
|||
},
|
||||
{
|
||||
"cell_type": "code",
|
||||
"execution_count": 75,
|
||||
"execution_count": 19,
|
||||
"metadata": {},
|
||||
"outputs": [
|
||||
{
|
||||
|
@ -766,7 +791,7 @@
|
|||
},
|
||||
{
|
||||
"cell_type": "code",
|
||||
"execution_count": 76,
|
||||
"execution_count": 20,
|
||||
"metadata": {},
|
||||
"outputs": [
|
||||
{
|
||||
|
|
Различия файлов скрыты, потому что одна или несколько строк слишком длинны
Различия файлов скрыты, потому что одна или несколько строк слишком длинны
Загрузка…
Ссылка в новой задаче