Deploy MXNet model serving, with awslab/mxnet-model-server
Python, mxnet, mxnet-model-server, docker, jmeter (for stress tests)
mxnet-model-export --model-name r50 --model-path model-r50-am-lfw
cd models
mxnet-model-server --models r50=r50.model ga=ga.model --service mxnet_vision_service.py --port=8080
nvidia-docker run --name mms -p 80:8080 -itd -v <full path to mxnet-serving/models>:/models deepinsight/mms_gpu mxnet-model-server start --mms-config /models/mms_app_gpu.conf
curl -X POST http://127.0.0.1/r50/predict -F "data=@models/image.jpg"
cd stress-test/threads-100-gpu
jmeter -n -t test-plan.jmx -e -l log -o output