From 23f53a1b879cc7c65c63385a8e12db86e9156c89 Mon Sep 17 00:00:00 2001 From: =?UTF-8?q?Piotr=20Or=C5=82owski?= Date: Wed, 30 Oct 2024 16:38:07 +0100 Subject: [PATCH] Cosmetic documentation updates --- client/cpp/kserve-api/README.md | 2 +- client/python/kserve-api/samples/README.md | 2 +- docs/llm/quickstart.md | 2 +- 3 files changed, 3 insertions(+), 3 deletions(-) diff --git a/client/cpp/kserve-api/README.md b/client/cpp/kserve-api/README.md index bb62539357..550557f4fd 100644 --- a/client/cpp/kserve-api/README.md +++ b/client/cpp/kserve-api/README.md @@ -388,7 +388,7 @@ Usage: ```Bash ./http_model_metadata --http_port 8000 --http_address localhost -{"name":"dummy","versions":["1"],"platform":"OpenVINO","inputs":[{"name":"b","datatype":"FP32","shape":[1,10]}],"outputs":[{"name":"a","datatype":"FP32","shape":[1,10]}]} +{"name":"dummy","versions":["1"],"platform":"OpenVINO","inputs":[{"name":"b","datatype":"FP32","shape":[1,10]}],"outputs":[{"name":"a","datatype":"FP32","shape":[1,10]}],"rt_info":{"MO_version":"2020.1.0-61-gd349c3ba4a","conversion_parameters":{"blobs_as_inputs":"True","caffe_parser_path":"DIR","data_type":"float","disable_nhwc_to_nchw":"False"},"model_info":{"precision":"FP16","resolution":{"height":"200","width":"300"}},"optimization":{},"version":"10"}} ``` ### Run the Client to perform inference diff --git a/client/python/kserve-api/samples/README.md b/client/python/kserve-api/samples/README.md index ce79df2091..de93a6106f 100644 --- a/client/python/kserve-api/samples/README.md +++ b/client/python/kserve-api/samples/README.md @@ -624,7 +624,7 @@ optional arguments: ```Bash python3 ./http_model_metadata.py --http_port 8000 --http_address localhost --model_name resnet -{'name': 'resnet', 'versions': ['1'], 'platform': 'OpenVINO', 'inputs': [{'name': '0', 'datatype': 'FP32', 'shape': [1, 224, 224, 3]}], 'outputs': [{'name': '1463', 'datatype': 'FP32', 'shape': [1, 1000]}]} +{'name': 'resnet', 'versions': ['1'], 'platform': 'OpenVINO', 'inputs': [{'name': '0', 'datatype': 'FP32', 'shape': [1, 224, 224, 3]}], 'outputs': [{'name': '1463', 'datatype': 'FP32', 'shape': [1, 1000]}], 'rt_info': {'MO_version': '2022.1.0-6456-86faa257241', 'conversion_parameters': {'caffe_parser_path': 'DIR', 'compress_fp16': 'False', 'data_type': 'FP32', 'disable_nhwc_to_nchw': 'False', 'disable_omitting_optional': 'False', 'disable_resnet_optimization': 'False', 'disable_weights_compression': 'False', 'enable_concat_optimization': 'False', 'enable_flattening_nested_params': 'False', 'enable_ssd_gluoncv': 'False', 'extensions': 'DIR', 'framework': 'onnx', 'freeze_placeholder_with_value': '{}', 'generate_deprecated_IR_V7': 'False', 'input': '0', 'input_model': 'DIR/model_bin.onnx', 'input_model_is_text': 'False', 'input_shape': '[1,3,224,224]', 'k': 'DIR/CustomLayersMapping.xml', 'keep_shape_ops': 'True', 'layout': '0(nchw)', 'layout_values': "{'0': {'source_layout': 'nchw', 'target_layout': None, 'is_input': True}}", 'legacy_ir_generation': 'False', 'legacy_mxnet_model': 'False', 'log_level': 'ERROR', 'mean_scale_values': "{'0': {'mean': array([123.678, 116.28 , 103.53 ]), 'scale': array([58.3942, 57.12 , 57.3756])}}", 'mean_values': '0[123.678,116.28,103.53]', 'model_name': 'resnet50-binary-0001', 'output': "['1463']", 'output_dir': 'DIR', 'placeholder_data_types': '{}', 'placeholder_shapes': "{'0': (1, 3, 224, 224)}", 'progress': 'False', 'remove_memory': 'False', 'remove_output_softmax': 'False', 'reverse_input_channels': 'True', 'save_params_from_nd': 'False', 'scale_values': '0[58.3942,57.12,57.3756]', 'silent': 'False', 'source_layout': '()', 'static_shape': 'False', 'stream_output': 'False', 'target_layout': '()', 'transform': '', 'unset': 'batch, counts, disable_fusing, disable_gfusing, finegrain_fusing, input_checkpoint, input_meta_graph, input_proto, input_symbol, mean_file, mean_file_offsets, move_to_preprocess, nd_prefix_name, pretrained_model_name, saved_model_dir, saved_model_tags, scale, tensorboard_logdir, tensorflow_custom_layer_libraries, tensorflow_custom_operations_config_update, tensorflow_object_detection_api_pipeline_config, tensorflow_use_custom_operations_config, transformations_config', 'use_legacy_frontend': 'False', 'use_new_frontend': 'False'}, 'optimization': {}, 'version': '11'}} ``` ### Run the Client to perform inference diff --git a/docs/llm/quickstart.md b/docs/llm/quickstart.md index dc77227b73..57ea839747 100644 --- a/docs/llm/quickstart.md +++ b/docs/llm/quickstart.md @@ -38,7 +38,7 @@ node: { node_options: { [type.googleapis.com / mediapipe.LLMCalculatorOptions]: { models_path: "./", - plugin_config: '{"KV_CACHE_PRECISION": "u8", "DYNAMIC_QUANTIZATION_GROUP_SIZE": "32"}', + plugin_config: '\''{"KV_CACHE_PRECISION": "u8", "DYNAMIC_QUANTIZATION_GROUP_SIZE": "32"}'\'', cache_size: 4 } }