# Copyright (c) 2021, NVIDIA CORPORATION. All rights reserved. # Licensed under the Apache License, Version 2.0 (the "License"); # you may not use this file except in compliance with the License. # You may obtain a copy of the License at # # http://www.apache.org/licenses/LICENSE-2.0 # # Unless required by applicable law or agreed to in writing, software # distributed under the License is distributed on an "AS IS" BASIS, # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. # See the License for the specific language governing permissions and # limitations under the License. # Created on 2024-01-01 # Author: GuAn Zhu name: "cif_search" backend: "python" max_batch_size: 128 sequence_batching{ max_sequence_idle_microseconds: 15000000 oldest { max_candidate_sequences: 1024 preferred_batch_size: [32, 64, 128] } control_input [ { name: "START", control [ { kind: CONTROL_SEQUENCE_START fp32_false_true: [0, 1] } ] }, { name: "READY" control [ { kind: CONTROL_SEQUENCE_READY fp32_false_true: [0, 1] } ] }, { name: "CORRID", control [ { kind: CONTROL_SEQUENCE_CORRID data_type: TYPE_UINT64 } ] }, { name: "END", control [ { kind: CONTROL_SEQUENCE_END fp32_false_true: [0, 1] } ] } ] } parameters [ { key: "vocabulary", value: { string_value: "model_repo_paraformer_large_online/feature_extractor/config.yaml"} }, { key: "FORCE_CPU_ONLY_INPUT_TENSORS" value: {string_value:"no"} } ] input [ { name: "enc" data_type: TYPE_FP32 dims: [-1, 512] }, { name: "enc_len" data_type: TYPE_INT32 dims: [1] reshape: { shape: [ ] } }, { name: 'alphas' data_type: TYPE_FP32 dims: [-1] } ] output [ { name: "transcripts" data_type: TYPE_STRING dims: [1] } ] instance_group [ { count: 6 kind: KIND_CPU } ]