Untitled

From Denim Iguana, 1 Year ago, written in Plain Text.

Embed

Download Paste or View Raw
Hits: 89

# Copyright (c) 2022, NVIDIA CORPORATION. All rights reserved.

#

# NVIDIA CORPORATION and its licensors retain all intellectual property

# and proprietary rights in and to this software, related documentation

# and any modifications thereto. Any use, reproduction, disclosure or

# distribution of this software and related documentation without an express

# license agreement from NVIDIA CORPORATION is strictly prohibited.

# GPU family of target platform. Supported values: tegra, non-tegra

riva_target_gpu_family="tegra"

# Name of tegra platform that is being used. Supported tegra platforms: orin, xavier

riva_tegra_platform="orin"

# Enable or Disable Riva Services

service_enabled_asr=true

service_enabled_nlp=true

service_enabled_tts=true

# Enable Riva Enterprise

# If enrolled in Enterprise, enable Riva Enterprise by setting configuration

# here. You must explicitly acknowledge you have read and agree to the EULA.

# RIVA_API_KEY=<ngc api key>

# RIVA_API_NGC_ORG=<ngc organization>

# RIVA_EULA=accept

# Language code to fetch models of a specify language

# Currently only ASR supports languages other than English

# Supported language codes: en-US, en-GB, de-DE, es-US, ru-RU, zh-CN, hi-IN, fr-FR, ko-KR, pt-BR

# for any language other than English, set service_enabled_nlp and service_enabled_tts to False

# for multiple languages enter space separated language codes.

language_code=("en-US")

# ASR acoustic model architecture

# Supported values are: conformer, citrinet_1024, citrinet_256 (en-US + arm64 only), jasper (en-US + amd64 only), quartznet (en-US + amd64 only)

asr_acoustic_model=("conformer")

# Specify one or more GPUs to use

# specifying more than one GPU is currently an experimental feature, and may result in undefined behaviours.

gpus_to_use="device=0"

# Specify the encryption key to use to deploy models

MODEL_DEPLOY_KEY="tlt_encode"

# Locations to use for storing models artifacts

#

# If an absolute path is specified, the data will be written to that location

# Otherwise, a docker volume will be used (default).

#

# riva_init.sh will create a `rmir` and `models` directory in the volume or

# path specified.

#

# RMIR ($riva_model_loc/rmir)

# Riva uses an intermediate representation (RMIR) for models

# that are ready to deploy but not yet fully optimized for deployment. Pretrained

# versions can be obtained from NGC (by specifying NGC models below) and will be

# downloaded to $riva_model_loc/rmir by `riva_init.sh`

#

# Custom models produced by NeMo or TLT and prepared using riva-build

# may also be copied manually to this location $(riva_model_loc/rmir).

#

# Models ($riva_model_loc/models)

# During the riva_init process, the RMIR files in $riva_model_loc/rmir

# are inspected and optimized for deployment. The optimized versions are

# stored in $riva_model_loc/models. The riva server exclusively uses these

# optimized versions.

riva_model_loc="riva-model-repo"

if [[ $riva_target_gpu_family == "tegra" ]]; then

riva_model_loc="`pwd`/model_repository"

fi

# The default RMIRs are downloaded from NGC by default in the above $riva_rmir_loc directory

# If you'd like to skip the download from NGC and use the existing RMIRs in the $riva_rmir_loc

# then set the below $use_existing_rmirs flag to true. You can also deploy your set of custom

# RMIRs by keeping them in the riva_rmir_loc dir and use this quickstart script with the

# below flag to deploy them all together.

use_existing_rmirs=false

# Ports to expose for Riva services

riva_speech_api_port="50051"

# NGC orgs

riva_ngc_org="nvidia"

riva_ngc_team="riva"

riva_ngc_image_version="2.7.0"

riva_ngc_model_version="2.7.0"

# Pre-built models listed below will be downloaded from NGC. If models already exist in $riva-rmir

# then models can be commented out to skip download from NGC

########## ASR MODELS ##########

models_asr=()

for lang_code in ${language_code[@]}; do

modified_lang_code="${lang_code/-/_}"

modified_lang_code=${modified_lang_code,,}

if [[ $riva_target_gpu_family == "tegra" ]]; then

if [[ ${asr_acoustic_model} == "jasper" || \

${asr_acoustic_model} == "quartznet" ]]; then

echo "Jasper and Quartznet models are not available for arm64 architecture"

exit 1

fi

if [[ ${asr_acoustic_model} == "citrinet_256" && ${lang_code} != "en-US" ]]; then

echo "For arm64 architecture, citrinet_256 acoustic model is only available for language code en-US."

exit 1

fi

models_asr+=(

"${riva_ngc_org}/${riva_ngc_team}/models_asr_${asr_acoustic_model}_${modified_lang_code}_str:${riva_ngc_model_version}-${riva_target_gpu_family}-${riva_tegra_platform}"

)

else

if [[ ${asr_acoustic_model} != "conformer" && \

${asr_acoustic_model} != "citrinet_1024" && \

${asr_acoustic_model} != "jasper" && \

${asr_acoustic_model} != "quartznet" ]]; then

echo "For amd64 architecture, valid acoustic models are conformer, citrinet_1024, jasper and quartznet."

exit 1

fi

if [[ (${asr_acoustic_model} == "jasper" || \

${asr_acoustic_model} == "quartznet") && \

${lang_code} != "en-US" ]]; then

echo "jasper and quartznet acoustic models are only available for language code en-US."

exit 1

fi

#Setting default Conformer Mandarin models to greedy decoder due to high high latency in os2s.

decoder=""

if [[ ${asr_acoustic_model} == "conformer" && ${lang_code} == "zh-CN" ]]; then

decoder="_gre"

fi

models_asr+=(

### Streaming w/ CPU decoder, best latency configuration

"${riva_ngc_org}/${riva_ngc_team}/rmir_asr_${asr_acoustic_model}_${modified_lang_code}_str${decoder}:${riva_ngc_model_version}"

### Streaming w/ CPU decoder, best throughput configuration

# "${riva_ngc_org}/${riva_ngc_team}/rmir_asr_${asr_acoustic_model}_${modified_lang_code}_str_thr${decoder}:${riva_ngc_model_version}"

### Offline w/ CPU decoder,

"${riva_ngc_org}/${riva_ngc_team}/rmir_asr_${asr_acoustic_model}_${modified_lang_code}_ofl${decoder}:${riva_ngc_model_version}"

)

fi

### Punctuation model

if [[ "${lang_code}" == "en-US" || "${lang_code}" == "de-DE" || "${lang_code}" == "hi-IN" || "${lang_code}" == "fr-FR" || "${lang_code}" == "es-US" || "${lang_code}" == "zh-CN" || "${lang_code}" == "en-GB" ]]; then

if [[ $riva_target_gpu_family == "tegra" ]]; then

models_asr+=(

"${riva_ngc_org}/${riva_ngc_team}/models_nlp_punctuation_bert_base_${modified_lang_code}:${riva_ngc_model_version}-${riva_target_gpu_family}-${riva_tegra_platform}"

)

else

models_asr+=(

"${riva_ngc_org}/${riva_ngc_team}/rmir_nlp_punctuation_bert_base_${modified_lang_code}:${riva_ngc_model_version}"

)

fi

fi

done

########## NLP MODELS ##########

if [[ $riva_target_gpu_family == "tegra" ]]; then

models_nlp=(

### BERT Base Intent Slot model for misty domain fine-tuned on weather, smalltalk/personality, poi/map datasets.

"${riva_ngc_org}/${riva_ngc_team}/models_nlp_intent_slot_misty_bert_base:${riva_ngc_model_version}-${riva_target_gpu_family}-${riva_tegra_platform}"

### DistilBERT Intent Slot model for misty domain fine-tuned on weather, smalltalk/personality, poi/map datasets.

# "${riva_ngc_org}/${riva_ngc_team}/models_nlp_intent_slot_misty_distilbert:${riva_ngc_model_version}-${riva_target_gpu_family}-${riva_tegra_platform}"

)

else

models_nlp=(

### Bert base Punctuation model

"${riva_ngc_org}/${riva_ngc_team}/rmir_nlp_punctuation_bert_base_en_us:${riva_ngc_model_version}"

### BERT base Named Entity Recognition model fine-tuned on GMB dataset with class labels LOC, PER, ORG etc.

"${riva_ngc_org}/${riva_ngc_team}/rmir_nlp_named_entity_recognition_bert_base:${riva_ngc_model_version}"

### BERT Base Intent Slot model fine-tuned on weather dataset.

"${riva_ngc_org}/${riva_ngc_team}/rmir_nlp_intent_slot_bert_base:${riva_ngc_model_version}"

### BERT Base Question Answering model fine-tuned on Squad v2.

"${riva_ngc_org}/${riva_ngc_team}/rmir_nlp_question_answering_bert_base:${riva_ngc_model_version}"

### Megatron345M Question Answering model fine-tuned on Squad v2.

# "${riva_ngc_org}/${riva_ngc_team}/rmir_nlp_question_answering_megatron:${riva_ngc_model_version}"

### Bert base Text Classification model fine-tuned on 4class (weather, meteorology, personality, nomatch) domain model.

"${riva_ngc_org}/${riva_ngc_team}/rmir_nlp_text_classification_bert_base:${riva_ngc_model_version}"

)

fi

########## TTS MODELS ##########

if [[ $riva_target_gpu_family == "tegra" ]]; then

models_tts=(

"${riva_ngc_org}/${riva_ngc_team}/models_tts_fastpitch_hifigan_en_us:${riva_ngc_model_version}-${riva_target_gpu_family}-${riva_tegra_platform}"

)

else

models_tts=(

"${riva_ngc_org}/${riva_ngc_team}/rmir_tts_fastpitch_hifigan_en_us:${riva_ngc_model_version}"

)

fi

NGC_TARGET=${riva_ngc_org}

if [[ ! -z ${riva_ngc_team} ]]; then

NGC_TARGET="${NGC_TARGET}/${riva_ngc_team}"

else

team="\"\""

fi

# Specify paths to SSL Key and Certificate files to use TLS/SSL Credentials for a secured connection.

# If either are empty, an insecure connection will be used.

# Stored within container at /ssl/servert.crt and /ssl/server.key

# Optional, one can also specify a root certificate, stored within container at /ssl/root_server.crt

ssl_server_cert=""

ssl_server_key=""

ssl_root_cert=""

# define docker images required to run Riva

image_speech_api="nvcr.io/${NGC_TARGET}/riva-speech:${riva_ngc_image_version}-l4t-aarch64"

# define docker images required to setup Riva

image_init_speech="nvcr.io/${NGC_TARGET}/riva-speech:${riva_ngc_image_version}-servicemaker-l4t-aarch64"

# daemon names

riva_daemon_speech="riva-speech"

if [[ $riva_target_gpu_family != "tegra" ]]; then

riva_daemon_client="riva-client"

fi

Author

Title

Language

Your paste - Paste your paste here

# Copyright (c) 2022, NVIDIA CORPORATION.  All rights reserved.
#
# NVIDIA CORPORATION and its licensors retain all intellectual property
# and proprietary rights in and to this software, related documentation
# and any modifications thereto.  Any use, reproduction, disclosure or
# distribution of this software and related documentation without an express
# license agreement from NVIDIA CORPORATION is strictly prohibited.

# GPU family of target platform. Supported values: tegra, non-tegra
riva_target_gpu_family=&quot;tegra&quot;

# Name of tegra platform that is being used. Supported tegra platforms: orin, xavier
riva_tegra_platform=&quot;orin&quot;

# Enable or Disable Riva Services
service_enabled_asr=true
service_enabled_nlp=true
service_enabled_tts=true

# Enable Riva Enterprise
# If enrolled in Enterprise, enable Riva Enterprise by setting configuration
# here. You must explicitly acknowledge you have read and agree to the EULA.
# RIVA_API_KEY=&lt;ngc api key&gt;
# RIVA_API_NGC_ORG=&lt;ngc organization&gt;
# RIVA_EULA=accept

# Language code to fetch models of a specify language
# Currently only ASR supports languages other than English
# Supported language codes: en-US, en-GB, de-DE, es-US, ru-RU, zh-CN, hi-IN, fr-FR, ko-KR, pt-BR
# for any language other than English, set service_enabled_nlp and service_enabled_tts to False
# for multiple languages enter space separated language codes.
language_code=(&quot;en-US&quot;)

# ASR acoustic model architecture
# Supported values are: conformer, citrinet_1024, citrinet_256 (en-US + arm64 only), jasper (en-US + amd64 only), quartznet (en-US + amd64 only)
asr_acoustic_model=(&quot;conformer&quot;)

# Specify one or more GPUs to use
# specifying more than one GPU is currently an experimental feature, and may result in undefined behaviours.
gpus_to_use=&quot;device=0&quot;

# Specify the encryption key to use to deploy models
MODEL_DEPLOY_KEY=&quot;tlt_encode&quot;

# Locations to use for storing models artifacts
#
# If an absolute path is specified, the data will be written to that location
# Otherwise, a docker volume will be used (default).
#
# riva_init.sh will create a `rmir` and `models` directory in the volume or
# path specified.
#
# RMIR ($riva_model_loc/rmir)
# Riva uses an intermediate representation (RMIR) for models
# that are ready to deploy but not yet fully optimized for deployment. Pretrained
# versions can be obtained from NGC (by specifying NGC models below) and will be
# downloaded to $riva_model_loc/rmir by `riva_init.sh`
#
# Custom models produced by NeMo or TLT and prepared using riva-build
# may also be copied manually to this location $(riva_model_loc/rmir).
#
# Models ($riva_model_loc/models)
# During the riva_init process, the RMIR files in $riva_model_loc/rmir
# are inspected and optimized for deployment. The optimized versions are
# stored in $riva_model_loc/models. The riva server exclusively uses these
# optimized versions.
riva_model_loc=&quot;riva-model-repo&quot;

if [[ $riva_target_gpu_family == &quot;tegra&quot; ]]; then
    riva_model_loc=&quot;`pwd`/model_repository&quot;
fi

# The default RMIRs are downloaded from NGC by default in the above $riva_rmir_loc directory
# If you'd like to skip the download from NGC and use the existing RMIRs in the $riva_rmir_loc
# then set the below $use_existing_rmirs flag to true. You can also deploy your set of custom
# RMIRs by keeping them in the riva_rmir_loc dir and use this quickstart script with the
# below flag to deploy them all together.
use_existing_rmirs=false

# Ports to expose for Riva services
riva_speech_api_port=&quot;50051&quot;

# NGC orgs
riva_ngc_org=&quot;nvidia&quot;
riva_ngc_team=&quot;riva&quot;
riva_ngc_image_version=&quot;2.7.0&quot;
riva_ngc_model_version=&quot;2.7.0&quot;

# Pre-built models listed below will be downloaded from NGC. If models already exist in $riva-rmir
# then models can be commented out to skip download from NGC

########## ASR MODELS ##########

models_asr=()

for lang_code in ${language_code[@]}; do
    modified_lang_code=&quot;${lang_code/-/_}&quot;
    modified_lang_code=${modified_lang_code,,}
    if [[ $riva_target_gpu_family  == &quot;tegra&quot; ]]; then

if [[ ${asr_acoustic_model} == &quot;jasper&quot; || \
            ${asr_acoustic_model} == &quot;quartznet&quot; ]]; then
          echo &quot;Jasper and Quartznet models are not available for arm64 architecture&quot;
          exit 1
      fi

if [[ ${asr_acoustic_model} == &quot;citrinet_256&quot; &amp;&amp; ${lang_code} != &quot;en-US&quot; ]]; then
        echo &quot;For arm64 architecture, citrinet_256 acoustic model is only available for language code en-US.&quot;
        exit 1
      fi
      models_asr+=(
          &quot;${riva_ngc_org}/${riva_ngc_team}/models_asr_${asr_acoustic_model}_${modified_lang_code}_str:${riva_ngc_model_version}-${riva_target_gpu_family}-${riva_tegra_platform}&quot;
      )
    else

if [[ ${asr_acoustic_model} != &quot;conformer&quot; &amp;&amp; \
            ${asr_acoustic_model} != &quot;citrinet_1024&quot; &amp;&amp; \
            ${asr_acoustic_model} != &quot;jasper&quot; &amp;&amp; \
            ${asr_acoustic_model} != &quot;quartznet&quot; ]]; then
        echo &quot;For amd64 architecture, valid acoustic models are conformer, citrinet_1024, jasper and quartznet.&quot;
        exit 1
      fi

if [[ (${asr_acoustic_model} == &quot;jasper&quot; || \
            ${asr_acoustic_model} == &quot;quartznet&quot;) &amp;&amp; \
            ${lang_code} != &quot;en-US&quot; ]]; then
        echo &quot;jasper and quartznet acoustic models are only available for language code en-US.&quot;
        exit 1
      fi
      #Setting default Conformer Mandarin models to greedy decoder due to high high latency in os2s.
      decoder=&quot;&quot;
      if [[ ${asr_acoustic_model} == &quot;conformer&quot; &amp;&amp; ${lang_code} == &quot;zh-CN&quot; ]]; then
        decoder=&quot;_gre&quot;
      fi
      models_asr+=(
      ### Streaming w/ CPU decoder, best latency configuration
          &quot;${riva_ngc_org}/${riva_ngc_team}/rmir_asr_${asr_acoustic_model}_${modified_lang_code}_str${decoder}:${riva_ngc_model_version}&quot;

### Streaming w/ CPU decoder, best throughput configuration
      #    &quot;${riva_ngc_org}/${riva_ngc_team}/rmir_asr_${asr_acoustic_model}_${modified_lang_code}_str_thr${decoder}:${riva_ngc_model_version}&quot;

### Offline w/ CPU decoder,
          &quot;${riva_ngc_org}/${riva_ngc_team}/rmir_asr_${asr_acoustic_model}_${modified_lang_code}_ofl${decoder}:${riva_ngc_model_version}&quot;
      )
    fi

### Punctuation model
    if [[ &quot;${lang_code}&quot;  == &quot;en-US&quot; || &quot;${lang_code}&quot; == &quot;de-DE&quot; || &quot;${lang_code}&quot; == &quot;hi-IN&quot; || &quot;${lang_code}&quot; == &quot;fr-FR&quot; || &quot;${lang_code}&quot; == &quot;es-US&quot; || &quot;${lang_code}&quot; == &quot;zh-CN&quot; || &quot;${lang_code}&quot; == &quot;en-GB&quot; ]]; then
      if [[ $riva_target_gpu_family == &quot;tegra&quot; ]]; then
        models_asr+=(
            &quot;${riva_ngc_org}/${riva_ngc_team}/models_nlp_punctuation_bert_base_${modified_lang_code}:${riva_ngc_model_version}-${riva_target_gpu_family}-${riva_tegra_platform}&quot;
        )
      else
        models_asr+=(
            &quot;${riva_ngc_org}/${riva_ngc_team}/rmir_nlp_punctuation_bert_base_${modified_lang_code}:${riva_ngc_model_version}&quot;
        )
      fi
    fi

done
########## NLP MODELS ##########

if [[ $riva_target_gpu_family == &quot;tegra&quot; ]]; then
  models_nlp=(
  ### BERT Base Intent Slot model for misty domain fine-tuned on weather, smalltalk/personality, poi/map datasets.
      &quot;${riva_ngc_org}/${riva_ngc_team}/models_nlp_intent_slot_misty_bert_base:${riva_ngc_model_version}-${riva_target_gpu_family}-${riva_tegra_platform}&quot;

### DistilBERT Intent Slot model for misty domain fine-tuned on weather, smalltalk/personality, poi/map datasets.
  #    &quot;${riva_ngc_org}/${riva_ngc_team}/models_nlp_intent_slot_misty_distilbert:${riva_ngc_model_version}-${riva_target_gpu_family}-${riva_tegra_platform}&quot;
  )
else
  models_nlp=(
  ### Bert base Punctuation model
      &quot;${riva_ngc_org}/${riva_ngc_team}/rmir_nlp_punctuation_bert_base_en_us:${riva_ngc_model_version}&quot;

### BERT base Named Entity Recognition model fine-tuned on GMB dataset with class labels LOC, PER, ORG etc.
      &quot;${riva_ngc_org}/${riva_ngc_team}/rmir_nlp_named_entity_recognition_bert_base:${riva_ngc_model_version}&quot;

### BERT Base Intent Slot model fine-tuned on weather dataset.
      &quot;${riva_ngc_org}/${riva_ngc_team}/rmir_nlp_intent_slot_bert_base:${riva_ngc_model_version}&quot;

### BERT Base Question Answering model fine-tuned on Squad v2.
      &quot;${riva_ngc_org}/${riva_ngc_team}/rmir_nlp_question_answering_bert_base:${riva_ngc_model_version}&quot;

### Megatron345M Question Answering model fine-tuned on Squad v2.
  #    &quot;${riva_ngc_org}/${riva_ngc_team}/rmir_nlp_question_answering_megatron:${riva_ngc_model_version}&quot;

### Bert base Text Classification model fine-tuned on 4class (weather, meteorology, personality, nomatch) domain model.
      &quot;${riva_ngc_org}/${riva_ngc_team}/rmir_nlp_text_classification_bert_base:${riva_ngc_model_version}&quot;
  )
fi

########## TTS MODELS ##########

if [[ $riva_target_gpu_family == &quot;tegra&quot; ]]; then
  models_tts=(
     &quot;${riva_ngc_org}/${riva_ngc_team}/models_tts_fastpitch_hifigan_en_us:${riva_ngc_model_version}-${riva_target_gpu_family}-${riva_tegra_platform}&quot;
  )
else
  models_tts=(
    &quot;${riva_ngc_org}/${riva_ngc_team}/rmir_tts_fastpitch_hifigan_en_us:${riva_ngc_model_version}&quot;
  )
fi

NGC_TARGET=${riva_ngc_org}
if [[ ! -z ${riva_ngc_team} ]]; then
  NGC_TARGET=&quot;${NGC_TARGET}/${riva_ngc_team}&quot;
else
  team=&quot;\&quot;\&quot;&quot;
fi

# Specify paths to SSL Key and Certificate files to use TLS/SSL Credentials for a secured connection.
# If either are empty, an insecure connection will be used.
# Stored within container at /ssl/servert.crt and /ssl/server.key
# Optional, one can also specify a root certificate, stored within container at /ssl/root_server.crt
ssl_server_cert=&quot;&quot;
ssl_server_key=&quot;&quot;
ssl_root_cert=&quot;&quot;

# define docker images required to run Riva
image_speech_api=&quot;nvcr.io/${NGC_TARGET}/riva-speech:${riva_ngc_image_version}-l4t-aarch64&quot;

# define docker images required to setup Riva
image_init_speech=&quot;nvcr.io/${NGC_TARGET}/riva-speech:${riva_ngc_image_version}-servicemaker-l4t-aarch64&quot;

# daemon names
riva_daemon_speech=&quot;riva-speech&quot;
if [[ $riva_target_gpu_family != &quot;tegra&quot; ]]; then
    riva_daemon_client=&quot;riva-client&quot;
fi

Private - Private paste aren't shown in recent listings.

Delete After - When should we delete your paste?

Spam protection -

Reply to "Untitled"