Examples
=================================

.. toctree::
   :maxdepth: 1
   :caption: Scripts

   api_client
   aqlm_example
   cpu_offload
   gguf_inference
   gradio_openai_chatbot_webserver
   gradio_webserver
   llm_engine_example
   lora_with_quantization_inference
   multilora_inference
   offline_inference
   offline_inference_arctic
   offline_inference_audio_language
   offline_inference_chat
   offline_inference_distributed
   offline_inference_embedding
   offline_inference_encoder_decoder
   offline_inference_mlpspeculator
   offline_inference_neuron
   offline_inference_neuron_int8_quantization
   offline_inference_tpu
   offline_inference_vision_language
   offline_inference_with_prefix
   openai_audio_api_client
   openai_chat_completion_client
   openai_chat_completion_client_with_tools
   openai_completion_client
   openai_embedding_client
   openai_vision_api_client
   save_sharded_state
   tensorize_vllm_model
