Unverified Commit 9593ada3 authored by Aleix Ramírez Baena's avatar Aleix Ramírez Baena Committed by GitHub
Browse files

F #227: First version of Dynamo appliance (#228)

This appliance includes the runtime installation of the Dynamo inference framework. Supported parameters:

- ONEAPP_DYNAMO_API_PORT: Port where the Dynamo API will be exposed
-  ONEAPP_DYNAMO_MODEL_ID: Name of the model in Hugging Face
-  ONEAPP_DYNAMO_MODEL_TOKEN: HF API token
- ONEAPP_DYNAMO_ENGINE_NAME: Name of the dynamo engine to use: mistralrs|sglang|llamacpp|vllm|trtllm|echo_full|echo_core.
-  ONEAPP_DYNAMO_ENGINE_EXTRA_ARGS_JSON: Engine extra args set in JSON format.
- ONEAPP_DYNAMO_ENGINE_EXTRA_ARGS_JSON_BASE64: Engine extra args set in JSON and encoded in base64.
parent 9a63b659
Loading
Loading
Loading
Loading
+4 −0
Original line number Diff line number Diff line
@@ -49,6 +49,10 @@ packer-service_OneKEa: packer-ubuntu2204oneke $(DIR_EXPORT)/service_OneKEa.qcow2
packer-service_Ray: packer-ubuntu2404 $(DIR_EXPORT)/service_Ray.qcow2
	@$(INFO) "Packer service_Ray done"

packer-service_Dynamo: PKR_VAR_nvidia_driver_path := $(NVIDIA_DRIVER_PATH)
packer-service_Dynamo: packer-ubuntu2404 $(DIR_EXPORT)/service_Dynamo.qcow2
	@$(INFO) "Packer service_Dynamo done"

# run packer build for given distro or service
$(DIR_EXPORT)/service_OneKE_storage.qcow2:
	qemu-img create -f qcow2 $(DIR_EXPORT)/service_OneKE_storage.qcow2 10G
+1 −1
Original line number Diff line number Diff line
@@ -31,7 +31,7 @@ DISTROS_ARM64 := alma8.aarch64 alma9.aarch64 \
                 ubuntu2204.aarch64 ubuntu2404.aarch64

SERVICES_AMD64 := service_Wordpress service_VRouter service_OneKE service_OneKEa \
                  service_Harbor service_MinIO service_Ray service_example
                  service_Harbor service_MinIO service_Ray service_Dynamo service_example

SERVICES_ARM64 := service_VRouter.aarch64

+3 −0
Original line number Diff line number Diff line
#base_url: "http://172.20.0.4:8000/v1/chat/completions"
base_url: "http://localhost:8999/v1/chat/completions"
model: "Qwen2.5-1.5B-Instruct"
 No newline at end of file
+3 −0
Original line number Diff line number Diff line
PyYAML==6.0.2
flask==3.1.0
requests==2.32.3
 No newline at end of file
+23 −0
Original line number Diff line number Diff line
/* fallback */
@font-face {
    font-family: 'Material Icons';
    font-style: normal;
    font-weight: 400;
    src: url('../fonts/flUhRq6tzZclQEJ-Vdg-IuiaDsNc.woff2') format('woff2');
  }
  
  .material-icons {
    font-family: 'Material Icons';
    font-weight: normal;
    font-style: normal;
    font-size: 24px;
    line-height: 1;
    letter-spacing: normal;
    text-transform: none;
    display: inline-block;
    white-space: nowrap;
    word-wrap: normal;
    direction: ltr;
    -webkit-font-feature-settings: 'liga';
    -webkit-font-smoothing: antialiased;
  }
 No newline at end of file
Loading