Merge branch 'dev' into makefile-fix

shmuelk · web-flow · commit c3419f392c55 · 2025-05-19T17:46:24.000+03:00
Signed-off-by: Shmuel Kallner &lt;kallner@il.ibm.com&gt;
diff --git a/.tekton/README.md b/.tekton/README.md
@@ -2,7 +2,7 @@
 
 <!-- NOTE TO CONTRIBUTORS: every repo in the hc4ai organization is intended to have the same contents in this file. The origin is the copy in https://github.ibm.com/mspreitz/hc4ai-hello-neural/blob/dev/.tekton/README.md; submit PRs against that one -->
 
-This pipeline is designed to support safe, efficient, and traceable development and deployment workflows using [OpenShift Pipelines-as-Code](https://pipelinesascode.com/), [Tekton](https://tekton.dev/), [buildah](https://buildah.io/), GitHub, and Quay.io.
+This pipeline is designed to support safe, efficient, and traceable development and deployment workflows using [OpenShift Pipelines-as-Code](https://pipelinesascode.com/), [Tekton](https://tekton.dev/), [buildah](https://buildah.io/), GitHub, and ghcr.io.
 
 This pipeline is used for CI/CD of the `dev` and `main` branches. This pipeline runs from source through container image build to deployment and testing in the hc4ai cluster.
 
@@ -20,9 +20,9 @@ Each repo includes a `.version.json` file at its root. This file controls:
 ```json
 {
   "dev-version": "0.0.5",
-  "dev-registry": "quay.io/llm-d/<your project name>-dev",
+  "dev-registry": "ghcr.io/llm-d/<your project name>-dev",
   "prod-version": "0.0.4",
-  "prod-registry": "quay.io/llm-d/<your project name>"
+  "prod-registry": "ghcr.io/llm-d/<your project name>"
 }
 ```
 
@@ -43,8 +43,8 @@ The pipeline reads this file to:
 
 This pipeline maintains two container repositories for this GitHub repository, as follows.
 
-- `quay.io/llm-d/<repoName>-dev`. Hold builds from the `dev` branch as described below.
-- `quay.io/llm-d/<repoName>`. Holds promotions to prod, as described below.
+- `ghcr.io/llm-d/<repoName>-dev`. Hold builds from the `dev` branch as described below.
+- `ghcr.io/llm-d/<repoName>`. Holds promotions to prod, as described below.
 
 ---
 
diff --git a/.tekton/buildah-build.yaml b/.tekton/buildah-build.yaml
@@ -41,17 +41,17 @@ spec:
         cp /workspace/registry/.dockerconfigjson /root/.docker/config.json
 
         echo "🔐 Extracting credentials..."
-        USERNAME=$(jq -r '.auths["quay.io"].username' /root/.docker/config.json)
-        PASSWORD=$(jq -r '.auths["quay.io"].password' /root/.docker/config.json)
+        USERNAME=$(jq -r '.auths["ghcr.io"].username' /root/.docker/config.json)
+        PASSWORD=$(jq -r '.auths["ghcr.io"].password' /root/.docker/config.json)
 
         if [ "$USERNAME" = "null" ] || [ "$PASSWORD" = "null" ]; then
           echo "❌ Error: Missing registry credentials"
           exit 1
         fi
 
         echo "🔓 Logging in to registry with Buildah..."
-        buildah logout quay.io || true
-        buildah login --username "$USERNAME" --password "$PASSWORD" quay.io
+        buildah logout ghcr.io || true
+        buildah login --username "$USERNAME" --password "$PASSWORD" ghcr.io
 
         export DOCKER_CONFIG=/root/.docker
         export BUILDER=buildah
diff --git a/.tekton/pipelinerun.yaml b/.tekton/pipelinerun.yaml
@@ -1,7 +1,7 @@
 apiVersion: tekton.dev/v1
 kind: PipelineRun
 metadata:
-  name: vllm-sim
+  name: llm-d-inference-sim
   annotations:
     pipelinesascode.tekton.dev/on-event: "[pull_request, push]"
     pipelinesascode.tekton.dev/on-target-branch: "[main, dev]"
@@ -632,7 +632,10 @@ spec:
         secretName: "{{ git_auth_secret }}"
     - name: git-auth  
       secret:
-        secretName: "git-auth-secret-neuralmagic"
+        secretName: "git-auth-secret-llm-d"
+    # - name: registry-secret
+    #   secret:
+    #     secretName: quay-secret-llm-d
     - name: registry-secret
       secret:
-        secretName: quay-secret-llm-d
+        secretName: ghcr-secret-llm-d
diff --git a/.tekton/vuln-scan-trivy.yaml b/.tekton/vuln-scan-trivy.yaml
@@ -10,7 +10,7 @@ spec:
   params:
     - name: IMAGE_URL
       type: string
-      description: Full image URL (e.g., quay.io/org/image:tag)
+      description: Full image URL (e.g., ghcr.io/org/image:tag)
     - name: SEVERITY
       type: string
       default: "CRITICAL,HIGH,MEDIUM"
diff --git a/.version.json b/.version.json
@@ -1,6 +1,6 @@
 {
-  "dev-version": "0.0.5",
-  "dev-registry": "quay.io/llm-d/vllm-sim-dev",
-  "prod-version": "0.0.4",
-  "prod-registry": "quay.io/llm-d/vllm-sim"
+  "dev-version": "0.0.6",
+  "dev-registry": "ghcr.io/llm-d/llm-d-inference-sim-dev",
+  "prod-version": "0.0.5",
+  "prod-registry": "ghcr.io/llm-d/llm-d-inference-sim"
 }
diff --git a/Dockerfile b/Dockerfile
@@ -12,23 +12,23 @@ COPY go.sum go.sum
 RUN go mod download
 
 # Copy the go source
-COPY cmd/vllm-sim/main.go cmd/cmd.go
+COPY cmd/llm-d-inference-sim/main.go cmd/cmd.go
 COPY . .
 
 # Build
 # the GOARCH has not a default value to allow the binary be built according to the host where the command
 # was called. For example, if we call make image-build in a local env which has the Apple Silicon M1 SO
 # the docker BUILDPLATFORM arg will be linux/arm64 when for Apple x86 it will be linux/amd64. Therefore,
 # by leaving it empty we can ensure that the container and binary shipped on it will have the same platform.
-RUN CGO_ENABLED=0 GOOS=${TARGETOS:-linux} GOARCH=${TARGETARCH} go build -a -o bin/vllm-sim cmd/cmd.go
+RUN CGO_ENABLED=0 GOOS=${TARGETOS:-linux} GOARCH=${TARGETARCH} go build -a -o bin/llm-d-inference-sim cmd/cmd.go
 
 # Use distroless as minimal base image to package the manager binary
 # Refer to https://github.com/GoogleContainerTools/distroless for more details
 FROM registry.access.redhat.com/ubi9/ubi:latest
 WORKDIR /
-COPY --from=builder /workspace/bin/vllm-sim /app/vllm-sim
+COPY --from=builder /workspace/bin/llm-d-inference-sim /app/llm-d-inference-sim
 USER 65532:65532
 
-ENTRYPOINT ["/app/vllm-sim"]
+ENTRYPOINT ["/app/llm-d-inference-sim"]
 
 
diff --git a/Makefile b/Makefile
@@ -1,4 +1,4 @@
-# Copyright 2025 The vLLM-Sim Authors.
+# Copyright 2025 The llm-d-inference-sim Authors.
 #
 # Licensed under the Apache License, Version 2.0 (the "License");
 # you may not use this file except in compliance with the License.
@@ -12,33 +12,34 @@
 # See the License for the specific language governing permissions and
 # limitations under the License.
 
-# Makefile for the vllm-sim project
+# Makefile for the llm-d-inference-sim project
+
 CONTAINER_RUNTIME ?= docker
 
-PACKAGE_VLLM_SIM = github.com/neuralmagic/vllm-sim/cmd/vllm-sim
-VLLM_SIM_NAME = vllm-sim/vllm-sim
+PACKAGE_VLLM_SIM = github.com/llm-d/llm-d-inference-sim/cmd/llm-d-inference-sim
+VLLM_SIM_NAME = llm-d-inference-sim/llm-d-inference-sim
 VLLM_SIM_TAG ?= 0.0.2
 
-.PHONY: build-vllm-sim
-build-vllm-sim:
+.PHONY: build-llm-d-inference-sim
+build-llm-d-inference-sim:
 	go build -o bin/ ${PACKAGE_VLLM_SIM}
 
-.PHONY: build-vllm-sim-linux
-build-vllm-sim-linux:
+.PHONY: build-llm-d-inference-sim-linux
+build-llm-d-inference-sim-linux:
 	CGO_ENABLED=0 GOOS=linux GOARCH=amd64 go build -o bin/linux/ ${PACKAGE_VLLM_SIM}
 
-.PHONY: build-vllm-sim-image
-build-vllm-sim-image: build-vllm-sim-linux
-	$(CONTAINER_RUNTIME) build --file build/vllm-sim.Dockerfile --tag ${VLLM_SIM_NAME}:${VLLM_SIM_TAG} ./bin/linux
+.PHONY: build-llm-d-inference-sim-image
+build-llm-d-inference-sim-image: build-llm-d-inference-sim-linux
+	$(CONTAINER_RUNTIME) build --file build/llm-d-inference-sim.Dockerfile --tag ${VLLM_SIM_NAME}:${VLLM_SIM_TAG} ./bin/linux
 
 
 SHELL := /usr/bin/env bash
 
 # Defaults
-PROJECT_NAME ?= vllm-sim
+PROJECT_NAME ?= llm-d-inference-sim
 DEV_VERSION ?= 0.0.1
 PROD_VERSION ?= 0.0.0
-IMAGE_TAG_BASE ?= quay.io/llm-d/$(PROJECT_NAME)
+IMAGE_TAG_BASE ?= ghcr.io/llm-d/$(PROJECT_NAME)
 IMG = $(IMAGE_TAG_BASE):$(DEV_VERSION)
 NAMESPACE ?= hc4ai-operator
 
@@ -264,7 +265,7 @@ load-version-json: check-jq
 	  export DEV_VERSION; \
 	  export PROD_VERSION; \
 	fi && \
-	CURRENT_DEFAULT="quay.io/llm-d/$(PROJECT_NAME)"; \
+	CURRENT_DEFAULT="ghcr.io/llm-d/$(PROJECT_NAME)"; \
 	if [ "$(IMAGE_TAG_BASE)" = "$$CURRENT_DEFAULT" ]; then \
 	  IMAGE_TAG_BASE=$$(jq -r '."dev-registry"' .version.json); \
 	  echo "✔ Loaded IMAGE_TAG_BASE from .version.json: $$IMAGE_TAG_BASE"; \
diff --git a/README.md b/README.md
@@ -89,13 +89,13 @@ For more details see the <a href="https://docs.vllm.ai/en/stable/getting_started
 ### Building
 To build a Docker image of the vLLM Simulator, run:
 ```bash
-make build-vllm-sim-image
+make build-llm-d-inference-sim-image
 ```
 
 ### Running
 To run the vLLM Simulator image under Docker, run:
 ```bash
-docker run --rm --publish 8000:8000 ai-aware-router/vllm-sim:0.0.1 /ai-aware-router/vllm-sim  --port 8000 --model "Qwen/Qwen2.5-1.5B-Instruct" --lora "tweet-summary-0,tweet-summary-1"
+docker run --rm --publish 8000:8000 ai-aware-router/llm-d-inference-sim:0.0.1 /ai-aware-router/llm-d-inference-sim  --port 8000 --model "Qwen/Qwen2.5-1.5B-Instruct" --lora "tweet-summary-0,tweet-summary-1"
 ```
 **Note:** The above command exposes the simulator on port 8000, and serves the Qwen/Qwen2.5-1.5B-Instruct model.
 
@@ -104,13 +104,13 @@ docker run --rm --publish 8000:8000 ai-aware-router/vllm-sim:0.0.1 /ai-aware-rou
 ### Building
 To build the vLLM simulator, run:
 ```bash
-make build-vllm-sim
+make build-llm-d-inference-sim
 ```
 
 ### Running
 To run the router in a standalone test environment, run:
 ```bash
-./bin/vllm-sim --model my_model --port 8000
+./bin/llm-d-inference-sim --model my_model --port 8000
 ```
 
 
diff --git a/build/vllm-sim.Dockerfile b/build/vllm-sim.Dockerfile
@@ -1,4 +1,4 @@
-# Copyright 2025 The vLLM-Sim Authors.
+# Copyright 2025 The llm-d-inference-sim Authors.
 #
 # Licensed under the Apache License, Version 2.0 (the "License");
 # you may not use this file except in compliance with the License.
@@ -14,8 +14,8 @@
 
 FROM alpine:3.21
 
-ADD --chmod=777 ./vllm-sim /vllm-sim/
+ADD --chmod=777 ./llm-d-inference-sim /llm-d-inference-sim/
 
-WORKDIR /vllm-sim/
+WORKDIR /llm-d-inference-sim/
 
-ENTRYPOINT ["/vllm-sim/vllm-sim"]
+ENTRYPOINT ["/llm-d-inference-sim/llm-d-inference-sim"]
diff --git a/cmd/llm-d-inference-sim/main.go b/cmd/llm-d-inference-sim/main.go
@@ -1,5 +1,5 @@
 /*
-Copyright 2025 The vLLM-Sim Authors.
+Copyright 2025 The llm-d-inference-sim Authors.
 
 Licensed under the Apache License, Version 2.0 (the "License");
 you may not use this file except in compliance with the License.
@@ -23,8 +23,8 @@ import (
 
 	"k8s.io/klog/v2"
 
-	"github.com/neuralmagic/vllm-sim/cmd/signals"
-	vllmsim "github.com/neuralmagic/vllm-sim/pkg/vllm-sim"
+	"github.com/llm-d/llm-d-inference-sim/cmd/signals"
+	vllmsim "github.com/llm-d/llm-d-inference-sim/pkg/llm-d-inference-sim"
 )
 
 func main() {
diff --git a/cmd/signals/signals.go b/cmd/signals/signals.go
@@ -1,5 +1,5 @@
 /*
-Copyright 2025 The vLLM-Sim Authors.
+Copyright 2025 The llm-d-inference-sim Authors.
 
 Licensed under the Apache License, Version 2.0 (the "License");
 you may not use this file except in compliance with the License.
diff --git a/deploy/common/statefulset.yaml b/deploy/common/statefulset.yaml
@@ -16,5 +16,5 @@ spec:
       serviceAccountName: operator-controller-manager
       containers:
         - name: cmd
-          image: quay.io/llm-d/placeholder:placeholder
+          image: ghcr.io/llm-d/placeholder:placeholder
           imagePullPolicy: Always
diff --git a/deploy/kustomization.yaml b/deploy/kustomization.yaml
@@ -25,8 +25,8 @@ configMapGenerator:
 
 # Define the image to be updated.
 # images:
-# - name: quay.io/llm-d/placeholder
-#   newName: quay.io/llm-d/${IMAGE_TAG_BASE}
+# - name: ghcr.io/llm-d/placeholder
+#   newName: ghcr.io/llm-d/${IMAGE_TAG_BASE}
 #   newTag: ${VERSION}
 patches:
 - path: common/patch-service.yaml
diff --git a/go.mod b/go.mod
@@ -1,4 +1,4 @@
-module github.com/neuralmagic/vllm-sim
+module github.com/llm-d/llm-d-inference-sim
 
 go 1.23.4
 
diff --git a/pkg/llm-d-inference-sim/defs.go b/pkg/llm-d-inference-sim/defs.go
@@ -1,5 +1,5 @@
 /*
-Copyright 2025 The vLLM-Sim Authors.
+Copyright 2025 The llm-d-inference-sim Authors.
 
 Licensed under the Apache License, Version 2.0 (the "License");
 you may not use this file except in compliance with the License.
@@ -16,7 +16,7 @@ limitations under the License.
 
 // Definitions of all sturctures used by vLLM simultor
 // Contains the main simulator class and all definitions related to request/response for all supported APIs
-package vllmsim
+package llmdinferencesim
 
 import (
 	"fmt"
diff --git a/pkg/llm-d-inference-sim/metrics.go b/pkg/llm-d-inference-sim/metrics.go
@@ -1,5 +1,5 @@
 /*
-Copyright 2025 The vLLM-Sim Authors.
+Copyright 2025 The llm-d-inference-simference-sim Authors.
 
 Licensed under the Apache License, Version 2.0 (the "License");
 you may not use this file except in compliance with the License.
@@ -16,15 +16,15 @@ limitations under the License.
 
 // Contains functions related to prometheus metrics
 
-package vllmsim
+package llmdinferencesim
 
 import (
 	"strconv"
 	"strings"
 	"sync/atomic"
 	"time"
 
-	vllmapi "github.com/neuralmagic/vllm-sim/pkg/vllm-api"
+	vllmapi "github.com/llm-d/llm-d-inference-sim/pkg/vllm-api"
 	"github.com/prometheus/client_golang/prometheus"
 )
 
diff --git a/pkg/llm-d-inference-sim/simulator.go b/pkg/llm-d-inference-sim/simulator.go
@@ -1,5 +1,5 @@
 /*
-Copyright 2025 The vLLM-Sim Authors.
+Copyright 2025 The llm-d-inference-sim Authors.
 
 Licensed under the Apache License, Version 2.0 (the "License");
 you may not use this file except in compliance with the License.
@@ -15,7 +15,7 @@ limitations under the License.
 */
 
 // Package vllmsim implements the vLLM simulator.
-package vllmsim
+package llmdinferencesim
 
 import (
 	"context"
@@ -31,7 +31,7 @@ import (
 	"github.com/buaazp/fasthttprouter"
 	"github.com/go-logr/logr"
 	"github.com/google/uuid"
-	vllmapi "github.com/neuralmagic/vllm-sim/pkg/vllm-api"
+	vllmapi "github.com/llm-d/llm-d-inference-sim/pkg/vllm-api"
 	"github.com/prometheus/client_golang/prometheus/promhttp"
 	"github.com/spf13/pflag"
 	"github.com/valyala/fasthttp"
@@ -77,7 +77,7 @@ func (s *VllmSimulator) Start(ctx context.Context) error {
 
 // parseCommandParams parses and validates command line parameters
 func (s *VllmSimulator) parseCommandParams() error {
-	f := pflag.NewFlagSet("vllm-sim flags", pflag.ExitOnError)
+	f := pflag.NewFlagSet("llm-d-inference-sim flags", pflag.ExitOnError)
 	f.StringVar(&s.mode, "mode", "random", "Simulator mode, echo - returns the same text that was sent in the request, for chat completion returns the last message, random - returns random sentence from a bank of pre-defined sentences")
 	f.IntVar(&s.port, "port", vLLMDefaultPort, "Port")
 	f.IntVar(&s.interTokenLatency, "inter-token-latency", 0, "Time to generate one token (in milliseconds)")
diff --git a/pkg/llm-d-inference-sim/simulator_test.go b/pkg/llm-d-inference-sim/simulator_test.go
@@ -1,5 +1,5 @@
 /*
-Copyright 2025 The vLLM-Sim Authors.
+Copyright 2025 The llm-d-inference-sim Authors.
 
 Licensed under the Apache License, Version 2.0 (the "License");
 you may not use this file except in compliance with the License.
@@ -14,7 +14,7 @@ See the License for the specific language governing permissions and
 limitations under the License.
 */
 
-package vllmsim
+package llmdinferencesim
 
 import (
 	"context"
diff --git a/pkg/llm-d-inference-sim/streaming.go b/pkg/llm-d-inference-sim/streaming.go
@@ -1,5 +1,5 @@
 /*
-Copyright 2025 The vLLM-Sim Authors.
+Copyright 2025 The llm-d-inference-sim Authors.
 
 Licensed under the Apache License, Version 2.0 (the "License");
 you may not use this file except in compliance with the License.
@@ -14,7 +14,7 @@ See the License for the specific language governing permissions and
 limitations under the License.
 */
 
-package vllmsim
+package llmdinferencesim
 
 import (
 	"bufio"
diff --git a/pkg/llm-d-inference-sim/utils.go b/pkg/llm-d-inference-sim/utils.go
diff --git a/pkg/llm-d-inference-sim/utils_test.go b/pkg/llm-d-inference-sim/utils_test.go
diff --git a/pkg/llm-d-inference-sim/vllm_sim_suite_test.go b/pkg/llm-d-inference-sim/vllm_sim_suite_test.go
diff --git a/pkg/vllm-api/vllm-models.go b/pkg/vllm-api/vllm-models.go
diff --git a/scripts/run-vllm-kind.sh b/scripts/run-vllm-kind.sh
diff --git a/yaml/vllm-kind.yaml b/yaml/vllm-kind.yaml

Original file line number	Diff line number	Diff line change
`@@ -1,6 +1,6 @@`
`1`	`1`	`{`
`2`		`- "dev-version": "0.0.5",`
`3`		`- "dev-registry": "quay.io/llm-d/vllm-sim-dev",`
`4`		`- "prod-version": "0.0.4",`
`5`		`- "prod-registry": "quay.io/llm-d/vllm-sim"`
	`2`	`+ "dev-version": "0.0.6",`
	`3`	`+ "dev-registry": "ghcr.io/llm-d/llm-d-inference-sim-dev",`
	`4`	`+ "prod-version": "0.0.5",`
	`5`	`+ "prod-registry": "ghcr.io/llm-d/llm-d-inference-sim"`
`6`	`6`	`}`