janhq
diff --git a/‎.github/workflows/beta-build.yml‎
Lines changed: 2 additions & 1 deletion b/‎.github/workflows/beta-build.yml‎
Lines changed: 2 additions & 1 deletion
diff --git a/‎.github/workflows/cortex-cpp-quality-gate.yml‎
Lines changed: 38 additions & 2 deletions b/‎.github/workflows/cortex-cpp-quality-gate.yml‎
Lines changed: 38 additions & 2 deletions
diff --git a/‎.github/workflows/template-noti-discord.yaml‎
Lines changed: 1 addition & 1 deletion b/‎.github/workflows/template-noti-discord.yaml‎
Lines changed: 1 addition & 1 deletion
diff --git a/‎docker/entrypoint.sh‎
Lines changed: 3 additions & 3 deletions b/‎docker/entrypoint.sh‎
Lines changed: 3 additions & 3 deletions
diff --git a/‎docs/docs/capabilities/embeddings.md‎
Lines changed: 99 additions & 3 deletions b/‎docs/docs/capabilities/embeddings.md‎
Lines changed: 99 additions & 3 deletions
diff --git a/‎docs/docs/capabilities/hardware/index.md‎ ‎docs/docs/capabilities/hardware/index.mdx‎docs/docs/capabilities/hardware/index.md renamed to docs/docs/capabilities/hardware/index.mdx
Lines changed: 6 additions & 1 deletion b/‎docs/docs/capabilities/hardware/index.md‎ ‎docs/docs/capabilities/hardware/index.mdx‎docs/docs/capabilities/hardware/index.md renamed to docs/docs/capabilities/hardware/index.mdx
Lines changed: 6 additions & 1 deletion
diff --git a/‎docs/docs/capabilities/models/sources/index.mdx‎
Lines changed: 1 addition & 1 deletion b/‎docs/docs/capabilities/models/sources/index.mdx‎
Lines changed: 1 addition & 1 deletion
diff --git a/‎docs/docs/cli/hardware/index.mdx‎
Lines changed: 116 additions & 0 deletions b/‎docs/docs/cli/hardware/index.mdx‎
Lines changed: 116 additions & 0 deletions
diff --git a/‎docs/docs/cli/models/index.mdx‎
Lines changed: 1 addition & 0 deletions b/‎docs/docs/cli/models/index.mdx‎
Lines changed: 1 addition & 0 deletions
diff --git a/‎docs/docs/cli/models/start.md‎
Lines changed: 5 additions & 11 deletions b/‎docs/docs/cli/models/start.md‎
Lines changed: 5 additions & 11 deletions
@@ -89,7 +89,7 @@ jobs:
       new_version: ${{ needs.get-update-version.outputs.new_version }}
       runs-on: ubuntu-latest
       cmake-extra-flags: "-DCORTEX_VARIANT=prod"
-      tags: "menloltd/cortex:${{ needs.get-update-version.outputs.new_version }}"
+      tags: "menloltd/cortex:beta-${{ needs.get-update-version.outputs.new_version }}"
 
   update_release:
       needs: [get-update-version, create-draft-release, build-macos, build-windows-x64, build-linux-x64]
@@ -140,4 +140,5 @@ jobs:
               - Network Installer: https://github.com/janhq/cortex.cpp/releases/download/v${{ env.VERSION }}/cortex-${{ env.VERSION }}-linux-amd64-network-installer.deb
               - Local Installer: https://github.com/janhq/cortex.cpp/releases/download/v${{ env.VERSION }}/cortex-${{ env.VERSION }}-linux-amd64-local-installer.deb
               - Binary: https://github.com/janhq/cortex.cpp/releases/download/v${{ env.VERSION }}/cortex-${{ env.VERSION }}-linux-amd64.tar.gz
+            - Docker: menloltd/cortex:beta-${{ env.VERSION }}
             - Github Release: https://github.com/janhq/cortex.cpp/releases/tag/v${{ env.VERSION }}
@@ -99,7 +99,6 @@ jobs:
 
       - name: Run setup config
         run: |
-          rm ~/.cortexrc
           cd engine
           echo "huggingFaceToken: ${{ secrets.HUGGINGFACE_TOKEN_READ }}" > ~/.cortexrc
           echo "gitHubToken: ${{ secrets.PAT_SERVICE_ACCOUNT }}" >> ~/.cortexrc
@@ -115,7 +114,6 @@ jobs:
 
       - name: Run setup config
         run: |
-          rm ~/.cortexrc
           cd engine
           echo "huggingFaceToken: ${{ secrets.HUGGINGFACE_TOKEN_READ }}" > ~/.cortexrc
           echo "gitHubToken: ${{ secrets.PAT_SERVICE_ACCOUNT }}" >> ~/.cortexrc
@@ -189,3 +187,41 @@ jobs:
           AWS_ACCESS_KEY_ID: "${{ secrets.MINIO_ACCESS_KEY_ID }}"
           AWS_SECRET_ACCESS_KEY: "${{ secrets.MINIO_SECRET_ACCESS_KEY }}"
           AWS_DEFAULT_REGION: "${{ secrets.MINIO_REGION }}"
+
+  build-docker-and-test:
+    runs-on: ubuntu-latest
+    steps:
+      - name: Getting the repo
+        uses: actions/checkout@v3
+        with:
+          submodules: 'recursive'
+
+      - name: Set up QEMU
+        uses: docker/setup-qemu-action@v3
+
+      - name: Set up Docker Buildx
+        uses: docker/setup-buildx-action@v3
+      
+      - name: Run Docker
+        run: |
+          docker build -t menloltd/cortex:test -f docker/Dockerfile .
+          docker run -it -d -p 3928:39281 --name cortex menloltd/cortex:test
+
+      - name: use python
+        uses: actions/setup-python@v5
+        with:
+          python-version: "3.10"
+
+      - name: Run e2e tests
+        run: |
+          cd engine
+          python -m pip install --upgrade pip
+          python -m pip install -r e2e-test/requirements.txt
+          pytest e2e-test/test_api_docker.py
+
+      - name: Run Docker
+        continue-on-error: true
+        if: always()  
+        run: |
+          docker stop cortex
+          docker rm cortex
@@ -42,5 +42,5 @@ jobs:
               - Network Installer: https://delta.jan.ai/cortex/v${{ env.VERSION }}/linux-amd64/cortex-${{ env.VERSION }}-linux-amd64-network-installer.deb
               - Local Installer: https://delta.jan.ai/cortex/v${{ env.VERSION }}/linux-amd64/cortex-${{ env.VERSION }}-linux-amd64-local-installer.deb
               - Binary: https://delta.jan.ai/cortex/v${{ env.VERSION }}/linux-amd64/cortex-nightly.tar.gz
-            - Docker: menloltd/cortex:${{ env.VERSION }}
+            - Docker: menloltd/cortex:nightly-${{ env.VERSION }}
             - Github action run: https://github.com/janhq/cortex.cpp/actions/runs/${{ env.RUNNER_ID }}
@@ -2,13 +2,13 @@
 
 # Install cortex.llamacpp engine
 
+echo "apiServerHost: 0.0.0.0" > /root/.cortexrc
+echo "enableCors: true" >> /root/.cortexrc
+
 cortex engines install llama-cpp -s /opt/cortex.llamacpp
-cortex -v
 
 # Start the cortex server
 
-sed -i 's/apiServerHost: 127.0.0.1/apiServerHost: 0.0.0.0/' /root/.cortexrc
-
 cortex start
 
 # Keep the container running by tailing the log files
 
@@ -1,7 +1,103 @@
 ---
 title: Embeddings
 ---
-
 :::info
-🚧 Cortex is currently under development, and this page is a stub for future development. 
-:::
+🚧 Cortex is currently under development, and this page is a stub for future development.
+:::
+
+cortex.cpp now support embeddings endpoint with fully OpenAI compatible.
+
+For embeddings API usage please refer to [API references](/api-reference#tag/chat/POST/v1/embeddings). This tutorial show you how to use embeddings in cortex with openai python SDK.
+
+## Embedding with openai compatible
+
+### 1. Start server and run model
+
+```
+cortex run llama3.1:8b-gguf-q4-km
+```
+
+### 2. Create script `embeddings.py` with this content
+
+```
+from datetime import datetime
+from openai import OpenAI
+from pydantic import BaseModel
+ENDPOINT = "http://localhost:39281/v1"
+MODEL = "llama3.1:8bb-gguf-q4-km"
+client = OpenAI(
+    base_url=ENDPOINT,
+    api_key="not-needed"
+)
+```
+
+### 3. Create embeddings
+
+```
+response = client.embeddings.create(input = "embedding", model=MODEL, encoding_format="base64")
+print(response)
+```
+
+The reponse will be like this
+
+```
+CreateEmbeddingResponse(
+    data=[
+        Embedding(
+            embedding='hjuAPOD8TryuPU8...',
+            index=0,
+            object='embedding'
+        )
+    ],
+    model='meta-llama3.1-8b-instruct',
+    object='list',
+    usage=Usage(
+        prompt_tokens=2,
+        total_tokens=2
+    )
+)
+```
+
+
+The output embeddings is encoded as base64 string. Default the model will output the embeddings in float mode.
+
+```
+response = client.embeddings.create(input = "embedding", model=MODEL)
+print(response)
+```
+
+Result will be
+
+```
+CreateEmbeddingResponse(
+    data=[
+        Embedding(
+            embedding=[0.1, 0.3, 0.4 ....],
+            index=0,
+            object='embedding'
+        )
+    ],
+    model='meta-llama3.1-8b-instruct',
+    object='list',
+    usage=Usage(
+        prompt_tokens=2,
+        total_tokens=2
+    )
+)
+```
+
+Cortex also supports all input types as [OpenAI](https://platform.openai.com/docs/api-reference/embeddings/create#embeddings-create-input).
+
+```sh
+# input as string
+response = client.embeddings.create(input = "embedding", model=MODEL)
+
+# input as array of string
+response = client.embeddings.create(input = ["embedding"], model=MODEL)
+
+# input as array of tokens
+response = client.embeddings.create(input = [12,44,123], model=MODEL)
+
+# input as array of arrays contain tokens
+response = client.embeddings.create(input = [[912,312,54],[12,433,1241]], model=MODEL)
+```
@@ -1,8 +1,13 @@
 ---
 title: Hardware Awareness
-draft: True
+description: The Hardware Awareness section overview
 ---
 
+:::warning
+🚧 Cortex.cpp is currently under development. Our documentation outlines the intended behavior of Cortex, which may not yet be fully implemented in the codebase.
+:::
+
+
 # Hardware Awareness
 
 Cortex is designed to be hardware aware, meaning it can detect your hardware configuration and automatically set parameters to optimize compatibility and performance, and avoid hardware-related errors.
 
@@ -272,7 +272,7 @@ curl --request POST \
 Clients can abort a downloading task using the task ID. Below is a sample `curl` command to abort a download task:
 
 ```sh
-curl --location --request DELETE 'http://127.0.0.1:3928/models/pull' \
+curl --location --request DELETE 'http://127.0.0.1:39281/v1/models/pull' \
 --header 'Content-Type: application/json' \
 --data '{
     "taskId": "tinyllama:1b-gguf-q2-k"
 
@@ -0,0 +1,116 @@
+---
+title: Cortex Hardware
+---
+
+import Tabs from "@theme/Tabs";
+import TabItem from "@theme/TabItem";
+
+# `cortex hardware`
+
+This command allows you manage and monitor hardware resources.
+
+
+**Usage**:
+:::info
+You can use the `--verbose` flag to display more detailed output of the internal processes. To apply this flag, use the following format: `cortex --verbose [subcommand]`.
+:::
+<Tabs>
+  <TabItem value="MacOs/Linux" label="MacOs/Linux">
+  ```sh
+  cortex hardware [options] [subcommand]
+  ```
+  </TabItem>
+  <TabItem value="Windows" label="Windows">
+  ```sh
+  cortex.exe hardware [options]
+
+  ```
+  </TabItem>
+</Tabs>
+
+**Options**:
+
+| Option            | Description                                           | Required | Default value | Example         |
+|-------------------|-------------------------------------------------------|----------|---------------|-----------------|
+| `-h`, `--help`    | Display help information for the command.             | No       | -             | `-h`        |
+
+---
+# Subcommands:
+
+## `cortex hardware list`
+:::info
+This CLI command calls the following API endpoint:
+- [List Model](/api-reference#tag/hardware/get/v1/hardware)
+:::
+This command lists all the hardware resources.
+
+**Usage**:
+<Tabs>
+  <TabItem value="MacOs/Linux" label="MacOs/Linux">
+  ```sh
+  cortex hardware list [options]
+  ```
+  </TabItem>
+  <TabItem value="Windows" label="Windows">
+  ```sh
+  cortex.exe hardware list [options]
+  ```
+  </TabItem>
+</Tabs>
+
+For example, it returns the following:
+```bash
+OS Information:
++---+---------------------------+--------------------+
+| # | Version                   | Name               |
++---+---------------------------+--------------------+
+| 1 | 24.04.1 LTS (Noble Numbat)| Ubuntu 24.04.1 LTS |
++---+---------------------------+--------------------+
+```
+
+**Options**:
+
+| Option                    | Description                                        | Required | Default value | Example              |
+|---------------------------|----------------------------------------------------|----------|---------------|----------------------|
+| `-h`, `--help`            | Display help for command.                          | No       | -             | `-h`                 |
+|`--cpu`                    | Display CPU information                            | No       | -             | `--cpu`              |
+|`--os`                     | Display OS information                             | No       | -             | `--os`               |
+|`--ram`                    | Display RAM information                            | No       | -             | `--ram`              |
+|`--storage`                | Display Storage information                        | No       | -             | `--storage`          |
+|`--gpu`                    | Display GPU information                            | No       | -             | `--gpu`              |
+|`--power`                  | Display Power information                          | No       | -             | `--power`            |
+|`--monitors`               | Display Monitors information                       | No       | -             | `--monitors`         |
+
+## `cortex hardware activate`
+
+::info
+This CLI command calls the following API endpoint:
+- [List Model](/api-reference#tag/hardware/post/v1/hardware/activate)
+:::
+This command activates the Cortex's hardware, currently support only GPUs.
+
+**Usage**:
+<Tabs>
+  <TabItem value="MacOs/Linux" label="MacOs/Linux">
+  ```sh
+  cortex hardware activate [options]
+  ```
+  </TabItem>
+  <TabItem value="Windows" label="Windows">
+  ```sh
+  cortex.exe hardware activate [options]
+  ```
+  </TabItem>
+</Tabs>
+
+For example, it returns the following:
+```bash
+Activated GPUs: 0
+```
+
+**Options**:
+
+| Option                    | Description                                        | Required | Default value | Example              |
+|---------------------------|----------------------------------------------------|----------|---------------|----------------------|
+| `-h`, `--help`            | Display help for command.                          | No       | -             | `-h`                 |
+|`--gpus`                   | List of GPUs to activate                           | Yes      | -             | `[0, 1]`             |
@@ -157,6 +157,7 @@ This command uses a `model_id` from the model that you have downloaded or availa
 | Option                    | Description                                                               | Required | Default value                                | Example                |
 |---------------------------|---------------------------------------------------------------------------|----------|----------------------------------------------|------------------------|
 | `model_id`                | The identifier of the model you want to start.                            | Yes       | `Prompt to select from the available models` | `mistral`       |
+| `--gpus`                  | List of GPUs to use.                                                      | No       | -                                            | `[0,1]`           |
 | `-h`, `--help`            | Display help information for the command.                                 | No       | -                                            | `-h`               |
 
 ## `cortex models stop`
 
@@ -12,34 +12,28 @@ description: Cortex models subcommands.
 This command starts a model defined by a `model_id`.
 
 
-
 ## Usage
 
 ```bash
 # Start a model
 cortex models start [model_id]
 
-# Start a model with a preset
-cortex models start [model_id] [options]
-
 # Start with a specified engine
 cortex models start [model_id]:[engine] [options]
 ```
 
 
 :::info
 - This command uses a `model_id` from the model that you have downloaded or available in your file system.
-- Model preset is applied only at the start of the model and does not change during the chat session.
 :::
 
 ## Options
 
-| Option                    | Description                                                               | Required | Default value                                | Example                |
-|---------------------------|---------------------------------------------------------------------------|----------|----------------------------------------------|------------------------|
-| `model_id`                | The identifier of the model you want to start.                            | No       | `Prompt to select from the available models` | `mistral`       |
-| `-a`, `--attach`          | Attach to an interactive chat session.                                    | No       | `false`                                      | `-a`             |
-| `-p`, `--preset <preset>` | Apply a chat preset to the chat session.                                  | No       | `false`                                      | `-p friendly`    |
-| `-h`, `--help`            | Display help information for the command.                                 | No       | -                                            | `-h`               |
+| Option                    | Description                                              | Required | Default value                                | Example           |
+|---------------------------|----------------------------------------------------------|----------|----------------------------------------------|-------------------|
+| `model_id`                | The identifier of the model you want to start.           | No       | `Prompt to select from the available models` | `mistral`         |
+| `--gpus`                  | List of GPUs to use.                                     | No       | -                                            | `[0,1]`           |
+| `-h`, `--help`            | Display help information for the command.                | No       | -                                            | `-h`              |