Skip to content

Commit e18d204

Browse files
authored
[main] links (#3227)
1 parent 646b76a commit e18d204

File tree

12 files changed

+31
-30
lines changed

12 files changed

+31
-30
lines changed

demos/c_api_minimal_app/Makefile

Lines changed: 2 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -25,13 +25,13 @@ BASE_OS ?= ubuntu24
2525

2626
ifeq ($(BASE_OS),ubuntu24)
2727
BASE_OS_TAG_UBUNTU ?= 24.04
28-
PACKAGE_URL ?="https://github.com/openvinotoolkit/model_server/releases/download/v2025.0/ovms_ubuntu24.tar.gz"
28+
PACKAGE_URL ?="https://github.com/openvinotoolkit/model_server/releases/download/v2025.1/ovms_ubuntu24.tar.gz"
2929
BASE_IMAGE ?= ubuntu:$(BASE_OS_TAG_UBUNTU)
3030
DIST_OS=ubuntu
3131
endif
3232
ifeq ($(BASE_OS),redhat)
3333
BASE_OS_TAG_REDHAT ?= 9.5
34-
PACKAGE_URL ="https://github.com/openvinotoolkit/model_server/releases/download/v2025.0/ovms_redhat.tar.gz"
34+
PACKAGE_URL ="https://github.com/openvinotoolkit/model_server/releases/download/v2025.1/ovms_redhat.tar.gz"
3535
BASE_IMAGE ?= registry.access.redhat.com/ubi9/ubi:$(BASE_OS_TAG_REDHAT)
3636
DIST_OS=redhat
3737
endif

demos/code_local_assistant/README.md

Lines changed: 5 additions & 4 deletions
Original file line numberDiff line numberDiff line change
@@ -33,7 +33,7 @@ Since we do not want to wait for the code to appear, we need to use smaller mode
3333
Code completion works in non-streaming, unary mode. Do not use instruct model, there is no chat involved in the process.
3434

3535
Export `Qwen/Qwen2.5-Coder-1.5B`:
36-
```baconsolesh
36+
```console
3737
python export_model.py text_generation --source_model Qwen/Qwen2.5-Coder-1.5B --weight-format int4 --config_file_path models/config_all.json --model_repository_path models --target_device NPU --overwrite_models
3838
```
3939

@@ -54,7 +54,7 @@ Examine that workspace is set up properly `models/config_all.json`:
5454
}
5555
```
5656

57-
```console
57+
```bash
5858
tree models
5959
models
6060
├── codellama
@@ -100,13 +100,14 @@ Run OpenVINO Model Server with both models loaded at the same time:
100100
### Windows: deploying on bare metal
101101
Please refer to OpenVINO Model Server installation first: [link](../../docs/deploying_server_baremetal.md)
102102

103-
```console
103+
```bat
104104
ovms --rest_port 8000 --config_path ./models/config_all.json
105105
```
106106

107107
### Linux: via Docker
108108
```bash
109-
docker run -d --rm -v $(pwd)/:/workspace/ -p 8000:8000 openvino/model_server:2025.1 --rest_port 8000 --config_path /workspace/models/config_all.json
109+
docker run -d --rm --device /dev/accel --group-add=$(stat -c "%g" /dev/dri/render* | head -n 1) -u $(id -u):$(id -g) \
110+
-p 8000:8000 -v $(pwd)/:/workspace/ openvino/model_server:2025.1 --rest_port 8000 --config_path /workspace/models/config_all.json
110111
```
111112

112113
## Set Up Visual Studio Code

demos/continuous_batching/README.md

Lines changed: 2 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -33,8 +33,8 @@ LLM engine parameters will be defined inside the `graph.pbtxt` file.
3333

3434
Download export script, install it's dependencies and create directory for the models:
3535
```console
36-
curl https://raw.githubusercontent.com/openvinotoolkit/model_server/refs/heads/releases/2025/0/demos/common/export_models/export_model.py -o export_model.py
37-
pip3 install -r https://raw.githubusercontent.com/openvinotoolkit/model_server/refs/heads/releases/2025/0/demos/common/export_models/requirements.txt
36+
curl https://raw.githubusercontent.com/openvinotoolkit/model_server/refs/heads/releases/2025/1/demos/common/export_models/export_model.py -o export_model.py
37+
pip3 install -r https://raw.githubusercontent.com/openvinotoolkit/model_server/refs/heads/releases/2025/1/demos/common/export_models/requirements.txt
3838
mkdir models
3939
```
4040

demos/continuous_batching/rag/README.md

Lines changed: 2 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -4,8 +4,8 @@
44
## Creating models repository for all the endpoints
55

66
```console
7-
curl https://raw.githubusercontent.com/openvinotoolkit/model_server/refs/heads/releases/2025/0/demos/common/export_models/export_model.py -o export_model.py
8-
pip3 install -r https://raw.githubusercontent.com/openvinotoolkit/model_server/refs/heads/releases/2025/0/demos/common/export_models/requirements.txt
7+
curl https://raw.githubusercontent.com/openvinotoolkit/model_server/refs/heads/releases/2025/1/demos/common/export_models/export_model.py -o export_model.py
8+
pip3 install -r https://raw.githubusercontent.com/openvinotoolkit/model_server/refs/heads/releases/2025/1/demos/common/export_models/requirements.txt
99

1010
mkdir models
1111
python export_model.py text_generation --source_model meta-llama/Meta-Llama-3-8B-Instruct --weight-format int8 --kv_cache_precision u8 --config_file_path models/config_all.json --model_repository_path models

demos/continuous_batching/speculative_decoding/README.md

Lines changed: 2 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -35,8 +35,8 @@ LLM engine parameters will be defined inside the `graph.pbtxt` file.
3535

3636
Download export script, install its dependencies and create directory for the models:
3737
```console
38-
curl https://raw.githubusercontent.com/openvinotoolkit/model_server/refs/heads/main/demos/common/export_models/export_model.py -o export_model.py
39-
pip3 install -r https://raw.githubusercontent.com/openvinotoolkit/model_server/refs/heads/main/demos/common/export_models/requirements.txt
38+
curl https://raw.githubusercontent.com/openvinotoolkit/model_server/refs/heads/releases/2025/1/demos/common/export_models/export_model.py -o export_model.py
39+
pip3 install -r https://raw.githubusercontent.com/openvinotoolkit/model_server/refs/heads/releases/2025/1/demos/common/export_models/requirements.txt
4040
mkdir models
4141
```
4242

demos/continuous_batching/vlm/README.md

Lines changed: 2 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -24,8 +24,8 @@ Execution parameters will be defined inside the `graph.pbtxt` file.
2424

2525
Download export script, install it's dependencies and create directory for the models:
2626
```console
27-
curl https://raw.githubusercontent.com/openvinotoolkit/model_server/main/demos/common/export_models/export_model.py -o export_model.py
28-
pip3 install -r https://raw.githubusercontent.com/openvinotoolkit/model_server/main/demos/common/export_models/requirements.txt
27+
curl https://raw.githubusercontent.com/openvinotoolkit/model_server/refs/heads/releases/2025/1/demos/common/export_models/export_model.py -o export_model.py
28+
pip3 install -r https://raw.githubusercontent.com/openvinotoolkit/model_server/refs/heads/releases/2025/1/demos/common/export_models/requirements.txt
2929
mkdir models
3030
```
3131

demos/embeddings/README.md

Lines changed: 2 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -17,8 +17,8 @@ That ensures faster initialization time, better performance and lower memory con
1717

1818
Download export script, install it's dependencies and create directory for the models:
1919
```console
20-
curl https://raw.githubusercontent.com/openvinotoolkit/model_server/refs/heads/releases/2025/0/demos/common/export_models/export_model.py -o export_model.py
21-
pip3 install -r https://raw.githubusercontent.com/openvinotoolkit/model_server/refs/heads/releases/2025/0/demos/common/export_models/requirements.txt
20+
curl https://raw.githubusercontent.com/openvinotoolkit/model_server/refs/heads/releases/2025/1/demos/common/export_models/export_model.py -o export_model.py
21+
pip3 install -r https://raw.githubusercontent.com/openvinotoolkit/model_server/refs/heads/releases/2025/1/demos/common/export_models/requirements.txt
2222
mkdir models
2323
```
2424

demos/llm_npu/README.md

Lines changed: 2 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -27,8 +27,8 @@ LLM engine parameters will be defined inside the `graph.pbtxt` file.
2727

2828
Download export script, install it's dependencies and create directory for the models:
2929
```console
30-
curl https://raw.githubusercontent.com/openvinotoolkit/model_server/main/demos/common/export_models/export_model.py -o export_model.py
31-
pip3 install -r https://raw.githubusercontent.com/openvinotoolkit/model_server/main/demos/common/export_models/requirements.txt
30+
curl https://raw.githubusercontent.com/openvinotoolkit/model_server/refs/heads/releases/2025/1/demos/common/export_models/export_model.py -o export_model.py
31+
pip3 install -r https://raw.githubusercontent.com/openvinotoolkit/model_server/refs/heads/releases/2025/1/demos/common/export_models/requirements.txt
3232
mkdir models
3333
```
3434

demos/rerank/README.md

Lines changed: 2 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -15,8 +15,8 @@ That ensures faster initialization time, better performance and lower memory con
1515

1616
Download export script, install it's dependencies and create directory for the models:
1717
```console
18-
curl https://raw.githubusercontent.com/openvinotoolkit/model_server/refs/heads/releases/2025/0/demos/common/export_models/export_model.py -o export_model.py
19-
pip3 install -r https://raw.githubusercontent.com/openvinotoolkit/model_server/refs/heads/releases/2025/0/demos/common/export_models/requirements.txt
18+
curl https://raw.githubusercontent.com/openvinotoolkit/model_server/refs/heads/releases/2025/1/demos/common/export_models/export_model.py -o export_model.py
19+
pip3 install -r https://raw.githubusercontent.com/openvinotoolkit/model_server/refs/heads/releases/2025/1/demos/common/export_models/requirements.txt
2020
mkdir models
2121
```
2222

demos/vlm_npu/README.md

Lines changed: 2 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -27,8 +27,8 @@ LLM engine parameters will be defined inside the `graph.pbtxt` file.
2727

2828
Download export script, install it's dependencies and create directory for the models:
2929
```console
30-
curl https://raw.githubusercontent.com/openvinotoolkit/model_server/main/demos/common/export_models/export_model.py -o export_model.py
31-
pip3 install -r https://raw.githubusercontent.com/openvinotoolkit/model_server/main/demos/common/export_models/requirements.txt
30+
curl https://raw.githubusercontent.com/openvinotoolkit/model_server/refs/heads/releases/2025/1/demos/common/export_models/export_model.py -o export_model.py
31+
pip3 install -r https://raw.githubusercontent.com/openvinotoolkit/model_server/refs/heads/releases/2025/1/demos/common/export_models/requirements.txt
3232
mkdir models
3333
```
3434

docs/deploying_server_baremetal.md

Lines changed: 7 additions & 7 deletions
Original file line numberDiff line numberDiff line change
@@ -8,12 +8,12 @@ To deploy Model Server on baremetal, use pre-compiled binaries for Ubuntu22, Ubu
88
:sync: ubuntu-22-04
99
Download precompiled package (without python support):
1010
```{code} sh
11-
wget https://github.com/openvinotoolkit/model_server/releases/download/v2025.0/ovms_ubuntu22.tar.gz
11+
wget https://github.com/openvinotoolkit/model_server/releases/download/v2025.1/ovms_ubuntu22.tar.gz
1212
tar -xzvf ovms_ubuntu22.tar.gz
1313
```
1414
or precompiled package (with python and LLM support):
1515
```{code} sh
16-
wget https://github.com/openvinotoolkit/model_server/releases/download/v2025.0/ovms_ubuntu22_python_on.tar.gz
16+
wget https://github.com/openvinotoolkit/model_server/releases/download/v2025.1/ovms_ubuntu22_python_on.tar.gz
1717
tar -xzvf ovms_ubuntu22_python_on.tar.gz
1818
```
1919
Install required libraries:
@@ -36,12 +36,12 @@ pip3 install "Jinja2==3.1.6" "MarkupSafe==3.0.2"
3636
:sync: ubuntu-24-04
3737
Download precompiled package (without python support):
3838
```{code} sh
39-
wget https://github.com/openvinotoolkit/model_server/releases/download/v2025.0/ovms_ubuntu24.tar.gz
39+
wget https://github.com/openvinotoolkit/model_server/releases/download/v2025.1/ovms_ubuntu24.tar.gz
4040
tar -xzvf ovms_ubuntu24.tar.gz
4141
```
4242
or precompiled package (with python and LLM support):
4343
```{code} sh
44-
wget https://github.com/openvinotoolkit/model_server/releases/download/v2025.0/ovms_ubuntu24_python_on.tar.gz
44+
wget https://github.com/openvinotoolkit/model_server/releases/download/v2025.1/ovms_ubuntu24_python_on.tar.gz
4545
tar -xzvf ovms_ubuntu24_python_on.tar.gz
4646
```
4747
Install required libraries:
@@ -64,12 +64,12 @@ pip3 install "Jinja2==3.1.6" "MarkupSafe==3.0.2"
6464
:sync: rhel-9.5
6565
Download precompiled package (without python support):
6666
```{code} sh
67-
wget https://github.com/openvinotoolkit/model_server/releases/download/v2025.0/ovms_redhat.tar.gz
67+
wget https://github.com/openvinotoolkit/model_server/releases/download/v2025.1/ovms_redhat.tar.gz
6868
tar -xzvf ovms_redhat.tar.gz
6969
```
7070
or precompiled package (with python and LLM support):
7171
```{code} sh
72-
wget https://github.com/openvinotoolkit/model_server/releases/download/v2025.0/ovms_redhat_python_on.tar.gz
72+
wget https://github.com/openvinotoolkit/model_server/releases/download/v2025.1/ovms_redhat_python_on.tar.gz
7373
tar -xzvf ovms_redhat_python_on.tar.gz
7474
```
7575
Install required libraries:
@@ -95,7 +95,7 @@ Make sure you have [Microsoft Visual C++ Redistributable](https://aka.ms/vs/17/r
9595
Download and unpack model server archive for Windows:
9696

9797
```bat
98-
curl -L https://github.com/openvinotoolkit/model_server/releases/download/v2025.0/ovms_windows.zip -o ovms.zip
98+
curl -L https://github.com/openvinotoolkit/model_server/releases/download/v2025.1/ovms_windows.zip -o ovms.zip
9999
tar -xf ovms.zip
100100
```
101101

docs/llm/quickstart.md

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -15,7 +15,7 @@ pip3 install -r https://raw.githubusercontent.com/openvinotoolkit/model_server/r
1515

1616
2. Run optimum-cli to download and quantize the model:
1717
```console
18-
curl https://raw.githubusercontent.com/openvinotoolkit/model_server/refs/heads/main/demos/common/export_models/export_model.py -o export_model.py
18+
curl https://raw.githubusercontent.com/openvinotoolkit/model_server/refs/heads/releases/2025/1/demos/common/export_models/export_model.py -o export_model.py
1919
mkdir models
2020
python export_model.py text_generation --source_model deepseek-ai/DeepSeek-R1-Distill-Qwen-7B --weight-format int4 --config_file_path models/config.json --model_repository_path models --target_device GPU --cache 2
2121
```

0 commit comments

Comments
 (0)