Compare commits

9 Commits
main ... proto

Author SHA1 Message Date
7904a6ab2d prototyping 2026-04-10 15:26:30 +02:00
64b0216c62 ONNX optimisations 2026-04-02 16:28:27 +02:00
809f1a02c4 update deps 2026-03-25 15:32:55 +01:00
a2a8614304 add dep for model 2026-03-24 14:19:10 +01:00
ede9dfdd05 update deps 2026-03-18 18:11:44 +01:00
7c87e44067 change source of llama-cpp-python to local repo 2026-03-12 14:55:46 +01:00
1b421a4813 background preparation of similarity dataset with Llama-CPP 2026-03-12 14:52:15 +01:00
14be0728ff prepared datasets 2026-03-04 12:22:31 +01:00
696459a186 add Polars as dep 2026-03-04 10:21:48 +01:00
3 changed files with 1447 additions and 31 deletions

40
model_management.ps1 Normal file
View File

@@ -0,0 +1,40 @@
$DOWNLOAD_MODEL = $false
$OPTIMISE = $true
# $TARGET_PTH = "B:\projects\MOP-TOM\models\models--BAAI--bge-reranker-v2-m3\snapshots\953dc6f6f85a1b2dbfca4c34a2796e7dde08d41e"
# $MODEL_NAME = 'BAAI/bge-reranker-v2-m3'
# $TARGET_PTH = "B:\projects\MOP-TOM\models\models--jinaai--jina-reranker-v3\snapshots\10fb694fc21f7a710a563ff1eb977a460f3868e4"
$TARGET_PTH = "B:\projects\MOP-TOM\models\models--jinaai--jina-reranker-v2-base-multilingual\snapshots\9cfeff2df7d40d1b78e75e5e9cebec92a99813c9"
$MODEL_NAME = 'jinaai/jina-reranker-v3'
$base = Get-Location
$model_path = Join-Path $base "..\models" -Resolve
$MODEL_EXPORT = Join-Path $model_path "onnx_tmp"
$MODEL_EXPORT_QUANT = Join-Path $MODEL_EXPORT "quant"
Write-Host "Path to base: $base"
Write-Host "Path to model folder: $model_path"
if (Test-Path -Path $model_path) {
Write-Host "Model directory found"
} else {
Write-Host "Model directory not found: $model_path"
exit
}
$Env:SENTENCE_TRANSFORMERS_HOME = $model_path
$Env:TRANSFORMERS_CACHE = $model_path
$Env:HF_HOME = $model_path
$Env:HF_HUB_DISABLE_SYMLINKS = 1
if ($DOWNLOAD_MODEL) {
pdm run hf download $MODEL_NAME
}
if ($OPTIMISE) {
pdm run optimum-cli export onnx -m $TARGET_PTH --task text-classification --trust-remote-code --optimize O2 $MODEL_EXPORT
# pdm run optimum-cli export onnx -m $TARGET_PTH --task text-classification $MODEL_EXPORT
}
if ($OPTIMISE) {
pdm run optimum-cli onnxruntime quantize --onnx_model $MODEL_EXPORT -o $MODEL_EXPORT_QUANT --avx2
# pdm run optimum-cli onnxruntime quantize --onnx_model $TARGET_PTH -o $MODEL_EXPORT_QUANT --avx2
}

1408
pdm.lock generated

File diff suppressed because it is too large Load Diff

View File

@@ -5,8 +5,8 @@ description = "use case for M.O.P. - T.O.M.: search semantically for problems an
authors = [
{name = "d-opt GmbH, resp. Florian Förster", email = "f.foerster@d-opt.com"},
]
dependencies = []
requires-python = ">=3.11"
dependencies = ["torch>=2.10.0", "torchvision>=0.25.0", "dopt-basics>=0.2.4", "llama-cpp-python>=0.3.16", "lancedb>=0.30.0", "pydantic>=2.12.5", "sentence-transformers>=5.3.0", "onnx>=1.20.1", "onnxruntime>=1.24.4", "tantivy>=0.25.1"]
requires-python = "<3.14,>=3.11"
readme = "README.md"
license = {text = "LicenseRef-Proprietary"}
@@ -122,14 +122,28 @@ package-dir = "src"
[tool.pdm.resolution]
respect-source-order = true
[[tool.pdm.source]]
name = "torch"
url = "https://download.pytorch.org/whl/cu128"
include_packages = ["torch*"]
exclude_packages = ["llama-cpp*"]
# [[tool.pdm.source]]
# name = "llama-cpp-python-cuda"
# url = "https://abetlen.github.io/llama-cpp-python/whl/cu124"
# include_packages = ["llama-cpp-py*"]
[[tool.pdm.source]]
name = "private"
url = "http://localhost:8001/simple"
verify_ssl = false
include_packages = ["llama-cpp-python*"]
[[tool.pdm.source]]
name = "pypi"
url = "https://pypi.org/simple"
exclude_packages = ["llama-cpp*"]
[dependency-groups]
tests = [
"pytest>=8.3.4",
@@ -143,8 +157,20 @@ dev = [
"pdoc3>=0.11.5",
"bump-my-version>=1.1.1",
"nox>=2025.2.9",
"huggingface-hub<1.0",
"tqdm>=4.66.5",
"peft>=0.18.1",
"einops>=0.8.2",
"onnx>=1.20.1",
"triton-windows>=3.6.0.post26",
"xformers>=0.0.34",
"optimum[onnxruntime]>=2.1.0",
]
nb = [
"jupyterlab>=4.3.5",
"ipywidgets>=8.1.5",
]
data = [
"polars>=1.38.1",
"striprtf>=0.0.29",
]