semantic-search/ONNX_quantize.ps1
2026-04-02 16:28:27 +02:00

29 lines
1.1 KiB
PowerShell

$TARGET_PTH = "B:\projects\MOP-TOM\models\models--BAAI--bge-reranker-v2-m3\snapshots\953dc6f6f85a1b2dbfca4c34a2796e7dde08d41e"
$MODEL_NAME = 'BAAI/bge-reranker-v2-m3'
$base = Get-Location
$model_path = Join-Path $base "..\models" -Resolve
$MODEL_EXPORT = Join-Path $model_path "onnx_test"
$MODEL_EXPORT_QUANT = Join-Path $MODEL_EXPORT "quant"
Write-Host "Path to base: $base"
Write-Host "Path to model folder: $model_path"
if (Test-Path -Path $model_path) {
Write-Host "Model directory found"
} else {
Write-Host "Model directory not found: $model_path"
exit
}
$Env:SENTENCE_TRANSFORMERS_HOME = $model_path
$Env:TRANSFORMERS_CACHE = $model_path
$Env:HF_HOME = $model_path
if ($true) {
pdm run optimum-cli export onnx -m $TARGET_PTH --task text-classification --optimize O1 $MODEL_EXPORT
# pdm run optimum-cli export onnx -m $TARGET_PTH --task text-classification $MODEL_EXPORT
}
if ($true) {
pdm run optimum-cli onnxruntime quantize --onnx_model $MODEL_EXPORT -o $MODEL_EXPORT_QUANT --avx2
# pdm run optimum-cli onnxruntime quantize --onnx_model $TARGET_PTH -o $MODEL_EXPORT_QUANT --avx2
}