fix: export only required models instead of entire Ollama directory
- Changed export-ollama-models.sh to selectively copy only qwen3:14b and qwen3-embedding:4b - Parses manifest files to identify required blob files - Significantly reduces Docker image size by excluding unrelated models - Added summary showing which models were skipped This prevents accidentally including other models (like deepseek-r1, bge-m3, etc.) that may exist in the user's Ollama directory but are not needed for the project.
This commit is contained in:
@@ -56,28 +56,73 @@ if [ ! -d "$OLLAMA_MODELS_PATH" ]; then
|
|||||||
exit 1
|
exit 1
|
||||||
fi
|
fi
|
||||||
|
|
||||||
# Create export directory
|
# Create export directory structure
|
||||||
echo ""
|
echo ""
|
||||||
echo "Creating export directory: $MODELS_DIR"
|
echo "Creating export directory: $MODELS_DIR"
|
||||||
rm -rf "$MODELS_DIR"
|
rm -rf "$MODELS_DIR"
|
||||||
mkdir -p "$MODELS_DIR"
|
mkdir -p "$MODELS_DIR/models/manifests/registry.ollama.ai/library"
|
||||||
|
mkdir -p "$MODELS_DIR/models/blobs"
|
||||||
|
|
||||||
echo ""
|
echo ""
|
||||||
echo "Copying Ollama data from $OLLAMA_MODELS_PATH to $MODELS_DIR..."
|
echo "Copying only required models (qwen3:14b and qwen3-embedding:4b)..."
|
||||||
echo "This may take several minutes (models are large)..."
|
echo "This may take several minutes (models are large)..."
|
||||||
|
|
||||||
# Copy the entire .ollama directory structure
|
# Function to get blob hashes from manifest
|
||||||
cp -r "$OLLAMA_MODELS_PATH"/* "$MODELS_DIR/"
|
get_blobs_from_manifest() {
|
||||||
|
local manifest_file=$1
|
||||||
|
# Extract all sha256 hashes from the manifest JSON
|
||||||
|
grep -oE 'sha256:[a-f0-9]{64}' "$manifest_file" 2>/dev/null | sed 's/sha256://' | sort -u
|
||||||
|
}
|
||||||
|
|
||||||
|
# Function to copy model files
|
||||||
|
copy_model() {
|
||||||
|
local model_name=$1
|
||||||
|
local model_tag=$2
|
||||||
|
local manifest_dir="$OLLAMA_MODELS_PATH/models/manifests/registry.ollama.ai/library/$model_name"
|
||||||
|
|
||||||
|
if [ ! -d "$manifest_dir" ]; then
|
||||||
|
echo "ERROR: Model manifest not found: $manifest_dir"
|
||||||
|
return 1
|
||||||
|
fi
|
||||||
|
|
||||||
|
echo " Copying $model_name:$model_tag manifest..."
|
||||||
|
mkdir -p "$MODELS_DIR/models/manifests/registry.ollama.ai/library/$model_name"
|
||||||
|
|
||||||
|
# Copy the specific tag manifest
|
||||||
|
if [ -f "$manifest_dir/$model_tag" ]; then
|
||||||
|
cp "$manifest_dir/$model_tag" "$MODELS_DIR/models/manifests/registry.ollama.ai/library/$model_name/"
|
||||||
|
|
||||||
|
# Get all blob hashes referenced in this manifest
|
||||||
|
echo " Finding blob files for $model_name:$model_tag..."
|
||||||
|
local blob_hashes=$(get_blobs_from_manifest "$manifest_dir/$model_tag")
|
||||||
|
local blob_count=0
|
||||||
|
|
||||||
|
for blob_hash in $blob_hashes; do
|
||||||
|
local blob_file="$OLLAMA_MODELS_PATH/models/blobs/sha256-$blob_hash"
|
||||||
|
if [ -f "$blob_file" ]; then
|
||||||
|
cp "$blob_file" "$MODELS_DIR/models/blobs/" 2>/dev/null
|
||||||
|
blob_count=$((blob_count + 1))
|
||||||
|
fi
|
||||||
|
done
|
||||||
|
|
||||||
|
echo " ✓ $model_name:$model_tag copied ($blob_count blobs)"
|
||||||
|
else
|
||||||
|
echo "ERROR: Manifest file not found: $manifest_dir/$model_tag"
|
||||||
|
return 1
|
||||||
|
fi
|
||||||
|
}
|
||||||
|
|
||||||
|
# Copy required models with specific tags
|
||||||
|
copy_model "qwen3" "14b" || exit 1
|
||||||
|
copy_model "qwen3-embedding" "4b" || exit 1
|
||||||
|
|
||||||
echo ""
|
echo ""
|
||||||
echo "=========================================="
|
echo "=========================================="
|
||||||
echo "Models exported successfully!"
|
echo "Models exported successfully!"
|
||||||
echo "=========================================="
|
echo "=========================================="
|
||||||
du -sh "$MODELS_DIR"
|
|
||||||
|
|
||||||
echo ""
|
echo ""
|
||||||
echo "Directory structure:"
|
echo "Total size:"
|
||||||
ls -lh "$MODELS_DIR/"
|
du -sh "$MODELS_DIR"
|
||||||
|
|
||||||
echo ""
|
echo ""
|
||||||
echo "Models included:"
|
echo "Models included:"
|
||||||
@@ -85,6 +130,24 @@ if [ -d "$MODELS_DIR/models/manifests/registry.ollama.ai/library" ]; then
|
|||||||
ls -lh "$MODELS_DIR/models/manifests/registry.ollama.ai/library/"
|
ls -lh "$MODELS_DIR/models/manifests/registry.ollama.ai/library/"
|
||||||
fi
|
fi
|
||||||
|
|
||||||
|
echo ""
|
||||||
|
echo "Blob files:"
|
||||||
|
if [ -d "$MODELS_DIR/models/blobs" ]; then
|
||||||
|
echo " Total blobs: $(ls -1 "$MODELS_DIR/models/blobs" | wc -l)"
|
||||||
|
du -sh "$MODELS_DIR/models/blobs"
|
||||||
|
fi
|
||||||
|
|
||||||
|
echo ""
|
||||||
|
echo "=========================================="
|
||||||
|
echo "Summary"
|
||||||
|
echo "=========================================="
|
||||||
|
echo "✓ Only qwen3:14b and qwen3-embedding:4b were exported"
|
||||||
|
echo ""
|
||||||
|
echo "Models in your Ollama that were NOT copied:"
|
||||||
|
ollama list | grep -v "qwen3:14b" | grep -v "qwen3-embedding:4b" | tail -n +2 || echo " (none)"
|
||||||
|
echo ""
|
||||||
|
echo "This keeps the Docker image size minimal!"
|
||||||
|
|
||||||
echo ""
|
echo ""
|
||||||
echo "=========================================="
|
echo "=========================================="
|
||||||
echo "Next steps:"
|
echo "Next steps:"
|
||||||
|
|||||||
Reference in New Issue
Block a user