| # Script to build vector store locally | |
| # Usage: ./scripts/build-vector-store.sh [--force-recreate] | |
| # | |
| # Environment variables that can be set: | |
| # FORCE_RECREATE - Set to "true" to force recreation of the vector store | |
| # OUTPUT_DIR - Directory to save stats and artifacts (default: ./artifacts) | |
| # USE_CHUNKING - Set to "false" to disable document chunking | |
| # SHOULD_SAVE_STATS - Set to "false" to disable saving document statistics | |
| # Parse command line arguments | |
| FORCE_RECREATE="" | |
| if [[ "$1" == "--force-recreate" ]]; then | |
| FORCE_RECREATE="--force-recreate" | |
| fi | |
| # Set output directory for artifacts (use environment variable if set) | |
| OUTPUT_DIR=${OUTPUT_DIR:-"./artifacts"} | |
| mkdir -p $OUTPUT_DIR | |
| echo "Building vector store with output to $OUTPUT_DIR" | |
| echo "Force recreate: ${FORCE_RECREATE:-false}" | |
| # Run pipeline in CI mode | |
| python py-src/pipeline.py $FORCE_RECREATE --ci --output-dir $OUTPUT_DIR | |
| # Check if successful | |
| if [ $? -eq 0 ]; then | |
| echo "Build successful!" | |
| # Create a zip of the vector store | |
| if [ -d "./db/vector_store_4" ]; then | |
| echo "Creating vector store zip file in $OUTPUT_DIR" | |
| cd db | |
| zip -r ../$OUTPUT_DIR/vector_store.zip vector_store_4 | |
| cd .. | |
| echo "Vector store zip created at $OUTPUT_DIR/vector_store.zip" | |
| fi | |
| echo "Artifacts available in $OUTPUT_DIR:" | |
| ls -la $OUTPUT_DIR | |
| else | |
| echo "Build failed!" | |
| exit 1 | |
| fi | |