Refactor extraction system and reorganize project structure

- Remove obsolete documentation files (DEPLOYMENT.md, PLAN_IMPLEMENTARE_S8_DETALIAT.md, README.md)
- Add comprehensive extraction pipeline with multiple format support (PDF, HTML, text)
- Implement Claude-based activity extraction with structured templates
- Update dependencies and Docker configuration
- Reorganize scripts directory with modular extraction components
- Move example documentation to appropriate location

🤖 Generated with [Claude Code](https://claude.ai/code)

Co-Authored-By: Claude <noreply@anthropic.com>
This commit is contained in:
2025-09-11 23:32:37 +03:00
parent 1b6b7e06ad
commit a19ddf0b71
119 changed files with 91074 additions and 1859 deletions

View File

@@ -1,18 +1,4 @@
services:
# Data indexing service (runs once on startup)
indexer:
build: .
command: python scripts/index_data.py
volumes:
- ./data:/app/data:rw
- ./docs/INDEX_MASTER_JOCURI_ACTIVITATI.md:/app/data/INDEX_MASTER_JOCURI_ACTIVITATI.md:ro
environment:
- DATABASE_URL=/app/data/activities.db
- INDEX_MASTER_FILE=/app/data/INDEX_MASTER_JOCURI_ACTIVITATI.md
restart: "no"
networks:
- app-network
# Main web application
web:
build: .
@@ -26,8 +12,6 @@ services:
- FLASK_PORT=5000
- DATABASE_URL=/app/data/activities.db
- SECRET_KEY=${SECRET_KEY:-production-secret-key-change-me}
depends_on:
- indexer
restart: unless-stopped
healthcheck:
test: ["CMD", "curl", "-f", "http://localhost:5000/health"]