updates meta

refactors to use redis & celery
adds docker & fly.toml
2025-02-20 20:02:47 +01:00 · 2025-02-20 19:56:37 +01:00 · 2025-02-20 14:32:09 +01:00 · 2025-02-12 13:25:17 +01:00 · 2025-02-12 13:15:32 +01:00
16 changed files with 528 additions and 590 deletions
--- a/.dockerignore
+++ b/.dockerignore
@@ -0,0 +1,5 @@
+fly.toml
+.git/
+__pycache__/
+.envrc
+.venv/
--- a/15
+++ b/15
@@ -0,0 +1,15 @@
+FROM python:3.13.1 AS builder
+
+ENV PYTHONUNBUFFERED=1 \
+    PYTHONDONTWRITEBYTECODE=1
+WORKDIR /app
+
+
+RUN python -m venv .venv
+COPY requirements.txt ./
+RUN .venv/bin/pip install -r requirements.txt
+FROM python:3.13.1-slim
+WORKDIR /app
+COPY --from=builder /app/.venv .venv/
+COPY . .
+CMD ["/app/.venv/bin/flask", "run", "--host=0.0.0.0", "--port=8080"]
--- a/README.md
+++ b/README.md
@@ -1,18 +1,22 @@
-# Torn User Activity Scraper
+# Torn User Activity Tracker
+
+> [!WARNING]  
+> **Development is still in its early stages; do not put it to productive use!**

 ## Features

 - Start and stop scraping user activity data
 - View real-time logs
 - Download data and log files
- View scraping results and statistics
+- View scraping results
+- Plugin based analysis system
 - Toggle between light and dark mode

 **Note:** Many features are not fully implemented yet, but the activity tracker/grabber works as intended.

 ## Planned Features

- Additional analyses
+- Additional analyses plugins
 - Selector for Torn API data to choose which data shall be tracked
 - Improved / fixed log viewer

@@ -24,6 +28,21 @@
 - Flask-WTF
 - Pandas
 - Requests
+- Redis
+- Celery
+
+Redis currently has to run locally, but this will change in the future. To change this, see file tasks.py:
+
+```python
+# tasks.py
+def get_redis():
+    return redis.StrictRedis(
+        host='localhost',
+        port=6379,
+        db=0,
+        decode_responses=True
+    )
+```

 ## Installation

--- a/app/init.py
+++ b/app/init.py
@@ -7,15 +7,18 @@ from app.views import register_views
 from app.api import register_api
 from app.config import load_config
 from app.filters import register_filters
+from app.tasks import celery

 from app.logging_config import init_logger

-def create_app():
+def create_app(config=None):
    app = Flask(__name__)

-    os.environ['TZ'] = 'UTC'
-
+    if config is None:
        config = load_config()
+    app.config.update(config)
+
+    os.environ['TZ'] = 'UTC'

    app.config['SECRET_KEY'] = config['DEFAULT']['SECRET_KEY']
    
@@ -23,6 +26,9 @@ def create_app():
    for key, value in config.get('BOOTSTRAP', {}).items():
        app.config[key.upper()] = value

+    # Initialize Celery
+    celery.conf.update(app.config)
+
    bootstrap = Bootstrap5(app)

    # Store the entire config in Flask app
--- a/app/api.py
+++ b/app/api.py
@@ -1,4 +1,3 @@
-# filepath: /home/michaelb/Dokumente/TornActivityTracker/app/api.py
 from flask import jsonify, request, Response, send_from_directory, current_app
 import threading
 import os
@@ -10,6 +9,7 @@ from app.models import Scraper
 from app.util import create_zip, delete_old_zips, tail
 from app.config import load_config
 from app.forms import ScrapingForm
+from app.tasks import start_scraping_task, stop_scraping_task, get_redis

 scraping_thread = None
 scraper = None
@@ -18,42 +18,40 @@ scrape_lock = threading.Lock()
 def register_api(app):
    @app.route('/start_scraping', methods=['POST'])
    def start_scraping():
-        global scraping_thread, scraper
-        with scrape_lock:
-            scraper = current_app.config.get('SCRAPER')
-            if scraper is not None and scraper.scraping_active:
-                current_app.logger.warning("Can't start scraping process: scraping already in progress")
-                return jsonify({"status": "Scraping already in progress"})
-
        form = ScrapingForm()
        if form.validate_on_submit():
+            redis_client = get_redis()
            faction_id = form.faction_id.data
-                fetch_interval = form.fetch_interval.data
-                run_interval = form.run_interval.data
            
-                scraper = Scraper(faction_id, fetch_interval, run_interval, app)
-                scraper.scraping_active = True
+            # Check if scraping is already active
+            if redis_client.hget(f"scraper:{faction_id}", "scraping_active") == "1":
+                return jsonify({"status": "Scraping already in progress"})
            
-                scraping_thread = threading.Thread(target=scraper.start_scraping, args=(app,))
-                scraping_thread.daemon = True
-                scraping_thread.start()
-
-                current_app.config['SCRAPER'] = scraper
-                current_app.config['SCRAPING_THREAD'] = scraping_thread
+            # Convert config to a serializable dict with only needed values
+            config_dict = {
+                'DATA': {'DATA_DIR': current_app.config['DATA']['DATA_DIR']},
+                'DEFAULT': {'API_KEY': current_app.config['DEFAULT']['API_KEY']}
+            }
            
+            start_scraping_task.delay(
+                faction_id,
+                int(form.fetch_interval.data),  # Ensure this is an int
+                int(form.run_interval.data),    # Ensure this is an int
+                config_dict
+            )
            return jsonify({"status": "Scraping started"})
        return jsonify({"status": "Invalid form data"})

    @app.route('/stop_scraping', methods=['POST'])
    def stop_scraping():
-        scraper = current_app.config.get('SCRAPER')
-        if scraper is None or not scraper.scraping_active:
-            return jsonify({"status": "Scraping is not running"})
+        redis_client = get_redis()
+        faction_id = redis_client.get("current_faction_id")
+        if not faction_id:
+            return jsonify({"status": "No active scraping session"})
+        
+        stop_scraping_task.delay(faction_id)
+        return jsonify({"status": "Stopping scraping"})

-        scraper.stop_scraping()
-        current_app.config['SCRAPING_ACTIVE'] = False
-        current_app.logger.debug("Scraping stopped by user")
-        return jsonify({"status": "Scraping stopped"})    
    @app.route('/logfile', methods=['GET'])
    def logfile():
        log_file_name = current_app.logger.handlers[0].baseFilename
@@ -196,20 +194,37 @@ def register_api(app):

    @app.route('/scraping_status', methods=['GET'])
    def scraping_status():
-        if scraper is None:
-            current_app.logger.debug("Scraper is not initialized.")
+        redis_client = get_redis()
+        current_faction_id = redis_client.get("current_faction_id")
+        
+        if not current_faction_id:
            return jsonify({"scraping_active": False})

-        if scraper.scraping_active:
-            current_app.logger.debug("Scraping is active.")
-            return jsonify({"scraping_active": True})
-        else:
-            current_app.logger.debug("Scraping is not active.")
+        scraping_active = redis_client.hget(f"scraper:{current_faction_id}", "scraping_active")
+        
+        # If we have a faction_id but scraping is not active, clean up the stale state
+        if not scraping_active or scraping_active == "0":
+            redis_client.delete("current_faction_id")
            return jsonify({"scraping_active": False})
            
+        return jsonify({
+            "scraping_active": True,
+            "faction_id": current_faction_id
+        })
+
    @app.route('/scraping_get_end_time')
    def scraping_get_end_time():
-        if scraper is None:
-            current_app.logger.debug("Scraper is not initialized.")
+        redis_client = get_redis()
+        current_faction_id = redis_client.get("current_faction_id")
+        
+        if not current_faction_id:
            return jsonify({"scraping_active": False})
-        return jsonify({"end_time": scraper.end_time})
+            
+        end_time = redis_client.hget(f"scraper:{current_faction_id}", "end_time")
+        if not end_time:
+            return jsonify({"scraping_active": False})
+            
+        return jsonify({
+            "end_time": end_time,
+            "faction_id": current_faction_id
+        })
--- a/app/filters.py
+++ b/app/filters.py
@@ -4,4 +4,12 @@ from datetime import datetime
 def register_filters(app):
    @app.template_filter('datetimeformat')
    def datetimeformat(value):
-        return datetime.fromtimestamp(value).strftime('%Y-%m-%d %H:%M:%S')
+        """Convert datetime or timestamp to formatted string"""
+        if isinstance(value, datetime):
+            dt = value
+        else:
+            try:
+                dt = datetime.fromtimestamp(float(value))
+            except (ValueError, TypeError):
+                return str(value)
+        return dt.strftime('%Y-%m-%d %H:%M:%S')
--- a/app/models.py
+++ b/app/models.py
@@ -5,21 +5,60 @@ import os
 import time
 from datetime import datetime, timedelta
 from requests.exceptions import ConnectionError, Timeout, RequestException
+import redis
+import threading

 from flask import current_app

 class Scraper:
-    def __init__(self, faction_id, fetch_interval, run_interval, app):
+    _instances = {}  # Track all instances by faction_id
+    _lock = threading.Lock()
+
+    def __new__(cls, faction_id, *args, **kwargs):
+        with cls._lock:
+            # Stop any existing instance for this faction
+            if faction_id in cls._instances:
+                old_instance = cls._instances[faction_id]
+                old_instance.stop_scraping()
+                
+            instance = super().__new__(cls)
+            cls._instances[faction_id] = instance
+            return instance
+
+    def __init__(self, faction_id, fetch_interval, run_interval, config):
+        # Only initialize if not already initialized
+        if not hasattr(self, 'faction_id'):
+            self.redis_client = redis.StrictRedis(
+                host='localhost', port=6379, db=0, decode_responses=True
+            )
            self.faction_id = faction_id
            self.fetch_interval = fetch_interval
            self.run_interval = run_interval
-        self.end_time = datetime.now() + timedelta(days=run_interval)
-        self.data_file_name = os.path.join(app.config['DATA']['DATA_DIR'], f"{self.faction_id}-{datetime.now().strftime('%Y-%m-%d-%H-%M')}.csv")
-        self.scraping_active = False
-        self.API_KEY = app.config['DEFAULT']['API_KEY']
-        self.logger = app.logger
+            self.API_KEY = config['DEFAULT']['API_KEY']
+            self.data_file_name = os.path.join(
+                config['DATA']['DATA_DIR'],
+                f"{faction_id}-{datetime.now().strftime('%Y-%m-%d-%H-%M')}.csv"
+            )
+            self.end_time = datetime.now() + timedelta(days=int(run_interval))
            
-        print(self.data_file_name)
+            # Store scraper state in Redis
+            self.redis_client.hmset(f"scraper:{faction_id}", {
+                "faction_id": faction_id,
+                "fetch_interval": fetch_interval,
+                "run_interval": run_interval,
+                "end_time": self.end_time.isoformat(),
+                "data_file_name": self.data_file_name,
+                "scraping_active": "0",
+                "api_key": self.API_KEY
+            })
+
+    @property
+    def scraping_active(self):
+        return bool(int(self.redis_client.hget(f"scraper:{self.faction_id}", "scraping_active")))
+
+    @scraping_active.setter 
+    def scraping_active(self, value):
+        self.redis_client.hset(f"scraper:{self.faction_id}", "scraping_active", "1" if value else "0")
        
    def fetch_faction_data(self):
        url = f"https://api.torn.com/faction/{self.faction_id}?selections=&key={self.API_KEY}"
@@ -48,16 +87,14 @@ class Scraper:
                time.sleep(2 ** attempt)  # Exponential backoff
        return None

-    def start_scraping(self, app) -> None:
+    def start_scraping(self) -> None:
        """Starts the scraping process until the end time is reached or stopped manually."""
        self.scraping_active = True
        
-        # Anwendungskontext explizit setzen
-        with app.app_context():
        current_app.logger.info(f"Starting scraping for faction ID {self.faction_id}")
        current_app.logger.debug(f"Fetch interval: {self.fetch_interval}s, Run interval: {self.run_interval} days, End time: {self.end_time}")

-            MAX_FAILURES = 5  # Stop after 5 consecutive failures
+        MAX_FAILURES = 5
        failure_count = 0

        while datetime.now() < self.end_time and self.scraping_active:
@@ -122,6 +159,18 @@ class Scraper:
        except Exception as e:
            current_app.logger.error(f"Error saving data to {self.data_file_name}: {e}")

+    def cleanup_redis_state(self):
+        """Clean up all Redis state for this scraper instance"""
+        if hasattr(self, 'faction_id'):
+            self.redis_client.delete(f"scraper:{self.faction_id}")
+            current_id = self.redis_client.get("current_faction_id")
+            if current_id and current_id == str(self.faction_id):
+                self.redis_client.delete("current_faction_id")
+            # Remove from instances tracking
+            with self._lock:
+                if self.faction_id in self._instances:
+                    del self._instances[self.faction_id]
+
    def handle_scraping_end(self) -> None:
        """Handles cleanup and logging when scraping ends."""
        if not self.scraping_active:
@@ -133,7 +182,13 @@ class Scraper:

        current_app.logger.info("Scraping completed.")
        self.scraping_active = False
+        self.cleanup_redis_state()
    
    def stop_scraping(self):
        self.scraping_active = False
-        current_app.logger.debug("Scraping stopped by user")
+        self.cleanup_redis_state()
+        current_app.logger.debug(f"Scraping stopped for faction {self.faction_id}")
+
+    def __del__(self):
+        """Ensure Redis cleanup on object destruction"""
+        self.cleanup_redis_state()
--- a/app/static/scraper_utils.js
+++ b/app/static/scraper_utils.js
@@ -12,6 +12,7 @@ export class ScraperUtils {

        this.serverTime = null;
        this.endTime = null;
+        this.pollInterval = null;  // Add this line

        this.init();
    }
@@ -20,7 +21,6 @@ export class ScraperUtils {
        this.showLoadingIndicator();
    
        try {
-            // Ensure each function runs only once
            await Promise.all([
                this.updateServerTime(), 
                this.checkScrapingStatus()
@@ -29,8 +29,12 @@ export class ScraperUtils {
            console.error("Error during initialization:", error);
        }
    
-        // Ensure end time is fetched only if scraping is active
-        if (this.endTime === null) {
+        // Start polling for status updates
+        this.startPolling();
+
+        // Only start the clock and wait for end time if scraping is active
+        if (this.activityIndicator.textContent === 'Active') {
+            if (!this.endTime) {
                try {
                    await this.fetchEndTime();
                } catch (error) {
@@ -38,22 +42,28 @@ export class ScraperUtils {
                }
            }
            
-        // Ensure UI is only updated once everything is ready
            if (this.serverTime && this.endTime) {
                this.startClock();
-            this.hideLoadingIndicator();
-        } else {
-            console.warn("Delaying hiding the loading indicator due to missing data...");
-            const checkDataInterval = setInterval(() => {
-                if (this.serverTime && this.endTime) {
-                    clearInterval(checkDataInterval);
-                    this.startClock();
-                    this.hideLoadingIndicator();
-                }
-            }, 500);
            }
        }
        
+        // Hide loading indicator regardless of scraping status
+        this.hideLoadingIndicator();
+    }
+
+    startPolling() {
+        // Poll every 2 seconds
+        this.pollInterval = setInterval(async () => {
+            await this.checkScrapingStatus();
+        }, 2000);
+    }
+
+    stopPolling() {
+        if (this.pollInterval) {
+            clearInterval(this.pollInterval);
+            this.pollInterval = null;
+        }
+    }

    showLoadingIndicator() {
        this.statusContainer.classList.remove('d-none');
@@ -79,9 +89,7 @@ export class ScraperUtils {
                this.activityIndicator.classList.add('text-bg-success');
                this.activityIndicator.textContent = 'Active';
    
-                console.log(`Scraping is active until ${data.end_time} TCT`);
-    
-                // Only call fetchEndTime() if endTime is not already set
+                // Fetch end time if we don't have it yet
                if (!this.endTime) {
                    await this.fetchEndTime();
                }
@@ -98,6 +106,9 @@ export class ScraperUtils {
    
                this.endTimeElement.classList.add('d-none');
                this.timeLeftElement.classList.add('d-none');
+                
+                // Reset end time when inactive
+                this.endTime = null;
            }
        } catch (error) {
            console.error('Error checking scraping status:', error);
@@ -177,4 +188,16 @@ export class ScraperUtils {
        const seconds = totalSeconds % 60;
        return `${String(hours).padStart(2, '0')}:${String(minutes).padStart(2, '0')}:${String(seconds).padStart(2, '0')}`;
    }
+
+    // Add cleanup method
+    cleanup() {
+        this.stopPolling();
    }
+}
+
+// Add event listener for page unload
+window.addEventListener('unload', () => {
+    if (window.scraperUtils) {
+        window.scraperUtils.cleanup();
+    }
+});
--- a/app/tasks.py
+++ b/app/tasks.py
@@ -0,0 +1,93 @@
+from celery import Celery
+from app.models import Scraper
+import redis
+from datetime import timedelta
+from flask import current_app
+
+def create_celery():
+    celery = Celery('tasks', broker='redis://localhost:6379/0')
+    celery.conf.update(
+        task_serializer='json',
+        accept_content=['json'],
+        result_serializer='json',
+        timezone='UTC'
+    )
+    return celery
+
+def init_celery(app):
+    """Initialize Celery with Flask app context"""
+    celery = create_celery()
+    celery.conf.update(app.config)
+
+    class ContextTask(celery.Task):
+        def __call__(self, *args, **kwargs):
+            with app.app_context():
+                return self.run(*args, **kwargs)
+
+    celery.Task = ContextTask
+    return celery
+
+celery = create_celery()  # This will be initialized properly in app/__init__.py
+
+def get_redis():
+    return redis.StrictRedis(
+        host='localhost',
+        port=6379,
+        db=0,
+        decode_responses=True
+    )
+
+@celery.task
+def start_scraping_task(faction_id, fetch_interval, run_interval, config_dict):
+    """
+    Start scraping task with serializable parameters
+    Args:
+        faction_id: ID of the faction to scrape
+        fetch_interval: Interval between fetches in seconds
+        run_interval: How long to run the scraper in days
+        config_dict: Dictionary containing configuration
+    """
+    try:
+        redis_client = get_redis()
+        # Set current faction ID at task start
+        redis_client.set("current_faction_id", str(faction_id))
+        
+        scraper = Scraper(
+            faction_id=faction_id,
+            fetch_interval=int(fetch_interval),
+            run_interval=int(run_interval),
+            config=config_dict
+        )
+        scraper.start_scraping()
+        return {"status": "success"}
+    except Exception as e:
+        # Clean up Redis state on error
+        redis_client = get_redis()
+        redis_client.delete("current_faction_id")
+        return {"status": "error", "message": str(e)}
+
+@celery.task
+def stop_scraping_task(faction_id):
+    """Stop scraping task and clean up Redis state"""
+    try:
+        redis_client = get_redis()
+        
+        # Clean up Redis state
+        redis_client.hset(f"scraper:{faction_id}", "scraping_active", "0")
+        redis_client.delete(f"scraper:{faction_id}")
+        
+        # Clean up current_faction_id if it matches
+        current_id = redis_client.get("current_faction_id")
+        if current_id and current_id == str(faction_id):
+            redis_client.delete("current_faction_id")
+            
+        # Revoke any running tasks for this faction
+        celery.control.revoke(
+            celery.current_task.request.id,
+            terminate=True,
+            signal='SIGTERM'
+        )
+        
+        return {"status": "success", "message": f"Stopped scraping for faction {faction_id}"}
+    except Exception as e:
+        return {"status": "error", "message": str(e)}
--- a/app/views.py
+++ b/app/views.py
@@ -2,6 +2,8 @@ import os
 import glob
 from flask import render_template, Blueprint, current_app, request

+from app.tasks import get_redis
+
 from app.forms import ScrapingForm
 from app.util import get_size
 from app.config import load_config
@@ -13,6 +15,14 @@ from datetime import datetime

 views_bp = Blueprint("views", __name__)

+def sizeof_fmt(num, suffix="B"):
+    """Convert bytes to human readable format"""
+    for unit in ["", "Ki", "Mi", "Gi", "Ti", "Pi", "Ei", "Zi"]:
+        if abs(num) < 1024.0:
+            return f"{num:3.1f} {unit}{suffix}"
+        num /= 1024.0
+    return f"{num:.1f} Yi{suffix}"
+
 def register_views(app):
    @app.route('/')
    def index():
@@ -29,49 +39,59 @@ def register_views(app):
    
    @app.route('/download_results')
    def download_results():
-        log_file_name = os.path.abspath(app.config['LOG_FILE_NAME'])
-        scraper = app.config.get('SCRAPER')
+        # Get the current active log file and data file from Redis and app config
+        redis_client = get_redis()
+        current_faction_id = redis_client.get("current_faction_id")
        
-        if scraper:
-            print(scraper.data_file_name)
-        if not scraper:
-            print("Scraper not initialized")
+        active_data_file = None
+        if current_faction_id:
+            active_data_file = redis_client.hget(f"scraper:{current_faction_id}", "data_file_name")
        
-        data_dir = os.path.abspath(current_app.config['DATA']['DATA_DIR'])
-        log_dir = os.path.abspath(current_app.config['LOGGING']['LOG_DIR'])
+        active_log_file = app.config['LOG_FILE_NAME']

-        data_files = glob.glob(os.path.join(data_dir, "*.csv"))
-        log_files = glob.glob(os.path.join(log_dir, "*.log"))
+        def get_file_info(file_path, file_type='data'):
+            stats = os.stat(file_path)
+            name = os.path.basename(file_path)
+            
+            # Determine if file is active
+            is_active = False
+            if file_type == 'data' and active_data_file:
+                is_active = os.path.abspath(file_path) == os.path.abspath(active_data_file)
+            elif file_type == 'log' and active_log_file:
+                is_active = os.path.basename(file_path) == os.path.basename(active_log_file)

-        def get_file_info(file_path):
            return {
-                "name": file_path,
-                "name_display": os.path.basename(file_path),
-                "last_modified": os.path.getmtime(file_path),
-                "created": os.path.getctime(file_path),
-                "size": get_size(file_path)
+                'name': file_path,  # Full path for internal use
+                'name_display': name,  # Just filename for display
+                'last_modified': stats.st_mtime,  # Send timestamp instead of datetime
+                'created': stats.st_ctime,        # Send timestamp instead of datetime
+                'size': sizeof_fmt(stats.st_size),
+                'active': is_active
            }

-        data_files_info = [get_file_info(file) for file in data_files]
-        log_files_info = [get_file_info(file) for file in log_files]
+        data_files = []
+        log_files = []

-        if scraper and scraper.scraping_active:
-            for data_file in data_files_info:
-                if os.path.abspath(scraper.data_file_name) == data_file['name']:
-                    data_file['active'] = True
-                else:
-                    data_file['active'] = False
+        # Get data files
+        data_dir = os.path.abspath(app.config['DATA']['DATA_DIR'])
+        if os.path.exists(data_dir):
+            for file in glob.glob(os.path.join(data_dir, "*.csv")):
+                data_files.append(get_file_info(file, 'data'))

-        for log_file in log_files_info:
-            if log_file_name == os.path.abspath(log_file['name']):
-                log_file['active'] = True
-            else:
-                log_file['active'] = False
+        # Get log files
+        log_dir = os.path.abspath(app.config['LOGGING']['LOG_DIR'])
+        if os.path.exists(log_dir):
+            for file in glob.glob(os.path.join(log_dir, "*.log")):
+                log_files.append(get_file_info(file, 'log'))

-        data_files_info.sort(key=lambda x: x['last_modified'], reverse=True)
-        log_files_info.sort(key=lambda x: x['last_modified'], reverse=True)
+        # Sort files by modification time, newest first
+        data_files.sort(key=lambda x: x['last_modified'], reverse=True)
+        log_files.sort(key=lambda x: x['last_modified'], reverse=True)

-        files = {"data": data_files_info, "log": log_files_info}
+        files = {
+            'data': data_files,
+            'log': log_files
+        }

        return render_template('download_results.html', files=files)
    
@@ -120,7 +140,7 @@ def register_views(app):

    @views_bp.route('/server_time')
    def server_time():
-        current_time = datetime.utcnow().strftime('%Y-%m-%d %H:%M:%S')
+        current_time = datetime.now(datetime.timezone.utc).strftime('%Y-%m-%d %H:%M:%S')
        return {'server_time': current_time}
    
    app.register_blueprint(views_bp)
--- a/fly.toml
+++ b/fly.toml
@@ -0,0 +1,20 @@
+# fly.toml app configuration file generated for tornactivitytracker on 2025-02-11T02:59:23+01:00
+#
+# See https://fly.io/docs/reference/configuration/ for information about how to use this file.
+#
+
+app = 'tornactivitytracker'
+primary_region = 'fra'
+
+[build]
+
+[http_service]
+  internal_port = 8080
+  force_https = true
+  auto_stop_machines = 'stop'
+  auto_start_machines = true
+  min_machines_running = 0
+  processes = ['app']
+
+[[vm]]
+  size = 'shared-cpu-2x'
--- a/requirements.in
+++ b/requirements.in
@@ -9,3 +9,5 @@ seaborn
 configparser
 plotly
 configobj
+redis
+celery
--- a/requirements.txt
+++ b/requirements.txt
@@ -4,16 +4,33 @@
 #
 #    pip-compile requirements.in
 #
+amqp==5.3.1
+    # via kombu
+billiard==4.2.1
+    # via celery
 blinker==1.9.0
    # via flask
 bootstrap-flask==2.4.1
    # via -r requirements.in
+celery==5.4.0
+    # via -r requirements.in
 certifi==2025.1.31
    # via requests
 charset-normalizer==3.4.1
    # via requests
 click==8.1.8
-    # via flask
+    # via
+    #   celery
+    #   click-didyoumean
+    #   click-plugins
+    #   click-repl
+    #   flask
+click-didyoumean==0.3.1
+    # via celery
+click-plugins==1.1.1
+    # via celery
+click-repl==0.3.0
+    # via celery
 configobj==5.0.9
    # via -r requirements.in
 configparser==7.1.0
@@ -41,6 +58,8 @@ jinja2==3.1.5
    # via flask
 kiwisolver==1.4.8
    # via matplotlib
+kombu==5.4.2
+    # via celery
 markupsafe==3.0.2
    # via
    #   jinja2
@@ -50,9 +69,9 @@ matplotlib==3.10.0
    # via
    #   -r requirements.in
    #   seaborn
-narwhals==1.26.0
+narwhals==1.27.1
    # via plotly
-numpy==2.2.2
+numpy==2.2.3
    # via
    #   contourpy
    #   matplotlib
@@ -70,14 +89,19 @@ pillow==11.1.0
    # via matplotlib
 plotly==6.0.0
    # via -r requirements.in
+prompt-toolkit==3.0.50
+    # via click-repl
 pyparsing==3.2.1
    # via matplotlib
 python-dateutil==2.9.0.post0
    # via
+    #   celery
    #   matplotlib
    #   pandas
 pytz==2025.1
    # via pandas
+redis==5.2.1
+    # via -r requirements.in
 requests==2.32.3
    # via -r requirements.in
 seaborn==0.13.2
@@ -85,9 +109,19 @@ seaborn==0.13.2
 six==1.17.0
    # via python-dateutil
 tzdata==2025.1
-    # via pandas
+    # via
+    #   celery
+    #   kombu
+    #   pandas
 urllib3==2.3.0
    # via requests
+vine==5.1.0
+    # via
+    #   amqp
+    #   celery
+    #   kombu
+wcwidth==0.2.13
+    # via prompt-toolkit
 werkzeug==3.1.3
    # via flask
 wtforms==3.2.1
--- a/run.py
+++ b/run.py
@@ -1,5 +1,6 @@
 from app import create_app

-if __name__ == '__main__':
 app = create_app()
-    app.run(debug=True, threaded=True)
+
+if __name__ == '__main__':
+    app.run(debug=True)
--- a/stop_scraping.py
+++ b/stop_scraping.py
@@ -0,0 +1,50 @@
+import redis
+import argparse
+
+def get_redis():
+    return redis.StrictRedis(
+        host='localhost',
+        port=6379,
+        db=0,
+        decode_responses=True
+    )
+
+def stop_scraping(flush=False, force=False):
+    redis_client = get_redis()
+    
+    if flush:
+        redis_client.flushall()
+        print("Flushed all Redis data")
+        return True
+        
+    current_faction_id = redis_client.get("current_faction_id")
+    
+    if not current_faction_id:
+        print("No active scraping session found.")
+        return False if not force else True
+        
+    redis_client.hset(f"scraper:{current_faction_id}", "scraping_active", "0")
+    print(f"Sent stop signal to scraping process for faction {current_faction_id}")
+    return True
+
+if __name__ == "__main__":
+    parser = argparse.ArgumentParser(description='Stop the Torn Activity Tracker scraping process.')
+    parser.add_argument('--force', action='store_true', help='Force stop even if no active session is found')
+    parser.add_argument('--flush', action='store_true', help='Flush all Redis data (WARNING: This will clear ALL Redis data)')
+    
+    args = parser.parse_args()
+    
+    if args.flush:
+        if input("WARNING: This will delete ALL Redis data. Are you sure? (y/N) ").lower() != 'y':
+            print("Operation cancelled.")
+            exit(0)
+            
+    success = stop_scraping(flush=args.flush, force=args.force)
+    
+    if not success and args.force:
+        print("Forcing stop for all potential scraping processes...")
+        redis_client = get_redis()
+        # Get all scraper keys
+        for key in redis_client.keys("scraper:*"):
+            redis_client.hset(key, "scraping_active", "0")
+        print("Sent stop signal to all potential scraping processes.")
--- a/tests/analyses.ipynb
+++ b/tests/analyses.ipynb
Author	SHA1	Message	Date
Michael Beck	adc002b38d	updates meta	2025-02-20 20:02:47 +01:00
Michael Beck	5994d8ae7b	refactors to use redis & celery	2025-02-20 19:56:37 +01:00
Michael Beck	f68ada7204	adds docker & fly.toml	2025-02-20 14:32:09 +01:00
Michael Beck	2217bd5855	README.md aktualisiert	2025-02-12 13:25:17 +01:00
Michael Beck	fa5d59b069	tests/analyses.ipynb gelöscht	2025-02-12 13:15:32 +01:00