diff --git a/pytest.ini b/pytest.ini
new file mode 100644
index 0000000..6e4f236
--- /dev/null
+++ b/pytest.ini
@@ -0,0 +1,2 @@
+[pytest]
+pythonpath = server
\ No newline at end of file
diff --git a/server/audio_processing.py b/server/audio_processing.py
index 16c73af..e80b340 100644
--- a/server/audio_processing.py
+++ b/server/audio_processing.py
@@ -104,7 +104,7 @@ def detect_ads(transcript):
         raise
 
 
-def remove_ads(audio, ad_segments):
+def remove_ads(audio, ad_segments, flag=None):
     """Removes ad segments from the audio file with optimized processing."""
     if not ad_segments:
         print("No ads to remove.")
@@ -121,7 +121,7 @@ def remove_ads(audio, ad_segments):
         start, end = segment["start"] * 1000, segment["end"] * 1000  # Convert to milliseconds
 
         # Edge Case 1: Adjust ads in the first 5 seconds
-        if start <= 5000:
+        if start <= 5000 and flag=="first":
             start = max(0, start - 1000)
 
         # Edge Case 2: Merge close ads
@@ -131,7 +131,7 @@ def remove_ads(audio, ad_segments):
             merged_ads.append({"start": start, "end": end})
 
     # Edge Case 3: Remove everything from the last ad if it's near the end
-    if merged_ads and merged_ads[-1]["end"] >= total_duration - 10000:
+    if merged_ads and merged_ads[-1]["end"] >= total_duration - 10000 and flag=="last":
         merged_ads[-1]["end"] = total_duration
 
     # Extract non-ad sections with proper updating of previous_end
@@ -189,10 +189,14 @@ def process_audio(audio_segment, url, streaming):
             logger.info(f"Transcription complete for chunk {i + 1}/{len(chunks)}: {url}")
 
             ad_segments = detect_ads(transcription)
-            logger.info(f"Ad-analysis complete for chunk {i + 1}/{len(chunks)}: {url}")
-
-            processed_chunk = remove_ads(chunk, ad_segments)
-            logger.info(f"Processing complete for chunk {i + 1}/{len(chunks)}: {url}")
+            logger.info(f"Ad-analysis complete for chunk {i+1}/{len(chunks)}: {url}")
+            flag = None
+            if i == 0:
+                flag = "first"
+            elif i == len(chunks) - 1:
+                flag = "last"
+            processed_chunk = remove_ads(chunk, ad_segments, flag=flag)
+            logger.info(f"Processing complete for chunk {i+1}/{len(chunks)}: {url}")
 
             if i == 0 and not streaming:
                 processed_chunk = intro + processed_chunk
diff --git a/server/tests/__init__.py b/server/enums/__init__.py
similarity index 100%
rename from server/tests/__init__.py
rename to server/enums/__init__.py
diff --git a/server/tests/helpers/__init__.py b/server/helpers/__init__.py
similarity index 100%
rename from server/tests/helpers/__init__.py
rename to server/helpers/__init__.py
diff --git a/server/pytest.ini b/server/pytest.ini
deleted file mode 100644
index 03f586d..0000000
--- a/server/pytest.ini
+++ /dev/null
@@ -1,2 +0,0 @@
-[pytest]
-pythonpath = .
\ No newline at end of file
diff --git a/server/tests/helpers/test_cache_helpers.py b/server/tests/helpers/test_cache_helpers.py
deleted file mode 100644
index 55c2fef..0000000
--- a/server/tests/helpers/test_cache_helpers.py
+++ /dev/null
@@ -1,85 +0,0 @@
-import pytest
-import logging
-from unittest.mock import MagicMock, patch
-from flask import Flask
-
-from server.helpers.cache_helpers import (
-    setup_cache, initiate_key, cache_audio,
-    retrieve_audio, cached_rss_url, cached_source_url
-)
-
-@pytest.fixture
-def mock_redis():
-    """Creates a mock Redis client."""
-    mock = MagicMock()
-    mock.scan_iter.return_value = iter([])  # Default: No cached data
-    return mock
-
-
-@pytest.fixture
-def mock_app():
-    """Creates a mock Flask app."""
-    app = Flask(__name__)
-    return app
-
-def test_setup_cache(mock_app, mock_redis):
-    """Test that cache is properly set up."""
-    with patch("helpers.cache_helpers.redis_client", mock_redis):
-        mock_app.config["CACHE_TYPE"] = "simple"  # ✅ Use in-memory cache for testing
-        setup_cache(mock_app, mock_redis)
-        assert mock_redis is not None  # Ensure redis_client is set
-
-
-def test_initiate_key(mock_redis, caplog):
-    """Test that initiate_key sets a value in Redis."""
-    with patch("helpers.cache_helpers.redis_client", mock_redis):
-        with caplog.at_level(logging.ERROR):
-            initiate_key("test_key")
-            mock_redis.set.assert_called_with("test_key", "INIT")  # Fix: Ensure this call actually happens
-            assert "Error initializing key in cache" not in caplog.text
-
-
-def test_cache_audio(mock_redis):
-    """Test that cache_audio stores the file path in Redis."""
-    with patch("helpers.cache_helpers.redis_client", mock_redis):
-        cache_audio("audio_key", "/path/to/audio.mp3")
-        mock_redis.set.assert_called_with("audio_key", "/path/to/audio.mp3")
-
-
-def test_retrieve_audio_found(mock_redis):
-    """Test that retrieve_audio returns the correct path if found."""
-    with patch("helpers.cache_helpers.redis_client", mock_redis):
-        mock_redis.scan_iter.side_effect = lambda pattern: iter(["audio_key"])
-        mock_redis.get.return_value = b"/path/to/audio.mp3"
-
-        result = retrieve_audio("audio.mp3")
-        assert result == b"/path/to/audio.mp3"
-
-
-def test_retrieve_audio_not_found(mock_redis):
-    """Test that retrieve_audio returns None if not found."""
-    with patch("helpers.cache_helpers.redis_client", mock_redis):
-        mock_redis.scan_iter.return_value = iter([])
-
-        result = retrieve_audio("audio.mp3")
-        assert result is None
-
-
-def test_cached_rss_url(mock_redis):
-    """Test that cached_rss_url checks if an RSS URL is cached."""
-    with patch("helpers.cache_helpers.redis_client", mock_redis):
-        mock_redis.scan_iter.return_value = iter(["rss_url::source_url"])
-        assert cached_rss_url("rss_url") is True  # rss_url should be found
-
-        mock_redis.scan_iter.return_value = iter([])
-        assert cached_rss_url("rss_url") is False
-
-
-def test_cached_source_url(mock_redis):
-    """Test that cached_source_url checks if a source URL is cached."""
-    with patch("helpers.cache_helpers.redis_client", mock_redis):
-        mock_redis.scan_iter.return_value = iter(["rss_url::source_url"])
-        assert cached_source_url("source_url") is True  # source_url should be found
-
-        mock_redis.scan_iter.return_value = iter([])
-        assert cached_source_url("source_url") is False
\ No newline at end of file
diff --git a/server/tests/helpers/test_file_helpers.py b/server/tests/helpers/test_file_helpers.py
deleted file mode 100644
index 9754c1c..0000000
--- a/server/tests/helpers/test_file_helpers.py
+++ /dev/null
@@ -1,42 +0,0 @@
-import os
-import pytest
-from server.helpers.file_helpers import allowed_file, save_file, sanitize_filename  # Bytt ut "your_module" med riktig filnavn
-
-
-def test_allowed_file():
-    """Test allowed_file function with valid and invalid file extensions."""
-    allowed_extensions = {"wav", "flacc", "mp3"}
-
-    #  Valid file-types
-    assert allowed_file("image.wav", allowed_extensions) is True
-    assert allowed_file("audio.mp3", allowed_extensions) is True
-
-    # invalid file-types
-    assert allowed_file("document.pdf", allowed_extensions) is False
-    assert allowed_file("script.exe", allowed_extensions) is False
-
-    # files with no extension
-    assert allowed_file("nofileextension", allowed_extensions) is False
-
-
-def test_save_file():
-    """Test that save_file returns the correct file path."""
-    upload_folder = "/uploads"
-
-    expected_path = os.path.abspath(os.path.normpath("/uploads/testfile.txt"))
-    result_path = os.path.abspath(save_file("testfile.txt", upload_folder))
-    assert result_path == expected_path
-
-    expected_path = os.path.abspath(os.path.normpath("/uploads/audio.mp3"))
-    result_path = os.path.abspath(save_file("audio.mp3", upload_folder))
-    assert result_path == expected_path
-def test_sanitize_filename():
-    """Test sanitize_filename function to ensure invalid characters are removed."""
-
-    # Remove invalid char in files
-    assert sanitize_filename('test<>file.txt') == 'test__file.txt'
-    assert sanitize_filename('my|file?.mp3') == 'my_file_.mp3'
-
-    # Not change anything if file name is normal
-    assert sanitize_filename('normal_file.txt') == 'normal_file.txt'
-    assert sanitize_filename('audio.mp3') == 'audio.mp3'
\ No newline at end of file
diff --git a/server/tests/helpers/test_url_helpers.py b/server/tests/helpers/test_url_helpers.py
deleted file mode 100644
index 9c37197..0000000
--- a/server/tests/helpers/test_url_helpers.py
+++ /dev/null
@@ -1,35 +0,0 @@
-from server.helpers.url_helpers import (
-    normalize_url, generate_cache_url,
-    extract_name, extract_title, extract_extension
-)
-
-
-def test_normalize_url():
-    """Ensures that URLs are normalized to end with .mp3."""
-    assert normalize_url("https://example.com/audio.mp3?param=value") == "https://example.com/audio.mp3"
-
-
-def test_generate_cache_url():
-    """Tests that the cache URL is generated correctly."""
-    assert generate_cache_url("rss_url", "source_url") == "rss_url::source_url"
-
-
-def test_extract_name():
-    """Tests that the file extension is extracted correctly from the URL."""
-    assert extract_name("https://example.com/audio.mp3") == "mp3"
-    assert extract_name("https://example.com/path/to/song.wav") == "wav"
-    assert extract_name("https://example.com/no-extension") == ""
-
-
-def test_extract_title():
-    """Tests that the title (filename without extension) is correctly extracted."""
-    assert extract_title("./uploads/audio.mp3") == "./uploads/audio"
-    assert extract_title("./uploads/song.wav") == "./uploads/song"
-    assert extract_title("./uploads/no-extension") == "./uploads/no-extension"
-
-
-def test_extract_extension():
-    """Tests that the file extension is extracted correctly."""
-    assert extract_extension("https://example.com/audio.mp3") == ".mp3"
-    assert extract_extension("https://example.com/song.WAV") == ".wav"
-    assert extract_extension("https://example.com/no-extension") == ""
\ No newline at end of file
diff --git a/server/tests/whisper/podblock_test.py b/server/tests/whisper/podblock_test.py
index 4ef6d31..95c356d 100644
--- a/server/tests/whisper/podblock_test.py
+++ b/server/tests/whisper/podblock_test.py
@@ -1,241 +1,242 @@
-import os
-import re
-import logging
-import json
-
-import time
-import openai
-import pytest
-import textwrap
-
-from pathlib import Path
-from dotenv import load_dotenv
-from time import perf_counter
-from io import BytesIO
-
-from pydub import AudioSegment
-from faster_whisper import WhisperModel, BatchedInferencePipeline
-
-env_path = Path(__file__).parents[2] / "api.env"
-load_dotenv(dotenv_path=env_path)
-
-client = openai.OpenAI(api_key=os.environ["OPENAI_API_KEY"])
-
-logging.basicConfig(level=logging.INFO, format="%(asctime)s %(levelname)s %(name)s: %(message)s")
-logger = logging.getLogger(__name__)
-
-NORWEGIAN_AUDIO_PATH = Path(__file__).parent / "resources" / "norwegian.mp3"
-ENGLISH_AUDIO_PATH = Path(__file__).parent / "resources" / "english.mp3"
-
-WHISPER_MODELS = ["tiny", "base", "small"]
-GPT_MODELS = ["gpt-4o-mini", "gpt-4o"]
-
-RESULTS_DIR = Path(__file__).parent / "results"
-RESULTS_DIR.mkdir(exist_ok=True, parents=True)
-
-
-def test_transcribe_and_save():
-    if not NORWEGIAN_AUDIO_PATH.exists():
-        pytest.skip(f"Audio file not found: {NORWEGIAN_AUDIO_PATH}")
-
-    if not ENGLISH_AUDIO_PATH.exists():
-        pytest.skip(f"Audio file not found: {ENGLISH_AUDIO_PATH}")
-
-    audio_segment_norwegian = AudioSegment.from_mp3(NORWEGIAN_AUDIO_PATH)
-    chunks_norwegian = chunk_audio(audio_segment_norwegian)
-
-    audio_segment_english = AudioSegment.from_mp3(ENGLISH_AUDIO_PATH)
-    chunks_english = chunk_audio(audio_segment_english)
-
-    if not chunks_norwegian:
-        pytest.skip(f"Audio could not be chunked: {NORWEGIAN_AUDIO_PATH}")
-
-    if not chunks_english:
-        pytest.skip(f"Audio could not be chunked: {ENGLISH_AUDIO_PATH}")
-
-    process_chunks(chunks_norwegian, audio_segment_norwegian, NORWEGIAN_AUDIO_PATH, 'norwegian')
-    process_chunks(chunks_english, audio_segment_english, ENGLISH_AUDIO_PATH, 'english')
-
-
-def process_chunks(chunks, audio_segment, audio_path, language):
-    for whisper_name in WHISPER_MODELS:
-        try:
-            logger.info("Loading model %s", whisper_name)
-            whisper_model = WhisperModel(whisper_name, device="cpu", compute_type="int8")
-            batched_model = BatchedInferencePipeline(model=whisper_model)
-
-            times = []
-            ads_results = []
-            transcripts = []
-
-            logger.info(f"Transcribing {audio_path} with {whisper_name}!")
-            for i, chunk in enumerate(chunks):
-                logger.info(f'Processing chunk {i + 1}/{len(chunks)} with model: {whisper_name}')
-                duration = chunk.duration_seconds
-                chunk_start = perf_counter()
-                transcription = transcribe_audio(chunk, batched_model)
-                chunk_end = perf_counter()
-
-                transcription_time = chunk_end - chunk_start
-                times.append({
-                    "chunk_id": i,
-                    "duration": duration,
-                    "transcription_time": transcription_time
-                })
-
-                transcripts.append({
-                    "chunk_id": i,
-                    "transcription": transcription
-                })
-
-                for gpt_name in GPT_MODELS:
-                    logger.info(f'Detecting ads with {gpt_name}')
-                    ad_detection, usage = detect_ads(transcription, gpt_name)
-                    ads_results.append({
-                        "model": gpt_name,
-                        "usage": usage,
-                        "ads": {
-                            "chunk_id": i,
-                            "ads": ad_detection
-                        }
-                    })
-                logger.info(
-                    f'Processed chunk {i + 1}/{len(chunks)} with model: {whisper_name} in {transcription_time:.2f} seconds')
-
-            save_result(language, whisper_name, times, ads_results, transcripts, RESULTS_DIR)
-            logger.info(f"Completed benchmark for model {whisper_name}")
-            time_file = RESULTS_DIR / language / whisper_name / "time.json"
-            assert time_file.exists(), f"{whisper_name} did not produce time.json"
-
-        except Exception as e:
-            logger.error(f"Error processing model {whisper_name}: {str(e)}")
-
-
-def save_result(language, model_name, times, ads, transcripts, output_dir):
-    model_dir = output_dir / language /model_name
-    model_dir.mkdir(exist_ok=True, parents=True)
-
-    # Save  timing information
-    time_file = model_dir / "time.json"
-    with open(time_file, "w") as f:
-        time_data = {
-            "model": model_name,
-            "total_time": sum(item["transcription_time"] for item in times),
-            "chunk_times": times
-        }
-        json.dump(time_data, f, indent=2)
-
-    # Save ad detection results
-    ads_file = model_dir / "ads.json"
-    with open(ads_file, "w") as f:
-        ads_data = {
-            "model": model_name,
-            "ads": ads
-        }
-        json.dump(ads_data, f, indent=2)
-
-    # Save plain text transcription
-    text_file = model_dir / "transcription.txt"
-    with open(text_file, "w") as f:
-        for chunk in transcripts:
-            f.write(f"--- Chunk {chunk['chunk_id']} ---\n")
-            # Extract all words and join them
-            if chunk["transcription"]:
-                if isinstance(chunk["transcription"], str):
-                    # Handle already formatted string
-                    f.write(f"{chunk['transcription']}\n\n")
-                else:
-                    # Handle structured transcription
-                    full_text = " ".join(item["text"] for item in chunk["transcription"])
-                    f.write(f"{full_text}\n\n")
-
-    no_ts_file = model_dir / "transcript_plain.txt"
-    with open(no_ts_file, "w") as f_plain:
-        for chunk in transcripts:
-            raw = chunk["transcription"]
-            cleaned = re.sub(r"\[\d+\.\d+-\d+\.\d+\]\s*", "", raw)
-            paragraph = " ".join(cleaned.split())
-            wrapped = textwrap.fill(paragraph, width=80)
-            f_plain.write(f"--- Chunk {chunk['chunk_id']} ---\n")
-            f_plain.write(wrapped + "\n\n")
-
-    logger.info(f"Results for model {model_name} saved to {model_dir}")
-
-
-def chunk_audio(audio, chunk_duration_seconds=240, chunk_duration_ms=240000):
-    duration_seconds = audio.duration_seconds
-    if duration_seconds <= chunk_duration_seconds:
-        chunks = [audio]
-    else:
-        chunks = [audio[i:i + chunk_duration_ms] for i in range(0, len(audio), chunk_duration_ms)]
-    return chunks
-
-
-def detect_ads(transcript, llm_model):
-    try:
-        completion = \
-            client.chat.completions.create(
-                model=llm_model,
-                messages=[
-                    {
-                        "role": "system",
-                        "content": "You are a system that detects ads in audio transcriptions from podcasts. "
-                                   "Based on the word-level timestamps provided, determine the start and end times of any ad segments. "
-                                   "For each ad segment, provide a 5-word summary of the ad. "
-                                   "Provide ad segments in the format: start: <time>, end: <time>, summary: '<summary>'. "
-                                   "If no ad is found, return 'No ad detected.'"
-                    },
-                    {
-                        "role": "user",
-                        "content": f"Here is the transcription with word-level timestamps:\n{transcript}"
-                    }
-                ]
-            )
-        usage = completion.usage
-        usage_dict = {
-            "prompt_tokens": usage.prompt_tokens,
-            "completion_tokens": usage.completion_tokens,
-            "total_tokens": usage.total_tokens
-        }
-
-        classification = completion.choices[0].message.content.strip()
-        logger.info(classification)
-        pattern = r"start:\s*([\d.]+).*?end:\s*([\d.]+).*?summary:\s*['\"]?([^'\"]+)['\"]?"
-        ad_segments = [{"start": float(m[0]), "end": float(m[1]), "summary": m[2].strip()} for m in
-                       re.findall(pattern, classification)]
-        logger.info(f"Detected ad-segments: {ad_segments}")
-        return ad_segments, usage_dict
-
-    except Exception as e:
-        raise
-
-
-def transcribe_audio(audio_segment, batched_model):
-    try:
-        buffer = BytesIO()
-        audio_segment.export(buffer, format="wav")
-        buffer.seek(0)
-
-        segments, _ = batched_model.transcribe(buffer, word_timestamps=True)
-
-        # Convert generator to list to avoid issues with it being consumed
-        segments_list = list(segments)
-
-        # Create structured transcription
-        transcription = [
-            {
-                "start": word.start,
-                "end": word.end,
-                "text": word.word
-            }
-            for segment in segments_list
-            for word in segment.words
-        ]
-
-        formatted_transcription = "\n".join(
-            [f"[{w['start']:.2f}-{w['end']:.2f}] {w['text']}" for w in transcription]
-        )
-        return formatted_transcription
-    except Exception as e:
-        logger.error(f"Error during transcription: {str(e)}")
-        return None
+# Test for performance and speed for the system. Uncomment if want to try to see the accuracy and speed of the system.
+# import os
+# import re
+# import logging
+# import json
+#
+# import time
+# import openai
+# import pytest
+# import textwrap
+#
+# from pathlib import Path
+# from dotenv import load_dotenv
+# from time import perf_counter
+# from io import BytesIO
+#
+# from pydub import AudioSegment
+# from faster_whisper import WhisperModel, BatchedInferencePipeline
+#
+# env_path = Path(__file__).parents[2] / "api.env"
+# load_dotenv(dotenv_path=env_path)
+#
+# client = openai.OpenAI(api_key=os.environ["OPENAI_API_KEY"])
+#
+# logging.basicConfig(level=logging.INFO, format="%(asctime)s %(levelname)s %(name)s: %(message)s")
+# logger = logging.getLogger(__name__)
+#
+# NORWEGIAN_AUDIO_PATH = Path(__file__).parent / "resources" / "norwegian.mp3"
+# ENGLISH_AUDIO_PATH = Path(__file__).parent / "resources" / "english.mp3"
+#
+# WHISPER_MODELS = ["tiny", "base", "small"]
+# GPT_MODELS = ["gpt-4o-mini", "gpt-4o"]
+#
+# RESULTS_DIR = Path(__file__).parent / "results"
+# RESULTS_DIR.mkdir(exist_ok=True, parents=True)
+#
+#
+# def test_transcribe_and_save():
+#     if not NORWEGIAN_AUDIO_PATH.exists():
+#         pytest.skip(f"Audio file not found: {NORWEGIAN_AUDIO_PATH}")
+#
+#     if not ENGLISH_AUDIO_PATH.exists():
+#         pytest.skip(f"Audio file not found: {ENGLISH_AUDIO_PATH}")
+#
+#     audio_segment_norwegian = AudioSegment.from_mp3(NORWEGIAN_AUDIO_PATH)
+#     chunks_norwegian = chunk_audio(audio_segment_norwegian)
+#
+#     audio_segment_english = AudioSegment.from_mp3(ENGLISH_AUDIO_PATH)
+#     chunks_english = chunk_audio(audio_segment_english)
+#
+#     if not chunks_norwegian:
+#         pytest.skip(f"Audio could not be chunked: {NORWEGIAN_AUDIO_PATH}")
+#
+#     if not chunks_english:
+#         pytest.skip(f"Audio could not be chunked: {ENGLISH_AUDIO_PATH}")
+#
+#     process_chunks(chunks_norwegian, audio_segment_norwegian, NORWEGIAN_AUDIO_PATH, 'norwegian')
+#     process_chunks(chunks_english, audio_segment_english, ENGLISH_AUDIO_PATH, 'english')
+#
+#
+# def process_chunks(chunks, audio_segment, audio_path, language):
+#     for whisper_name in WHISPER_MODELS:
+#         try:
+#             logger.info("Loading model %s", whisper_name)
+#             whisper_model = WhisperModel(whisper_name, device="cpu", compute_type="int8")
+#             batched_model = BatchedInferencePipeline(model=whisper_model)
+#
+#             times = []
+#             ads_results = []
+#             transcripts = []
+#
+#             logger.info(f"Transcribing {audio_path} with {whisper_name}!")
+#             for i, chunk in enumerate(chunks):
+#                 logger.info(f'Processing chunk {i + 1}/{len(chunks)} with model: {whisper_name}')
+#                 duration = chunk.duration_seconds
+#                 chunk_start = perf_counter()
+#                 transcription = transcribe_audio(chunk, batched_model)
+#                 chunk_end = perf_counter()
+#
+#                 transcription_time = chunk_end - chunk_start
+#                 times.append({
+#                     "chunk_id": i,
+#                     "duration": duration,
+#                     "transcription_time": transcription_time
+#                 })
+#
+#                 transcripts.append({
+#                     "chunk_id": i,
+#                     "transcription": transcription
+#                 })
+#
+#                 for gpt_name in GPT_MODELS:
+#                     logger.info(f'Detecting ads with {gpt_name}')
+#                     ad_detection, usage = detect_ads(transcription, gpt_name)
+#                     ads_results.append({
+#                         "model": gpt_name,
+#                         "usage": usage,
+#                         "ads": {
+#                             "chunk_id": i,
+#                             "ads": ad_detection
+#                         }
+#                     })
+#                 logger.info(
+#                     f'Processed chunk {i + 1}/{len(chunks)} with model: {whisper_name} in {transcription_time:.2f} seconds')
+#
+#             save_result(language, whisper_name, times, ads_results, transcripts, RESULTS_DIR)
+#             logger.info(f"Completed benchmark for model {whisper_name}")
+#             time_file = RESULTS_DIR / language / whisper_name / "time.json"
+#             assert time_file.exists(), f"{whisper_name} did not produce time.json"
+#
+#         except Exception as e:
+#             logger.error(f"Error processing model {whisper_name}: {str(e)}")
+#
+#
+# def save_result(language, model_name, times, ads, transcripts, output_dir):
+#     model_dir = output_dir / language /model_name
+#     model_dir.mkdir(exist_ok=True, parents=True)
+#
+#     # Save  timing information
+#     time_file = model_dir / "time.json"
+#     with open(time_file, "w") as f:
+#         time_data = {
+#             "model": model_name,
+#             "total_time": sum(item["transcription_time"] for item in times),
+#             "chunk_times": times
+#         }
+#         json.dump(time_data, f, indent=2)
+#
+#     # Save ad detection results
+#     ads_file = model_dir / "ads.json"
+#     with open(ads_file, "w") as f:
+#         ads_data = {
+#             "model": model_name,
+#             "ads": ads
+#         }
+#         json.dump(ads_data, f, indent=2)
+#
+#     # Save plain text transcription
+#     text_file = model_dir / "transcription.txt"
+#     with open(text_file, "w") as f:
+#         for chunk in transcripts:
+#             f.write(f"--- Chunk {chunk['chunk_id']} ---\n")
+#             # Extract all words and join them
+#             if chunk["transcription"]:
+#                 if isinstance(chunk["transcription"], str):
+#                     # Handle already formatted string
+#                     f.write(f"{chunk['transcription']}\n\n")
+#                 else:
+#                     # Handle structured transcription
+#                     full_text = " ".join(item["text"] for item in chunk["transcription"])
+#                     f.write(f"{full_text}\n\n")
+#
+#     no_ts_file = model_dir / "transcript_plain.txt"
+#     with open(no_ts_file, "w") as f_plain:
+#         for chunk in transcripts:
+#             raw = chunk["transcription"]
+#             cleaned = re.sub(r"\[\d+\.\d+-\d+\.\d+\]\s*", "", raw)
+#             paragraph = " ".join(cleaned.split())
+#             wrapped = textwrap.fill(paragraph, width=80)
+#             f_plain.write(f"--- Chunk {chunk['chunk_id']} ---\n")
+#             f_plain.write(wrapped + "\n\n")
+#
+#     logger.info(f"Results for model {model_name} saved to {model_dir}")
+#
+#
+# def chunk_audio(audio, chunk_duration_seconds=240, chunk_duration_ms=240000):
+#     duration_seconds = audio.duration_seconds
+#     if duration_seconds <= chunk_duration_seconds:
+#         chunks = [audio]
+#     else:
+#         chunks = [audio[i:i + chunk_duration_ms] for i in range(0, len(audio), chunk_duration_ms)]
+#     return chunks
+#
+#
+# def detect_ads(transcript, llm_model):
+#     try:
+#         completion = \
+#             client.chat.completions.create(
+#                 model=llm_model,
+#                 messages=[
+#                     {
+#                         "role": "system",
+#                         "content": "You are a system that detects ads in audio transcriptions from podcasts. "
+#                                    "Based on the word-level timestamps provided, determine the start and end times of any ad segments. "
+#                                    "For each ad segment, provide a 5-word summary of the ad. "
+#                                    "Provide ad segments in the format: start: <time>, end: <time>, summary: '<summary>'. "
+#                                    "If no ad is found, return 'No ad detected.'"
+#                     },
+#                     {
+#                         "role": "user",
+#                         "content": f"Here is the transcription with word-level timestamps:\n{transcript}"
+#                     }
+#                 ]
+#             )
+#         usage = completion.usage
+#         usage_dict = {
+#             "prompt_tokens": usage.prompt_tokens,
+#             "completion_tokens": usage.completion_tokens,
+#             "total_tokens": usage.total_tokens
+#         }
+#
+#         classification = completion.choices[0].message.content.strip()
+#         logger.info(classification)
+#         pattern = r"start:\s*([\d.]+).*?end:\s*([\d.]+).*?summary:\s*['\"]?([^'\"]+)['\"]?"
+#         ad_segments = [{"start": float(m[0]), "end": float(m[1]), "summary": m[2].strip()} for m in
+#                        re.findall(pattern, classification)]
+#         logger.info(f"Detected ad-segments: {ad_segments}")
+#         return ad_segments, usage_dict
+#
+#     except Exception as e:
+#         raise
+#
+#
+# def transcribe_audio(audio_segment, batched_model):
+#     try:
+#         buffer = BytesIO()
+#         audio_segment.export(buffer, format="wav")
+#         buffer.seek(0)
+#
+#         segments, _ = batched_model.transcribe(buffer, word_timestamps=True)
+#
+#         # Convert generator to list to avoid issues with it being consumed
+#         segments_list = list(segments)
+#
+#         # Create structured transcription
+#         transcription = [
+#             {
+#                 "start": word.start,
+#                 "end": word.end,
+#                 "text": word.word
+#             }
+#             for segment in segments_list
+#             for word in segment.words
+#         ]
+#
+#         formatted_transcription = "\n".join(
+#             [f"[{w['start']:.2f}-{w['end']:.2f}] {w['text']}" for w in transcription]
+#         )
+#         return formatted_transcription
+#     except Exception as e:
+#         logger.error(f"Error during transcription: {str(e)}")
+#         return None
diff --git a/tests/__init__.py b/tests/__init__.py
new file mode 100644
index 0000000..e69de29
diff --git a/tests/pytest.ini.py b/tests/pytest.ini.py
new file mode 100644
index 0000000..9288be6
--- /dev/null
+++ b/tests/pytest.ini.py
@@ -0,0 +1,3 @@
+[pytest]
+log_cli = true
+log_cli_level = INFO
\ No newline at end of file
diff --git a/tests/unit/__init__.py b/tests/unit/__init__.py
new file mode 100644
index 0000000..e69de29
diff --git a/tests/unit/helpers/__init__.py b/tests/unit/helpers/__init__.py
new file mode 100644
index 0000000..e69de29
diff --git a/tests/unit/helpers/test_cache_helpers.py b/tests/unit/helpers/test_cache_helpers.py
new file mode 100644
index 0000000..fca017f
--- /dev/null
+++ b/tests/unit/helpers/test_cache_helpers.py
@@ -0,0 +1,46 @@
+import pytest
+from unittest.mock import MagicMock
+
+@pytest.fixture
+def fake_redis(monkeypatch):
+    import server.helpers.cache_helpers as cache_helpers
+    mock_redis = MagicMock()
+    monkeypatch.setattr(cache_helpers, "r", mock_redis)
+    return mock_redis
+
+def test_initiate_key_success(fake_redis):
+    from server.helpers.cache_helpers import initiate_key
+    lock = MagicMock()
+    lock.acquire.return_value = True
+    fake_redis.lock.return_value = lock
+
+    assert initiate_key("test123") is True
+    fake_redis.hset.assert_called_once()
+
+def test_initiate_key_locked(fake_redis):
+    from server.helpers.cache_helpers import initiate_key
+    lock = MagicMock()
+    lock.acquire.return_value = False
+    fake_redis.lock.return_value = lock
+
+    assert initiate_key("test123") is False
+
+def test_update_total_number_of_chunks(fake_redis):
+    from server.helpers.cache_helpers import update_total_number_of_chunks
+    update_total_number_of_chunks("episode42", 3)
+    fake_redis.hincrby.assert_called_once_with("meta::episode42", "chunks", 3)
+
+def test_update_status_to_complete(fake_redis):
+    from server.helpers.cache_helpers import update_status_to_complete
+    update_status_to_complete("episode42")
+    fake_redis.hset.assert_called_once_with("meta::episode42", "status", "COMPLETE")
+
+def test_cached_url_true(fake_redis):
+    from server.helpers.cache_helpers import cached_url
+    fake_redis.exists.return_value = 1
+    assert cached_url("url-key") is True
+
+def test_cached_url_false(fake_redis):
+    from server.helpers.cache_helpers import cached_url
+    fake_redis.exists.return_value = 0
+    assert cached_url("url-key") is False
diff --git a/tests/unit/helpers/test_file_helpers.py b/tests/unit/helpers/test_file_helpers.py
new file mode 100644
index 0000000..12e58bb
--- /dev/null
+++ b/tests/unit/helpers/test_file_helpers.py
@@ -0,0 +1,15 @@
+import os
+from server.helpers.file_helpers import allowed_file, sanitize_filename, save_file
+
+def test_allowed_file():
+    assert allowed_file("test.mp3", {"mp3", "wav"}) is True
+    assert allowed_file("test.txt", {"mp3", "wav"}) is False
+
+def test_sanitize_filename():
+    unsafe = 'file<name>|wrong?.mp3'
+    safe = sanitize_filename(unsafe)
+    assert safe == 'file_name__wrong_.mp3'
+
+def test_save_file(tmp_path):
+    path = save_file("audio.mp3", str(tmp_path))
+    assert path == os.path.join(str(tmp_path), "audio.mp3")
diff --git a/tests/unit/helpers/test_rss_helpers.py b/tests/unit/helpers/test_rss_helpers.py
new file mode 100644
index 0000000..f56046c
--- /dev/null
+++ b/tests/unit/helpers/test_rss_helpers.py
@@ -0,0 +1,25 @@
+import pytest
+import requests
+from unittest.mock import patch
+from server.helpers.rss_helpers import fetch_rss, extract_rss_urls
+
+def test_extract_rss_urls_valid():
+    rss_content = b"""
+    <rss><channel>
+    <item><enclosure url="http://test.com/audio.mp3" type="audio/mpeg"/></item>
+    </channel></rss>
+    """
+    urls = extract_rss_urls(rss_content)
+    assert urls == ["http://test.com/audio.mp3"]
+
+def test_extract_rss_urls_empty():
+    with pytest.raises(ValueError):
+        extract_rss_urls(b"")
+
+@patch("server.helpers.rss_helpers.requests.get")
+def test_fetch_rss_success(mock_get):
+    mock_get.return_value.status_code = 200
+    mock_get.return_value.headers = {"Content-Type": "application/xml"}
+    mock_get.return_value.content = b"<rss></rss>"
+    result = fetch_rss("http://example.com/feed.xml")
+    assert result == b"<rss></rss>"
\ No newline at end of file
diff --git a/tests/unit/helpers/test_url_helpers.py b/tests/unit/helpers/test_url_helpers.py
new file mode 100644
index 0000000..b358b67
--- /dev/null
+++ b/tests/unit/helpers/test_url_helpers.py
@@ -0,0 +1,13 @@
+from server.helpers.url_helpers import extract_name, extract_title, extract_extension
+
+def test_extract_name():
+    url = "https://example.com/podcast/audiofile.mp3"
+    assert extract_name(url) == "mp3"
+
+def test_extract_title():
+    path = "episode001.mp3"
+    assert extract_title(path) == "episode001"
+
+def test_extract_extension():
+    url = "https://example.com/audio.wav"
+    assert extract_extension(url) == ".wav"
diff --git a/tests/unit/test_audio_processing.py b/tests/unit/test_audio_processing.py
new file mode 100644
index 0000000..429467f
--- /dev/null
+++ b/tests/unit/test_audio_processing.py
@@ -0,0 +1,108 @@
+import pytest
+from unittest.mock import patch, MagicMock
+import sys
+import os
+
+os.environ["OPENAI_API_KEY"] = "fake-key-for-tests"
+
+# Patch pydub to avoid FileNotFoundError during import
+mock_audio_segment = MagicMock()
+mock_audio_segment.from_file.return_value = MagicMock(name="AudioSegment")
+mock_audio_segment.silent = MagicMock(side_effect=lambda duration: MagicMock(duration=duration, __len__=lambda self: duration))
+
+sys.modules["pydub"] = MagicMock(AudioSegment=mock_audio_segment)
+sys.modules["pydub.audio_segment"] = MagicMock(AudioSegment=mock_audio_segment)
+
+# Now safe to import audio_processing
+from server.audio_processing import (
+    chunk_audio,
+    remove_ads,
+    detect_ads,
+    transcribe_audio,
+    process_audio,
+)
+@pytest.fixture
+def dummy_audio_segment():
+    return MagicMock(duration_seconds=10, __len__=lambda self: 10000)
+
+
+def test_chunk_audio_short_segment(dummy_audio_segment):
+    chunks = chunk_audio(dummy_audio_segment, chunk_duration_seconds=15)
+    assert len(chunks) == 1
+
+
+def test_chunk_audio_multiple_chunks():
+    audio = MagicMock()
+    audio.__len__.return_value = 500000  # 500 seconds in ms
+    audio.duration_seconds = 500
+    chunks = chunk_audio(audio, chunk_duration_seconds=240)
+    assert len(chunks) >= 2
+
+
+def test_remove_ads_merges_and_cuts():
+    audio = MagicMock()
+    audio.__len__.return_value = 30000  # 30s in ms
+    audio.__getitem__.side_effect = lambda x: MagicMock()
+    audio.empty.return_value = MagicMock()
+    ads = [
+        {"start": 2.0, "end": 5.0, "summary": "First Ad"},
+        {"start": 5.1, "end": 8.0, "summary": "Second Ad"},
+        {"start": 25.0, "end": 29.5, "summary": "Final Ad"},
+    ]
+    result = remove_ads(audio, ads)
+    assert result is not None
+
+
+@patch("server.audio_processing.batched_model.transcribe")
+def test_transcribe_audio(mock_transcribe, dummy_audio_segment):
+    mock_transcribe.return_value = ([MagicMock(words=[
+        MagicMock(start=0.0, end=0.5, word="Hello"),
+        MagicMock(start=0.6, end=1.0, word="world")
+    ])], None)
+
+    transcript = transcribe_audio(dummy_audio_segment)
+    assert "[0.0-0.5] Hello" in transcript
+    assert "[0.6-1.0] world" in transcript
+
+
+@patch("server.audio_processing.client.chat.completions.create")
+def test_detect_ads_parsing(mock_create):
+    mock_resp = MagicMock()
+    mock_resp.choices[0].message.content = (
+        "start: 10.0, end: 15.0, summary: 'Buy now!'\n"
+        "start: 20.0, end: 22.0, summary: 'Limited offer'"
+    )
+    mock_create.return_value = mock_resp
+
+    ads = detect_ads("some fake transcript")
+    assert ads == [
+        {"start": 10.0, "end": 15.0, "summary": "Buy now!"},
+        {"start": 20.0, "end": 22.0, "summary": "Limited offer"},
+    ]
+
+
+@patch("server.audio_processing.transcribe_audio", return_value="fake transcript")
+@patch("server.audio_processing.detect_ads", return_value=[])
+@patch("server.audio_processing.remove_ads", side_effect=lambda audio, ads, flag=None: audio)
+@patch("server.audio_processing.cache_chunk")
+@patch("server.audio_processing.update_total_number_of_chunks")
+@patch("server.audio_processing.update_status_to_complete")
+def test_process_audio_simple(
+    mock_status,
+    mock_total,
+    mock_cache,
+    mock_remove,
+    mock_detect,
+    mock_transcribe,
+):
+    dummy_audio = MagicMock()
+    dummy_audio.frame_rate = 44100
+    dummy_audio.duration_seconds = 10
+    dummy_audio.__len__.return_value = 10000
+    dummy_audio.__getitem__.side_effect = lambda x: dummy_audio
+
+    process_audio(dummy_audio, url="test-key", streaming=False)
+
+    mock_total.assert_called_once()
+    mock_cache.assert_called()
+    mock_status.assert_called_once()
diff --git a/tests/unit/test_router.py b/tests/unit/test_router.py
new file mode 100644
index 0000000..23b61fe
--- /dev/null
+++ b/tests/unit/test_router.py
@@ -0,0 +1,65 @@
+import pytest
+from unittest.mock import MagicMock, patch
+import sys
+import os
+mock_audio_segment = MagicMock()
+mock_audio_segment.from_file.return_value = MagicMock(name="AudioSegment")
+
+os.environ["OPENAI_API_KEY"] = "fake-key-for-tests"
+
+sys.modules["pydub"] = MagicMock(AudioSegment=mock_audio_segment)
+sys.modules["pydub.audio_segment"] = MagicMock(AudioSegment=mock_audio_segment)
+
+from flask import Flask
+from server.router import audio_bp
+
+@pytest.fixture
+def client():
+    app = Flask(__name__)
+    app.register_blueprint(audio_bp)
+    return app.test_client()
+@patch("server.router.fetch_rss")
+@patch("server.router.extract_rss_urls")
+@patch("server.router.process_url_task.delay")
+def test_process_rss_success(mock_delay, mock_extract, mock_fetch, client):
+    mock_fetch.return_value = b"<rss>...</rss>"
+    mock_extract.return_value = ["https://audio1.mp3", "https://audio2.mp3"]
+
+    response = client.post("/rss?url=https://example.com/feed.xml")
+
+    assert response.status_code == 200
+    assert response.data == b"retrieved"
+    assert mock_delay.call_count == 2
+
+
+def test_process_rss_missing_url(client):
+    response = client.post("/rss")
+    assert response.status_code == 400
+    assert b"No url provided" in response.data
+
+
+@patch("server.router.cached_url", return_value=False)
+@patch("server.router.initiate_key", return_value=True)
+@patch("server.router.initiate_streaming_task.delay")
+@patch("server.router.retrieve_audio", return_value=b"audio-bytes")
+def test_request_podcast_new(mock_retrieve, mock_stream, mock_key, mock_cached, client):
+    response = client.get("/podcast?url=https://example.com/ep.mp3")
+
+    assert response.status_code == 200
+    assert response.data == b"audio-bytes"
+    mock_stream.assert_called_once()
+
+
+@patch("server.router.cached_url", return_value=True)
+@patch("server.router.retrieve_audio", return_value=b"cached-audio")
+def test_request_podcast_cached(mock_retrieve, mock_cached, client):
+    response = client.get("/podcast?url=https://example.com/ep.mp3")
+
+    assert response.status_code == 200
+    assert response.data == b"cached-audio"
+
+
+def test_request_podcast_missing_url(client):
+    response = client.get("/podcast")
+    assert response.status_code == 400
+    assert b"No url provided" in response.data
\ No newline at end of file
diff --git a/tests/unit/test_tasks.py b/tests/unit/test_tasks.py
new file mode 100644
index 0000000..d7e8c3d
--- /dev/null
+++ b/tests/unit/test_tasks.py
@@ -0,0 +1,47 @@
+import pytest
+import os
+from unittest.mock import patch, MagicMock
+
+os.environ["OPENAI_API_KEY"] = "fake-key-for-tests"
+
+patcher = patch("server.audio_processing.AudioSegment.from_file", return_value=MagicMock(name="AudioSegment"))
+patcher.start()
+from server.tasks import process_url_task, initiate_streaming_task
+
+def teardown_module(module):
+    patcher.stop()
+@patch("server.tasks.fetch_audio")
+@patch("server.tasks.initiate_key")
+@patch("server.tasks.cached_url", return_value=False)
+@patch("server.tasks.process_audio")
+def test_process_url_task_uncached(mock_process, mock_cached, mock_initiate, mock_fetch):
+    dummy_audio = MagicMock()
+    mock_fetch.return_value = dummy_audio
+    result = process_url_task.run("http://test.com/audio.mp3")
+    assert "Processing complete" in result
+    mock_initiate.assert_called_once()
+    mock_process.assert_called_once()
+
+
+@patch("server.tasks.cached_url", return_value=True)
+def test_process_url_task_cached(mock_cached):
+    result = process_url_task.run("http://test.com/already.mp3")
+    assert "already cached" in result
+
+
+@patch("server.tasks.fetch_audio")
+@patch("server.tasks.transcribe_audio", return_value="transcript")
+@patch("server.tasks.detect_ads", return_value=[])
+@patch("server.tasks.remove_ads", side_effect=lambda audio, ads: audio)
+@patch("server.tasks.cache_chunk")
+@patch("server.tasks.update_total_number_of_chunks")
+@patch("server.tasks.process_audio")
+def test_initiate_streaming_task(mock_process, mock_chunks, mock_cache, mock_remove, mock_detect, mock_transcribe, mock_fetch):
+    audio = MagicMock()
+    audio.__getitem__.side_effect = lambda s: audio
+    mock_fetch.return_value = audio
+
+    result = initiate_streaming_task.run("http://test.com/streaming.mp3")
+    assert "Processing complete" in result
+    mock_cache.assert_called_once()
+    mock_process.assert_called_once()