vicinaehq
diff --git a/‎tests/CMakeLists.txt‎
Lines changed: 11 additions & 0 deletions b/‎tests/CMakeLists.txt‎
Lines changed: 11 additions & 0 deletions
diff --git a/‎tests/lib/file-indexer/regex-utils.cpp‎
Lines changed: 155 additions & 0 deletions b/‎tests/lib/file-indexer/regex-utils.cpp‎
Lines changed: 155 additions & 0 deletions
diff --git a/‎vicinae/CMakeLists.txt‎
Lines changed: 3 additions & 1 deletion b/‎vicinae/CMakeLists.txt‎
Lines changed: 3 additions & 1 deletion
diff --git a/‎vicinae/database/file-indexer/migrations.qrc‎
Lines changed: 1 addition & 0 deletions b/‎vicinae/database/file-indexer/migrations.qrc‎
Lines changed: 1 addition & 0 deletions
diff --git a/‎vicinae/database/file-indexer/migrations/002_tri_idx.sql‎
Lines changed: 13 additions & 0 deletions b/‎vicinae/database/file-indexer/migrations/002_tri_idx.sql‎
Lines changed: 13 additions & 0 deletions
diff --git a/‎vicinae/include/search-files-view.hpp‎
Lines changed: 22 additions & 3 deletions b/‎vicinae/include/search-files-view.hpp‎
Lines changed: 22 additions & 3 deletions
diff --git a/‎vicinae/src/extensions/file/file-extension.hpp‎
Lines changed: 6 additions & 1 deletion b/‎vicinae/src/extensions/file/file-extension.hpp‎
Lines changed: 6 additions & 1 deletion
diff --git a/‎vicinae/src/services/extension-registry/extension-registry.hpp‎
Lines changed: 1 addition & 0 deletions b/‎vicinae/src/services/extension-registry/extension-registry.hpp‎
Lines changed: 1 addition & 0 deletions
diff --git a/‎vicinae/src/services/files-service/abstract-file-indexer.hpp‎
Lines changed: 6 additions & 3 deletions b/‎vicinae/src/services/files-service/abstract-file-indexer.hpp‎
Lines changed: 6 additions & 3 deletions
@@ -5,8 +5,14 @@ file(GLOB_RECURSE TEST_SOURCES
     "lib/**/*.cpp"
 )
 
+# Add source files that are being tested
+set(REGEX_UTILS_SRC
+    ${CMAKE_SOURCE_DIR}/vicinae/src/services/files-service/file-indexer/regex-utils.cpp
+)
+
 add_executable(all_tests
     ${TEST_SOURCES}
+    ${REGEX_UTILS_SRC}
 )
 
 set(FIXTURE_DIR ${CMAKE_CURRENT_SOURCE_DIR}/fixtures)
@@ -17,6 +23,11 @@ target_compile_definitions(all_tests PRIVATE
 	XDGPP_FIXTURE_DIR="${FIXTURE_DIR}/xdgpp"
 )
 
+target_include_directories(all_tests PRIVATE
+    ${CMAKE_SOURCE_DIR}/vicinae/src
+    ${CMAKE_SOURCE_DIR}/vicinae/include
+)
+
 target_link_libraries(all_tests 
     PRIVATE 
     xdgpp
 
@@ -0,0 +1,155 @@
+#include "services/files-service/file-indexer/regex-utils.hpp"
+#include <catch2/catch_test_macros.hpp>
+
+TEST_CASE("extractStaticCharsFromRegex - basic patterns", "[file-indexer]") {
+  SECTION(".*config.*db^") { REQUIRE(extractStaticCharsFromRegex(".*config.*db^") == "config db"); }
+  SECTION("^[ab]cd") { REQUIRE(extractStaticCharsFromRegex("^[ab]cd") == "cd"); }
+  SECTION("^ab[cd](test)k") { REQUIRE(extractStaticCharsFromRegex("^ab[cd](test)k") == "^ab test k"); }
+}
+
+TEST_CASE("extractStaticCharsFromRegex - special regex characters", "[file-indexer]") {
+  SECTION("handles dot wildcard") { REQUIRE(extractStaticCharsFromRegex("a.b") == "a b"); }
+  SECTION("handles asterisk") { REQUIRE(extractStaticCharsFromRegex("a*b") == "a b"); }
+  SECTION("handles plus") { REQUIRE(extractStaticCharsFromRegex("a+b") == "a b"); }
+  SECTION("handles question mark") { REQUIRE(extractStaticCharsFromRegex("a?b") == "b"); }
+  SECTION("handles pipe") { REQUIRE(extractStaticCharsFromRegex("a|b") == ""); }
+  SECTION("handles dollar sign") { REQUIRE(extractStaticCharsFromRegex("abc$") == "abc"); }
+}
+
+TEST_CASE("extractStaticCharsFromRegex - keeps only alphanumercial, space, tab, newline", "[file-indexer]") {
+  SECTION("strips dots") { REQUIRE(extractStaticCharsFromRegex("abc\\.") == "abc"); }
+  SECTION("strips dots") { REQUIRE(extractStaticCharsFromRegex("\\\\-$@#abc\\.") == "abc"); }
+  SECTION("strips dots") { REQUIRE(extractStaticCharsFromRegex("abc-def") == "abc def"); }
+}
+
+TEST_CASE("extractStaticCharsFromRegex - brackets", "[file-indexer]") {
+  SECTION("ignores content in square brackets") { REQUIRE(extractStaticCharsFromRegex("[abc]def") == "def"); }
+
+  SECTION("keeps content in parentheses (groups)") {
+    REQUIRE(extractStaticCharsFromRegex("(abc)def") == "abcdef");
+  }
+}
+
+TEST_CASE("extractStaticCharsFromRegex - caret handling", "[file-indexer]") {
+  SECTION("keeps caret followed by regular character") {
+    REQUIRE(extractStaticCharsFromRegex("^abc") == "^abc");
+  }
+
+  SECTION("removes caret not followed by character") { REQUIRE(extractStaticCharsFromRegex("^[abc]") == ""); }
+
+  SECTION("removes caret followed by special char") {
+    REQUIRE(extractStaticCharsFromRegex("^.abc") == "abc");
+  }
+
+  SECTION("caret in middle without following char") { REQUIRE(extractStaticCharsFromRegex("abc^") == "abc"); }
+}
+
+TEST_CASE("extractStaticCharsFromRegex - escaping", "[file-indexer]") {
+  SECTION("escaped special characters become static") {
+    REQUIRE(extractStaticCharsFromRegex("a\\.b") == "a b");
+  }
+
+  SECTION("escaped bracket") { REQUIRE(extractStaticCharsFromRegex("a\\[b") == "a b"); }
+  SECTION("escaped backslash") { REQUIRE(extractStaticCharsFromRegex("a\\\\b") == "a b"); }
+  SECTION("caret with escaped character") { REQUIRE(extractStaticCharsFromRegex("^\\[test") == "test"); }
+}
+
+TEST_CASE("extractStaticCharsFromRegex - empty and edge cases", "[file-indexer]") {
+  SECTION("empty string") { REQUIRE(extractStaticCharsFromRegex("") == ""); }
+  SECTION("only special characters") { REQUIRE(extractStaticCharsFromRegex(".*+?|$") == ""); }
+  SECTION("only brackets") { REQUIRE(extractStaticCharsFromRegex("[abc](def)") == "def"); }
+  SECTION("single character") { REQUIRE(extractStaticCharsFromRegex("a") == "a"); }
+}
+
+TEST_CASE("extractStaticCharsFromRegex - quantifiers", "[file-indexer]") {
+  SECTION("exactly n - {3}") { REQUIRE(extractStaticCharsFromRegex("a{3}b") == "a b"); }
+  SECTION("n or more - {3,}") { REQUIRE(extractStaticCharsFromRegex("a{3,}b") == "a b"); }
+  SECTION("between m and n - {3,5}") { REQUIRE(extractStaticCharsFromRegex("a{3,5}b") == "a b"); }
+
+  SECTION("lazy quantifiers - ?? *? +?") {
+    REQUIRE(extractStaticCharsFromRegex("a??b") == "b");
+    REQUIRE(extractStaticCharsFromRegex("a*?b") == "a b");
+    REQUIRE(extractStaticCharsFromRegex("a+?b") == "a b");
+  }
+
+  SECTION("multiple wildcards") { REQUIRE(extractStaticCharsFromRegex("a.*b.*c") == "a b c"); }
+  SECTION("combined quantifiers") { REQUIRE(extractStaticCharsFromRegex("a+b*c?d") == "a b d"); }
+}
+
+TEST_CASE("extractStaticCharsFromRegex - word boundaries", "[file-indexer]") {
+  SECTION("word boundary \\b") { REQUIRE(extractStaticCharsFromRegex("\\btest\\b") == "test"); }
+  SECTION("not word boundary \\B") { REQUIRE(extractStaticCharsFromRegex("\\Btest\\B") == "test"); }
+  SECTION("start of word \\<") { REQUIRE(extractStaticCharsFromRegex("\\<test") == "test"); }
+  SECTION("end of word \\>") { REQUIRE(extractStaticCharsFromRegex("test\\>") == "test"); }
+}
+
+TEST_CASE("extractStaticCharsFromRegex - character classes", "[file-indexer]") {
+  SECTION("digit \\d") { REQUIRE(extractStaticCharsFromRegex("\\d") == ""); }
+  SECTION("not digit \\D") { REQUIRE(extractStaticCharsFromRegex("\\D") == ""); }
+  SECTION("whitespace \\s") { REQUIRE(extractStaticCharsFromRegex("\\s") == ""); }
+  SECTION("not whitespace \\S") { REQUIRE(extractStaticCharsFromRegex("\\S") == ""); }
+  SECTION("word character \\w") { REQUIRE(extractStaticCharsFromRegex("\\w") == ""); }
+  SECTION("not word character \\W") { REQUIRE(extractStaticCharsFromRegex("\\W") == ""); }
+  SECTION("hex digit \\x") { REQUIRE(extractStaticCharsFromRegex("\\x41") == "A"); }
+}
+
+TEST_CASE("extractStaticCharsFromRegex - complex patterns", "[file-indexer]") {
+  SECTION("multiple groups") { REQUIRE(extractStaticCharsFromRegex("(abc)(def)(ghi)") == "abcdefghi"); }
+  SECTION("nested groups") { REQUIRE(extractStaticCharsFromRegex("((ab)c)def") == "abcdef"); }
+  SECTION("alternation in group") { REQUIRE(extractStaticCharsFromRegex("(a|b)cd") == "cd"); }
+
+  SECTION("mixed brackets and groups") {
+    REQUIRE(extractStaticCharsFromRegex("[abc](def)[ghi]jkl") == "def jkl");
+  }
+
+  SECTION("quantifiers with groups") { REQUIRE(extractStaticCharsFromRegex("(abc)+def") == "abc def"); }
+}
+
+TEST_CASE("extractStaticCharsFromRegex - anchors", "[file-indexer]") {
+  SECTION("\\A start of string") { REQUIRE(extractStaticCharsFromRegex("\\Atest") == "test"); }
+  SECTION("\\Z end of string") { REQUIRE(extractStaticCharsFromRegex("test\\Z") == "test"); }
+  SECTION("combined anchors") { REQUIRE(extractStaticCharsFromRegex("^test$") == "^test"); }
+}
+
+TEST_CASE("extractStaticCharsFromRegex - special escapes", "[file-indexer]") {
+  SECTION("tab \\t") { REQUIRE(extractStaticCharsFromRegex("a\\tb") == "a\tb"); }
+  SECTION("newline \\n") { REQUIRE(extractStaticCharsFromRegex("a\\nb") == "a\nb"); }
+  SECTION("carriage return \\r") { REQUIRE(extractStaticCharsFromRegex("a\\rb") == "a\rb"); }
+  SECTION("vertical tab \\v") { REQUIRE(extractStaticCharsFromRegex("a\\vb") == "a\vb"); }
+  SECTION("form feed \\f") { REQUIRE(extractStaticCharsFromRegex("a\\fb") == "a\fb"); }
+}
+
+TEST_CASE("extractStaticCharsFromRegex - minWordLength", "[file-indexer]") {
+  SECTION("filters single character words") {
+    REQUIRE(extractStaticCharsFromRegex("a b c", 2) == "");
+    REQUIRE(extractStaticCharsFromRegex("ab cd ef", 2) == "ab cd ef");
+    REQUIRE(extractStaticCharsFromRegex("a bc d", 2) == "bc");
+  }
+
+  SECTION("filters with minimum length 3") {
+    REQUIRE(extractStaticCharsFromRegex("a bc def", 3) == "def");
+    REQUIRE(extractStaticCharsFromRegex("foo bar ab", 3) == "foo bar");
+    REQUIRE(extractStaticCharsFromRegex("test a b", 3) == "test");
+  }
+
+  SECTION("keeps all words when min is 0") {
+    REQUIRE(extractStaticCharsFromRegex("a b c", 0) == "a b c");
+    REQUIRE(extractStaticCharsFromRegex("test a bc", 0) == "test a bc");
+  }
+
+  SECTION("regex patterns with minWordLength") {
+    REQUIRE(extractStaticCharsFromRegex(".*config.*db^", 3) == "config");
+    REQUIRE(extractStaticCharsFromRegex("^ab[cd](test)k", 3) == "test");
+    REQUIRE(extractStaticCharsFromRegex("a.*b.*c", 2) == "");
+  }
+
+  SECTION("empty result when all words too short") {
+    REQUIRE(extractStaticCharsFromRegex("a b c d e", 3) == "");
+    REQUIRE(extractStaticCharsFromRegex("ab cd", 3) == "");
+  }
+
+  SECTION("preserves word boundaries") {
+    REQUIRE(extractStaticCharsFromRegex("test a b config", 4) == "test config");
+    REQUIRE(extractStaticCharsFromRegex("a very long test", 4) == "very long test");
+  }
+}
@@ -6,7 +6,7 @@ set(TARGET vicinae)
 find_package(Qt6 REQUIRED COMPONENTS Core Widgets Sql Network Svg DBus)
 find_package(OpenSSL REQUIRED)
 
-list(APPEND LIBS  Qt6::Widgets Qt6::Sql Qt6::Network Qt6::Svg Qt6::DBus ${CMARK_LIBRARY} protobuf::libprotobuf minizip OpenSSL::Crypto wayland-client xdgpp qt6keychain)
+list(APPEND LIBS  Qt6::Widgets Qt6::Sql Qt6::Network Qt6::Svg Qt6::DBus ${CMARK_LIBRARY} protobuf::libprotobuf minizip OpenSSL::Crypto wayland-client xdgpp qt6keychain sqlite3)
 
 set(WLR_CLIP_BIN ${CMAKE_BINARY_DIR}/wlr-clip/wlr-clip${CMAKE_EXECUTABLE_SUFFIX})
 set(ASSET_PATH ${CMAKE_CURRENT_SOURCE_DIR}/assets)
@@ -478,6 +478,8 @@ set(SRCS
 	src/services/files-service/file-indexer/writer-worker.cpp
 	src/services/files-service/file-indexer/scan-dispatcher.cpp
 	src/services/files-service/file-indexer/abstract-scanner.hpp
+	src/services/files-service/file-indexer/regex-utils.hpp
+	src/services/files-service/file-indexer/regex-utils.cpp
 
 	src/services/extension-registry/extension-registry.hpp
 	src/services/extension-registry/extension-registry.cpp
 
@@ -1,5 +1,6 @@
 <RCC>
     <qresource prefix="database/file-indexer">
         <file>migrations/001_init.sql</file>
+        <file>migrations/002_tri_idx.sql</file>
     </qresource>
 </RCC>
@@ -0,0 +1,13 @@
+
+CREATE VIRTUAL TABLE IF NOT EXISTS tri_idx USING fts5(name, content='indexed_file',
+  tokenize='trigram');
+
+INSERT INTO tri_idx(tri_idx) VALUES('rebuild');
+
+-- Triggers to keep the FTS index up to date.
+
+CREATE TRIGGER tri_idx_ai AFTER INSERT ON indexed_file BEGIN
+  INSERT INTO tri_idx(rowid, name) VALUES (new.id, new.name);END;
+
+CREATE TRIGGER tri_idx_ad AFTER DELETE ON indexed_file BEGIN
+  INSERT INTO tri_idx(unicode_idx, rowid, name) VALUES('delete', old.id, old.name);END; 
@@ -7,12 +7,14 @@
 #include "ui/image/url.hpp"
 #include "service-registry.hpp"
 #include "services/files-service/abstract-file-indexer.hpp"
+#include "services/files-service/file-indexer/file-indexer.hpp"
 #include "ui/omni-list/omni-list.hpp"
 #include "utils/utils.hpp"
 #include <filesystem>
 #include <qfuturewatcher.h>
 #include <qlocale.h>
 #include <qmimedatabase.h>
+#include <qtimer.h>
 #include "ui/text-file-viewer/text-file-viewer.hpp"
 
 class FileListItemMetadata : public DetailWithMetadataWidget {
@@ -111,6 +113,7 @@ class SearchFilesView : public ListView {
   Watcher m_pendingFileResults;
   QString m_lastSearchText;
   QString currentQuery;
+  QTimer m_debounceTimer;
 
   void initialize() override {
     setSearchPlaceholderText("Search for files...");
@@ -133,13 +136,24 @@ class SearchFilesView : public ListView {
     });
   }
 
-  void generateFilteredList(const QString &query) {
+  void executeSearch() {
     auto fileService = context()->services->fileService();
 
     if (m_pendingFileResults.isRunning()) { m_pendingFileResults.cancel(); }
-    m_lastSearchText = query;
+    m_lastSearchText = currentQuery;
     setLoading(true);
-    m_pendingFileResults.setFuture(fileService->queryAsync(query.toStdString()));
+    m_pendingFileResults.setFuture(fileService->queryAsync(currentQuery.toStdString()));
+  }
+
+  void generateFilteredList(const QString &query) {
+    auto fileService = context()->services->fileService();
+    auto indexer = dynamic_cast<FileIndexer *>(fileService->indexer());
+
+    if (indexer && indexer->useRegex()) {
+      m_debounceTimer.start();
+    } else {
+      executeSearch();
+    }
   }
 
   void renderRecentFiles() {
@@ -161,6 +175,11 @@ class SearchFilesView : public ListView {
 
 public:
   SearchFilesView() {
+    // debounce is important for regex searches to avoid excessive computation, could be removed or reduced
+    // for simple searches
+    m_debounceTimer.setSingleShot(true);
+    m_debounceTimer.setInterval(std::chrono::milliseconds(500));
+    connect(&m_debounceTimer, &QTimer::timeout, this, &SearchFilesView::executeSearch);
     connect(&m_pendingFileResults, &Watcher::finished, this, &SearchFilesView::handleSearchResults);
   }
 };
@@ -75,7 +75,12 @@ class FileExtension : public BuiltinCommandRepository {
     watcherPaths.setDescription("Semicolon-separated list of paths watched by experimental watcher");
     watcherPaths.setDefaultValue("");
 
-    return {paths, watcherPaths};
+    auto useRegex = Preference::makeCheckbox("useRegex");
+    useRegex.setTitle("Use regex search");
+    useRegex.setDescription("Enable regular expression matching for file searches");
+    useRegex.setDefaultValue(false);
+
+    return {paths, watcherPaths, useRegex};
   }
 
   void preferenceValuesChanged(const QJsonObject &preferences) const override {
 
@@ -7,6 +7,7 @@
 #include <qfilesystemwatcher.h>
 #include <qjsonobject.h>
 #include <qobject.h>
+#include <qtimer.h>
 #include <qtmetamacros.h>
 #include <vector>
 #include <QString>
 
@@ -38,11 +38,14 @@ struct Pagination {
   int limit = 50;
 };
 
+struct FileIndexerQueryParams {
+  Pagination pagination;
+  bool useRegex = false;
+};
+
 class AbstractFileIndexer : public QObject {
 public:
-  struct QueryParams {
-    Pagination pagination;
-  };
+  using QueryParams = FileIndexerQueryParams;
 
 public:
   virtual void start() = 0;