add regex for insertions/patterns

2025-09-25 23:03:57 +02:00
parent 8d57c3d97e
commit cc92f432fd
1 changed files with 96 additions and 28 deletions
--- a/customize-WebUI.py
+++ b/customize-WebUI.py
@@ -146,6 +146,16 @@ def copySources(config, destinationDirectory):
 # MARK: Modify files
 def _is_regex(marker: str) -> bool:
    """Return True if the marker is flagged as regex (prefix 're:')."""
    return isinstance(marker, str) and marker.startswith('re:')
 def _extract_pattern(marker: str) -> str:
    """Strip the 're:' prefix and return the regex pattern."""
    return marker[3:]
 def modifyFiles(config, destinationDirectory):
    """Modify files according to modification rules."""
    print(f"{Colors.YELLOW}Starting file modification process...{Colors.RESET}")
@@ -165,45 +175,103 @@ def modifyFiles(config, destinationDirectory):
                        with open(filePath, 'r', encoding='utf-8') as f:
                            content = f.read()
-                        # Perform text replacements
+                        # Perform text replacements / insertions
                        for insertRule in rule.get('insert_rules', []):
                            # AFTER TEXT INSERTION
                            if 'after_text' in insertRule:
-                                after_text = insertRule['after_text']
+                                raw_after = insertRule['after_text']
-                                insert_text = insertRule['insert_text']
+                                insert_text = insertRule['insert_text'].replace('\n', '')
-                                if after_text not in content:           #if not re.search(after_text, content):     # for use of * wildcard in text
+                                if _is_regex(raw_after):
-                                    raise ValueError(f"Text '{after_text}' not found in file: {filePath}")
+                                    pattern = _extract_pattern(raw_after)
-                                elif insert_text not in content:
+                                    # search first occurrence
-                                    print(f"  {Colors.GREEN}Inserting text after: {after_text} {Colors.YELLOW}+ ->{Colors.GREEN} {insert_text}{Colors.RESET}")
+                                    match = re.search(pattern, content, re.DOTALL)
-                                    content = content.replace(after_text, after_text + insert_text.replace('\n', ''))
+                                    if not match:
                                        raise ValueError(f"Regex after_text pattern '{pattern}' not found in file: {filePath}")
                                    anchor = match.group(0)
                                    # idempotency check
                                    if anchor + insert_text in content[match.start():match.start()+len(anchor)+len(insert_text)+5]:
                                        print(f"  {Colors.YELLOW}Regex after_text already has insertion after anchor.{Colors.RESET}")
                                        errorList['modWarnings'] += 1
                                    else:
                                        print(f"  {Colors.GREEN}Regex inserting after anchor: /{pattern}/ -> {insert_text[:60]}...{Colors.RESET}")
                                        content = content[:match.end()] + insert_text + content[match.end():]
                                else:
-                                    print(f"  {Colors.YELLOW}Text already present after: {after_text}{Colors.RESET}")
+                                    # Plain (substring) variant – use first occurrence only (consistent with replace count=1)
-                                    errorList['modWarnings'] += 1
+                                    anchor = raw_after
-
+                                    idx = content.find(anchor)
                                    if idx == -1:
                                        raise ValueError(f"Text '{anchor}' not found in file: {filePath}")
                                    after_pos = idx + len(anchor)
                                    # Precise idempotency: is insert_text already directly after anchor?
                                    if content.startswith(insert_text, after_pos):
                                        print(f"  {Colors.YELLOW}Plain after_text already directly followed by insertion (idempotent).{Colors.RESET}")
                                        errorList['modWarnings'] += 1
                                    else:
                                        print(f"  {Colors.GREEN}Inserting text after (plain): {anchor[:40]} -> {insert_text[:60]}...{Colors.RESET}")
                                        content = content[:after_pos] + insert_text + content[after_pos:]
                            # BEFORE TEXT INSERTION
                            if 'before_text' in insertRule:
-                                before_text = insertRule['before_text']
+                                raw_before = insertRule['before_text']
-                                insert_text = insertRule['insert_text']
+                                insert_text = insertRule['insert_text'].replace('\n', '')
-                                if before_text not in content:
+                                if _is_regex(raw_before):
-                                    raise ValueError(f"Text '{before_text}' not found in file: {filePath}")
+                                    pattern = _extract_pattern(raw_before)
-                                elif insert_text not in content:
+                                    match = re.search(pattern, content, re.DOTALL)
-                                    print(f"  {Colors.GREEN}Inserting text before: {insert_text} {Colors.YELLOW}+ <-{Colors.GREEN} {before_text}{Colors.RESET}")
+                                    if not match:
-                                    content = content.replace(before_text, insert_text.replace('\n', '') + before_text)
+                                        raise ValueError(f"Regex before_text pattern '{pattern}' not found in file: {filePath}")
                                    anchor = match.group(0)
                                    segment_start = max(0, match.start() - len(insert_text) - 5)
                                    if insert_text + anchor in content[segment_start:match.end()+len(insert_text)]:
                                        print(f"  {Colors.YELLOW}Regex before_text already has insertion before anchor.{Colors.RESET}")
                                        errorList['modWarnings'] += 1
                                    else:
                                        print(f"  {Colors.GREEN}Regex inserting before anchor: /{pattern}/ <- {insert_text[:60]}...{Colors.RESET}")
                                        content = content[:match.start()] + insert_text + content[match.start():]
                                else:
-                                    print(f"  {Colors.YELLOW}Text already present before: {before_text}{Colors.RESET}")
+                                    # Plain (substring) variant – first occurrence logic
-                                    errorList['modWarnings'] += 1
+                                    anchor = raw_before
                                    idx = content.find(anchor)
                                    if idx == -1:
                                        raise ValueError(f"Text '{anchor}' not found in file: {filePath}")
                                    before_pos = idx
                                    # Precise idempotency: does insert_text already sit immediately before anchor?
                                    if before_pos >= len(insert_text) and content[before_pos - len(insert_text): before_pos] == insert_text:
                                        print(f"  {Colors.YELLOW}Plain before_text already directly preceded by insertion (idempotent).{Colors.RESET}")
                                        errorList['modWarnings'] += 1
                                    else:
                                        print(f"  {Colors.GREEN}Inserting text before (plain): {insert_text[:60]}... <- {anchor[:40]}{Colors.RESET}")
                                        content = content[:before_pos] + insert_text + content[before_pos:]
                        # REPLACE RULES
                        for replaceRules in rule.get('replace_rules', []):
                            if 'old_text' in replaceRules:
-                                old_text = replaceRules['old_text']
+                                raw_old = replaceRules['old_text']
                                new_text = replaceRules['new_text']
-                                if old_text not in content and new_text not in content:
+                                if _is_regex(raw_old):
-                                    raise ValueError(f"Text '{old_text}' not found in file: {filePath}")
+                                    pattern = _extract_pattern(raw_old)
-                                elif new_text not in content:
+                                    if re.search(re.escape(new_text), content):
-                                    print(f"  {Colors.GREEN}Replacing text: {old_text} {Colors.YELLOW}->{Colors.GREEN} {new_text}{Colors.RESET}")
+                                        print(f"  {Colors.YELLOW}Regex replacement already applied -> {new_text[:60]}...{Colors.RESET}")
-                                    content = content.replace(old_text, new_text)
+                                        errorList['modWarnings'] += 1
                                        continue
                                    if not re.search(pattern, content, re.DOTALL):
                                        raise ValueError(f"Regex old_text pattern '{pattern}' not found in file: {filePath}")
                                    content_new, count = re.subn(pattern, new_text, content, count=1)
                                    if count:
                                        print(f"  {Colors.GREEN}Regex replacing pattern /{pattern}/ -> {new_text[:60]}...{Colors.RESET}")
                                        content = content_new
                                    else:
                                        print(f"  {Colors.YELLOW}Regex replacement produced no change for /{pattern}/.{Colors.RESET}")
                                        errorList['modWarnings'] += 1
                                else:
-                                    print(f"  {Colors.YELLOW}Text already replaced: {old_text} -> {new_text}{Colors.RESET}")
+                                    old_text = raw_old
-                                    errorList['modWarnings'] += 1
+                                    if old_text not in content and new_text not in content:
                                        raise ValueError(f"Text '{old_text}' not found in file: {filePath}")
                                    elif new_text not in content:
                                        print(f"  {Colors.GREEN}Replacing text: {old_text[:60]}... -> {new_text[:60]}...{Colors.RESET}")
                                        content = content.replace(old_text, new_text, 1)
                                    else:
                                        print(f"  {Colors.YELLOW}Text already replaced: {old_text[:40]} -> {new_text[:40]}{Colors.RESET}")
                                        errorList['modWarnings'] += 1
                        # Write modified contents