vinkius-labs
diff --git a/‎src/Middleware/RemoveComments.php‎
Lines changed: 202 additions & 67 deletions b/‎src/Middleware/RemoveComments.php‎
Lines changed: 202 additions & 67 deletions
@@ -92,15 +92,9 @@ protected function removeCommentsFromTag($tag)
             $content = $matches[2];
             $closingTag = $matches[3];
 
-            // Split content by lines and process each line
-            $lines = preg_split('/\r\n|\r|\n/', $content);
-            $processedLines = [];
-
-            foreach ($lines as $line) {
-                $processedLines[] = $this->removeSingleLineCommentFromLine($line);
-            }
-
-            $processedContent = implode($lineEnding, $processedLines);
+            // Process the whole content at once (supports multi-line template
+            // literals and complex regex literals) for correctness and performance.
+            $processedContent = $this->removeSingleLineCommentsFromContent($content);
 
             // Reconstruct the tag with processed content
             return $openingTag . $processedContent . $closingTag;
@@ -120,82 +114,223 @@ protected function removeCommentsFromTag($tag)
      */
     protected function removeSingleLineCommentFromLine($line)
     {
-        // Early return for lines without //
+        // Fast path: no comments at all
         if (strpos($line, '//') === false) {
             return $line;
         }
 
-        $result = '';
-        $length = strlen($line);
-        $inSingleQuote = false;
-        $inDoubleQuote = false;
-        $inRegex = false;
-        $escaped = false;
-
-        for ($i = 0; $i < $length; $i++) {
-            $char = $line[$i];
-            $nextChar = $i + 1 < $length ? $line[$i + 1] : '';
-            $prevChar = $i > 0 ? $line[$i - 1] : '';
-
-            // Handle escape sequences
-            if ($escaped) {
-                $result .= $char;
-                $escaped = false;
-                continue;
-            }
+        // If there are no quotes/backticks and no regex literal, we can do a fast, simple check.
+        // This avoids invoking the heavier regex when not necessary — a common
+        // case is lines like: var x = 1; // Comment
+        // However, if there are regex literals in the line (e.g. /http:\/\/\//),
+        // we must avoid the fast path as it can't safely detect // inside them.
+        // Quick check for escaped slash sequences (e.g. http:\/\/) that indicate
+        // the presence of regex literals or escaped slashes in general.
+        $hasEscapedSlash = strpos($line, '\\/') !== false;
+        if (strpos($line, '"') === false && strpos($line, "'") === false && strpos($line, '`') === false && !$hasEscapedSlash) {
+            $offset = 0;
+            while (($pos = strpos($line, '//', $offset)) !== false) {
+                $prevChar = $pos > 0 ? $line[$pos - 1] : '';
 
-            if ($char === '\\' && ($inSingleQuote || $inDoubleQuote || $inRegex)) {
-                $result .= $char;
-                $escaped = true;
-                continue;
-            }
+                // URLs like http://example.com are preceded by :, so ignore these
+                if ($prevChar === ':') {
+                    // Skip over this occurrence (it's likely a protocol spec)
+                    $offset = $pos + 2;
+                    continue;
+                }
 
-            // Toggle quote states
-            if ($char === '"' && !$inSingleQuote && !$inRegex) {
-                $inDoubleQuote = !$inDoubleQuote;
-                $result .= $char;
-                continue;
+                // Comment starts here — strip it
+                return substr($line, 0, $pos);
             }
 
-            if ($char === "'" && !$inDoubleQuote && !$inRegex) {
-                $inSingleQuote = !$inSingleQuote;
-                $result .= $char;
-                continue;
-            }
+            return $line;
+        }
 
-            // Handle regex literals (basic detection)
-            if ($char === '/' && !$inSingleQuote && !$inDoubleQuote) {
-                // Check if this might be a regex literal
-                // Simple heuristic: regex usually comes after =, (, [, ,, return, or at start
-                if ($prevChar === '=' || $prevChar === '(' || $prevChar === '[' || $prevChar === ',' || $prevChar === ' ') {
-                    // Look ahead to see if this looks like a regex (not a comment)
-                    if ($nextChar !== '/' && $nextChar !== '*') {
-                        $inRegex = true;
-                        $result .= $char;
-                        continue;
+        // More complex lines can contain strings, regexes, or backticks — use a
+        // single PCRE step which skips strings/regex literals and removes // comments
+        // that are not preceded by a colon.
+                    $pattern = <<<'PATTERN'
+                /(?:(?:"(?:\\.|[^"\\])*")|(?:'(?:\\.|[^'\\])*')|(?:`[^`]*`)|(?:\/(?:\\.|[^\/\\])+\/[a-zA-Z]*))(*SKIP)(*F)|(?<!:)\/\/[^\r\n]*/su
+                PATTERN;
+
+        // preg_replace will remove matched // comments but will skip strings/regexes
+        $result = preg_replace($pattern, '', $line);
+
+        // preg_replace returns null on error; if that happens fall back to original line
+        return $result === null ? $line : $result;
+    }
+
+    /**
+     * Remove // comments from full content (possibly multi-line) while preserving
+     * strings, template literals, and regex literals in the content.
+     *
+     * This function avoids splitting lines so that multi-line template literals
+     * (backticks) are preserved correctly.
+     *
+     * @param string $content
+     * @return string
+     */
+    protected function removeSingleLineCommentsFromContent($content)
+    {
+        
+            // Fallback to a linear scanner: it's safer than a single complex PCRE
+            // and supports multi-line template literals and complex regexes.
+            $length = strlen($content);
+            $out = '';
+
+            $inSingle = false;
+            $inDouble = false;
+            $inBacktick = false;
+            $inRegex = false;
+            $inRegexCharClass = false;
+            $escaped = false;
+
+            for ($i = 0; $i < $length; $i++) {
+                $char = $content[$i];
+                $next = $i + 1 < $length ? $content[$i + 1] : '';
+
+                if ($escaped) {
+                    $out .= $char;
+                    $escaped = false;
+                    continue;
+                }
+
+                if ($char === '\\') {
+                    $out .= $char;
+                    $escaped = true;
+                    continue;
+                }
+
+                if ($inSingle) {
+                    if ($char === "'") {
+                        $inSingle = false;
                     }
+                    $out .= $char;
+                    continue;
+                }
+
+                if ($inDouble) {
+                    if ($char === '"') {
+                        $inDouble = false;
+                    }
+                    $out .= $char;
+                    continue;
+                }
+
+                if ($inBacktick) {
+                    if ($char === '`') {
+                        $inBacktick = false;
+                    }
+                    $out .= $char;
+                    continue;
                 }
 
-                // End of regex literal
                 if ($inRegex) {
-                    $inRegex = false;
-                    $result .= $char;
+                    // Handle char classes inside regex
+                    if ($inRegexCharClass) {
+                        if ($char === ']' && !$escaped) {
+                            $inRegexCharClass = false;
+                        }
+                        $out .= $char;
+                        continue;
+                    }
+
+                    if ($char === '[') {
+                        $inRegexCharClass = true;
+                        $out .= $char;
+                        continue;
+                    }
+
+                    if ($char === '/' && !$escaped) {
+                        $inRegex = false;
+                        $out .= $char;
+                        // Append any regex flags
+                        $j = $i + 1;
+                        while ($j < $length && preg_match('/[a-zA-Z]/', $content[$j])) {
+                            $out .= $content[$j];
+                            $j++;
+                        }
+                        $i = $j - 1;
+                        continue;
+                    }
+
+                    $out .= $char;
                     continue;
                 }
-            }
 
-            // Check for // comment outside of strings
-            if (!$inSingleQuote && !$inDoubleQuote && !$inRegex && $char === '/' && $nextChar === '/') {
-                // Check if this is not part of a URL (preceded by :)
-                if ($prevChar !== ':') {
-                    // Found a comment, remove everything from here to end of line
-                    break;
+                // Not inside string, backtick or regex
+                // Start single-quoted string
+                if ($char === "'") {
+                    $inSingle = true;
+                    $out .= $char;
+                    continue;
                 }
-            }
 
-            $result .= $char;
-        }
+                // Start double-quoted string
+                if ($char === '"') {
+                    $inDouble = true;
+                    $out .= $char;
+                    continue;
+                }
+
+                // Start backtick template literal
+                if ($char === '`') {
+                    $inBacktick = true;
+                    $out .= $char;
+                    continue;
+                }
+
+                // Detect start of comment
+                if ($char === '/' && $next === '/') {
+                    // Ensure '//' isn't part of a url (http://) — check previous char
+                    $prevIndex = strlen($out) - 1;
+                    $prevChar = $prevIndex >= 0 ? $out[$prevIndex] : '';
+                    if ($prevChar === ':') {
+                        // it's likely a URL-like, keep it
+                        $out .= $char;
+                        continue;
+                    }
+
+                    // Skip until end of line
+                    $i += 2; // skip the //
+                    while ($i < $length && $content[$i] !== "\n" && $content[$i] !== "\r") {
+                        $i++;
+                    }
+                    // Append newline if present (preserve newline to keep structure)
+                    if ($i < $length && $content[$i] === "\r") {
+                        $out .= "\r";
+                        if ($i + 1 < $length && $content[$i + 1] === "\n") {
+                            $out .= "\n";
+                            $i++;
+                        }
+                    } elseif ($i < $length && $content[$i] === "\n") {
+                        $out .= "\n";
+                    }
+                    continue;
+                }
+
+                // Potential start of regex literal
+                if ($char === '/') {
+                    // Heuristic: regex often comes after these characters or at start
+                    $prevNonSpaceIndex = strlen($out) - 1;
+                    while ($prevNonSpaceIndex >= 0 && ctype_space($out[$prevNonSpaceIndex])) {
+                        $prevNonSpaceIndex--;
+                    }
+                    $prevNonSpaceChar = $prevNonSpaceIndex >= 0 ? $out[$prevNonSpaceIndex] : '';
+
+                    if ($prevNonSpaceChar === '' || in_array($prevNonSpaceChar, ['=', '(', '[', ',', ':', '?', '!', '{', '}', ';', '+', '-', '*', '/', '%'])) {
+                        // This is likely a regex
+                        $inRegex = true;
+                        $out .= $char;
+                        continue;
+                    }
+                    // Otherwise it's a division operator
+                }
+
+                // Default: append char
+                $out .= $char;
+            }
 
-        return $result;
+            return $out;
     }
 }