feat: Add comprehensive tests for contentPattern and glob pattern matching

- Implemented final verification tests for contentPattern to validate behavior with empty strings, dangerous patterns, and normal patterns. - Created glob pattern matching tests to verify regex conversion and matching functionality. - Developed infinite loop risk tests using Worker threads to isolate potential blocking operations. - Introduced optimized contentPattern tests to validate improvements in the findMatches function. - Added verification tests to assess the effectiveness of contentPattern optimizations. - Conducted safety tests for contentPattern to identify edge cases and potential vulnerabilities. - Implemented unrestricted loop tests to analyze infinite loop risks without match limits. - Developed tests for zero-width pattern detection logic to ensure proper handling of dangerous regex patterns.
2026-02-10 02:24:35 +08:00 · 2026-02-09 11:13:01 +08:00
parent dfe153778c
commit 964292ebdb
62 changed files with 7588 additions and 374 deletions
--- a/test-zero-width-fixed.js
+++ b/test-zero-width-fixed.js
@@ -0,0 +1,88 @@
+/**
+ * 测试零宽度模式的检测逻辑
+ */
+
+console.log('=== 零宽度模式检测测试 ===\n');
+
+const testPatterns = [
+  { pattern: '', desc: '空字符串' },
+  { pattern: 'x*', desc: '零宽量词' },
+  { pattern: 'a|', desc: '或空匹配' },
+  { pattern: '.*', desc: '点星' },
+  { pattern: 'CCW', desc: '正常模式' },
+  { pattern: 'TODO', desc: '正常模式2' }
+];
+
+for (const test of testPatterns) {
+  console.log(`\n测试: ${test.desc}`);
+  console.log(`模式: "${test.pattern}"`);
+
+  try {
+    const regex = new RegExp(test.pattern, 'gm');
+    const emptyTest = regex.exec('');
+
+    console.log('第1次匹配:', emptyTest ? {
+      match: emptyTest[0],
+      index: emptyTest.index,
+      length: emptyTest[0].length
+    } : 'null');
+
+    if (emptyTest && emptyTest[0] === '' && emptyTest.index === 0) {
+      const secondMatch = regex.exec('');
+      console.log('第2次匹配:', secondMatch ? {
+        match: secondMatch[0],
+        index: secondMatch.index,
+        length: secondMatch[0].length
+      } : 'null');
+
+      if (secondMatch && secondMatch.index === 0) {
+        console.log('❌ 危险: 卡在位置 0');
+      } else {
+        console.log(`✅ 安全: 第2次匹配在位置 ${secondMatch?.index || '(end)'}`);
+      }
+    } else {
+      console.log(`✅ 安全: 第1次匹配后位置 = ${emptyTest?.index || '(end)'}`);
+    }
+  } catch (error) {
+    console.log(`❌ 错误: ${error.message}`);
+  }
+}
+
+console.log('\n' + '='.repeat(60));
+console.log('\n结论:');
+console.log('问题分析:');
+console.log('- 空字符串 "" 应该被 pattern === \'\' 检查捕获');
+console.log('- "x*" 在空字符串上第2次就结束，不会卡住');
+console.log('- "a|" 在空字符串上第2次就结束，不会卡住');
+console.log('- ".*" 在空字符串上第2次就结束，不会卡住');
+
+console.log('\n真正的危险是:');
+console.log('- 在**非空内容**上反复匹配空字符串');
+console.log('- 例如: "x*" 在 "abc" 上会匹配 4 次（每个位置一次）');
+
+console.log('\n真正的危险测试:');
+console.log('模式 "x*" 在内容 "abc" 上的行为:');
+
+const regex = new RegExp('x*', 'gm');
+const content = 'abc';
+let match;
+let count = 0;
+let lastIndex = -1;
+
+while ((match = regex.exec(content)) !== null && count < 10) {
+  count++;
+  console.log(`  匹配 #${count}: "${match[0]}" at index ${match.index}`);
+
+  if (match.index === lastIndex) {
+    console.log(`  ❌ 卡住! 停留在 index ${match.index}`);
+    break;
+  }
+  lastIndex = match.index;
+}
+
+if (count >= 10) {
+  console.log('  ⚠️ 达到 10 次迭代限制');
+}
+
+console.log('\n结论: "x*" 会在每个字符位置匹配空字符串!');
+console.log('这就是为什么需要位置前进检查 (match.index === lastIndex)');