fix(actions): don't swallow HTML entities into linkified URLs (#38239)

In the Actions log viewer, a double-quoted URL renders with a stray extra `;` after it. Reported in `gitea/runner#1046` Remove the buggy AI slop `linkifyURLs` and use new approach to process URLs in text --------- Signed-off-by: wxiaoguang <wxiaoguang@gmail.com> Co-authored-by: wxiaoguang <wxiaoguang@gmail.com>
2026-06-29 22:31:28 +00:00 · 2026-06-28 13:37:16 +02:00
parent 5b9251150c
commit ce8cf22af9
7 changed files with 104 additions and 117 deletions
--- a/web_src/js/modules/codeeditor/utils.test.ts
+++ b/web_src/js/modules/codeeditor/utils.test.ts
@@ -1,41 +1,4 @@
-import {findUrlAtPosition, trimUrlPunctuation, urlRawRegex} from './utils.ts';
-
-function matchUrls(text: string): string[] {
-  return Array.from(text.matchAll(urlRawRegex), (m) => trimUrlPunctuation(m[0]));
-}
-
-test('matchUrls', () => {
-  expect(matchUrls('visit https://example.com for info')).toEqual(['https://example.com']);
-  expect(matchUrls('see https://example.com.')).toEqual(['https://example.com']);
-  expect(matchUrls('see https://example.com, and')).toEqual(['https://example.com']);
-  expect(matchUrls('see https://example.com; and')).toEqual(['https://example.com']);
-  expect(matchUrls('(https://example.com)')).toEqual(['https://example.com']);
-  expect(matchUrls('"https://example.com"')).toEqual(['https://example.com']);
-  expect(matchUrls('https://example.com/path?q=1&b=2#hash')).toEqual(['https://example.com/path?q=1&b=2#hash']);
-  expect(matchUrls('https://example.com/path?q=1&b=2#hash.')).toEqual(['https://example.com/path?q=1&b=2#hash']);
-  expect(matchUrls('https://x.co')).toEqual(['https://x.co']);
-  expect(matchUrls('https://example.com/path_(wiki)')).toEqual(['https://example.com/path_(wiki)']);
-  expect(matchUrls('https://en.wikipedia.org/wiki/Rust_(programming_language)')).toEqual(['https://en.wikipedia.org/wiki/Rust_(programming_language)']);
-  expect(matchUrls('(https://en.wikipedia.org/wiki/Rust_(programming_language))')).toEqual(['https://en.wikipedia.org/wiki/Rust_(programming_language)']);
-  expect(matchUrls('http://example.com')).toEqual(['http://example.com']);
-  expect(matchUrls('no url here')).toEqual([]);
-  expect(matchUrls('https://a.com and https://b.com')).toEqual(['https://a.com', 'https://b.com']);
-  expect(matchUrls('[![](https://img.shields.io/npm/v/pkg.svg?style=flat)](https://www.npmjs.org/package/pkg)')).toEqual(['https://img.shields.io/npm/v/pkg.svg?style=flat', 'https://www.npmjs.org/package/pkg']);
-});
-
-test('trimUrlPunctuation', () => {
-  expect(trimUrlPunctuation('https://example.com.')).toEqual('https://example.com');
-  expect(trimUrlPunctuation('https://example.com,')).toEqual('https://example.com');
-  expect(trimUrlPunctuation('https://example.com;')).toEqual('https://example.com');
-  expect(trimUrlPunctuation('https://example.com:')).toEqual('https://example.com');
-  expect(trimUrlPunctuation("https://example.com'")).toEqual('https://example.com');
-  expect(trimUrlPunctuation('https://example.com"')).toEqual('https://example.com');
-  expect(trimUrlPunctuation('https://example.com.,;')).toEqual('https://example.com');
-  expect(trimUrlPunctuation('https://example.com/path')).toEqual('https://example.com/path');
-  expect(trimUrlPunctuation('https://example.com/path_(wiki)')).toEqual('https://example.com/path_(wiki)');
-  expect(trimUrlPunctuation('https://example.com)')).toEqual('https://example.com');
-  expect(trimUrlPunctuation('https://en.wikipedia.org/wiki/Rust_(lang))')).toEqual('https://en.wikipedia.org/wiki/Rust_(lang)');
-});
+import {findUrlAtPosition} from './utils.ts';

 test('findUrlAtPosition', () => {
  const doc = 'visit https://example.com for info';
--- a/web_src/js/modules/codeeditor/utils.ts
+++ b/web_src/js/modules/codeeditor/utils.ts
@@ -1,5 +1,6 @@
 import type {EditorView, ViewUpdate} from '@codemirror/view';
 import type {CodemirrorModules} from './main.ts';
+import {trimUrlPunctuation, urlRawRegex} from '../../utils/url.ts';

 /** Remove trailing whitespace from all lines in the editor. */
 export function trimTrailingWhitespaceFromView(view: EditorView): void {
@@ -15,22 +16,9 @@ export function trimTrailingWhitespaceFromView(view: EditorView): void {
  if (changes.length) view.dispatch({changes});
 }

-/** Matches URLs, excluding characters that are never valid unencoded in URLs per RFC 3986. */
-export const urlRawRegex = /\bhttps?:\/\/[^\s<>[\]]+/gi;
-
-/** Strip trailing punctuation that is likely not part of the URL. */
-export function trimUrlPunctuation(url: string): string {
-  url = url.replace(/[.,;:'"]+$/, '');
-  // Strip trailing closing parens only if unbalanced (not part of the URL like Wikipedia links)
-  while (url.endsWith(')') && (url.match(/\(/g) || []).length < (url.match(/\)/g) || []).length) {
-    url = url.slice(0, -1);
-  }
-  return url;
-}
-
 /** Find the URL at the given character position in a document string, or null if none. */
 export function findUrlAtPosition(doc: string, pos: number): string | null {
-  for (const match of doc.matchAll(urlRawRegex)) {
+  for (const match of doc.matchAll(urlRawRegex())) {
    const url = trimUrlPunctuation(match[0]);
    if (match.index !== undefined && pos >= match.index && pos < match.index + url.length) {
      return url;
@@ -67,7 +55,7 @@ export function goToDefinitionAt(cm: CodemirrorModules, view: EditorView, pos: n
 export function clickableUrls(cm: CodemirrorModules) {
  const urlMark = cm.view.Decoration.mark({class: 'cm-url'});
  const urlDecorator = new cm.view.MatchDecorator({
-    regexp: urlRawRegex,
+    regexp: urlRawRegex(),
    decorate: (add, from, _to, match) => {
      const trimmed = trimUrlPunctuation(match[0]);
      add(from, from + trimmed.length, urlMark);