Feature/post media translations (#42)

* chore: updated todo with translation ideas

* feat: first take at the implementation of translations

* fix: small addition for the translation feature

* feat: support language switching in the editor and preview

* feat: better handling of long bodies by not running them through a json envelope

* fix: unknown macros have better fallback

* feat: api for python to get translations

* fix: strip dumb prefix of content in translation

* feat: extend meta diff for translations

* feat: hook up translations to rebuild-from-disk

* feat: generation of the website prefers project language, falling back to canonical language

* fix: crashes during rendering

* feat: translation validation report

* fix: made the translation validation actually work

* chore: reorganization of menu

* fix: some topics cleanup

* chore: updated doc

* feat: translations for media

* feat: more aligned in UI/UX

* feat: edit translations possible

* chore: added full multi-language todo

* chore: updated todo for clarity

* feat: implementation of full multi-linguality

* fix: page creation creates pages

* fix: flags on every page

* fix: better prompt

* feat: made MCP server aware of language content

* feat: python tools for translations

* fix: better fill-in-translations

* fix: better prompt for translation. maybe.

* fix: losing posts from search due to translation process

* fix: translation validation handles in-db content and fill-in of missing translations fixed to flush

* fix: faster scanning for infilling of missing translations

* chore: updated agent instructions

* feat: calendar and tag cloud respect current language now

* fix: retries going up

* fix: got metadata-diff and rebuild into sync

* fix: extended meta-diff for timestamps

* fix: made website validation look at translated content, too

* fix: multi-lingual search

* chore: refactor Editor.tsx into two separate editors

* feat: do language detection when no explicit language given

---------

Co-authored-by: hugo <hugoms@me.com>
This commit is contained in:
Georg Bauer
2026-03-09 14:43:18 +01:00
committed by GitHub
parent f1c9038803
commit b855d61524
116 changed files with 19954 additions and 2094 deletions

View File

@@ -43,6 +43,7 @@ function createMockDeps() {
const postEngine = {
getPost: vi.fn(),
upsertPostTranslation: vi.fn(),
} as any;
return { chatEngine, providers, mediaEngine, postEngine };
@@ -182,3 +183,283 @@ describe('OneShotTasks.analyzePost', () => {
expect(deps.providers.resolveModel).toHaveBeenCalledWith('custom-model-id');
});
});
describe('OneShotTasks.translatePost', () => {
let deps: ReturnType<typeof createMockDeps>;
let tasks: OneShotTasks;
beforeEach(() => {
vi.clearAllMocks();
deps = createMockDeps();
tasks = new OneShotTasks(deps.providers, deps.chatEngine, deps.mediaEngine, deps.postEngine);
});
it('instructs the AI to leave fenced code blocks untranslated', async () => {
deps.postEngine.getPost.mockResolvedValue({
id: 'post-1',
title: 'My Post',
excerpt: 'Summary',
content: 'Intro\n\n```ts\nconst label = "Hello";\n```',
language: 'en',
status: 'draft',
});
deps.postEngine.upsertPostTranslation.mockResolvedValue({
id: 'translation-1',
translationFor: 'post-1',
language: 'fr',
title: 'Mon Post',
excerpt: 'Resume',
content: 'Intro\n\n```ts\nconst label = "Hello";\n```',
});
mockGenerateText
.mockResolvedValueOnce({
text: '{"title":"Mon Post","excerpt":"Resume"}',
} as any)
.mockResolvedValueOnce({
text: 'Intro\n\n```ts\nconst label = "Hello";\n```',
} as any);
await tasks.translatePost('post-1', 'fr');
expect(mockGenerateText).toHaveBeenNthCalledWith(2, expect.objectContaining({
system: expect.stringContaining('Leave text inside fenced code blocks untranslated.'),
}));
});
it('translates markdown body outside a JSON envelope', async () => {
deps.postEngine.getPost.mockResolvedValue({
id: 'post-1',
title: 'My Post',
excerpt: 'Summary',
content: 'Intro\n\n```ts\nconst config = { hello: "world" };\n```\n\nEnd.',
language: 'en',
status: 'draft',
});
deps.postEngine.upsertPostTranslation.mockResolvedValue({
id: 'translation-1',
translationFor: 'post-1',
language: 'fr',
title: 'Mon Post',
excerpt: 'Resume',
content: 'Bonjour',
});
mockGenerateText
.mockResolvedValueOnce({
text: '{"title":"Mon Post","excerpt":"Resume"}',
} as any)
.mockResolvedValueOnce({
text: 'Introduction\n\n```ts\nconst config = { hello: "world" };\n```\n\nFin.',
} as any);
const result = await tasks.translatePost('post-1', 'fr');
expect(result.success).toBe(true);
expect(mockGenerateText).toHaveBeenCalledTimes(2);
expect(mockGenerateText).toHaveBeenNthCalledWith(1, expect.objectContaining({
system: expect.stringContaining('keys title and excerpt'),
}));
expect(mockGenerateText).toHaveBeenNthCalledWith(2, expect.objectContaining({
system: expect.stringContaining('Return ONLY the translated Markdown body'),
}));
expect(deps.postEngine.upsertPostTranslation).toHaveBeenCalledWith('post-1', 'fr', {
title: 'Mon Post',
excerpt: 'Resume',
content: 'Introduction\n\n```ts\nconst config = { hello: "world" };\n```\n\nFin.',
});
});
it('passes the raw markdown body without a leading content label', async () => {
deps.postEngine.getPost.mockResolvedValue({
id: 'post-1',
title: 'My Post',
excerpt: 'Summary',
content: '# Heading\n\nBody text',
language: 'en',
status: 'draft',
});
deps.postEngine.upsertPostTranslation.mockResolvedValue({
id: 'translation-1',
translationFor: 'post-1',
language: 'fr',
title: 'Mon Post',
excerpt: 'Resume',
content: '# Titre\n\nTexte',
});
mockGenerateText
.mockResolvedValueOnce({
text: '{"title":"Mon Post","excerpt":"Resume"}',
} as any)
.mockResolvedValueOnce({
text: '# Titre\n\nTexte',
} as any);
await tasks.translatePost('post-1', 'fr');
expect(mockGenerateText).toHaveBeenNthCalledWith(2, expect.objectContaining({
prompt: '# Heading\n\nBody text',
}));
});
it('strips an accidental leading content label from translated markdown', async () => {
deps.postEngine.getPost.mockResolvedValue({
id: 'post-1',
title: 'Mein Beitrag',
excerpt: 'Zusammenfassung',
content: '# Uberschrift\n\nText',
language: 'de',
status: 'draft',
});
deps.postEngine.upsertPostTranslation.mockResolvedValue({
id: 'translation-1',
translationFor: 'post-1',
language: 'en',
title: 'My Post',
excerpt: 'Summary',
content: '# Heading\n\nText',
});
mockGenerateText
.mockResolvedValueOnce({
text: '{"title":"My Post","excerpt":"Summary"}',
} as any)
.mockResolvedValueOnce({
text: 'content:\n\n# Heading\n\nText',
} as any);
await tasks.translatePost('post-1', 'en');
expect(deps.postEngine.upsertPostTranslation).toHaveBeenCalledWith('post-1', 'en', {
title: 'My Post',
excerpt: 'Summary',
content: '# Heading\n\nText',
});
});
it('instructs the AI to translate only — never invent or add content', async () => {
deps.postEngine.getPost.mockResolvedValue({
id: 'post-1',
title: 'My Post',
excerpt: 'Summary',
content: '# Hello\n\nWorld',
language: 'en',
status: 'draft',
});
deps.postEngine.upsertPostTranslation.mockResolvedValue({
id: 'translation-1',
translationFor: 'post-1',
language: 'fr',
title: 'Mon Post',
excerpt: 'Resume',
content: '# Bonjour\n\nMonde',
});
mockGenerateText
.mockResolvedValueOnce({ text: '{"title":"Mon Post","excerpt":"Resume"}' } as any)
.mockResolvedValueOnce({ text: '# Bonjour\n\nMonde' } as any);
await tasks.translatePost('post-1', 'fr');
const contentSystemPrompt = mockGenerateText.mock.calls[1][0].system as string;
expect(contentSystemPrompt).toMatch(/do not invent|do not add|only translate/i);
expect(contentSystemPrompt).toMatch(/macro|shortcode|non-translatable/i);
});
it('instructs the AI to keep markdown link text unchanged and translate surrounding prose', async () => {
deps.postEngine.getPost.mockResolvedValue({
id: 'post-1',
title: 'USearch Library',
excerpt: '',
content: '[unum-cloud/USearch: Fast Search](https://github.com/unum-cloud/USearch) - drin was drauf steht. Eine Library.',
language: 'de',
status: 'draft',
});
deps.postEngine.upsertPostTranslation.mockResolvedValue({
id: 'translation-1',
translationFor: 'post-1',
language: 'en',
title: 'USearch Library',
excerpt: '',
content: '[unum-cloud/USearch: Fast Search](https://github.com/unum-cloud/USearch) - what it says on the tin. A library.',
});
mockGenerateText
.mockResolvedValueOnce({ text: '{"title":"USearch Library","excerpt":""}' } as any)
.mockResolvedValueOnce({
text: '[unum-cloud/USearch: Fast Search](https://github.com/unum-cloud/USearch) - what it says on the tin. A library.',
} as any);
await tasks.translatePost('post-1', 'en');
const contentSystemPrompt = mockGenerateText.mock.calls[1][0].system as string;
expect(contentSystemPrompt).toMatch(/link text/i);
expect(contentSystemPrompt).toMatch(/url/i);
});
it('falls back to source title and excerpt when metadata JSON is invalid', async () => {
deps.postEngine.getPost.mockResolvedValue({
id: 'post-1',
title: 'My Post',
excerpt: 'Summary',
content: 'Intro',
language: 'en',
status: 'draft',
});
deps.postEngine.upsertPostTranslation.mockResolvedValue({
id: 'translation-1',
translationFor: 'post-1',
language: 'fr',
title: 'My Post',
excerpt: 'Summary',
content: 'Bonjour',
});
mockGenerateText
.mockResolvedValueOnce({
text: 'not valid json',
} as any)
.mockResolvedValueOnce({
text: 'Bonjour',
} as any);
const result = await tasks.translatePost('post-1', 'fr');
expect(result.success).toBe(true);
expect(deps.postEngine.upsertPostTranslation).toHaveBeenCalledWith('post-1', 'fr', {
title: 'My Post',
excerpt: 'Summary',
content: 'Bonjour',
});
});
it('passes status published when autoPublish is set', async () => {
deps.postEngine.getPost.mockResolvedValue({
id: 'post-1',
title: 'My Post',
excerpt: 'Summary',
content: 'Hello world',
language: 'en',
status: 'published',
});
deps.postEngine.upsertPostTranslation.mockResolvedValue({
id: 'translation-1',
translationFor: 'post-1',
language: 'fr',
title: 'Mon Post',
excerpt: 'Résumé',
content: 'Bonjour le monde',
});
mockGenerateText
.mockResolvedValueOnce({
text: '{"title":"Mon Post","excerpt":"Résumé"}',
} as any)
.mockResolvedValueOnce({
text: 'Bonjour le monde',
} as any);
const result = await tasks.translatePost('post-1', 'fr', { autoPublish: true });
expect(result.success).toBe(true);
expect(deps.postEngine.upsertPostTranslation).toHaveBeenCalledWith('post-1', 'fr', {
title: 'Mon Post',
excerpt: 'Résumé',
content: 'Bonjour le monde',
status: 'published',
});
});
});