committed by
GitHub
3 changed files with 311 additions and 0 deletions
@ -0,0 +1,148 @@ |
|||||
|
Translate to Spanish (español). |
||||
|
|
||||
|
Use the informal grammar (use "tú" instead of "usted"). |
||||
|
|
||||
|
For instructions or titles in imperative, keep them in imperative, for example "Edit it" to "Edítalo". |
||||
|
|
||||
|
There are special blocks of notes, tips and others that look like: |
||||
|
|
||||
|
/// note |
||||
|
|
||||
|
To translate it, keep the same line and add the translation after a vertical bar: |
||||
|
|
||||
|
/// note | Nota |
||||
|
|
||||
|
Some examples: |
||||
|
|
||||
|
Source: |
||||
|
|
||||
|
/// tip |
||||
|
|
||||
|
Result: |
||||
|
|
||||
|
/// tip | Consejo |
||||
|
|
||||
|
Source: |
||||
|
|
||||
|
/// details | Preview |
||||
|
|
||||
|
Result: |
||||
|
|
||||
|
/// details | Vista previa |
||||
|
|
||||
|
Source: |
||||
|
|
||||
|
/// warning |
||||
|
|
||||
|
Result: |
||||
|
|
||||
|
/// warning | Advertencia |
||||
|
|
||||
|
Source: |
||||
|
|
||||
|
/// info |
||||
|
|
||||
|
Result: |
||||
|
|
||||
|
/// info | Información |
||||
|
|
||||
|
Source: |
||||
|
|
||||
|
/// note | Technical Details |
||||
|
|
||||
|
Result: |
||||
|
|
||||
|
/// note | Detalles Técnicos |
||||
|
|
||||
|
--- |
||||
|
|
||||
|
For the next terms, use the following translations: |
||||
|
|
||||
|
* framework: framework (do not translate to "marco") |
||||
|
* performance: rendimiento |
||||
|
* program (verb): programar |
||||
|
* code (verb): programar |
||||
|
* type hints: anotaciones de tipos |
||||
|
* type annotations: anotaciones de tipos |
||||
|
* autocomplete: autocompletado |
||||
|
* completion (in the context of autocompletion): autocompletado |
||||
|
* feature: funcionalidad |
||||
|
* sponsor: sponsor |
||||
|
* host (in a podcast): host |
||||
|
* request (as in HTTP request): request |
||||
|
* response (as in HTTP response): response |
||||
|
* path operation function: path operation function (do not translate to "función de operación de ruta") |
||||
|
* path operation: path operation (do not translate to "operación de ruta") |
||||
|
* path (as in URL path): path (do not translate to "ruta") |
||||
|
* query (as in URL query): query (do not translate to "consulta") |
||||
|
* cookie (as in HTTP cookie): cookie |
||||
|
* header (as in HTTP header): header |
||||
|
* form (as in HTML form): formulario |
||||
|
* type checks: chequeo de tipos |
||||
|
* parse: parse |
||||
|
* parsing: parsing |
||||
|
* marshall: marshall |
||||
|
* library: paquete (do not translate to "biblioteca" or "librería") |
||||
|
* instance: instance (do not translate to "instancia") |
||||
|
* scratch the surface: tocar los conceptos básicos |
||||
|
* string: string |
||||
|
* bug: bug |
||||
|
* docs: documentación (do not translate to "documentos") |
||||
|
* cheat sheet: cheat sheet (do not translate to "chuleta") |
||||
|
* key (as in key-value pair, dictionary key): clave |
||||
|
* array (as in JSON array): array |
||||
|
* API key: API key (do not translate to "clave API") |
||||
|
* 100% test coverage: cobertura de tests del 100% |
||||
|
* back and forth: de un lado a otro |
||||
|
* I/O (as in "input and output"): I/O (do not translate to "E/S") |
||||
|
* Machine Learning: Machine Learning (do not translate to "Aprendizaje Automático") |
||||
|
* Deep Learning: Deep Learning (do not translate to "Aprendizaje Profundo") |
||||
|
* callback hell: callback hell (do not translate to "infierno de callbacks") |
||||
|
* tip: Consejo (do not translate to "tip") |
||||
|
* check: Revisa (do not translate to "chequea" or "comprobación) |
||||
|
* Cross-Origin Resource Sharing: Cross-Origin Resource Sharing (do not translate to "Compartición de Recursos de Origen Cruzado") |
||||
|
* Release Notes: Release Notes (do not translate to "Notas de la Versión") |
||||
|
* Semantic Versioning: Semantic Versioning (do not translate to "Versionado Semántico") |
||||
|
* dependable: dependable (do not translate to "confiable" or "fiable") |
||||
|
* list (as in Python list): list |
||||
|
* context manager: context manager (do not translate to "gestor de contexto" or "administrador de contexto") |
||||
|
* a little bit: un poquito |
||||
|
* graph (data structure, as in "dependency graph"): grafo (do not translate to "gráfico") |
||||
|
* form data: form data (do not translate to "datos de formulario" or "datos de form") |
||||
|
* import (as in code import): import (do not translate to "importación") |
||||
|
* JSON Schema: JSON Schema (do not translate to "Esquema JSON") |
||||
|
* embed: embeber (do not translate to "incrustar") |
||||
|
* request body: request body (do not translate to "cuerpo de la petición") |
||||
|
* response body: response body (do not translate to "cuerpo de la respuesta") |
||||
|
* cross domain: cross domain (do not translate to "dominio cruzado") |
||||
|
* cross origin: cross origin (do not translate to "origen cruzado") |
||||
|
* plugin: plugin (do not translate to "complemento" or "extensión") |
||||
|
* plug-in: plug-in (do not translate to "complemento" or "extensión") |
||||
|
* plug-ins: plug-ins (do not translate to "complementos" or "extensiones") |
||||
|
* full stack: full stack (do not translate to "pila completa") |
||||
|
* full-stack: full-stack (do not translate to "de pila completa") |
||||
|
* stack: stack (do not translate to "pila") |
||||
|
* loop (as in async loop): loop (do not translate to "bucle" or "ciclo") |
||||
|
* hard dependencies: dependencias obligatorias (do not translate to "dependencias duras") |
||||
|
* locking: locking (do not translate to "bloqueo") |
||||
|
* testing (as in software testing): escribir pruebas (do not translate to "probar") |
||||
|
* code base: code base (do not translate to "base de código") |
||||
|
* default: por defecto (do not translate to "predeterminado") |
||||
|
* default values: valores por defecto (do not translate to "valores predeterminados") |
||||
|
* media type: media type (do not translate to "tipo de medio") |
||||
|
* instantiate: crear un instance (do not translate to "instanciar") |
||||
|
* OAuth2 Scopes: Scopes de OAuth2 (do not translate to "Alcances de OAuth2") |
||||
|
* on the fly: sobre la marcha (do not translate to "al vuelo") |
||||
|
* terminal: terminal (femenine, as in "la terminal") |
||||
|
* terminals: terminales (plural femenine, as in "las terminales") |
||||
|
* lifespan: lifespan (do not translate to "vida útil" or "tiempo de vida") |
||||
|
* unload: quitar de memoria (do not translate to "descargar") |
||||
|
* mount (noun): mount (do not translate to "montura") |
||||
|
* mount (verb): montar |
||||
|
* statement (as in code statement): statement (do not translate to "declaración" or "sentencia") |
||||
|
* worker process: worker process (do not translate to "proceso trabajador" or "proceso de trabajo") |
||||
|
* worker processes: worker processes (do not translate to "procesos trabajadores" or "procesos de trabajo") |
||||
|
* worker: worker (do not translate to "trabajador") |
||||
|
* load balancer: load balancer (do not translate to "balanceador de carga") |
||||
|
* load balance: load balance (do not translate to "balancear carga") |
||||
|
* self hosting: self hosting (do not translate to "auto alojamiento") |
@ -0,0 +1 @@ |
|||||
|
pydantic-ai==0.0.15 |
@ -0,0 +1,162 @@ |
|||||
|
from functools import lru_cache |
||||
|
from pathlib import Path |
||||
|
from typing import Iterable |
||||
|
|
||||
|
import typer |
||||
|
import yaml |
||||
|
from pydantic_ai import Agent |
||||
|
|
||||
|
non_translated_sections = ( |
||||
|
"reference/", |
||||
|
"release-notes.md", |
||||
|
"fastapi-people.md", |
||||
|
"external-links.md", |
||||
|
"newsletter.md", |
||||
|
"management-tasks.md", |
||||
|
"management.md", |
||||
|
"contributing.md", |
||||
|
) |
||||
|
|
||||
|
|
||||
|
general_prompt = """ |
||||
|
For technical terms in English that don't have a common translation term use the original term in English. |
||||
|
|
||||
|
For code snippets or fragments, surrounded by backticks (`), don't translate the content, keep the original in English. For example, `list`, `dict`, keep them as is. |
||||
|
|
||||
|
The content is written in markdown, write the translation in markdown as well. Don't add triple backticks (`) around the generated translation content. |
||||
|
|
||||
|
When there's an example of code, the console or a terminal, normally surrounded by triple backticks and a keyword like "console" or "bash" (e.g. ```console), do not translate the content, keep the original in English. |
||||
|
|
||||
|
The original content will be surrounded by triple percentage signs (%) and you should translate it to the target language. Do not include the triple percentage signs in the translation. |
||||
|
""" |
||||
|
|
||||
|
|
||||
|
@lru_cache |
||||
|
def get_langs() -> dict[str, str]: |
||||
|
return yaml.safe_load(Path("docs/language_names.yml").read_text()) |
||||
|
|
||||
|
|
||||
|
def generate_lang_path(*, lang: str, path: Path) -> Path: |
||||
|
en_docs_path = Path("docs/en/docs") |
||||
|
assert str(path).startswith( |
||||
|
str(en_docs_path) |
||||
|
), f"Path must be inside {en_docs_path}" |
||||
|
lang_docs_path = Path(f"docs/{lang}/docs") |
||||
|
out_path = Path(str(path).replace(str(en_docs_path), str(lang_docs_path))) |
||||
|
return out_path |
||||
|
|
||||
|
|
||||
|
def translate_page(*, lang: str, path: Path) -> None: |
||||
|
langs = get_langs() |
||||
|
language = langs[lang] |
||||
|
lang_path = Path(f"docs/{lang}") |
||||
|
lang_path.mkdir(exist_ok=True) |
||||
|
lang_prompt_path = lang_path / "llm-prompt.md" |
||||
|
assert lang_prompt_path.exists(), f"Prompt file not found: {lang_prompt_path}" |
||||
|
lang_prompt_content = lang_prompt_path.read_text() |
||||
|
|
||||
|
en_docs_path = Path("docs/en/docs") |
||||
|
assert str(path).startswith( |
||||
|
str(en_docs_path) |
||||
|
), f"Path must be inside {en_docs_path}" |
||||
|
out_path = generate_lang_path(lang=lang, path=path) |
||||
|
out_path.parent.mkdir(parents=True, exist_ok=True) |
||||
|
original_content = path.read_text() |
||||
|
old_translation: str | None = None |
||||
|
if out_path.exists(): |
||||
|
old_translation = out_path.read_text() |
||||
|
agent = Agent("openai:gpt-4o") |
||||
|
|
||||
|
prompt_segments = [ |
||||
|
lang_prompt_content, |
||||
|
general_prompt, |
||||
|
] |
||||
|
if old_translation: |
||||
|
prompt_segments.extend( |
||||
|
[ |
||||
|
"There's an existing previous translation for this content that is probably outdated with old content or old instructions.", |
||||
|
"Update the translation given your current instructions and the original content.", |
||||
|
"If you have instructions to translate specific terms or phrases in a specific way, please follow those instructions instead of keeping the old and outdated content.", |
||||
|
"Previous translation:", |
||||
|
f"%%%\n{old_translation}%%%", |
||||
|
] |
||||
|
) |
||||
|
prompt_segments.extend( |
||||
|
[ |
||||
|
f"Translate to {language} ({lang}).", |
||||
|
"Original content:", |
||||
|
f"%%%\n{original_content}%%%", |
||||
|
] |
||||
|
) |
||||
|
prompt = "\n\n".join(prompt_segments) |
||||
|
|
||||
|
result = agent.run_sync(prompt) |
||||
|
out_content = f"{result.data.strip()}\n" |
||||
|
out_path.write_text(out_content) |
||||
|
|
||||
|
|
||||
|
def iter_paths_to_translate() -> Iterable[Path]: |
||||
|
""" |
||||
|
Iterate on the markdown files to translate in order of priority. |
||||
|
""" |
||||
|
first_dirs = [ |
||||
|
Path("docs/en/docs/learn"), |
||||
|
Path("docs/en/docs/tutorial"), |
||||
|
Path("docs/en/docs/advanced"), |
||||
|
Path("docs/en/docs/about"), |
||||
|
Path("docs/en/docs/how-to"), |
||||
|
] |
||||
|
first_parent = Path("docs/en/docs") |
||||
|
yield from first_parent.glob("*.md") |
||||
|
for dir_path in first_dirs: |
||||
|
yield from dir_path.rglob("*.md") |
||||
|
first_dirs_str = tuple(str(d) for d in first_dirs) |
||||
|
for path in Path("docs/en/docs").rglob("*.md"): |
||||
|
if str(path).startswith(first_dirs_str): |
||||
|
continue |
||||
|
if path.parent == first_parent: |
||||
|
continue |
||||
|
yield path |
||||
|
|
||||
|
|
||||
|
def translate_all(lang: str) -> None: |
||||
|
paths_to_process: list[Path] = [] |
||||
|
for path in iter_paths_to_translate(): |
||||
|
if str(path).replace("docs/en/docs/", "").startswith(non_translated_sections): |
||||
|
continue |
||||
|
paths_to_process.append(path) |
||||
|
print("Original paths:") |
||||
|
for p in paths_to_process: |
||||
|
print(f" - {p}") |
||||
|
print(f"Total original paths: {len(paths_to_process)}") |
||||
|
missing_paths: list[Path] = [] |
||||
|
skipped_paths: list[Path] = [] |
||||
|
for p in paths_to_process: |
||||
|
lang_path = generate_lang_path(lang=lang, path=p) |
||||
|
if lang_path.exists(): |
||||
|
skipped_paths.append(p) |
||||
|
continue |
||||
|
missing_paths.append(p) |
||||
|
print("Paths to skip:") |
||||
|
for p in skipped_paths: |
||||
|
print(f" - {p}") |
||||
|
print(f"Total paths to skip: {len(skipped_paths)}") |
||||
|
print("Paths to process:") |
||||
|
for p in missing_paths: |
||||
|
print(f" - {p}") |
||||
|
print(f"Total paths to process: {len(missing_paths)}") |
||||
|
for p in missing_paths: |
||||
|
print(f"Translating: {p}") |
||||
|
translate_page(lang="es", path=p) |
||||
|
print(f"Done translating: {p}") |
||||
|
|
||||
|
|
||||
|
def main(*, lang: str, path: Path = None) -> None: |
||||
|
if path: |
||||
|
translate_page(lang=lang, path=path) |
||||
|
else: |
||||
|
translate_all(lang=lang) |
||||
|
|
||||
|
|
||||
|
if __name__ == "__main__": |
||||
|
typer.run(main) |
Loading…
Reference in new issue