diff --git a/.dockerignore b/.dockerignore new file mode 100644 index 0000000..0629895 --- /dev/null +++ b/.dockerignore @@ -0,0 +1,42 @@ +# Python +__pycache__/ +*.py[cod] +*$py.class +*.so +.Python +*.egg-info/ +dist/ +build/ + +# Virtual environments +venv/ +env/ +ENV/ + +# Models cache (will be mounted as volume) +models/ + +# IDE +.vscode/ +.idea/ +*.swp +*.swo + +# Git +.git/ +.gitignore + +# Documentation +README.md +CLAUDE.md +*.md + +# Environment +.env +.env.local +.env.*.local + +# Docker +.dockerignore +Dockerfile +docker-compose.yml diff --git a/app/translator.py b/app/translator.py index 2c3e515..78c4274 100644 --- a/app/translator.py +++ b/app/translator.py @@ -473,7 +473,8 @@ class TranslationService: ).to(self.device) # Generate translation - NLLB uses forced_bos_token_id - forced_bos_token_id = tokenizer.lang_code_to_id[tgt_code] + # Convert language code to token ID + forced_bos_token_id = tokenizer.convert_tokens_to_ids(tgt_code) with torch.no_grad(): translated = model.generate(