{"id":27319,"library":"pyvi","title":"PyVi","description":"PyVi is a Python toolkit for Vietnamese language processing, providing tokenization (word segmentation), part-of-speech tagging, and named entity recognition. Currently at version 0.1.1, the project appears to be in maintenance mode with no recent updates.","status":"maintenance","version":"0.1.1","language":"python","source_language":"en","source_url":"https://github.com/trungtv/pyvi","tags":["vietnamese","nlp","tokenization","pos-tagger"],"install":[{"cmd":"pip install pyvi","lang":"bash","label":"pip"}],"dependencies":[],"imports":[{"note":"Wrong import; correct class is ViTokenizer.","wrong":"from pyvi import tokenize","symbol":"Tokenizer","correct":"from pyvi import ViTokenizer"},{"note":"Wrong import; correct class is ViPOSTagger.","wrong":"from pyvi import pos_tag","symbol":"POSTagger","correct":"from pyvi import ViPOSTagger"}],"quickstart":{"code":"from pyvi import ViTokenizer, ViPosTagger\n\ntext = 'Học sinh học sinh học'\ntokens = ViTokenizer.tokenize(text)\nprint(tokens)\n# Output: Học_sinh học_sinh học\n\n# POS tagging\nwords = tokens.split()\ntags = ViPosTagger.postagging(words)\nprint(tags)\n# Output: (['Học_sinh', 'học_sinh', 'học'], ['N', 'N', 'V'])","lang":"python","description":"Tokenize Vietnamese text and perform POS tagging."},"warnings":[{"fix":"Use tokenizer output directly or replace underscores with spaces as needed.","message":"The tokenizer combines syllables with underscores (e.g., 'Học_sinh'). Do not split on spaces before feeding to downstream tasks without handling underscores.","severity":"gotcha","affected_versions":"all versions"},{"fix":"Consider alternatives like underthesea or VnCoreNLP for better accuracy.","message":"The package has not been updated since 2020. Models may be outdated compared to newer approaches.","severity":"deprecated","affected_versions":"0.1.1"}],"env_vars":null,"last_verified":"2026-04-27T00:00:00.000Z","next_check":"2026-07-26T00:00:00.000Z","problems":[{"fix":"Run: pip install pyvi","cause":"PyVi is not installed.","error":"ModuleNotFoundError: No module named 'pyvi'"},{"fix":"Use: from pyvi import ViTokenizer","cause":"Incorrect import statement.","error":"AttributeError: module 'pyvi' has no attribute 'ViTokenizer'"},{"fix":"Reinstall pyvi: pip install --force-reinstall pyvi","cause":"Package data files missing; likely a broken installation.","error":"FileNotFoundError: [Errno 2] No such file or directory: 'pyvi/ViTokenizer/data/tokenized_data.pkl'"}],"ecosystem":"pypi","meta_description":null,"install_score":null,"install_tag":null,"quickstart_score":null,"quickstart_tag":null}