Source code for pythainlp.tools

# -*- coding: utf-8 -*-
"""
PyThaiNLP data tools

For text processing and text conversion, see pythainlp.util
"""
import os

import pythainlp

PYTHAINLP_DATA_DIR = "pythainlp-data"


[docs]def get_full_data_path(path: str) -> str: """ This function joins path of :mod:`pythainlp` data directory and the given path, and returns the full path. :return: full path given the name of dataset :rtype: str :Example: :: from pythainlp.tools import get_full_data_path get_full_data_path('ttc_freq.txt') # output: '/root/pythainlp-data/ttc_freq.txt' """ return os.path.join(get_pythainlp_data_path(), path)
[docs]def get_pythainlp_data_path() -> str: """ Returns the full path where PyThaiNLP keeps its (downloaded) data. If the directory does not yet exist, it will be created. The path can be specified through the environment variable :envvar:`PYTHAINLP_DATA_DIR`. By default, `~/pythainlp-data` will be used. :return: full path of directory for :mod:`pythainlp` downloaded data :rtype: str :Example: :: from pythainlp.tools import get_pythainlp_data_path get_pythainlp_data_path() # output: '/root/pythainlp-data' """ path = os.getenv('PYTHAINLP_DATA_DIR', os.path.join("~", PYTHAINLP_DATA_DIR)) path = os.path.expanduser(path) os.makedirs(path, exist_ok=True) return path
[docs]def get_pythainlp_path() -> str: """ This function returns full path of PyThaiNLP code :return: full path of :mod:`pythainlp` code :rtype: str :Example: :: from pythainlp.tools import get_pythainlp_path get_pythainlp_path() # output: '/usr/local/lib/python3.6/dist-packages/pythainlp' """ return os.path.dirname(pythainlp.__file__)