Improve: [newmm tokenizer] Change regular expression of "non-thai-characters" #1292
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
name: Lint | |
on: | |
push: | |
branches: | |
- dev | |
paths-ignore: | |
- '**.md' | |
- '**.yml' | |
- 'docs/**' | |
pull_request: | |
branches: | |
- dev | |
paths-ignore: | |
- '**.md' | |
- '**.yml' | |
- 'docs/**' | |
jobs: | |
build: | |
runs-on: ubuntu-20.04 | |
strategy: | |
matrix: | |
python-version: [3.8] | |
steps: | |
- uses: actions/checkout@v2 | |
- name: Set up Python ${{ matrix.python-version }} | |
uses: actions/setup-python@v4 | |
with: | |
python-version: ${{ matrix.python-version }} | |
- name: Check Code Format with Black | |
uses: psf/black@stable | |
with: | |
options: "--check --verbose --line-length=79" | |
src: "./pythainlp" | |
version: "~= 22.0" | |
- name: Install dependencies | |
run: | | |
python -m pip install --upgrade pip | |
if [ -f requirements.txt ]; then pip install -r requirements.txt; fi | |
pip install "h5py>=2.10.0,<3" "tensorflow>=2.3.1,<3" | |
pip install torch==1.7.0+cpu -f https://download.pytorch.org/whl/torch_stable.html | |
pip install deepcut | |
pip install .[full] | |
pip install flake8 flake8-commas flake8-comprehensions flake8-tidy-imports | |
- name: Lint with flake8 | |
run: | | |
# stop the build if there are Python syntax errors or undefined names | |
flake8 . --count --select=E9,F63,F7,F82 --show-source --statistics | |
# exit-zero treats all errors as warnings. The GitHub editor is 127 chars wide | |
flake8 . --count --exit-zero --max-complexity=10 --max-line-length=127 --statistics |