.dockerignore
Dockerfile
Makefile
README.md
pyproject.toml
ldnoobw/de
ldnoobw/en
ldnoobw/es
ldnoobw/fr
ldnoobw/ja
ldnoobw/pt
src/cc_net_prepro.py
src/doc_Gopher_statistics.py
src/doc_c4_statistics.py
src/doc_quality_local.py
src/doc_quality_local_python.py
src/doc_quality_transform.py
src/doc_quality_transform_python.py
src/doc_quality_utils.py
src/dpk_doc_quality_transform_python.egg-info/PKG-INFO
src/dpk_doc_quality_transform_python.egg-info/SOURCES.txt
src/dpk_doc_quality_transform_python.egg-info/dependency_links.txt
src/dpk_doc_quality_transform_python.egg-info/requires.txt
src/dpk_doc_quality_transform_python.egg-info/top_level.txt
test/test_doc_quality.py
test/test_doc_quality_python.py
test-data/expected/metadata.json
test-data/expected/test1.parquet
test-data/input/test1.parquet