Path |
Digest |
Size |
clean_text_my/__init__.py |
sha256=_CN5C9fJHDzdAC8zNpeA6UFJfH3DCg8VYd2QO3q2anY
|
179 |
clean_text_my/deduplication.py |
sha256=KyTwx1lSQBUXXOS-_oXKs-RmAS9Z6gzNB0fcstdnBCs
|
3719 |
clean_text_my/download_dataset.py |
sha256=Jd5DiftsYUHynoaM7fumBDzG9iqOdqHbsErCh9e94As
|
631 |
clean_text_my/logging.py |
sha256=S3Qu35aeYpJt9orM3kUFpxomma-yHhLVM0d_Sd9LEeo
|
973 |
clean_text_my/manipulation.py |
sha256=CtBdME0231ZGMn6vTag2lH5QJ7zJVYUDiqX7XKYqQ-8
|
2528 |
clean_text_my/postprocessing.py |
sha256=2S_YTPoIILKH_nRt_iJUtz0BNKQ00RZkLDcmjO_I9aU
|
4114 |
clean_text_my/utils.py |
sha256=2JrQH4OjoCmbbEI6wZyKqr-VlvVnqusyrJFLu9jNywI
|
1127 |
clean_text_my/text_dedup/__init__.py |
sha256=vNpo7t6C_3ycPlRzHgGEc6JLyFmSpoRis7IYbIsu7VQ
|
240 |
clean_text_my/text_dedup/minhash.py |
sha256=Lr-n5FpnxvpBTI_EcqKY7vK7npH93lPnfmTF2o5SnBo
|
13281 |
clean_text_my/text_dedup/utils/__init__.py |
sha256=tqMsTWpCx14W6_68Rvids_9o82a8O_PdaXB0f64s1iY
|
1680 |
clean_text_my/text_dedup/utils/add_args.py |
sha256=dvecgcuZzRyTuCa8f0OS8N7begFAJQZ2XZ0xLhRsbCQ
|
7981 |
clean_text_my/text_dedup/utils/analysis.py |
sha256=MGZDr2tJ1yYVTXwD2flRZHI61E9ZCzn5rkBdAraCbyc
|
3143 |
clean_text_my/text_dedup/utils/hashfunc.py |
sha256=p2iz_mtvEsfexnT5EWBKUu1rX0eUWn4KPM0NCH1EOGs
|
5012 |
clean_text_my/text_dedup/utils/preprocess.py |
sha256=EPrcQ894ZB_TL6kuzZcxjKhhmx1fXY_cBwsdFnXi4ZM
|
809 |
clean_text_my/text_dedup/utils/timer.py |
sha256=N2Bh139jGNfCn-lDJtm3jHJ4TtABm9EuU68WdgjEK_A
|
1489 |
clean_text_my/text_dedup/utils/tokenization.py |
sha256=ZMuwB_NSk_gMyTOQAkkPm0Zxv-031oxZcN-q9zd85Y8
|
1112 |
clean_text_my/text_dedup/utils/union_find.py |
sha256=-iNlVsENozOJP3-lIWOlz_4u0gAEaJdnYGhczbtsStg
|
809 |
clean_text_my-0.1.1.dist-info/METADATA |
sha256=fxUYnFnACFIHTN1sXT2vtX9ticIpwkzC2JxSNpyznOI
|
1655 |
clean_text_my-0.1.1.dist-info/WHEEL |
sha256=iYlv5fX357PQyRT2o6tw1bN-YcKFFHKqB_LwHO5wP-g
|
110 |
clean_text_my-0.1.1.dist-info/top_level.txt |
sha256=coFM29PeLMPTcg-uoh29vCDpoEXY0Za_gJjfOL4nNsA
|
14 |
clean_text_my-0.1.1.dist-info/RECORD |
— |
— |