File size: 351 Bytes
456f698
246f918
 
456f698
246f918
 
 
 
 
 
 
1
2
3
4
5
6
7
8
9
10
11
from pycccedict.cccedict import CcCedict
import json
from pathlib import Path

CC_DICT = CcCedict()

# source: https://github.com/chujiezheng/ChID-Dataset
CHID_FILE = Path(__file__).parent.parent / "data/chid_idiom_reference.json"
with open(CHID_FILE, "r", encoding="utf-8") as f:
    chid_data = json.load(f) 
CHID_SET = set(chid_data)  # O(1) lookup