From 3f2919e05c79eafe81f9412a0a0663a319fe6402 Mon Sep 17 00:00:00 2001 From: jacksonllee Date: Thu, 18 Mar 2021 07:12:00 -0500 Subject: [PATCH] MAINT update readme for acknowledgments --- README.rst | 1 + docs/index.html | 1 + docs/searchindex.js | 2 +- 3 files changed, 3 insertions(+), 1 deletion(-) diff --git a/README.rst b/README.rst index b600844..002df0e 100644 --- a/README.rst +++ b/README.rst @@ -170,6 +170,7 @@ Individuals who have contributed feedback, bug reports, etc. - @rylanchiu - Stephan Stiller - Tsz-Him Tsui +- Robin Yuen .. end-sphinx-website-index-page diff --git a/docs/index.html b/docs/index.html index 68e48a0..478a97b 100644 --- a/docs/index.html +++ b/docs/index.html @@ -417,6 +417,7 @@

Acknowledgments diff --git a/docs/searchindex.js b/docs/searchindex.js index 29879d5..aad664c 100644 --- a/docs/searchindex.js +++ b/docs/searchindex.js @@ -1 +1 @@ -Search.setIndex({docnames:["api","changelog","data","generated/pycantonese.characters_to_jyutping","generated/pycantonese.corpus.CantoneseCHATReader","generated/pycantonese.corpus.CantoneseCHATReader.search","generated/pycantonese.hkcancor","generated/pycantonese.jyutping_to_tipa","generated/pycantonese.jyutping_to_yale","generated/pycantonese.parse_jyutping","generated/pycantonese.pos_tag","generated/pycantonese.pos_tagging.hkcancor_to_ud","generated/pycantonese.read_chat","generated/pycantonese.segment","generated/pycantonese.stop_words","generated/pycantonese.word_segmentation.Segmenter","index","jyutping","papers","pos_tagging","reader","searches","stop_words","word_segmentation"],envversion:{"sphinx.domains.c":2,"sphinx.domains.changeset":1,"sphinx.domains.citation":1,"sphinx.domains.cpp":3,"sphinx.domains.index":1,"sphinx.domains.javascript":2,"sphinx.domains.math":2,"sphinx.domains.python":2,"sphinx.domains.rst":2,"sphinx.domains.std":1,"sphinx.ext.viewcode":1,sphinx:56},filenames:["api.rst","changelog.rst","data.rst","generated/pycantonese.characters_to_jyutping.rst","generated/pycantonese.corpus.CantoneseCHATReader.rst","generated/pycantonese.corpus.CantoneseCHATReader.search.rst","generated/pycantonese.hkcancor.rst","generated/pycantonese.jyutping_to_tipa.rst","generated/pycantonese.jyutping_to_yale.rst","generated/pycantonese.parse_jyutping.rst","generated/pycantonese.pos_tag.rst","generated/pycantonese.pos_tagging.hkcancor_to_ud.rst","generated/pycantonese.read_chat.rst","generated/pycantonese.segment.rst","generated/pycantonese.stop_words.rst","generated/pycantonese.word_segmentation.Segmenter.rst","index.rst","jyutping.rst","papers.rst","pos_tagging.rst","reader.rst","searches.rst","stop_words.rst","word_segmentation.rst"],objects:{"pycantonese.corpus":{CantoneseCHATReader:[20,1,1,""]},"pycantonese.corpus.CantoneseCHATReader":{IPSyn:[20,2,1,""],MLU:[20,2,1,""],MLUm:[20,2,1,""],MLUw:[20,2,1,""],TTR:[20,2,1,""],__init__:[4,2,1,""],abspath:[20,2,1,""],add:[20,2,1,""],age:[20,2,1,""],character_sents:[20,2,1,""],characters:[20,2,1,""],clear:[20,2,1,""],concordance:[20,2,1,""],date_of_birth:[20,2,1,""],dates_of_recording:[20,2,1,""],filenames:[20,2,1,""],from_chat_files:[20,2,1,""],from_chat_str:[20,2,1,""],headers:[20,2,1,""],index_to_tiers:[20,2,1,""],jyutping_sents:[20,2,1,""],jyutpings:[20,2,1,""],languages:[20,2,1,""],number_of_files:[20,2,1,""],number_of_utterances:[20,2,1,""],part_of_speech_tags:[20,2,1,""],participant_codes:[20,2,1,""],participants:[20,2,1,""],remove:[20,2,1,""],search:[20,2,1,""],sents:[20,2,1,""],tagged_sents:[20,2,1,""],tagged_words:[20,2,1,""],update:[20,2,1,""],utterances:[20,2,1,""],word_frequency:[20,2,1,""],word_ngrams:[20,2,1,""],words:[20,2,1,""]},"pycantonese.pos_tagging":{hkcancor_to_ud:[11,0,1,""]},"pycantonese.word_segmentation":{Segmenter:[15,1,1,""]},"pycantonese.word_segmentation.Segmenter":{__init__:[15,2,1,""]},pycantonese:{characters_to_jyutping:[3,0,1,""],hkcancor:[6,0,1,""],jyutping_to_tipa:[7,0,1,""],jyutping_to_yale:[8,0,1,""],parse_jyutping:[9,0,1,""],pos_tag:[10,0,1,""],read_chat:[12,0,1,""],segment:[13,0,1,""],stop_words:[14,0,1,""]}},objnames:{"0":["py","function","Python function"],"1":["py","class","Python class"],"2":["py","method","Python method"]},objtypes:{"0":"py:function","1":"py:class","2":"py:method"},terms:{"000":[2,19],"0dev":16,"100":[10,11,19,22],"104":[1,14,22],"105":[14,22],"107":22,"112":[],"12409":21,"149781":21,"150":[2,19],"1583":[],"1601":21,"184":21,"186888":21,"197":17,"1st":21,"2014":16,"2015":[2,16,18],"2016":[16,18],"2018":16,"2020":[16,17,23],"2021":16,"20579":21,"21830":21,"23768":[],"29012":[16,21],"29229":21,"2nd":[],"3rd":18,"679":21,"\u4e00\u5572":[14,22],"\u4e00\u5b9a":[14,22],"\u4e03":21,"\u4e0d\u5982":[14,22],"\u4e0d\u904e":[14,21,22],"\u4e5d\u9f8d":22,"\u4f4f":21,"\u4f60":21,"\u4fc2":[16,21],"\u505c\u7528\u8a5e":16,"\u505c\u7528\u8bcd":16,"\u516b\u6708":21,"\u5187\u5f97":[16,21],"\u5206\u8a5e":16,"\u5206\u8bcd":16,"\u53bb":[16,20,21],"\u53ef\u4ee5":21,"\u54aa":21,"\u5514":[13,20,23],"\u5514\u4fc2":21,"\u5514\u5bb9\u6613":[],"\u5514\u8a72":17,"\u554a":[20,21],"\u5572":20,"\u5582":20,"\u5587":21,"\u55f0":[10,19],"\u55f0\u500b":21,"\u55f0\u908a":21,"\u55f1":21,"\u565a\u65e5":[10,19],"\u56d6":21,"\u597d":[16,17,21],"\u5b78":[13,16,23],"\u5bb9":[13,23],"\u5bb9\u5514\u5bb9\u6613":[13,23],"\u5bb9\u6613":[13,23],"\u5c0d":[10,19],"\u5e7e":21,"\u5e7f\u4e1c\u8bdd":16,"\u5ee3\u6771":23,"\u5ee3\u6771\u8a71":[3,7,8,9,13,16,17,23],"\u5ee3\u6771\u8a71\u597d\u96e3\u5b78":16,"\u5ee3\u6771\u8a71\u5bb9\u5514\u5bb9\u6613\u5b78":[13,23],"\u6211":[10,19],"\u6211\u565a\u65e5\u8cb7\u55f0\u5c0d\u978b":19,"\u62b5":21,"\u65b0\u754c":22,"\u65c5\u884c":[16,20,21],"\u65e5":21,"\u6709\u5187":[16,21],"\u6709\u5f97":[16,21],"\u6a5f":21,"\u6a5f\u7968":21,"\u6c23\u5019":[8,17],"\u6de1\u5b63":21,"\u73a9":21,"\u76f4\u7a0b":21,"\u771f\u4fc2":21,"\u7793\u89ba":21,"\u789f":21,"\u789f\u5f62":21,"\u7ca4\u62fc":16,"\u7ca4\u8bed":16,"\u7cb5":16,"\u7cb5\u62fc":16,"\u7cb5\u8a9e":16,"\u7da0":21,"\u8072\u6bcd":21,"\u807d":21,"\u81ea\u7136\u8a9e\u8a00\u8655\u7406":16,"\u81ea\u7136\u8bed\u8a00\u5904\u7406":16,"\u86cb":17,"\u86cb\u7cd5":17,"\u8981":[16,21],"\u8a5e\u6027\u6a19\u6ce8":16,"\u8a71":[21,23],"\u8a9e\u8a00\u5b78":16,"\u8b1b":[3,16,17,21],"\u8b8a\u97f3":17,"\u8bcd\u6027\u6807\u6ce8":16,"\u8bed\u8a00\u5b66":16,"\u8cb7":[10,19],"\u8ddf":21,"\u8fea\u58eb\u5c3c":21,"\u904e":21,"\u9072":20,"\u90fd":21,"\u96c0":21,"\u96e3":16,"\u978b":[10,19],"\u97fb\u6bcd":21,"\u98db\u6a5f":21,"\u9999\u6e2f":[14,22],"\u9999\u6e2f\u4eba":[3,16,17],"\u9999\u6e2f\u4eba\u8b1b\u5ee3\u6771\u8a71":[3,16,17],"\u9999\u6e2f\u5cf6":22,"\ud844\udcc9":21,"\ud844\udcc9":[],"break":[],"case":[4,17,20,22],"char":3,"class":[4,13,15,20,23],"computational linguist":16,"d\u016bng":[8,17],"default":[1,2,4,5,8,10,12,13,19,20,21,22,23],"final":[1,5,20,21],"float":20,"function":[1,2,3,7,8,11,17,19,20,21,22,23],"g\u014di":17,"gw\u00f3ng":[8,17],"gw\u00f3ngd\u016bngw\u00e1":[8,17],"hg\u014di":[],"import":[2,13,16,17,19,20,21,22,23],"int":[5,15,20,21],"natural language process":16,"new":[1,3,7,8,10,11,13,14,15,17,19,20,22,23],"null":1,"part-of-speech tag":16,"return":[1,3,5,6,7,8,9,10,11,12,13,14,17,20,21,22,23],"stop word":16,"super":[7,17],"switch":[1,8],"true":[1,5,8,14,20,21,22],"while":[17,20,21],"word segment":16,Added:13,Eve:[],For:[2,5,11,20,21],Its:19,LFS:[],One:[5,20],POS:10,PoS:20,Such:[],The:[1,3,5,10,13,16,17,18,19,21,22,23],There:10,These:[],Used:1,Uses:2,With:[16,21],__init__:[4,15],__version__:16,aa3:[20,21],abil:17,abl:17,about:[19,22],abov:[1,16,20,21],absolut:20,abspath:20,accept:19,access:[1,16,21],accur:[],acquisit:[2,4,20],activ:[],adam:[],add:[14,17,20,22],added:[],adjust:21,adopt:[1,2],adp:[],adv:[10,19],after:[5,20],age:[16,18,20],ages:[],albino:16,algorithm:23,align:20,all:[1,2,5,16,20,21,22],all_verb:[16,21],allow:[1,10,13,15,21,23],allow_remot:[],alon:21,alphabet:16,alreadi:19,also:[17,19,21,22],altern:[],altogeth:20,alwai:21,ambigu:[8,17],american:[],among:17,analysi:21,analyt:[],ani:[3,11,17,20,21],annot:[1,2,11,16,19,20,21],anoth:[2,17,20],anywai:21,api:16,appear:[2,20],append:[],append_left:[],appli:10,applic:[4,11,20],approach:[13,19],appropri:[],arbitrari:[],aren:[],arg:[],argument:[1,4,10,12,13,17,19,22,23],aris:17,around:21,arrai:[20,21],artist:16,as_list:[1,8,17],ask:21,assum:[2,21],attempt:[],author:16,automat:[17,20,21],avail:[1,2],averag:[10,19],avoid:[20,21],awai:20,awar:2,baat3jyut6:21,back:1,background:[],ban:23,bare:2,base:[3,17,20,21],basenam:20,basic:[1,19],bat1gwo3:21,bear:21,becaus:[20,23],becom:[],been:[1,19,21],befor:[1,5,20],begin:[16,21],behav:[],behavior:[13,17],being:8,below:[],benefit:11,between:[8,17],big:[16,18],bilingu:[16,18],binari:[],birth:20,blah:[],bool:[5,8,20],both:1,bought:[10,19],boundari:[8,21,23],brown:[],bug:[1,16],build:1,built:16,by_fil:[5,20],by_utter:[],cake:17,call:[17,21],can:[2,11,17,20,21,22,23],cannot:[],cantones:[1,2,3,4,5,6,7,8,9,10,12,13,14,17,18,19,20,21,22,23],cantonesechatread:[6,12,20],cantons:[],cap:1,capabl:21,capit:[],cat1:21,cathug:16,centr:[16,18],certain:23,cha:[2,20],chang:[3,8,13,17,21],changelog:16,chao:17,charact:[1,3,5,7,8,9,10,13,16,20,23],character_s:20,characters2jyutp:[1,3],characters_to_jyutp:[1,16,17],charl:16,chat:[1,4,12,16,20],chat_str:20,chen:[16,18],chi:20,child:[2,20],childhood:[16,18],children:[],chim:16,chines:[2,5,16,17,18,20],choic:2,chosen:[],ci4:20,circleci:1,cite:2,classmethod:20,clean:20,clear:20,climat:[8,17],cls:[13,23],coda:[1,5,16,17,20,21],codas_ptk:21,code:[1,9,16,20],collaps:[],collect:[],colloc:21,com:16,combin:[19,20,21],come:[1,2,16,19,20],common:[17,21],commonli:17,compl:[10,11,19],complet:21,compon:17,comput:18,concord:20,concurr:23,conflict:21,confus:[17,20],consid:20,conson:[8,17],constrain:23,consult:2,contact:[2,16],contain:[5,13,17,20,21,23],context:20,contextu:17,contribut:16,control:23,conveni:20,convent:[1,23],convers:[1,3,16,21],convert:[1,3,7,8,10,17],corpora:2,corpu:[1,3,6,13,16,17,19,23],correct:17,correspond:[],could:2,counter:20,counterpart:1,cover:1,creat:[6,20,21],criteria:[5,16,20],criterion:1,cross:[11,19,21],current:[2,4,12,16,17,19,20,23],custom:[1,13,16],customiz:[1,15],daam6gwai3:21,daan2:17,daan6gou1:17,dai2:21,dai:20,data:[1,3,4,5,10,11,12,13,16,17,18,19,20,22,23],data_method:[],databas:2,dataset:[1,2,16,20],date:20,date_of_birth:20,dates_of_record:20,datetim:[],defin:[1,20],depend:[1,10,11,17,19,20,22,23],deprec:[3,7,8],describ:[10,11,19,21],design:[2,16],desir:20,detail:16,detect:17,determin:22,dev2:[],develop:18,di1:20,dict:[11,20],dictioari:11,dictionari:[11,17],differ:21,difficult:16,dik6si6nei4:21,dip2:21,dip2jing4:21,direct:1,directli:17,directori:2,disabl:[1,5,20],disallow:[1,13,15,23],disambigu:[8,17],discours:21,disk:20,dist:17,distinct:20,doc:1,docstr:1,document:[1,2,20],doe:13,domain:1,domin:[],don:[],done:[],dou1:21,download:[],drive:2,drop:1,due:[17,19],duplic:[],dut2:21,each:[1,3,10,21],earli:[],easi:[13,23],edu:[10,11,19],effect:20,egg:17,either:[20,22],element:[1,7,8,9,16],email:16,empti:20,enabl:[],encod:[1,2,4,12,20],encompass:[],end:[17,23],eng:[],english:[22,23],enough:17,entir:[11,23],equival:[1,3,5,7,8,17,20,21],error:[1,17],especi:19,etc:[16,20,21],european:[],eve01:20,eve02:20,eve:20,even:[],everyth:20,evolv:[],exactli:20,exampl:[3,5,7,8,9,10,11,13,14,17,20,21,22],exclud:[1,5,20],exist:23,expand:[],expect:19,explicitli:23,expos:[1,17,19],express:[16,21],extend:[],extend_left:[],extens:2,facebook:16,fact:[2,19],fals:[1,5,8,14,17,20,21],fan3gaau3:21,favor:1,featur:16,feedback:16,fei1gei1:21,fetch:[],few:20,file:[1,2,4,5,12,17,20],file_path:[],filenam:[2,4,12,20],filter:[20,22],find:16,first:21,five:[13,23],fix:[],flag:[],flavor:20,flexibl:21,folder:1,follow:[1,2,20,21,23],foobar:20,forc:[1,20],form:[1,5,20,23],format:[1,16,20],forth:20,found:[21,23],frequenc:20,from:[1,4,8,10,11,13,16,17,19,20,21,22,23],from_chat_fil:20,from_chat_str:20,from_dir:[],from_fil:[],from_str:[],from_zip:[],full:[16,21],func:[],further:[17,19],futur:17,gaa3:21,gan1:21,gei1:21,gei1piu3:21,gei2:21,gener:[1,21],get:[16,17,19],git:[],github:[1,16],given:[1,5,11,20,21],glob:[4,12,20],go2bin1:21,go2go3:21,goal:[],going:[],gong2:[3,16,17,21],good:17,gra:20,grab:21,gradual:[],gram:20,grammat:20,granular:11,grow:[],gwo3:21,gwong2dung1waa2:[3,7,8,9,16,17],hai6:[16,21],han:16,handl:[2,16,17],handout:18,has:[1,2,8,16,17,19,20,21,22,23],hasn:[],hauh:[8,17],have:[1,2,16,17,19,20],haven:[],header:20,hei3hau6:[8,17],hei6au6:[8,17],hei:[8,17],heihauh:[8,17],help:[],helper:19,heoi3:[16,20,21],here:[2,20,21,23],hesit:[],high:[17,21],hill:16,him:[16,18],hkcancor:[1,2,3,10,11,13,16,17,19,20,21,23],hkcancor_to_ud:[1,10,19],ho2ji5:21,hoeng1gong2jan4:[3,16,17],hong:[1,2,6,16,18,22],hongkong:[3,16,17],host:[],hou2:[17,21],hou7:17,how:21,howev:[21,23],hss:[10,11,19],html:[5,10,11,19,20],http:[1,5,10,11,16,19,20],ident:20,identifi:[],ids:[],ignor:[5,20,21],iii:[],illeg:[7,8,9],illustr:20,implement:[1,16,23],impos:21,improv:1,includ:[1,5,13,16,17,20,21,22,23],inconveni:17,incorpor:[2,16],index:[10,11,19,20],index_to_ti:20,indic:[],individu:[1,3,5,16,17,20],inflect:20,info:20,inform:20,inherit:[4,20],initi:[1,4,5,15,20,21],innov:18,input:[1,10,11,13,19],instagram:16,instal:[],instanc:[20,21,23],instanti:[],instead:[1,17,20,21],integ:23,intellig:17,intention:[],interest:[17,20,21],intern:[1,10],internet:[],interpret:16,introduc:[16,18],inv:[],invalid:17,investig:19,involv:17,ipsyn:20,island:22,issu:[1,16],issubset:22,iter:[4,5,12,14,15,20,22,23],its:[1,8,10,16,17,20,21],jackson:[2,16,18],jacksonlle:16,jat6:21,jau5dak1:[16,21],jau5mou5:[16,21],jenni:16,jiu3:[16,21],journal:2,jp_str:[7,8,9],json:23,just:[5,20,21],jyutp:[1,3,5,7,8,9,16,20],jyutping2tipa:[1,7],jyutping2yal:[1,8],jyutping_s:20,jyutping_to_tipa:[1,17],jyutping_to_x:[1,8],jyutping_to_yal:[1,17],jyytp:[],kang:2,keep_cas:20,kept:20,keyword:[1,4,12,13,17,19,20,23],kind:21,known:[16,20],kong:[1,2,6,16,18,22],kowloon:22,koy55:17,kwarg:[4,12,20,23],kwong:2,laa1:21,laa4:21,lai:16,lam:16,languag:[2,4,11,16,17,19,20,22,23],last:[16,17],latex:[7,17],learn:[13,16,23],leav:[],lee:[2,16,18],left:[5,20,21],lemma:20,len:[14,16,21,22],length:[1,13,15,20,23],leoi5hang4:[16,20,21],less:11,let:20,letter:[17,21],level:[17,20,21],lib:17,librari:[2,13,16,17,20,23],licens:[1,2,17,19,23],like:[2,19,20,22,23],likewis:21,limit:19,line:[1,8,17,20],linguist:[2,11,18,19,21],link:1,list:[1,3,5,7,8,9,10,13,17,20,21],liter:[],litong:[16,18],lo1:21,load:23,local:[2,17],logo:[],longer:13,longest:[13,23],look:[],low:[8,17],lowercas:20,luk2:21,luke:2,m4goi1:17,m4hai6:21,machin:21,made:20,mai6:21,mai:[2,4,17,20,21,22],maintain:[],maintein:16,major:19,make:2,mani:[20,22,23],map:[1,11,19,20],march:18,mark:[3,17],marker:[8,17],master:[],match:[2,4,5,12,13,20,21,23],match_entire_word:20,matter:[3,17],max_word_length:[15,23],maxim:13,maximum:[1,13,15,23],mean:[16,19,20],media:16,memori:20,metadata:[],metadata_method:[],methdo:[],method:[1,4,15,16,21],might:[17,19],minim:[],minimum:2,mit:16,mix:21,mlu:20,mlum:20,mluw:20,model:[1,3,10,13,15,17,19,23],modifi:16,modul:17,month:20,mor:20,more:[1,5,16,19,20,21,23],morphem:20,most:[16,17,20],mot:20,mother:20,motiv:2,mou5dak1:[16,21],much:[],multipl:[7,8,9,16,17,20],n_file:[],name:[1,2,16],nasal:[1,17],natur:[11,16,19,22,23],necessari:[2,17,20,22,23],necessit:17,need:17,nei5:21,neighbor:21,neither:21,ngram:[],nlp:[],nltk:[1,20],non:[],none:[3,5,11,13,14,15,17,20],nor:21,note:[16,18,21],notic:[],noun:[10,19],novemb:[],now:[1,3],ntu:[10,11,19],nuclei:17,nucleu:[1,5,9,16,17,20,21],number:[16,17,20,21],number_of_charact:1,number_of_fil:20,number_of_utter:20,number_of_word:1,numer:17,numpydoc:1,object:[1,6,12,13,15,20,21,23],occurr:19,odd:19,off:19,offer:17,often:[22,23],ohio:18,on25:[7,17],onc:[],one:[1,2,5,7,8,9,10,20],ones:22,onli:[1,4,5,12,19,20,21],onset:[1,5,8,9,16,17,20,21],onward:1,open:[1,2],option:[2,5,8,10,11,13,14,15,20,22],orb:1,order:[16,21],org:[1,5,10,11,19,20],organ:[5,20],origin:[1,10,11,16,19,20],orthograph:[],other:[1,2,8,17,21],otherwis:[5,20,21],our:[],output:[3,5,8,16,17,20],over:[10,11,19],overal:1,overridden:2,owner:2,packag:[1,17],pad:20,page:[],pair:[10,19,20],paramet:[1,2,3,4,5,7,8,9,10,11,12,13,14,15,20,21],parent:[4,20],pars:[1,2,9,16,21],parse_jyutp:[1,16,17],part:[1,5,8,10,11,16,17,20],part_of_speech_tag:20,particip:[1,5,20],participant_cod:20,particularli:17,pass:[4,12,21,23],path:[1,2,4,5,12,20],pattern:[2,20],per:[],perceptron:[10,19],perform:[20,21],perhap:19,permiss:19,phonolog:[5,17,20],phrase:[1,10,19],pick:1,piggyback:1,pin:1,pinjam:[17,21],pip:16,pleas:[2,5,16,17,19,20],plu:[1,5,20,21],point:1,pop:[],pop_left:[],pos:[5,10,11,16,19,20,21],pos_tag:[1,19],possibl:[1,21],post:[],potenti:[17,19,23],power:21,pprint:[16,21],pre:[],preced:21,predict:10,prefix:[],preprocess:[],pretti:21,preval:[5,20],previou:[8,17],previous:[1,3],print:[16,21],process:[11,16,17,19,22,23],product:20,programmat:20,pron:[10,19],pronoun:22,pronunci:17,proper:[],prove:17,provid:[11,13,17,19,20,21,22,23],ptk:21,ptk_tone2:21,punct:[10,19],punctuat:[3,17],purpos:[1,2,11,21],pycantones:[1,2,17,18,19,20,21,22,23],pylangacq:[1,2,4,20],pypi:1,python3:17,python:[1,2,21],qualiti:[1,19],queri:16,question:[],quot:[8,17],rachel:16,rais:[1,5,7,8,9,10,17,20],random:[],rang:[1,5,16,20],rather:1,ratio:20,read:[1,12,17],read_chat:[2,20],reader:[1,4,12,16],readm:[2,16],readthedoc:1,recent:[16,17],recogn:20,record:20,recurs:[],refer:[16,20],reflect:[],regex:[5,20],regular:[16,21],rel:[19,20,21],relat:[20,21],releas:[2,16,17,23],relev:17,remark:20,remot:[],remov:[14,20,22],render:20,replac:[1,3,7,8],report:16,repositori:[],repr:17,repres:[3,17,21],represent:16,request:16,requir:[1,16],research:[2,16,20,21],reset:20,resourc:17,respect:21,restrict:21,restructur:1,result:[1,16,19,20,23],revis:1,rich:2,richielo:16,right:[5,20,21],rime:[1,3,13,16,17,23],rime_cantones:16,rise:[17,21],roman:[1,3,5,7,8,9,16,20,21],rst:1,run:[],ryan:16,rylanchiu:16,safe:20,same:[21,23],sarah:[],satisfi:[],scheme:17,search:[1,16,20],search_item:20,second:21,section:[],secur:[],see:[2,5,10,16,17,20,21],seem:17,segment:[1,3,5,10,16,17,19,20],select:[],self:[],semant:21,sens:[],sent:[5,20,21],sent_rang:[5,20,21],sent_str:[],sentenc:[1,5,10,13,16,19,20],separ:17,septemb:[16,18],set:[13,14,17,20,21,22],shoe:[10,19],should:2,show:[16,21],shown:20,signatur:[],similar:20,similarli:22,simpl:[20,23],simpli:[],sinc:19,singl:[2,8,20,21],situat:23,size:19,slide:[16,18],small:19,smaller:[],snippet:1,snowman:16,social:16,soek2:21,some:[4,20],sophist:19,sort:20,sorted_by_ag:20,sourc:[1,3,4,5,6,7,8,9,10,11,12,13,14,15,16,17,20],space:[20,23],span:[5,20,21],speak:[3,16,17,21],specif:[1,19,21],specifi:[2,20,21,23],speech:[1,5,10,11,16,20],split:20,stabl:16,standalon:17,standard:[2,19],start:20,state:18,statist:19,stdin:17,step:[],stephan:16,still:[17,19,23],stiller:16,stop:[1,14,16],stop_wds1:[],stop_wds2:[],stop_word:22,stop_words_1:[14,22],stop_words_2:[14,22],store:[],str:[3,4,5,7,8,9,10,11,12,13,14,15,20,21],string:[1,3,5,8,10,13,16,20,21,22,23],strip:1,structur:20,studi:[],style:1,subclass:[],subject:[],substanti:16,substr:20,suffici:[],suffix:17,suggest:[],suit:1,suppli:1,support:[1,4,5,10,12,20],syllab:[1,17],syllabl:[8,17],syntax:[20,21],system:17,tag:[1,5,10,11,16,20],tagged_s:20,tagged_word:20,tagger:[10,19],tagset:[1,10,11,19,21],take:[1,17,19,20,21,22,23],talk:[16,18],talkbank:[],target:20,task:[11,17,21,22,23],teach:17,teng1:21,term:[5,16,20],territori:22,test:[1,16],tester:[],text:1,than:[1,5,13,19,20,21,23],thank:17,thei:1,them:[],theme:1,thi:[1,2,3,7,8,10,11,13,15,16,17,20,21,23],think:[19,23],those:17,though:23,through:2,thrown:19,tier:20,time:21,tip:[],tipa:[1,7,16],todai:17,togeth:20,token:[5,17,20,21],tone2:21,tone:[5,8,9,16,17,20,21],tool:[16,17,18],top:20,total:21,touch:19,traceback:17,tracker:16,tradit:[5,20],train:[10,13,17,19,23],transcript:[16,20],transpar:1,travel:16,treat:[17,20,22,23],trivial:17,tsui:[16,18],tsz:[16,18],ttr:20,tun55:[7,17],tupl:[1,3,5,9,10,17,20,21],turn:[1,17],twitter:16,two:[17,20],txt:16,type:20,typeerror:10,typic:20,unclear:8,under:2,underli:[1,23],underlyingli:2,unicod:[],union:[],univers:[1,10,11,16,18,19],universaldepend:[10,11,19],unless:[],unrecogn:[7,8,9,11],unreleas:16,unseen:[3,17],unseg:[1,10,13,19,23],unspecifi:[5,20],unstabl:[],unzip:[],upcom:[],updat:20,upgrad:16,uppercas:20,url:[],use:[2,4,17,20,21,22],used:[2,5,10,13,17,20,21,23],useful:21,usefulness:17,user:[1,17],uses:[2,10,11,19],using:21,usr:17,utf8:[2,4,12,20],utf:[1,2],utter:[20,21],uuid:[],valid:17,valu:[1,3,8,17,21],valueerror:[5,7,8,9,10,17,20],varieti:21,variou:[1,17,21],verb:[10,11,16,19,21],version:[1,3,7,8,10,11,13,14,15,16,17,19,20,22,23],versu:[],via:2,wa25:[7,17],waa6:21,waan2:21,wai3:20,wai:23,welcom:[],well:2,what:20,whatev:20,when:[1,17,20,21],where:[1,3,10,23],whether:[17,20,23],which:[2,4,8,10,11,17,19,20,21,22],whitespac:1,who:16,whose:16,wide:[2,21],wildcard:20,window:1,within:[5,20,21],without:20,wong:2,word:[1,2,3,5,10,13,14,15,16,17,19],word_frequ:20,word_ngram:20,word_rang:[5,20,21],word_segment:[13,23],wordlist:1,wordseg:1,work:[19,21,23],workshop:18,worth:19,would:[2,8,11,17,19,20,23],wouldn:19,wrap:[],written:23,x2y:1,x_to_i:1,xxa:20,xxb:20,xxx:[],yale:[1,8,16],year:20,yesterdai:[10,19],yet:20,you:[2,17,19,20,22,23],your:[2,4,16,19,20,22],zan1hai6:21,zero:20,zik6cing4:21,zip:[],zoek2:21,zyu6:21},titles:["API Reference","Changelog","Corpus Data","pycantonese.characters_to_jyutping","pycantonese.corpus.CantoneseCHATReader","pycantonese.corpus.CantoneseCHATReader.search","pycantonese.hkcancor","pycantonese.jyutping_to_tipa","pycantonese.jyutping_to_yale","pycantonese.parse_jyutping","pycantonese.pos_tag","pycantonese.pos_tagging.hkcancor_to_ud","pycantonese.read_chat","pycantonese.segment","pycantonese.stop_words","pycantonese.word_segmentation.Segmenter","PyCantonese: Cantonese Linguistics and NLP in Python","Jyutping Romanization","Research Outputs","Part-of-Speech Tagging","Corpus Reader Methods","Corpus Search Queries","Stop Words","Word Segmentation"],titleterms:{"0dev":1,"2014":1,"2015":1,"2016":1,"2018":1,"2020":1,"2021":1,"break":1,Added:1,The:[2,20],access:[2,20],acknowledg:16,api:[0,1,20],built:2,cantones:16,cantonesechatread:[4,5],chang:1,changelog:1,charact:[17,21],characters2jyutp:[],characters_to_jyutp:3,chat:2,chines:21,cite:16,content:16,convers:17,corpu:[0,2,4,5,20,21],criteria:21,custom:[2,23],data:[0,2],deprec:1,develop:[],download:16,element:21,etc:[],exampl:16,fix:1,format:[2,21],full:20,handl:[],hkcancor:6,hkcancor_to_ud:11,how:16,instal:16,introduct:[],jyutp:[0,17,21],jyutping2tipa:[],jyutping2yal:[],jyutping_to_tipa:7,jyutping_to_yal:8,languag:0,librari:[],licens:16,linguist:16,link:16,logo:16,metadata:[],method:20,multipl:21,natur:0,nlp:16,non:1,note:20,output:[18,21],pars:17,parse_jyutp:9,part:[19,21],perform:[],pos_tag:[10,11],process:0,pycantones:[3,4,5,6,7,8,9,10,11,12,13,14,15,16],python:16,queri:21,quick:16,rang:21,read:[],read_chat:12,reader:20,refer:0,remov:1,represent:20,research:18,result:21,roman:[0,17],search:[5,21],secur:1,segment:[13,15,23],sentenc:21,speech:[19,21],stop:22,stop_word:14,string:17,support:[],tabl:16,tag:[19,21],task:[],technic:[],tipa:17,transcript:2,unreleas:1,word:[20,21,22,23],word_segment:15,yale:17}}) \ No newline at end of file +Search.setIndex({docnames:["api","changelog","data","generated/pycantonese.characters_to_jyutping","generated/pycantonese.corpus.CantoneseCHATReader","generated/pycantonese.corpus.CantoneseCHATReader.search","generated/pycantonese.hkcancor","generated/pycantonese.jyutping_to_tipa","generated/pycantonese.jyutping_to_yale","generated/pycantonese.parse_jyutping","generated/pycantonese.pos_tag","generated/pycantonese.pos_tagging.hkcancor_to_ud","generated/pycantonese.read_chat","generated/pycantonese.segment","generated/pycantonese.stop_words","generated/pycantonese.word_segmentation.Segmenter","index","jyutping","papers","pos_tagging","reader","searches","stop_words","word_segmentation"],envversion:{"sphinx.domains.c":2,"sphinx.domains.changeset":1,"sphinx.domains.citation":1,"sphinx.domains.cpp":3,"sphinx.domains.index":1,"sphinx.domains.javascript":2,"sphinx.domains.math":2,"sphinx.domains.python":2,"sphinx.domains.rst":2,"sphinx.domains.std":1,"sphinx.ext.viewcode":1,sphinx:56},filenames:["api.rst","changelog.rst","data.rst","generated/pycantonese.characters_to_jyutping.rst","generated/pycantonese.corpus.CantoneseCHATReader.rst","generated/pycantonese.corpus.CantoneseCHATReader.search.rst","generated/pycantonese.hkcancor.rst","generated/pycantonese.jyutping_to_tipa.rst","generated/pycantonese.jyutping_to_yale.rst","generated/pycantonese.parse_jyutping.rst","generated/pycantonese.pos_tag.rst","generated/pycantonese.pos_tagging.hkcancor_to_ud.rst","generated/pycantonese.read_chat.rst","generated/pycantonese.segment.rst","generated/pycantonese.stop_words.rst","generated/pycantonese.word_segmentation.Segmenter.rst","index.rst","jyutping.rst","papers.rst","pos_tagging.rst","reader.rst","searches.rst","stop_words.rst","word_segmentation.rst"],objects:{"pycantonese.corpus":{CantoneseCHATReader:[20,1,1,""]},"pycantonese.corpus.CantoneseCHATReader":{IPSyn:[20,2,1,""],MLU:[20,2,1,""],MLUm:[20,2,1,""],MLUw:[20,2,1,""],TTR:[20,2,1,""],__init__:[4,2,1,""],abspath:[20,2,1,""],add:[20,2,1,""],age:[20,2,1,""],character_sents:[20,2,1,""],characters:[20,2,1,""],clear:[20,2,1,""],concordance:[20,2,1,""],date_of_birth:[20,2,1,""],dates_of_recording:[20,2,1,""],filenames:[20,2,1,""],from_chat_files:[20,2,1,""],from_chat_str:[20,2,1,""],headers:[20,2,1,""],index_to_tiers:[20,2,1,""],jyutping_sents:[20,2,1,""],jyutpings:[20,2,1,""],languages:[20,2,1,""],number_of_files:[20,2,1,""],number_of_utterances:[20,2,1,""],part_of_speech_tags:[20,2,1,""],participant_codes:[20,2,1,""],participants:[20,2,1,""],remove:[20,2,1,""],search:[20,2,1,""],sents:[20,2,1,""],tagged_sents:[20,2,1,""],tagged_words:[20,2,1,""],update:[20,2,1,""],utterances:[20,2,1,""],word_frequency:[20,2,1,""],word_ngrams:[20,2,1,""],words:[20,2,1,""]},"pycantonese.pos_tagging":{hkcancor_to_ud:[11,0,1,""]},"pycantonese.word_segmentation":{Segmenter:[15,1,1,""]},"pycantonese.word_segmentation.Segmenter":{__init__:[15,2,1,""]},pycantonese:{characters_to_jyutping:[3,0,1,""],hkcancor:[6,0,1,""],jyutping_to_tipa:[7,0,1,""],jyutping_to_yale:[8,0,1,""],parse_jyutping:[9,0,1,""],pos_tag:[10,0,1,""],read_chat:[12,0,1,""],segment:[13,0,1,""],stop_words:[14,0,1,""]}},objnames:{"0":["py","function","Python function"],"1":["py","class","Python class"],"2":["py","method","Python method"]},objtypes:{"0":"py:function","1":"py:class","2":"py:method"},terms:{"000":[2,19],"0dev":16,"100":[10,11,19,22],"104":[1,14,22],"105":[14,22],"107":22,"112":[],"12409":21,"149781":21,"150":[2,19],"1583":[],"1601":21,"184":21,"186888":21,"197":17,"1st":21,"2014":16,"2015":[2,16,18],"2016":[16,18],"2018":16,"2020":[16,17,23],"2021":16,"20579":21,"21830":21,"23768":[],"29012":[16,21],"29229":21,"2nd":[],"3rd":18,"679":21,"\u4e00\u5572":[14,22],"\u4e00\u5b9a":[14,22],"\u4e03":21,"\u4e0d\u5982":[14,22],"\u4e0d\u904e":[14,21,22],"\u4e5d\u9f8d":22,"\u4f4f":21,"\u4f60":21,"\u4fc2":[16,21],"\u505c\u7528\u8a5e":16,"\u505c\u7528\u8bcd":16,"\u516b\u6708":21,"\u5187\u5f97":[16,21],"\u5206\u8a5e":16,"\u5206\u8bcd":16,"\u53bb":[16,20,21],"\u53ef\u4ee5":21,"\u54aa":21,"\u5514":[13,20,23],"\u5514\u4fc2":21,"\u5514\u5bb9\u6613":[],"\u5514\u8a72":17,"\u554a":[20,21],"\u5572":20,"\u5582":20,"\u5587":21,"\u55f0":[10,19],"\u55f0\u500b":21,"\u55f0\u908a":21,"\u55f1":21,"\u565a\u65e5":[10,19],"\u56d6":21,"\u597d":[16,17,21],"\u5b78":[13,16,23],"\u5bb9":[13,23],"\u5bb9\u5514\u5bb9\u6613":[13,23],"\u5bb9\u6613":[13,23],"\u5c0d":[10,19],"\u5e7e":21,"\u5e7f\u4e1c\u8bdd":16,"\u5ee3\u6771":23,"\u5ee3\u6771\u8a71":[3,7,8,9,13,16,17,23],"\u5ee3\u6771\u8a71\u597d\u96e3\u5b78":16,"\u5ee3\u6771\u8a71\u5bb9\u5514\u5bb9\u6613\u5b78":[13,23],"\u6211":[10,19],"\u6211\u565a\u65e5\u8cb7\u55f0\u5c0d\u978b":19,"\u62b5":21,"\u65b0\u754c":22,"\u65c5\u884c":[16,20,21],"\u65e5":21,"\u6709\u5187":[16,21],"\u6709\u5f97":[16,21],"\u6a5f":21,"\u6a5f\u7968":21,"\u6c23\u5019":[8,17],"\u6de1\u5b63":21,"\u73a9":21,"\u76f4\u7a0b":21,"\u771f\u4fc2":21,"\u7793\u89ba":21,"\u789f":21,"\u789f\u5f62":21,"\u7ca4\u62fc":16,"\u7ca4\u8bed":16,"\u7cb5":16,"\u7cb5\u62fc":16,"\u7cb5\u8a9e":16,"\u7da0":21,"\u8072\u6bcd":21,"\u807d":21,"\u81ea\u7136\u8a9e\u8a00\u8655\u7406":16,"\u81ea\u7136\u8bed\u8a00\u5904\u7406":16,"\u86cb":17,"\u86cb\u7cd5":17,"\u8981":[16,21],"\u8a5e\u6027\u6a19\u6ce8":16,"\u8a71":[21,23],"\u8a9e\u8a00\u5b78":16,"\u8b1b":[3,16,17,21],"\u8b8a\u97f3":17,"\u8bcd\u6027\u6807\u6ce8":16,"\u8bed\u8a00\u5b66":16,"\u8cb7":[10,19],"\u8ddf":21,"\u8fea\u58eb\u5c3c":21,"\u904e":21,"\u9072":20,"\u90fd":21,"\u96c0":21,"\u96e3":16,"\u978b":[10,19],"\u97fb\u6bcd":21,"\u98db\u6a5f":21,"\u9999\u6e2f":[14,22],"\u9999\u6e2f\u4eba":[3,16,17],"\u9999\u6e2f\u4eba\u8b1b\u5ee3\u6771\u8a71":[3,16,17],"\u9999\u6e2f\u5cf6":22,"\ud844\udcc9":21,"\ud844\udcc9":[],"break":[],"case":[4,17,20,22],"char":3,"class":[4,13,15,20,23],"computational linguist":16,"d\u016bng":[8,17],"default":[1,2,4,5,8,10,12,13,19,20,21,22,23],"final":[1,5,20,21],"float":20,"function":[1,2,3,7,8,11,17,19,20,21,22,23],"g\u014di":17,"gw\u00f3ng":[8,17],"gw\u00f3ngd\u016bngw\u00e1":[8,17],"hg\u014di":[],"import":[2,13,16,17,19,20,21,22,23],"int":[5,15,20,21],"natural language process":16,"new":[1,3,7,8,10,11,13,14,15,17,19,20,22,23],"null":1,"part-of-speech tag":16,"return":[1,3,5,6,7,8,9,10,11,12,13,14,17,20,21,22,23],"stop word":16,"super":[7,17],"switch":[1,8],"true":[1,5,8,14,20,21,22],"while":[17,20,21],"word segment":16,Added:13,Eve:[],For:[2,5,11,20,21],Its:19,LFS:[],One:[5,20],POS:10,PoS:20,Such:[],The:[1,3,5,10,13,16,17,18,19,21,22,23],There:10,These:[],Used:1,Uses:2,With:[16,21],__init__:[4,15],__version__:16,aa3:[20,21],abil:17,abl:17,about:[19,22],abov:[1,16,20,21],absolut:20,abspath:20,accept:19,access:[1,16,21],accur:[],acquisit:[2,4,20],activ:[],adam:[],add:[14,17,20,22],added:[],adjust:21,adopt:[1,2],adp:[],adv:[10,19],after:[5,20],age:[16,18,20],ages:[],albino:16,algorithm:23,align:20,all:[1,2,5,16,20,21,22],all_verb:[16,21],allow:[1,10,13,15,21,23],allow_remot:[],alon:21,alphabet:16,alreadi:19,also:[17,19,21,22],altern:[],altogeth:20,alwai:21,ambigu:[8,17],american:[],among:17,analysi:21,analyt:[],ani:[3,11,17,20,21],annot:[1,2,11,16,19,20,21],anoth:[2,17,20],anywai:21,api:16,appear:[2,20],append:[],append_left:[],appli:10,applic:[4,11,20],approach:[13,19],appropri:[],arbitrari:[],aren:[],arg:[],argument:[1,4,10,12,13,17,19,22,23],aris:17,around:21,arrai:[20,21],artist:16,as_list:[1,8,17],ask:21,assum:[2,21],attempt:[],author:16,automat:[17,20,21],avail:[1,2],averag:[10,19],avoid:[20,21],awai:20,awar:2,baat3jyut6:21,back:1,background:[],ban:23,bare:2,base:[3,17,20,21],basenam:20,basic:[1,19],bat1gwo3:21,bear:21,becaus:[20,23],becom:[],been:[1,19,21],befor:[1,5,20],begin:[16,21],behav:[],behavior:[13,17],being:8,below:[],benefit:11,between:[8,17],big:[16,18],bilingu:[16,18],binari:[],birth:20,blah:[],bool:[5,8,20],both:1,bought:[10,19],boundari:[8,21,23],brown:[],bug:[1,16],build:1,built:16,by_fil:[5,20],by_utter:[],cake:17,call:[17,21],can:[2,11,17,20,21,22,23],cannot:[],cantones:[1,2,3,4,5,6,7,8,9,10,12,13,14,17,18,19,20,21,22,23],cantonesechatread:[6,12,20],cantons:[],cap:1,capabl:21,capit:[],cat1:21,cathug:16,centr:[16,18],certain:23,cha:[2,20],chang:[3,8,13,17,21],changelog:16,chao:17,charact:[1,3,5,7,8,9,10,13,16,20,23],character_s:20,characters2jyutp:[1,3],characters_to_jyutp:[1,16,17],charl:16,chat:[1,4,12,16,20],chat_str:20,chen:[16,18],chi:20,child:[2,20],childhood:[16,18],children:[],chim:16,chines:[2,5,16,17,18,20],choic:2,chosen:[],ci4:20,circleci:1,cite:2,classmethod:20,clean:20,clear:20,climat:[8,17],cls:[13,23],coda:[1,5,16,17,20,21],codas_ptk:21,code:[1,9,16,20],collaps:[],collect:[],colloc:21,com:16,combin:[19,20,21],come:[1,2,16,19,20],common:[17,21],commonli:17,compl:[10,11,19],complet:21,compon:17,comput:18,concord:20,concurr:23,conflict:21,confus:[17,20],consid:20,conson:[8,17],constrain:23,consult:2,contact:[2,16],contain:[5,13,17,20,21,23],context:20,contextu:17,contribut:16,control:23,conveni:20,convent:[1,23],convers:[1,3,16,21],convert:[1,3,7,8,10,17],corpora:2,corpu:[1,3,6,13,16,17,19,23],correct:17,correspond:[],could:2,counter:20,counterpart:1,cover:1,creat:[6,20,21],criteria:[5,16,20],criterion:1,cross:[11,19,21],current:[2,4,12,16,17,19,20,23],custom:[1,13,16],customiz:[1,15],daam6gwai3:21,daan2:17,daan6gou1:17,dai2:21,dai:20,data:[1,3,4,5,10,11,12,13,16,17,18,19,20,22,23],data_method:[],databas:2,dataset:[1,2,16,20],date:20,date_of_birth:20,dates_of_record:20,datetim:[],defin:[1,20],depend:[1,10,11,17,19,20,22,23],deprec:[3,7,8],describ:[10,11,19,21],design:[2,16],desir:20,detail:16,detect:17,determin:22,dev2:[],develop:18,di1:20,dict:[11,20],dictioari:11,dictionari:[11,17],differ:21,difficult:16,dik6si6nei4:21,dip2:21,dip2jing4:21,direct:1,directli:17,directori:2,disabl:[1,5,20],disallow:[1,13,15,23],disambigu:[8,17],discours:21,disk:20,dist:17,distinct:20,doc:1,docstr:1,document:[1,2,20],doe:13,domain:1,domin:[],don:[],done:[],dou1:21,download:[],drive:2,drop:1,due:[17,19],duplic:[],dut2:21,each:[1,3,10,21],earli:[],easi:[13,23],edu:[10,11,19],effect:20,egg:17,either:[20,22],element:[1,7,8,9,16],email:16,empti:20,enabl:[],encod:[1,2,4,12,20],encompass:[],end:[17,23],eng:[],english:[22,23],enough:17,entir:[11,23],equival:[1,3,5,7,8,17,20,21],error:[1,17],especi:19,etc:[16,20,21],european:[],eve01:20,eve02:20,eve:20,even:[],everyth:20,evolv:[],exactli:20,exampl:[3,5,7,8,9,10,11,13,14,17,20,21,22],exclud:[1,5,20],exist:23,expand:[],expect:19,explicitli:23,expos:[1,17,19],express:[16,21],extend:[],extend_left:[],extens:2,facebook:16,fact:[2,19],fals:[1,5,8,14,17,20,21],fan3gaau3:21,favor:1,featur:16,feedback:16,fei1gei1:21,fetch:[],few:20,file:[1,2,4,5,12,17,20],file_path:[],filenam:[2,4,12,20],filter:[20,22],find:16,first:21,five:[13,23],fix:[],flag:[],flavor:20,flexibl:21,folder:1,follow:[1,2,20,21,23],foobar:20,forc:[1,20],form:[1,5,20,23],format:[1,16,20],forth:20,found:[21,23],frequenc:20,from:[1,4,8,10,11,13,16,17,19,20,21,22,23],from_chat_fil:20,from_chat_str:20,from_dir:[],from_fil:[],from_str:[],from_zip:[],full:[16,21],func:[],further:[17,19],futur:17,gaa3:21,gan1:21,gei1:21,gei1piu3:21,gei2:21,gener:[1,21],get:[16,17,19],git:[],github:[1,16],given:[1,5,11,20,21],glob:[4,12,20],go2bin1:21,go2go3:21,goal:[],going:[],gong2:[3,16,17,21],good:17,gra:20,grab:21,gradual:[],gram:20,grammat:20,granular:11,grow:[],gwo3:21,gwong2dung1waa2:[3,7,8,9,16,17],hai6:[16,21],han:16,handl:[2,16,17],handout:18,has:[1,2,8,16,17,19,20,21,22,23],hasn:[],hauh:[8,17],have:[1,2,16,17,19,20],haven:[],header:20,hei3hau6:[8,17],hei6au6:[8,17],hei:[8,17],heihauh:[8,17],help:[],helper:19,heoi3:[16,20,21],here:[2,20,21,23],hesit:[],high:[17,21],hill:16,him:[16,18],hkcancor:[1,2,3,10,11,13,16,17,19,20,21,23],hkcancor_to_ud:[1,10,19],ho2ji5:21,hoeng1gong2jan4:[3,16,17],hong:[1,2,6,16,18,22],hongkong:[3,16,17],host:[],hou2:[17,21],hou7:17,how:21,howev:[21,23],hss:[10,11,19],html:[5,10,11,19,20],http:[1,5,10,11,16,19,20],ident:20,identifi:[],ids:[],ignor:[5,20,21],iii:[],illeg:[7,8,9],illustr:20,implement:[1,16,23],impos:21,improv:1,includ:[1,5,13,16,17,20,21,22,23],inconveni:17,incorpor:[2,16],index:[10,11,19,20],index_to_ti:20,indic:[],individu:[1,3,5,16,17,20],inflect:20,info:20,inform:20,inherit:[4,20],initi:[1,4,5,15,20,21],innov:18,input:[1,10,11,13,19],instagram:16,instal:[],instanc:[20,21,23],instanti:[],instead:[1,17,20,21],integ:23,intellig:17,intention:[],interest:[17,20,21],intern:[1,10],internet:[],interpret:16,introduc:[16,18],inv:[],invalid:17,investig:19,involv:17,ipsyn:20,island:22,issu:[1,16],issubset:22,iter:[4,5,12,14,15,20,22,23],its:[1,8,10,16,17,20,21],jackson:[2,16,18],jacksonlle:16,jat6:21,jau5dak1:[16,21],jau5mou5:[16,21],jenni:16,jiu3:[16,21],journal:2,jp_str:[7,8,9],json:23,just:[5,20,21],jyutp:[1,3,5,7,8,9,16,20],jyutping2tipa:[1,7],jyutping2yal:[1,8],jyutping_s:20,jyutping_to_tipa:[1,17],jyutping_to_x:[1,8],jyutping_to_yal:[1,17],jyytp:[],kang:2,keep_cas:20,kept:20,keyword:[1,4,12,13,17,19,20,23],kind:21,known:[16,20],kong:[1,2,6,16,18,22],kowloon:22,koy55:17,kwarg:[4,12,20,23],kwong:2,laa1:21,laa4:21,lai:16,lam:16,languag:[2,4,11,16,17,19,20,22,23],last:[16,17],latex:[7,17],learn:[13,16,23],leav:[],lee:[2,16,18],left:[5,20,21],lemma:20,len:[14,16,21,22],length:[1,13,15,20,23],leoi5hang4:[16,20,21],less:11,let:20,letter:[17,21],level:[17,20,21],lib:17,librari:[2,13,16,17,20,23],licens:[1,2,17,19,23],like:[2,19,20,22,23],likewis:21,limit:19,line:[1,8,17,20],linguist:[2,11,18,19,21],link:1,list:[1,3,5,7,8,9,10,13,17,20,21],liter:[],litong:[16,18],lo1:21,load:23,local:[2,17],logo:[],longer:13,longest:[13,23],look:[],low:[8,17],lowercas:20,luk2:21,luke:2,m4goi1:17,m4hai6:21,machin:21,made:20,mai6:21,mai:[2,4,17,20,21,22],maintain:[],maintein:16,major:19,make:2,mani:[20,22,23],map:[1,11,19,20],march:18,mark:[3,17],marker:[8,17],master:[],match:[2,4,5,12,13,20,21,23],match_entire_word:20,matter:[3,17],max_word_length:[15,23],maxim:13,maximum:[1,13,15,23],mean:[16,19,20],media:16,memori:20,metadata:[],metadata_method:[],methdo:[],method:[1,4,15,16,21],might:[17,19],minim:[],minimum:2,mit:16,mix:21,mlu:20,mlum:20,mluw:20,model:[1,3,10,13,15,17,19,23],modifi:16,modul:17,month:20,mor:20,more:[1,5,16,19,20,21,23],morphem:20,most:[16,17,20],mot:20,mother:20,motiv:2,mou5dak1:[16,21],much:[],multipl:[7,8,9,16,17,20],n_file:[],name:[1,2,16],nasal:[1,17],natur:[11,16,19,22,23],necessari:[2,17,20,22,23],necessit:17,need:17,nei5:21,neighbor:21,neither:21,ngram:[],nlp:[],nltk:[1,20],non:[],none:[3,5,11,13,14,15,17,20],nor:21,note:[16,18,21],notic:[],noun:[10,19],novemb:[],now:[1,3],ntu:[10,11,19],nuclei:17,nucleu:[1,5,9,16,17,20,21],number:[16,17,20,21],number_of_charact:1,number_of_fil:20,number_of_utter:20,number_of_word:1,numer:17,numpydoc:1,object:[1,6,12,13,15,20,21,23],occurr:19,odd:19,off:19,offer:17,often:[22,23],ohio:18,on25:[7,17],onc:[],one:[1,2,5,7,8,9,10,20],ones:22,onli:[1,4,5,12,19,20,21],onset:[1,5,8,9,16,17,20,21],onward:1,open:[1,2],option:[2,5,8,10,11,13,14,15,20,22],orb:1,order:[16,21],org:[1,5,10,11,19,20],organ:[5,20],origin:[1,10,11,16,19,20],orthograph:[],other:[1,2,8,17,21],otherwis:[5,20,21],our:[],output:[3,5,8,16,17,20],over:[10,11,19],overal:1,overridden:2,owner:2,packag:[1,17],pad:20,page:[],pair:[10,19,20],paramet:[1,2,3,4,5,7,8,9,10,11,12,13,14,15,20,21],parent:[4,20],pars:[1,2,9,16,21],parse_jyutp:[1,16,17],part:[1,5,8,10,11,16,17,20],part_of_speech_tag:20,particip:[1,5,20],participant_cod:20,particularli:17,pass:[4,12,21,23],path:[1,2,4,5,12,20],pattern:[2,20],per:[],perceptron:[10,19],perform:[20,21],perhap:19,permiss:19,phonolog:[5,17,20],phrase:[1,10,19],pick:1,piggyback:1,pin:1,pinjam:[17,21],pip:16,pleas:[2,5,16,17,19,20],plu:[1,5,20,21],point:1,pop:[],pop_left:[],pos:[5,10,11,16,19,20,21],pos_tag:[1,19],possibl:[1,21],post:[],potenti:[17,19,23],power:21,pprint:[16,21],pre:[],preced:21,predict:10,prefix:[],preprocess:[],pretti:21,preval:[5,20],previou:[8,17],previous:[1,3],print:[16,21],process:[11,16,17,19,22,23],product:20,programmat:20,pron:[10,19],pronoun:22,pronunci:17,proper:[],prove:17,provid:[11,13,17,19,20,21,22,23],ptk:21,ptk_tone2:21,punct:[10,19],punctuat:[3,17],purpos:[1,2,11,21],pycantones:[1,2,17,18,19,20,21,22,23],pylangacq:[1,2,4,20],pypi:1,python3:17,python:[1,2,21],qualiti:[1,19],queri:16,question:[],quot:[8,17],rachel:16,rais:[1,5,7,8,9,10,17,20],random:[],rang:[1,5,16,20],rather:1,ratio:20,read:[1,12,17],read_chat:[2,20],reader:[1,4,12,16],readm:[2,16],readthedoc:1,recent:[16,17],recogn:20,record:20,recurs:[],refer:[16,20],reflect:[],regex:[5,20],regular:[16,21],rel:[19,20,21],relat:[20,21],releas:[2,16,17,23],relev:17,remark:20,remot:[],remov:[14,20,22],render:20,replac:[1,3,7,8],report:16,repositori:[],repr:17,repres:[3,17,21],represent:16,request:16,requir:[1,16],research:[2,16,20,21],reset:20,resourc:17,respect:21,restrict:21,restructur:1,result:[1,16,19,20,23],revis:1,rich:2,richielo:16,right:[5,20,21],rime:[1,3,13,16,17,23],rime_cantones:16,rise:[17,21],robin:16,roman:[1,3,5,7,8,9,16,20,21],rst:1,run:[],ryan:16,rylanchiu:16,safe:20,same:[21,23],sarah:[],satisfi:[],scheme:17,search:[1,16,20],search_item:20,second:21,section:[],secur:[],see:[2,5,10,16,17,20,21],seem:17,segment:[1,3,5,10,16,17,19,20],select:[],self:[],semant:21,sens:[],sent:[5,20,21],sent_rang:[5,20,21],sent_str:[],sentenc:[1,5,10,13,16,19,20],separ:17,septemb:[16,18],set:[13,14,17,20,21,22],shoe:[10,19],should:2,show:[16,21],shown:20,signatur:[],similar:20,similarli:22,simpl:[20,23],simpli:[],sinc:19,singl:[2,8,20,21],situat:23,size:19,slide:[16,18],small:19,smaller:[],snippet:1,snowman:16,social:16,soek2:21,some:[4,20],sophist:19,sort:20,sorted_by_ag:20,sourc:[1,3,4,5,6,7,8,9,10,11,12,13,14,15,16,17,20],space:[20,23],span:[5,20,21],speak:[3,16,17,21],specif:[1,19,21],specifi:[2,20,21,23],speech:[1,5,10,11,16,20],split:20,stabl:16,standalon:17,standard:[2,19],start:20,state:18,statist:19,stdin:17,step:[],stephan:16,still:[17,19,23],stiller:16,stop:[1,14,16],stop_wds1:[],stop_wds2:[],stop_word:22,stop_words_1:[14,22],stop_words_2:[14,22],store:[],str:[3,4,5,7,8,9,10,11,12,13,14,15,20,21],string:[1,3,5,8,10,13,16,20,21,22,23],strip:1,structur:20,studi:[],style:1,subclass:[],subject:[],substanti:16,substr:20,suffici:[],suffix:17,suggest:[],suit:1,suppli:1,support:[1,4,5,10,12,20],syllab:[1,17],syllabl:[8,17],syntax:[20,21],system:17,tag:[1,5,10,11,16,20],tagged_s:20,tagged_word:20,tagger:[10,19],tagset:[1,10,11,19,21],take:[1,17,19,20,21,22,23],talk:[16,18],talkbank:[],target:20,task:[11,17,21,22,23],teach:17,teng1:21,term:[5,16,20],territori:22,test:[1,16],tester:[],text:1,than:[1,5,13,19,20,21,23],thank:17,thei:1,them:[],theme:1,thi:[1,2,3,7,8,10,11,13,15,16,17,20,21,23],think:[19,23],those:17,though:23,through:2,thrown:19,tier:20,time:21,tip:[],tipa:[1,7,16],todai:17,togeth:20,token:[5,17,20,21],tone2:21,tone:[5,8,9,16,17,20,21],tool:[16,17,18],top:20,total:21,touch:19,traceback:17,tracker:16,tradit:[5,20],train:[10,13,17,19,23],transcript:[16,20],transpar:1,travel:16,treat:[17,20,22,23],trivial:17,tsui:[16,18],tsz:[16,18],ttr:20,tun55:[7,17],tupl:[1,3,5,9,10,17,20,21],turn:[1,17],twitter:16,two:[17,20],txt:16,type:20,typeerror:10,typic:20,unclear:8,under:2,underli:[1,23],underlyingli:2,unicod:[],union:[],univers:[1,10,11,16,18,19],universaldepend:[10,11,19],unless:[],unrecogn:[7,8,9,11],unreleas:16,unseen:[3,17],unseg:[1,10,13,19,23],unspecifi:[5,20],unstabl:[],unzip:[],upcom:[],updat:20,upgrad:16,uppercas:20,url:[],use:[2,4,17,20,21,22],used:[2,5,10,13,17,20,21,23],useful:21,usefulness:17,user:[1,17],uses:[2,10,11,19],using:21,usr:17,utf8:[2,4,12,20],utf:[1,2],utter:[20,21],uuid:[],valid:17,valu:[1,3,8,17,21],valueerror:[5,7,8,9,10,17,20],varieti:21,variou:[1,17,21],verb:[10,11,16,19,21],version:[1,3,7,8,10,11,13,14,15,16,17,19,20,22,23],versu:[],via:2,wa25:[7,17],waa6:21,waan2:21,wai3:20,wai:23,welcom:[],well:2,what:20,whatev:20,when:[1,17,20,21],where:[1,3,10,23],whether:[17,20,23],which:[2,4,8,10,11,17,19,20,21,22],whitespac:1,who:16,whose:16,wide:[2,21],wildcard:20,window:1,within:[5,20,21],without:20,wong:2,word:[1,2,3,5,10,13,14,15,16,17,19],word_frequ:20,word_ngram:20,word_rang:[5,20,21],word_segment:[13,23],wordlist:1,wordseg:1,work:[19,21,23],workshop:18,worth:19,would:[2,8,11,17,19,20,23],wouldn:19,wrap:[],written:23,x2y:1,x_to_i:1,xxa:20,xxb:20,xxx:[],yale:[1,8,16],year:20,yesterdai:[10,19],yet:20,you:[2,17,19,20,22,23],your:[2,4,16,19,20,22],yuen:16,zan1hai6:21,zero:20,zik6cing4:21,zip:[],zoek2:21,zyu6:21},titles:["API Reference","Changelog","Corpus Data","pycantonese.characters_to_jyutping","pycantonese.corpus.CantoneseCHATReader","pycantonese.corpus.CantoneseCHATReader.search","pycantonese.hkcancor","pycantonese.jyutping_to_tipa","pycantonese.jyutping_to_yale","pycantonese.parse_jyutping","pycantonese.pos_tag","pycantonese.pos_tagging.hkcancor_to_ud","pycantonese.read_chat","pycantonese.segment","pycantonese.stop_words","pycantonese.word_segmentation.Segmenter","PyCantonese: Cantonese Linguistics and NLP in Python","Jyutping Romanization","Research Outputs","Part-of-Speech Tagging","Corpus Reader Methods","Corpus Search Queries","Stop Words","Word Segmentation"],titleterms:{"0dev":1,"2014":1,"2015":1,"2016":1,"2018":1,"2020":1,"2021":1,"break":1,Added:1,The:[2,20],access:[2,20],acknowledg:16,api:[0,1,20],built:2,cantones:16,cantonesechatread:[4,5],chang:1,changelog:1,charact:[17,21],characters2jyutp:[],characters_to_jyutp:3,chat:2,chines:21,cite:16,content:16,convers:17,corpu:[0,2,4,5,20,21],criteria:21,custom:[2,23],data:[0,2],deprec:1,develop:[],download:16,element:21,etc:[],exampl:16,fix:1,format:[2,21],full:20,handl:[],hkcancor:6,hkcancor_to_ud:11,how:16,instal:16,introduct:[],jyutp:[0,17,21],jyutping2tipa:[],jyutping2yal:[],jyutping_to_tipa:7,jyutping_to_yal:8,languag:0,librari:[],licens:16,linguist:16,link:16,logo:16,metadata:[],method:20,multipl:21,natur:0,nlp:16,non:1,note:20,output:[18,21],pars:17,parse_jyutp:9,part:[19,21],perform:[],pos_tag:[10,11],process:0,pycantones:[3,4,5,6,7,8,9,10,11,12,13,14,15,16],python:16,queri:21,quick:16,rang:21,read:[],read_chat:12,reader:20,refer:0,remov:1,represent:20,research:18,result:21,roman:[0,17],search:[5,21],secur:1,segment:[13,15,23],sentenc:21,speech:[19,21],stop:22,stop_word:14,string:17,support:[],tabl:16,tag:[19,21],task:[],technic:[],tipa:17,transcript:2,unreleas:1,word:[20,21,22,23],word_segment:15,yale:17}}) \ No newline at end of file