Overview
Comment: | [build] lex_build.py: main() + options |
---|---|
Downloads: | Tarball | ZIP archive | SQL archive |
Timelines: | family | ancestors | descendants | both | trunk | build |
Files: | files | file ages | folders |
SHA3-256: |
e091821b507aa481b740f7a561b0bd3e |
User & Date: | olr on 2017-06-23 13:19:32 |
Other Links: | manifest | tags |
Context
2017-06-23
| ||
14:43 | [core] dawg: accept personal lexicon check-in: 3916c538b5 user: olr tags: trunk, core, new_feature | |
13:19 | [build] lex_build.py: main() + options check-in: e091821b50 user: olr tags: trunk, build | |
12:55 | [build] change arguments order for dictionary building check-in: 4bc364b3ac user: olr tags: trunk, build | |
Changes
Modified lex_build.py from [17cde37b09] to [a7e2785f63].
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 | #!python3 # Lexicon builder from distutils import dir_util import grammalecte.dawg as fsa from grammalecte.ibdawg import IBDAWG def build (spfSrc, sLangName, sDicName, bJSON=False, cStemmingMethod="S", nCompressMethod=1): "transform a text lexicon as a binary indexable dictionary" oDAWG = fsa.DAWG(spfSrc, sLangName, cStemmingMethod) dir_util.mkpath("grammalecte/_dictionaries") oDAWG.writeInfo("grammalecte/_dictionaries/" + sDicName + ".info.txt") oDAWG.createBinary("grammalecte/_dictionaries/" + sDicName + ".bdic", int(nCompressMethod)) if bJSON: dir_util.mkpath("grammalecte-js/_dictionaries") oDic = IBDAWG(sDicName + ".bdic") | > < > > | > > > > > > | | 1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31 32 33 34 35 36 37 | #!python3 # Lexicon builder import argparse from distutils import dir_util import grammalecte.dawg as fsa from grammalecte.ibdawg import IBDAWG def build (spfSrc, sLangName, sDicName, bJSON=False, cStemmingMethod="S", nCompressMethod=1): "transform a text lexicon as a binary indexable dictionary" oDAWG = fsa.DAWG(spfSrc, sLangName, cStemmingMethod) dir_util.mkpath("grammalecte/_dictionaries") oDAWG.writeInfo("grammalecte/_dictionaries/" + sDicName + ".info.txt") oDAWG.createBinary("grammalecte/_dictionaries/" + sDicName + ".bdic", int(nCompressMethod)) if bJSON: dir_util.mkpath("grammalecte-js/_dictionaries") oDic = IBDAWG(sDicName + ".bdic") oDic.writeAsJSObject("grammalecte-js/_dictionaries/" + sDicName + ".json") def main (): xParser = argparse.ArgumentParser() xParser.add_argument("src_lexicon", type=str, help="path and file name of the source lexicon") xParser.add_argument("lang_name", type=str, help="language name") xParser.add_argument("dic_name", type=str, help="dictionary file name (without extension)") xParser.add_argument("-js", "--json", help="Build dictionary in JSON", action="store_true") xParser.add_argument("-s", "--stemming", help="stemming method: S=suffixes, A=affixes, N=no stemming", type=str, choices=["S", "A", "N"], default="S") xParser.add_argument("-c", "--compress", help="compression method: 1, 2 (beta), 3, (beta)", type=int, choices=[1, 2, 3], default=1) xArgs = xParser.parse_args() build(xArgs.src_lexicon, xArgs.lang_name, xArgs.dic_name, xArgs.json) if __name__ == '__main__': main() |