Overview
Comment: | [graphspell][core] tokenizer: rename ELPFX tokens to WORD_ELIDED |
---|---|
Downloads: | Tarball | ZIP archive | SQL archive |
Timelines: | family | ancestors | descendants | both | core | graphspell | rg |
Files: | files | file ages | folders |
SHA3-256: |
a1b165e27617202e63311b572053dbd7 |
User & Date: | olr on 2018-06-28 07:53:20 |
Original Comment: | [graphspell][core] rename ELPFX tokens to WORD_ELIDED |
Other Links: | branch diff | manifest | tags |
Context
2018-06-28
| ||
08:00 | [graphspell] tokenizer: rename ORDINAL tokens to WORD_ORDINAL check-in: 20dbc28ded user: olr tags: graphspell, rg | |
07:53 | [graphspell][core] tokenizer: rename ELPFX tokens to WORD_ELIDED check-in: a1b165e276 user: olr tags: core, graphspell, rg | |
2018-06-27
| ||
23:39 | [build][fix] check regexes: memorize checked regexes check-in: 74d9c8e099 user: olr tags: build, rg | |
Changes
Modified gc_lang/fr/modules-js/lexicographe.js from [823f277d47] to [6f858d6849].
︙ | ︙ | |||
83 84 85 86 87 88 89 | [':O2', [" 2ᵉ pers.,", "Pronom : 2ᵉ personne"]], [':O3', [" 3ᵉ pers.,", "Pronom : 3ᵉ personne"]], [':C', [" conjonction,", "Conjonction"]], [':Ĉ', [" conjonction (él.),", "Conjonction (élément)"]], [':Cc', [" conjonction de coordination,", "Conjonction de coordination"]], [':Cs', [" conjonction de subordination,", "Conjonction de subordination"]], [':Ĉs', [" conjonction de subordination (él.),", "Conjonction de subordination (élément)"]], | | | 83 84 85 86 87 88 89 90 91 92 93 94 95 96 97 | [':O2', [" 2ᵉ pers.,", "Pronom : 2ᵉ personne"]], [':O3', [" 3ᵉ pers.,", "Pronom : 3ᵉ personne"]], [':C', [" conjonction,", "Conjonction"]], [':Ĉ', [" conjonction (él.),", "Conjonction (élément)"]], [':Cc', [" conjonction de coordination,", "Conjonction de coordination"]], [':Cs', [" conjonction de subordination,", "Conjonction de subordination"]], [':Ĉs', [" conjonction de subordination (él.),", "Conjonction de subordination (élément)"]], [':Ñ', [" locution nominale (él.),", "Locution nominale (élément)"]], [':Â', [" locution adjectivale (él.),", "Locution adjectivale (élément)"]], [':Ṽ', [" locution verbale (él.),", "Locution verbale (élément)"]], [':Ŵ', [" locution adverbiale (él.),", "Locution adverbiale (élément)"]], [':Ŕ', [" locution prépositive (él.),", "Locution prépositive (élément)"]], [':Ĵ', [" locution interjective (él.),", "Locution interjective (élément)"]], |
︙ | ︙ | |||
261 262 263 264 265 266 267 | case 'LINK': return { sType: oToken.sType, sValue: oToken.sValue.slice(0, 40) + "…", aLabel: ["hyperlien"] }; break; | | | 261 262 263 264 265 266 267 268 269 270 271 272 273 274 275 | case 'LINK': return { sType: oToken.sType, sValue: oToken.sValue.slice(0, 40) + "…", aLabel: ["hyperlien"] }; break; case 'WORD_ELIDED': let sTemp = oToken.sValue.replace("’", "").replace("'", "").replace("`", "").toLowerCase(); return { sType: oToken.sType, sValue: oToken.sValue, aLabel: [_dElidedPrefix.gl_get(sTemp, "préfixe élidé inconnu")] }; break; |
︙ | ︙ | |||
452 453 454 455 456 457 458 | let aTokenList = this.getListOfTokens(sText.replace("'", "’").trim(), false); let iKey = 0; let aElem = []; do { let oToken = aTokenList[iKey]; let sMorphLoc = ''; let aTokenTempList = [oToken]; | | | 452 453 454 455 456 457 458 459 460 461 462 463 464 465 466 | let aTokenList = this.getListOfTokens(sText.replace("'", "’").trim(), false); let iKey = 0; let aElem = []; do { let oToken = aTokenList[iKey]; let sMorphLoc = ''; let aTokenTempList = [oToken]; if (oToken.sType == "WORD" || oToken.sType == "WORD_ELIDED"){ let iKeyTree = iKey + 1; let oLocNode = this.oLocGraph[oToken.sValue.toLowerCase()]; while (oLocNode) { let oTokenNext = aTokenList[iKeyTree]; iKeyTree++; if (oTokenNext) { oLocNode = oLocNode[oTokenNext.sValue.toLowerCase()]; |
︙ | ︙ |
Modified gc_lang/fr/webext/content_scripts/panel_lxg.css from [60aef30035] to [83fe0f37d1].
︙ | ︙ | |||
86 87 88 89 90 91 92 | } div.grammalecte_lxg_token_LOC { background-color: hsla(150, 50%, 30%, 1); } div.grammalecte_lxg_token_WORD { background-color: hsla(150, 50%, 50%, 1); } | | | 86 87 88 89 90 91 92 93 94 95 96 97 98 99 100 | } div.grammalecte_lxg_token_LOC { background-color: hsla(150, 50%, 30%, 1); } div.grammalecte_lxg_token_WORD { background-color: hsla(150, 50%, 50%, 1); } div.grammalecte_lxg_token_WORD_ELIDED { background-color: hsla(150, 30%, 50%, 1); } div.grammalecte_lxg_token_UNKNOWN { background-color: hsla(0, 50%, 50%, 1); } div.grammalecte_lxg_token_NUM { background-color: hsla(180, 50%, 50%, 1); |
︙ | ︙ |
Modified gc_lang/fr/xpi/data/lxg_panel.css from [3d666aa76c] to [0f0ad23b15].
︙ | ︙ | |||
54 55 56 57 58 59 60 | padding: 2px 5px; border-radius: 2px; text-decoration: none; } #wordlist b.WORD { background-color: hsla(150, 50%, 50%, 1); } | | | 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 | padding: 2px 5px; border-radius: 2px; text-decoration: none; } #wordlist b.WORD { background-color: hsla(150, 50%, 50%, 1); } #wordlist b.WORD_ELIDED { background-color: hsla(150, 30%, 50%, 1); } #wordlist b.UNKNOWN { background-color: hsla(0, 50%, 50%, 1); } #wordlist b.NUM { background-color: hsla(180, 50%, 50%, 1); |
︙ | ︙ |
Modified graphspell-js/tokenizer.js from [5f94dc04ea] to [8dd855b1b3].
︙ | ︙ | |||
38 39 40 41 42 43 44 | [/^[,.;:!?…«»“”‘’"(){}\[\]·–—]/, 'SEPARATOR'], [/^[A-Z][.][A-Z][.](?:[A-Z][.])*/, 'ACRONYM'], [/^(?:https?:\/\/|www[.]|[a-zA-Zà-öÀ-Ö0-9ø-ÿØ-ßĀ-ʯfi-st_-]+[@.][a-zA-Zà-öÀ-Ö0-9ø-ÿØ-ßĀ-ʯfi-st_-]{2,}[@.])[a-zA-Z0-9][a-zA-Zà-öÀ-Ö0-9ø-ÿØ-ßĀ-ʯfi-st_.\/?&!%=+*"'@$#-]+/, 'LINK'], [/^[#@][a-zA-Zà-öÀ-Ö0-9ø-ÿØ-ßĀ-ʯfi-st_-]+/, 'TAG'], [/^<[a-zA-Zà-öÀ-Ö0-9ø-ÿØ-ßĀ-ʯfi-st]+.*?>|<\/[a-zA-Zà-öÀ-Ö0-9ø-ÿØ-ßĀ-ʯfi-st]+ *>/, 'HTML'], [/^\[\/?[a-zA-Zà-öÀ-Ö0-9ø-ÿØ-ßĀ-ʯfi-st]+\]/, 'PSEUDOHTML'], [/^&\w+;(?:\w+;|)/, 'HTMLENTITY'], | | | 38 39 40 41 42 43 44 45 46 47 48 49 50 51 52 | [/^[,.;:!?…«»“”‘’"(){}\[\]·–—]/, 'SEPARATOR'], [/^[A-Z][.][A-Z][.](?:[A-Z][.])*/, 'ACRONYM'], [/^(?:https?:\/\/|www[.]|[a-zA-Zà-öÀ-Ö0-9ø-ÿØ-ßĀ-ʯfi-st_-]+[@.][a-zA-Zà-öÀ-Ö0-9ø-ÿØ-ßĀ-ʯfi-st_-]{2,}[@.])[a-zA-Z0-9][a-zA-Zà-öÀ-Ö0-9ø-ÿØ-ßĀ-ʯfi-st_.\/?&!%=+*"'@$#-]+/, 'LINK'], [/^[#@][a-zA-Zà-öÀ-Ö0-9ø-ÿØ-ßĀ-ʯfi-st_-]+/, 'TAG'], [/^<[a-zA-Zà-öÀ-Ö0-9ø-ÿØ-ßĀ-ʯfi-st]+.*?>|<\/[a-zA-Zà-öÀ-Ö0-9ø-ÿØ-ßĀ-ʯfi-st]+ *>/, 'HTML'], [/^\[\/?[a-zA-Zà-öÀ-Ö0-9ø-ÿØ-ßĀ-ʯfi-st]+\]/, 'PSEUDOHTML'], [/^&\w+;(?:\w+;|)/, 'HTMLENTITY'], [/^(?:l|d|n|m|t|s|j|c|ç|lorsqu|puisqu|jusqu|quoiqu|qu)['’`]/i, 'WORD_ELIDED'], [/^\d\d?[hm]\d\d\b/, 'HOUR'], [/^\d+(?:ers?|nds?|es?|des?|ièmes?|èmes?|emes?|ᵉʳˢ?|ⁿᵈˢ?|ᵉˢ?|ᵈᵉˢ?)\b/, 'ORDINAL'], [/^-?\d+(?:[.,]\d+|)/, 'NUM'], [/^[%‰+=*/<>⩾⩽-]/, 'SIGN'], [/^[a-zA-Zà-öÀ-Ö0-9ø-ÿØ-ßĀ-ʯfi-st]+(?:[’'`-][a-zA-Zà-öÀ-Ö0-9ø-ÿØ-ßĀ-ʯfi-st]+)*/, 'WORD'] ] }; |
︙ | ︙ |
Modified graphspell/tokenizer.py from [7c766445e1] to [8cf6a6bb2e].
︙ | ︙ | |||
27 28 29 30 31 32 33 | r'(?P<FOLDERWIN>[a-zA-Z]:\\(?:Program Files(?: [(]x86[)]|)|[\w.()]+)(?:\\[\w.()-]+)*)', r'(?P<PUNC>[][,.;:!?…«»“”‘’"(){}·–—])', r'(?P<ACRONYM>[A-Z][.][A-Z][.](?:[A-Z][.])*)', r'(?P<LINK>(?:https?://|www[.]|\w+[@.]\w\w+[@.])\w[\w./?&!%=+*"\'@$#-]+)', r'(?P<HASHTAG>[#@][\w-]+)', r'(?P<HTML><\w+.*?>|</\w+ *>)', r'(?P<PSEUDOHTML>\[/?\w+\])', | | | 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 | r'(?P<FOLDERWIN>[a-zA-Z]:\\(?:Program Files(?: [(]x86[)]|)|[\w.()]+)(?:\\[\w.()-]+)*)', r'(?P<PUNC>[][,.;:!?…«»“”‘’"(){}·–—])', r'(?P<ACRONYM>[A-Z][.][A-Z][.](?:[A-Z][.])*)', r'(?P<LINK>(?:https?://|www[.]|\w+[@.]\w\w+[@.])\w[\w./?&!%=+*"\'@$#-]+)', r'(?P<HASHTAG>[#@][\w-]+)', r'(?P<HTML><\w+.*?>|</\w+ *>)', r'(?P<PSEUDOHTML>\[/?\w+\])', r"(?P<WORD_ELIDED>(?:l|d|n|m|t|s|j|c|ç|lorsqu|puisqu|jusqu|quoiqu|qu)['’`])", r'(?P<ORDINAL>\d+(?:ers?|nds?|es?|des?|ièmes?|èmes?|emes?|ᵉʳˢ?|ⁿᵈˢ?|ᵉˢ?|ᵈᵉˢ?)\b)', r'(?P<HOUR>\d\d?h\d\d\b)', r'(?P<NUM>-?\d+(?:[.,]\d+|))', r'(?P<SIGN>[%‰+=*/<>⩾⩽-])', r"(?P<WORD>\w+(?:[’'`-]\w+)*)" ) } |
︙ | ︙ |