feat(options): add 読点 and 句点 as options

azu · azu · commit d62518749786 · 2021-04-08T18:10:56.000+09:00
diff --git a/package.json b/package.json
@@ -30,9 +30,13 @@
     "build": "textlint-scripts build",
     "watch": "textlint-scripts build --watch",
     "prepublish": "npm run --if-present build",
-    "test": "textlint-scripts test"
+    "test": "textlint-scripts test",
+    "prettier": "prettier --write \"**/*.{js,jsx,ts,tsx,css}\"",
+    "prepare": "git config --local core.hooksPath .githook"
   },
   "devDependencies": {
+    "lint-staged": "^10.5.4",
+    "prettier": "^2.2.1",
     "textlint-scripts": "^3.0.0"
   },
   "dependencies": {
@@ -41,5 +45,16 @@
     "structured-source": "^3.0.2",
     "textlint-rule-helper": "^2.0.0",
     "textlint-util-to-string": "^3.1.1"
+  },
+  "prettier": {
+    "singleQuote": false,
+    "printWidth": 120,
+    "tabWidth": 4,
+    "trailingComma": "none"
+  },
+  "lint-staged": {
+    "*.{js,jsx,ts,tsx,css}": [
+      "prettier --write"
+    ]
   }
 }
diff --git a/src/max-ten.js b/src/max-ten.js
@@ -1,20 +1,25 @@
 // LICENSE : MIT
 "use strict";
-import { RuleHelper } from "textlint-rule-helper"
+import { RuleHelper } from "textlint-rule-helper";
 import { getTokenizer } from "kuromojin";
 import { splitAST, Syntax as SentenceSyntax } from "sentence-splitter";
 import { StringSource } from "textlint-util-to-string";
+import { SeparatorParser } from "sentence-splitter/lib/parser/SeparatorParser";
 
 const defaultOptions = {
-    max: 3, // 1文に利用できる最大の、の数
-    strict: false // 例外ルールを適応するかどうか
+    // 1文に利用できる最大の、の数
+    max: 3,
+    // 例外ルールを適応するかどうか,
+    strict: false,
+    // 読点として扱う文字
+    // https://ja.wikipedia.org/wiki/%E8%AA%AD%E7%82%B9
+    touten: "、",
+    // 句点として扱う文字
+    // https://ja.wikipedia.org/wiki/%E5%8F%A5%E7%82%B9
+    kuten: "。"
 };
 
-function isSandwichedMeishi({
-                                before,
-                                token,
-                                after
-                            }) {
+function isSandwichedMeishi({ before, token, after }) {
     if (before === undefined || after === undefined || token === undefined) {
         return false;
     }
@@ -23,20 +28,31 @@ function isSandwichedMeishi({
 
 /**
  * @param {RuleContext} context
- * @param {object} [options]
+ * @param {typeof defaultOptions} [options]
  */
 module.exports = function (context, options = {}) {
-    const maxLen = options.max || defaultOptions.max;
-    const isStrict = options.strict || defaultOptions.strict;
+    const maxLen = options.max ?? defaultOptions.max;
+    const isStrict = options.strict ?? defaultOptions.strict;
+    const touten = options.touten ?? defaultOptions.touten;
+    const kuten = options.kuten ?? defaultOptions.kuten;
     const helper = new RuleHelper(context);
     const { Syntax, RuleError, report, getSource } = context;
     return {
         [Syntax.Paragraph](node) {
             if (helper.isChildNode(node, [Syntax.BlockQuote])) {
                 return;
             }
-            const resultNode = splitAST(node);
-            const sentences = resultNode.children.filter(childNode => childNode.type === SentenceSyntax.Sentence);
+            const resultNode = splitAST(node, {
+                SeparatorParser: {
+                    separatorCharacters: [
+                        "?", // question mark
+                        "!", //  exclamation mark
+                        "？", // (ja) zenkaku question mark
+                        "！" // (ja) zenkaku exclamation mark
+                    ].concat(kuten)
+                }
+            });
+            const sentences = resultNode.children.filter((childNode) => childNode.type === SentenceSyntax.Sentence);
             /*
              <p>
              <str><code><img><str>
@@ -49,18 +65,18 @@ module.exports = function (context, options = {}) {
              2. sentence to tokens
              3. check tokens
              */
-            return getTokenizer().then(tokenizer => {
-                sentences.forEach(sentence => {
+            return getTokenizer().then((tokenizer) => {
+                sentences.forEach((sentence) => {
                     const source = new StringSource(sentence);
                     const text = source.toString();
                     const tokens = tokenizer.tokenizeForSentence(text);
                     let currentTenCount = 0;
                     let lastToken = null;
                     tokens.forEach((token, index) => {
-                        let surface = token.surface_form;
-                        if (surface === "、") {
+                        const surface = token.surface_form;
+                        if (surface === touten) {
                             // 名詞に囲まわれている場合は例外とする
-                            let isSandwiched = isSandwichedMeishi({
+                            const isSandwiched = isSandwichedMeishi({
                                 before: tokens[index - 1],
                                 token: token,
                                 after: tokens[index + 1]
@@ -80,15 +96,18 @@ module.exports = function (context, options = {}) {
                         if (currentTenCount >= maxLen) {
                             const positionInSentence = source.originalIndexFromIndex(lastToken.word_position - 1);
                             const index = sentence.range[0] + positionInSentence;
-                            const ruleError = new context.RuleError(`一つの文で"、"を${maxLen}つ以上使用しています`, {
-                                index
-                            });
+                            const ruleError = new context.RuleError(
+                                `一つの文で"${touten}"を${maxLen}つ以上使用しています`,
+                                {
+                                    index
+                                }
+                            );
                             report(node, ruleError);
                             currentTenCount = 0;
                         }
                     });
                 });
             });
         }
-    }
-}
+    };
+};
diff --git a/test/max-ten-test.js b/test/max-ten-test.js
@@ -1,9 +1,11 @@
-const rule = require("../src/max-ten");
+import TextLintTester from "textlint-tester";
+import rule from "../src/max-ten";
+
 function textIncludeTen(count) {
-    return (new Array(count + 1)).join("テスト文章において、") + "です";
+    return new Array(count + 1).join("テスト文章において、") + "です";
 }
-var TextLintTester = require("textlint-tester");
-var tester = new TextLintTester();
+
+const tester = new TextLintTester();
 // ruleName, rule, expected[]
 tester.run("max-ten", rule, {
     // default max:3
@@ -17,19 +19,31 @@ tester.run("max-ten", rule, {
         {
             text: textIncludeTen(5 - 1),
             options: {
-                "max": 5
+                max: 5
             }
         },
         {
             text: "これは、テストです。"
+        },
+        {
+            text: "これは、これは、これは、これは、オプションでカウントされないのでOK",
+            options: {
+                touten: "，",
+                kuten: "．"
+            }
+        },
+        {
+            text: `これは，これは．これは，これは．`,
+            options: {
+                touten: "，",
+                kuten: "．"
+            }
         }
-
     ],
     invalid: [
         {
             text: `これは、これは、これは
-、d`
-            ,
+、d`,
             errors: [
                 {
                     message: `一つの文で"、"を3つ以上使用しています`,
@@ -38,10 +52,23 @@ tester.run("max-ten", rule, {
                 }
             ]
         },
+        {
+            text: `これは，これは，これは，これは。`,
+            errors: [
+                {
+                    message: `一つの文で"，"を3つ以上使用しています`,
+                    index: 11
+                }
+            ],
+            options: {
+                touten: "，",
+                kuten: "．"
+            }
+        },
         {
             text: textIncludeTen(5),
             options: {
-                "max": 5
+                max: 5
             },
             errors: [
                 {
@@ -52,7 +79,7 @@ tester.run("max-ten", rule, {
         {
             text: `これは、長文の例ですが、columnがちゃんと計算、されてるはずです。`,
             options: {
-                "max": 3
+                max: 3
             },
             errors: [
                 {
@@ -65,7 +92,7 @@ tester.run("max-ten", rule, {
         {
             text: "間に、Str以外の`code`Nodeが、あっても、OK",
             options: {
-                "max": 3
+                max: 3
             },
             errors: [
                 {
@@ -78,7 +105,7 @@ tester.run("max-ten", rule, {
         {
             text: `複数のセンテンスがある場合。これでも、columnが、ちゃんと計算、されているはずです。`,
             options: {
-                "max": 3
+                max: 3
             },
             errors: [
                 {
@@ -91,7 +118,7 @@ tester.run("max-ten", rule, {
         {
             text: `複数のセンテンスがあって、改行されている場合でも\n大丈夫です。これでも、lineとcolumnが、ちゃんと計算、されているはずです。`,
             options: {
-                "max": 3
+                max: 3
             },
             errors: [
                 {
@@ -102,4 +129,4 @@ tester.run("max-ten", rule, {
             ]
         }
     ]
-});
+});
diff --git a/yarn.lock b/yarn.lock

Original file line number	Diff line number	Diff line change
`@@ -1,9 +1,11 @@`
`1`		`-const rule = require("../src/max-ten");`
	`1`	`+import TextLintTester from "textlint-tester";`
	`2`	`+import rule from "../src/max-ten";`
	`3`	`+`
`2`	`4`	`function textIncludeTen(count) {`
`3`		`- return (new Array(count + 1)).join("テスト文章において、") + "です";`
	`5`	`+ return new Array(count + 1).join("テスト文章において、") + "です";`
`4`	`6`	`}`
`5`		`-var TextLintTester = require("textlint-tester");`
`6`		`-var tester = new TextLintTester();`
	`7`	`+`
	`8`	`+const tester = new TextLintTester();`
`7`	`9`	`// ruleName, rule, expected[]`
`8`	`10`	`tester.run("max-ten", rule, {`
`9`	`11`	`// default max:3`
`@@ -17,19 +19,31 @@ tester.run("max-ten", rule, {`
`17`	`19`	`{`
`18`	`20`	`text: textIncludeTen(5 - 1),`
`19`	`21`	`options: {`
`20`		`- "max": 5`
	`22`	`+ max: 5`
`21`	`23`	`}`
`22`	`24`	`},`
`23`	`25`	`{`
`24`	`26`	`text: "これは、テストです。"`
	`27`	`+ },`
	`28`	`+ {`
	`29`	`+ text: "これは、これは、これは、これは、オプションでカウントされないのでOK",`
	`30`	`+ options: {`
	`31`	`+ touten: "，",`
	`32`	`+ kuten: "．"`
	`33`	`+ }`
	`34`	`+ },`
	`35`	`+ {`
	`36`	+ text: `これは，これは．これは，これは．`,
	`37`	`+ options: {`
	`38`	`+ touten: "，",`
	`39`	`+ kuten: "．"`
	`40`	`+ }`
`25`	`41`	`}`
`26`		`-`
`27`	`42`	`],`
`28`	`43`	`invalid: [`
`29`	`44`	`{`
`30`	`45`	text: `これは、これは、これは
`31`		-、d`
`32`		`- ,`
	`46`	+、d`,
`33`	`47`	`errors: [`
`34`	`48`	`{`
`35`	`49`	message: `一つの文で"、"を3つ以上使用しています`,
`@@ -38,10 +52,23 @@ tester.run("max-ten", rule, {`
`38`	`52`	`}`
`39`	`53`	`]`
`40`	`54`	`},`
	`55`	`+ {`
	`56`	+ text: `これは，これは，これは，これは。`,
	`57`	`+ errors: [`
	`58`	`+ {`
	`59`	+ message: `一つの文で"，"を3つ以上使用しています`,
	`60`	`+ index: 11`
	`61`	`+ }`
	`62`	`+ ],`
	`63`	`+ options: {`
	`64`	`+ touten: "，",`
	`65`	`+ kuten: "．"`
	`66`	`+ }`
	`67`	`+ },`
`41`	`68`	`{`
`42`	`69`	`text: textIncludeTen(5),`
`43`	`70`	`options: {`
`44`		`- "max": 5`
	`71`	`+ max: 5`
`45`	`72`	`},`
`46`	`73`	`errors: [`
`47`	`74`	`{`
`@@ -52,7 +79,7 @@ tester.run("max-ten", rule, {`
`52`	`79`	`{`
`53`	`80`	text: `これは、長文の例ですが、columnがちゃんと計算、されてるはずです。`,
`54`	`81`	`options: {`
`55`		`- "max": 3`
	`82`	`+ max: 3`
`56`	`83`	`},`
`57`	`84`	`errors: [`
`58`	`85`	`{`
`@@ -65,7 +92,7 @@ tester.run("max-ten", rule, {`
`65`	`92`	`{`
`66`	`93`	text: "間に、Str以外の`code`Nodeが、あっても、OK",
`67`	`94`	`options: {`
`68`		`- "max": 3`
	`95`	`+ max: 3`
`69`	`96`	`},`
`70`	`97`	`errors: [`
`71`	`98`	`{`
`@@ -78,7 +105,7 @@ tester.run("max-ten", rule, {`
`78`	`105`	`{`
`79`	`106`	text: `複数のセンテンスがある場合。これでも、columnが、ちゃんと計算、されているはずです。`,
`80`	`107`	`options: {`
`81`		`- "max": 3`
	`108`	`+ max: 3`
`82`	`109`	`},`
`83`	`110`	`errors: [`
`84`	`111`	`{`
`@@ -91,7 +118,7 @@ tester.run("max-ten", rule, {`
`91`	`118`	`{`
`92`	`119`	text: `複数のセンテンスがあって、改行されている場合でも\n大丈夫です。これでも、lineとcolumnが、ちゃんと計算、されているはずです。`,
`93`	`120`	`options: {`
`94`		`- "max": 3`
	`121`	`+ max: 3`
`95`	`122`	`},`
`96`	`123`	`errors: [`
`97`	`124`	`{`
`@@ -102,4 +129,4 @@ tester.run("max-ten", rule, {`
`102`	`129`	`]`
`103`	`130`	`}`
`104`	`131`	`]`
`105`		`-});`
	`132`	`+});`