Skip to content
New issue

Have a question about this project? Sign up for a free GitHub account to open an issue and contact its maintainers and the community.

By clicking “Sign up for GitHub”, you agree to our terms of service and privacy statement. We’ll occasionally send you account related emails.

Already on GitHub? Sign in to your account

Cb changes 20241203 #11081

Merged
merged 4 commits into from
Dec 4, 2024
Merged
Show file tree
Hide file tree
Changes from all commits
Commits
File filter

Filter by extension

Filter by extension

Conversations
Failed to load comments.
Loading
Jump to
Jump to file
Failed to load files.
Loading
Diff view
Diff view
Original file line number Diff line number Diff line change
Expand Up @@ -26865,6 +26865,17 @@ Apostolos Tzitzikostas
Christophe Hansen
Glenn Micallef
Pam Bondi
Standard Oil
Oxford Circus
Oxford Street
Vinci Autoroutes
VINCI Autoroutes
Jardine Matheson
Dagens Nyheter
Opel Grandland
Vauxhall Grandland
Ko Samui
Koh Samui
Qeshm Air
Santiago Posteguillo
Portia de Rossi
Expand Down
Original file line number Diff line number Diff line change
Expand Up @@ -80,17 +80,68 @@ public class CompoundInfinitivRule extends Rule {
token("an"),
token("zu")
),
Arrays.asList( // "Hab keine Lust, mir Gedanken darüber zu machen."
token("Gedanken"),
Arrays.asList(
tokenRegex("dazu|darüber"),
token("zu"),
token("machen")
),
Arrays.asList( // "um dort die Nacht über zu stehen."
tokenRegex("Spiel|Tag|Nacht|Morgen|Nachmittag|Abend|Zeit|.+zeit"),
Arrays.asList(
token("kurz"),
token("davor"),
token("zu")
),
Arrays.asList(
tokenRegex("Jahr|Monat|Zeit"),
token("über"),
token("zu")
),
Arrays.asList(
token("endlich"),
token("wieder"),
token("zu")
),
Arrays.asList(
token("bis"),
token("hin"),
token("zu")
),
Arrays.asList(
token("von"),
tokenRegex(".*[a-z].*"),
token("her"),
token("zu")
),
Arrays.asList(
tokenRegex("sehr|ganz|äu(ss|ß)erst|zu|nicht|absolut|total|wirklich|möglichst"),
posRegex("ADJ.*"),
token("zu")
),
Arrays.asList(
token("Schritt"),
token("weiter"),
token("zu")
),
Arrays.asList(
token("und"),
token("so"),
token("weiter")
),
Arrays.asList(
token("darauf"),
token("zu"),
posRegex("VER.*"),
token("dass")
),
Arrays.asList(
token("darauf"),
token("zu"),
token("stehen")
posRegex("VER.*"),
token(",")
),
Arrays.asList( // "um dort die Nacht über zu stehen."
tokenRegex("Spiel|Tag|Nacht|Morgen|Nachmittag|Abend|Zeit|.+zeit|Jahr(zehnt)?|Monat|.+tag|Mittwoch|Januar|Februar|März|April|Mai|Juni|Juli|August|September|Oktober|November|Dezember"),
token("über"),
token("zu")
),
Arrays.asList(
token("kurz"),
Expand All @@ -117,6 +168,11 @@ public class CompoundInfinitivRule extends Rule {
token("ab"),
token("zu")
),
Arrays.asList(
token("zu"),
posRegex("ADJ.*"),
token("zu")
),
Arrays.asList(
// "Hin und her zu laufen"
token("hin"),
Expand Down Expand Up @@ -163,8 +219,8 @@ private static PatternToken token(String s) {
public CompoundInfinitivRule(ResourceBundle messages, Language lang, UserConfig userConfig) throws IOException {
super.setCategory(Categories.COMPOUNDING.getCategory(messages));
setLocQualityIssueType(ITSIssueType.Misspelling);
addExamplePair(Example.wrong("Er überprüfte die Rechnungen noch einmal, um ganz <marker>sicher zu gehen</marker>."),
Example.fixed("Er überprüfte die Rechnungen noch einmal, um ganz <marker>sicherzugehen</marker>."));
addExamplePair(Example.wrong("Er überprüfte die Rechnungen noch einmal, um <marker>sicher zu gehen</marker>."),
Example.fixed("Er überprüfte die Rechnungen noch einmal, um <marker>sicherzugehen</marker>."));
this.lang = lang;
if (userConfig != null) {
linguServices = userConfig.getLinguServices();
Expand Down
Original file line number Diff line number Diff line change
Expand Up @@ -17573,7 +17573,7 @@ Fixierungsprozess
Fixierungsprozesse/NS
Friedrichssegen/S #name
gelingsicher/A
Granola #name
Granola/S #name
Häkeltechnik
Häkeltechniken
Haeckel #name
Expand Down Expand Up @@ -65357,6 +65357,32 @@ Prävalenzfehler/NS
Kondensatwannenheizung
Kondensatwannenheizungen
Drehmomentschrauber/NS
rumkippeln
rumkippel
rumkippelst
rumkippelt
rumkippelte
rumkippelten
rumgekippelt
herumkippeln
herumkippel
herumkippelst
herumkippelt
herumkippelte
herumkippelten
herumgekippelt
purinreich/A
urinreich/A
Erzählcafé/S
Sprachmodell/S
Sprachmodelle/N
mit_meinen
verfassungsimmanent/A
wettbewerbsübergreifend/A
störungsresistent/A
Fasziitis
pronordkoreanisch/A
standortfeindlich/A
Gymnastin
Gymnastinnen
Gewahrsamsbruch/S
Expand Down Expand Up @@ -65405,6 +65431,7 @@ Längerfristigkeit
straßenbündig/A
Durchfahrtssperre/N
Bøgseth/S
AnnenMayKantereit/S
ein_trainieren
eintrainiert/P
Mittelblockerposition
Expand Down
Original file line number Diff line number Diff line change
Expand Up @@ -3117,6 +3117,8 @@ Pete Hegseth/S #name
Elise Stefanik/S #name
Red Sweep/S
Blue Sweep/S
Ko Samui/S
Koh Samui/S
Ko Lanta/S
Koh Lanta/S
Ko Phangan/S
Expand Down
Original file line number Diff line number Diff line change
Expand Up @@ -27273,6 +27273,57 @@ Foundation, Inc., 51 Franklin St, Fifth Floor, Boston, MA 02110-1301, USA
<token>nach</token>
<token>zu</token>
</antipattern>
<antipattern>
<token inflected="yes" skip="10">reichen</token>
<token>aus</token>
<token>zu</token>
</antipattern>
<antipattern>
<token inflected="yes" skip="5">kommen</token>
<token>komisch</token>
<token>vor</token>
<token>zu</token>
</antipattern>
<antipattern>
<token regexp="yes">sehr|ganz|äu(ß|ss)erst|zu|nicht|total|wirklich|absolut|möglichst</token>
<token postag="ADJ.*" postag_regexp="yes" />
<token>zu</token>
</antipattern>
<antipattern>
<token>mit</token>
<token>zu</token>
<token>tun</token>
</antipattern>
<antipattern>
<token skip="3">von</token>
<token>aus</token>
<token>zu</token>
</antipattern>
<antipattern>
<token inflected="yes" skip="5">ziehen</token>
<token>vor</token>
<token>zu</token>
</antipattern>
<antipattern>
<token inflected="yes" skip="2">machen</token>
<token>auf</token>
<token>zu</token>
</antipattern>
<antipattern>
<token>Angst</token>
<token>vor</token>
<token>zu</token>
</antipattern>
<antipattern>
<token>vor</token>
<token>zu</token>
<token>haben</token>
</antipattern>
<antipattern>
<token skip="4">halten</token>
<token>ab</token>
<token>zu</token>
</antipattern>
<rule>
<pattern>
<token postag=".*PRP:.*" postag_regexp="yes">
Expand Down Expand Up @@ -27318,6 +27369,9 @@ Foundation, Inc., 51 Franklin St, Fifth Floor, Boston, MA 02110-1301, USA
<exception>fürs</exception>
<exception>ans</exception>
<exception>mithilfe</exception>
<exception>kraft</exception>
<exception>oberhalb</exception>
<exception>unterhalb</exception>
<exception regexp="yes">.*zeit</exception>
</token>
<token>zu</token>
Expand Down
Original file line number Diff line number Diff line change
Expand Up @@ -17151,4 +17151,23 @@ Incorrectly touched. <example type="untouched">Incorrect grammar. Those present
<disambig action="ignore_spelling"/>
</rule>
</rulegroup>

<rulegroup id="CENSORED_WORDS" name="ignore spelling of censored words">
<rule>
<pattern>
<token>f</token>
<token>*</token>
<token regexp="yes">ck(s|ed|ing)?</token>
</pattern>
<disambig action="ignore_spelling"/>
</rule>
<rule>
<pattern>
<token regexp="yes">(bull)?sh</token>
<token>*</token>
<token>t</token>
</pattern>
<disambig action="ignore_spelling"/>
</rule>
</rulegroup>
</rules>
Original file line number Diff line number Diff line change
Expand Up @@ -10970,6 +10970,11 @@ hardcode
hardcoded
DPA
DPAs
intl
decontrol
decontrols
decontrolled
decontrolling
Swiftie
Swifties
Miraidon
Expand Down
Original file line number Diff line number Diff line change
Expand Up @@ -531,6 +531,8 @@ indemnifying
indemnifies
indemnifier
indemnifiers
controllability
controlment
organocatalyst
organocatalysts
organocatalysis
Expand Down
Original file line number Diff line number Diff line change
Expand Up @@ -72199,7 +72199,7 @@ USA
<antipattern>
<token regexp="yes">an?</token>
<token>honors</token>
<token regexp="yes">thesis|major|student|graduate|class|degree|program|diploma|course</token>
<token regexp="yes" inflected="yes">thesis|major|student|graduate|class|degree|program|diploma|course</token>
</antipattern>
<antipattern>
<token>_</token>
Expand Down
Loading