diff --git a/languagetool-language-modules/pt/src/main/resources/org/languagetool/resource/pt/added.txt b/languagetool-language-modules/pt/src/main/resources/org/languagetool/resource/pt/added.txt index e9973de7bae39..f89e8b05b107e 100644 --- a/languagetool-language-modules/pt/src/main/resources/org/languagetool/resource/pt/added.txt +++ b/languagetool-language-modules/pt/src/main/resources/org/languagetool/resource/pt/added.txt @@ -211,3 +211,35 @@ Eds Ed NCMPS00 EF EF NCCS000 BT BT AQ0CN0 Linux Linux AQ0CN0 + +# To be added before 1.2.0 +Vermont Vermont NPMSG00 +Newport Newport NPCSG00 +Connecticut Connecticut NPCSG00 +Delaware Delaware NPCSG00 +Maryland Maryland NPCSG00 +Mississippi Mississippi NPMSG00 +cajun cajun AQ0CN0 +Tennessee Tennessee NPMSG00 +Nashville Nashville NPCSG00 +Kentucky Kentucky NPMSG00 +Iowa Iowa NPMSG00 +Dakota Dakota NPFSG00 +Nebraska Nebraska NPMSG00 +Idaho Idaho NPMSG00 +Oregon Oregon NPMSG00 +Seattle Seattle NPCSG00 +Yukon Yukon NPMSG00 +Saskatchewan Saskatchewan NPCSG00 +Saskatoon Saskatoon NPCSG00 +Manitoba Manitoba NPCSG00 +Winnipeg Winnipeg NPCSG00 +Niágara Niágara NPMSG00 +Hobart Hobart NPCSG00 +Brisbane Brisbane NPCSG00 +Cairns Cairns NPCSG00 +Perth Perth NPCSG00 +outback outback NCMS000 +outbacks outback NCMS000 +Erie Erie NPMSG00 +Huron Huron NPMSG00 diff --git a/languagetool-language-modules/pt/src/main/resources/org/languagetool/resource/pt/entities/english.ent b/languagetool-language-modules/pt/src/main/resources/org/languagetool/resource/pt/entities/english.ent index 1c0f75445d71f..5a9e7d0c651cf 100644 --- a/languagetool-language-modules/pt/src/main/resources/org/languagetool/resource/pt/entities/english.ent +++ b/languagetool-language-modules/pt/src/main/resources/org/languagetool/resource/pt/entities/english.ent @@ -10,7 +10,7 @@ - + @@ -214,10 +214,11 @@ kitchen|(bath|bed)room|survivors?|catch(es)?|caught|tells?|told|forbid(den)?| prohibit(ed|s|ing)?|cats?|strikes?|strikes?|afternoons?|soldiers?|troops?| count(y|ies|s)?|earls?|viscounts?|hells?|heavens?|damn|[fs]uck(ing|s|ed|ers?)| - stupid|good|bad|wors[et]|fast(er|est)?|royalty|defen[sc]es?|defend(ed|s|ers?)?| + stupid|good|bad|wors[et]|fast(er|est)?|royal(ty)?|defen[sc]es?|defend(ed|s|ers?)?| chemistry|chemical|chemist|grew|grow([sn]|ing)?|blew|blow([sn]|ing)?| boys?|girls?|ugl(y|ie(r|st))|beaut(y|ies)|robbers?|forever|big(ge(r|st))?| - small(er|est)?|slow(er|est|ly)?|tall(er|est)?|short(ly|er|est)? + small(er|est)?|slow(er|est|ly)?|tall(er|est)?|short(ly|er|est)?| + live[sd]|living|die[sd]|dying|free|gardens? "> diff --git a/languagetool-language-modules/pt/src/main/resources/org/languagetool/resource/pt/multiwords.txt b/languagetool-language-modules/pt/src/main/resources/org/languagetool/resource/pt/multiwords.txt index c78ee50efd526..8389783a778db 100644 --- a/languagetool-language-modules/pt/src/main/resources/org/languagetool/resource/pt/multiwords.txt +++ b/languagetool-language-modules/pt/src/main/resources/org/languagetool/resource/pt/multiwords.txt @@ -820,7 +820,7 @@ Chrome Store NPCNO00_ Ciudad Juárez NPCNG00_ Ciudad Real NPCNG00_ Cliff Richard NPMSSP0_ -Colúmbia Britànica NPCNG00_ +Colúmbia Britânica NPCNG00_ Compra Garantida NPMSO00_ Consell de Cent NPMSO00_ Copy Club NPCSO00_ @@ -12053,3 +12053,9 @@ code reviews NCCP000_ # Looks to be a pt-BR-only way of abbreviating the name of the RHCP lol Red Hot NPMNS00_ + +Nova Hampshire NPFSG00_ +Nova Jersey NPFSG00_ +Nova Jérsia NPFSG00_ +Monte Rushmore NPMSG00_ +Sydney Harbour Bridge NPFSG00_ diff --git a/languagetool-language-modules/pt/src/main/resources/org/languagetool/resource/pt/spelling.txt b/languagetool-language-modules/pt/src/main/resources/org/languagetool/resource/pt/spelling.txt index 32bc3db4ef692..0194b4db79605 100644 --- a/languagetool-language-modules/pt/src/main/resources/org/languagetool/resource/pt/spelling.txt +++ b/languagetool-language-modules/pt/src/main/resources/org/languagetool/resource/pt/spelling.txt @@ -303,3 +303,37 @@ maquillage surmenage assemblage paul + +# To be added before 1.2.0 + +Vermont +Newport +Connecticut +Delaware +Maryland +Mississippi +cajun +Tennessee +Nashville +Kentucky +Iowa +Dakota +Nebraska +Idaho +Oregon +Seattle +Yukon +Saskatchewan +Saskatoon +Manitoba +Winnipeg +Niágara +Hobart +Brisbane +Cairns +Perth +outback +outbacks +Erie +Huron +hidrologicamente diff --git a/languagetool-standalone/src/test/java/org/languagetool/JLanguageToolTest.java b/languagetool-standalone/src/test/java/org/languagetool/JLanguageToolTest.java index 715f63b0c427a..0c9f744a8c709 100644 --- a/languagetool-standalone/src/test/java/org/languagetool/JLanguageToolTest.java +++ b/languagetool-standalone/src/test/java/org/languagetool/JLanguageToolTest.java @@ -608,7 +608,8 @@ public void testIgnoreEnglishWordsInPortuguese() throws IOException { "Birmingham City Football Club.", "Narra, segundo o historiador americano Will Durant, uma das maiores aventuras da história humana.", "Duas décadas mais tarde, os Gipsy Kings incorporaram aquilo.", - "Valente teve três irmãos, um dos quais, Silvio Francesco, também esteve no show business." + "Valente teve três irmãos, um dos quais, Silvio Francesco, também esteve no show business.", + "O lema do estado de Nova Hampshire é Livre Free or Die" }; for (String sentence : noErrorSentences) { List matches = lt.check(sentence); @@ -621,6 +622,7 @@ public void testIgnoreEnglishWordsInPortuguese() throws IOException { errorSentences.put("A comunidade do ghetto de Veneza.", "gueto"); // in isolation, it is not tagged with _english_ignore_ // because "as" is blocked and "Endeavour" is not in the list of 'common' English words, we don't tag with _english_ignore_ errorSentences.put("Acho que se chamava As Endeavour.", "EndeavourOS"); + errorSentences.put("Clique settings e veja o que acontece.", "sétimas"); // "settings" is isolated; "clique" is English but specifically blocked for (Map.Entry entry : errorSentences.entrySet()) { List matches = lt.check(entry.getKey()); assert !matches.isEmpty();