// Copyright (c) 2010 The Chromium Authors. All rights reserved. // Use of this source code is governed by a BSD-style license that can be // found in the LICENSE file. #include "base/string_util.h" #include "base/utf_string_conversions.h" #include "chrome/browser/spellchecker_platform_engine.h" #include "testing/gtest/include/gtest/gtest.h" // Tests that words are properly ignored. Currently only enabled on OS X as it // is the only platform to support ignoring words. Note that in this test, we // supply a non-zero doc_tag, in order to test that ignored words are matched to // the correct document. TEST(PlatformSpellCheckTest, IgnoreWords_EN_US) { const char* kTestCases[] = { "teh", "morblier", "watre", "noooen", }; for (size_t i = 0; i < ARRAYSIZE_UNSAFE(kTestCases); ++i) { const string16 word(ASCIIToUTF16(kTestCases[i])); const int doc_tag = SpellCheckerPlatform::GetDocumentTag(); // The word should show up as misspelled. EXPECT_FALSE(SpellCheckerPlatform::CheckSpelling(word, doc_tag)) << word; // Ignore the word. SpellCheckerPlatform::IgnoreWord(word); // The word should now show up as correctly spelled. EXPECT_TRUE(SpellCheckerPlatform::CheckSpelling(word, doc_tag)) << word; // Close the docuemnt. Any words that we had previously ignored should no // longer be ignored and thus should show up as misspelled. SpellCheckerPlatform::CloseDocumentWithTag(doc_tag); // The word should now show be spelled wrong again EXPECT_FALSE(SpellCheckerPlatform::CheckSpelling(word, doc_tag)) << word; } } // Test IgnoreWords_EN_US TEST(PlatformSpellCheckTest, SpellCheckSuggestions_EN_US) { static const struct { const char* input; // A string to be tested. const char* suggested_word; // A suggested word that should occur. } kTestCases[] = { // We need to have separate test cases here, since hunspell and the OS X // spellchecking service occasionally differ on what they consider a valid // suggestion for a given word, although these lists could likely be // integrated somewhat. The test cases for non-Mac are in // chrome/renderer/spellcheck_unittest.cc // These words come from the wikipedia page of the most commonly // misspelled words in english. // (http://en.wikipedia.org/wiki/Commonly_misspelled_words). // However, 10.6 loads multiple dictionaries and enables many non-English // dictionaries by default. As a result, we have removed from the list any // word that is marked as correct because it is correct in another // language. {"absense", "absence"}, {"acceptible", "acceptable"}, {"accidentaly", "accidentally"}, {"acheive", "achieve"}, {"acknowlege", "acknowledge"}, {"acquaintence", "acquaintance"}, {"aquire", "acquire"}, {"aquit", "acquit"}, {"acrage", "acreage"}, {"adultary", "adultery"}, {"advertize", "advertise"}, {"adviseable", "advisable"}, {"alchohol", "alcohol"}, {"alege", "allege"}, {"allegaince", "allegiance"}, {"allmost", "almost"}, // Ideally, this test should pass. It works in firefox, but not in hunspell // or OS X. // {"alot", "a lot"}, {"amatuer", "amateur"}, {"ammend", "amend"}, {"amung", "among"}, {"anually", "annually"}, {"apparant", "apparent"}, {"artic", "arctic"}, {"arguement", "argument"}, {"athiest", "atheist"}, {"athelete", "athlete"}, {"avrage", "average"}, {"awfull", "awful"}, {"ballance", "balance"}, {"basicly", "basically"}, {"becuase", "because"}, {"becomeing", "becoming"}, {"befor", "before"}, {"begining", "beginning"}, {"beleive", "believe"}, {"bellweather", "bellwether"}, {"benifit", "benefit"}, {"bouy", "buoy"}, {"briliant", "brilliant"}, {"burgler", "burglar"}, {"camoflage", "camouflage"}, {"carefull", "careful"}, {"Carribean", "Caribbean"}, {"catagory", "category"}, {"cauhgt", "caught"}, {"cieling", "ceiling"}, {"cemetary", "cemetery"}, {"certin", "certain"}, {"changable", "changeable"}, {"cheif", "chief"}, {"citezen", "citizen"}, {"collaegue", "colleague"}, {"colum", "column"}, {"comming", "coming"}, {"commited", "committed"}, {"compitition", "competition"}, {"conceed", "concede"}, {"congradulate", "congratulate"}, {"consciencious", "conscientious"}, {"concious", "conscious"}, {"concensus", "consensus"}, {"contraversy", "controversy"}, {"conveniance", "convenience"}, {"critecize", "criticize"}, {"dacquiri", "daiquiri"}, {"decieve", "deceive"}, {"dicide", "decide"}, {"definate", "definite"}, {"definitly", "definitely"}, {"desparate", "desperate"}, {"develope", "develop"}, {"diffrence", "difference"}, {"disapear", "disappear"}, {"disapoint", "disappoint"}, {"disasterous", "disastrous"}, {"disipline", "discipline"}, {"drunkeness", "drunkenness"}, {"dumbell", "dumbbell"}, {"easely", "easily"}, {"eigth", "eight"}, {"embarass", "embarrass"}, {"enviroment", "environment"}, {"equiped", "equipped"}, {"equiptment", "equipment"}, {"exagerate", "exaggerate"}, {"exellent", "excellent"}, {"exsept", "except"}, {"exercize", "exercise"}, {"exilerate", "exhilarate"}, {"existance", "existence"}, {"experiance", "experience"}, {"experament", "experiment"}, {"explaination", "explanation"}, {"facinating", "fascinating"}, {"firey", "fiery"}, {"finaly", "finally"}, {"flourescent", "fluorescent"}, {"foriegn", "foreign"}, {"fourty", "forty"}, {"foreward", "forward"}, {"freind", "friend"}, {"fundemental", "fundamental"}, {"guage", "gauge"}, {"generaly", "generally"}, {"goverment", "government"}, {"gratefull", "grateful"}, {"garantee", "guarantee"}, {"guidence", "guidance"}, {"happyness", "happiness"}, {"harrass", "harass"}, {"heighth", "height"}, {"heirarchy", "hierarchy"}, {"humerous", "humorous"}, {"hygene", "hygiene"}, {"hipocrit", "hypocrite"}, {"idenity", "identity"}, {"ignorence", "ignorance"}, {"imaginery", "imaginary"}, {"immitate", "imitate"}, {"immitation", "imitation"}, {"imediately", "immediately"}, {"incidently", "incidentally"}, {"independant", "independent"}, {"indispensible", "indispensable"}, {"innoculate", "inoculate"}, {"inteligence", "intelligence"}, {"intresting", "interesting"}, {"interuption", "interruption"}, {"irrelevent", "irrelevant"}, {"irritible", "irritable"}, {"jellous", "jealous"}, {"knowlege", "knowledge"}, {"labratory", "laboratory"}, {"lenght", "length"}, {"liason", "liaison"}, {"libary", "library"}, {"lisence", "license"}, {"lonelyness", "loneliness"}, {"lieing", "lying"}, {"maintenence", "maintenance"}, {"manuever", "maneuver"}, {"marrige", "marriage"}, {"mathmatics", "mathematics"}, {"medcine", "medicine"}, {"miniture", "miniature"}, {"minite", "minute"}, {"mischevous", "mischievous"}, {"mispell", "misspell"}, // Maybe this one should pass, as it works in hunspell, but not in firefox. // {"misterius", "mysterious"}, {"naturaly", "naturally"}, {"neccessary", "necessary"}, {"neice", "niece"}, {"nieghbor", "neighbor"}, {"nieghbour", "neighbor"}, {"niether", "neither"}, {"noticable", "noticeable"}, {"occassion", "occasion"}, {"occasionaly", "occasionally"}, {"occurrance", "occurrence"}, {"occured", "occurred"}, {"ommision", "omission"}, {"oppurtunity", "opportunity"}, {"outragous", "outrageous"}, {"parrallel", "parallel"}, {"parliment", "parliament"}, {"particurly", "particularly"}, {"passtime", "pastime"}, {"peculier", "peculiar"}, {"percieve", "perceive"}, {"pernament", "permanent"}, {"perseverence", "perseverance"}, {"personaly", "personally"}, {"persaude", "persuade"}, {"pichure", "picture"}, {"peice", "piece"}, {"plagerize", "plagiarize"}, {"playright", "playwright"}, {"plesant", "pleasant"}, {"pollitical", "political"}, {"posession", "possession"}, {"potatos", "potatoes"}, {"practicle", "practical"}, {"preceed", "precede"}, {"predjudice", "prejudice"}, {"presance", "presence"}, {"privelege", "privilege"}, // This one should probably work. It does in FF and Hunspell. // {"probly", "probably"}, {"proffesional", "professional"}, {"promiss", "promise"}, {"pronounciation", "pronunciation"}, {"prufe", "proof"}, {"psycology", "psychology"}, {"publically", "publicly"}, {"quanity", "quantity"}, {"quarentine", "quarantine"}, {"questionaire", "questionnaire"}, {"readible", "readable"}, {"realy", "really"}, {"recieve", "receive"}, {"reciept", "receipt"}, {"reconize", "recognize"}, {"recomend", "recommend"}, {"refered", "referred"}, {"referance", "reference"}, {"relevent", "relevant"}, {"religous", "religious"}, {"repitition", "repetition"}, {"restarant", "restaurant"}, {"rythm", "rhythm"}, {"rediculous", "ridiculous"}, {"sacrefice", "sacrifice"}, {"saftey", "safety"}, {"sissors", "scissors"}, {"secratary", "secretary"}, {"seperate", "separate"}, {"sargent", "sergeant"}, {"shineing", "shining"}, {"similer", "similar"}, {"sinceerly", "sincerely"}, {"speach", "speech"}, {"strenght", "strength"}, {"succesful", "successful"}, {"supercede", "supersede"}, {"surelly", "surely"}, {"suprise", "surprise"}, {"temperture", "temperature"}, {"temprary", "temporary"}, {"tommorrow", "tomorrow"}, {"tounge", "tongue"}, {"truely", "truly"}, {"twelth", "twelfth"}, {"tyrany", "tyranny"}, {"underate", "underrate"}, {"untill", "until"}, {"unuseual", "unusual"}, {"upholstry", "upholstery"}, {"usible", "usable"}, {"useing", "using"}, {"usualy", "usually"}, {"vaccuum", "vacuum"}, {"vegatarian", "vegetarian"}, {"vehical", "vehicle"}, {"visious", "vicious"}, {"villege", "village"}, {"wierd", "weird"}, {"wellcome", "welcome"}, {"wellfare", "welfare"}, {"wilfull", "willful"}, {"withold", "withhold"}, {"writting", "writing"}, }; for (size_t i = 0; i < ARRAYSIZE_UNSAFE(kTestCases); ++i) { const string16 word(ASCIIToUTF16(kTestCases[i].input)); EXPECT_FALSE(SpellCheckerPlatform::CheckSpelling(word, 0)) << word; // Check if the suggested words occur. std::vector<string16> suggestions; SpellCheckerPlatform::FillSuggestionList(word, &suggestions); bool suggested_word_is_present = false; const string16 suggested_word(ASCIIToUTF16(kTestCases[i].suggested_word)); for (size_t j = 0; j < suggestions.size(); j++) { if (suggestions[j].compare(suggested_word) == 0) { suggested_word_is_present = true; break; } } EXPECT_TRUE(suggested_word_is_present) << suggested_word; } }