diff options
author | Kurt Zenker <kz@openoffice.org> | 2007-06-19 15:00:49 +0000 |
---|---|---|
committer | Kurt Zenker <kz@openoffice.org> | 2007-06-19 15:00:49 +0000 |
commit | 59b2c7ecaf555287f0607c16873711eb855fdbbc (patch) | |
tree | 8a10a575c5448e62c86710638e1e32d3b5eea54b | |
parent | 3150642bbb71441a8a945c6b4eaaaf40cb93b987 (diff) |
INTEGRATION: CWS languageguessing (1.1.2); FILE ADDED
2007/01/12 11:05:12 tl 1.1.2.1: #i73173# integrate Google SoC language-guessing
-rw-r--r-- | lingucomponent/source/languageguessing/guess.cxx | 165 |
1 files changed, 165 insertions, 0 deletions
diff --git a/lingucomponent/source/languageguessing/guess.cxx b/lingucomponent/source/languageguessing/guess.cxx new file mode 100644 index 000000000..233b2dab7 --- /dev/null +++ b/lingucomponent/source/languageguessing/guess.cxx @@ -0,0 +1,165 @@ +/*************************************************************************** + * Copyright (C) 2006 by Jocelyn Merand * + * joc.mer@gmail.com * + * * + * + * OpenOffice.org - a multi-platform office productivity suite + * + * $RCSfile: guess.cxx,v $ + * + * $Revision: 1.2 $ + * + * last change: $Author: kz $ $Date: 2007-06-19 16:00:49 $ + * + * The Contents of this file are made available subject to + * the terms of GNU Lesser General Public License Version 2.1. + * + * + * GNU Lesser General Public License Version 2.1 + * ============================================= + * Copyright 2005 by Sun Microsystems, Inc. + * 901 San Antonio Road, Palo Alto, CA 94303, USA + * + * This library is free software; you can redistribute it and/or + * modify it under the terms of the GNU Lesser General Public + * License version 2.1, as published by the Free Software Foundation. + * + * This library is distributed in the hope that it will be useful, + * but WITHOUT ANY WARRANTY; without even the implied warranty of + * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU + * Lesser General Public License for more details. + * + * You should have received a copy of the GNU Lesser General Public + * License along with this library; if not, write to the Free Software + * Foundation, Inc., 59 Temple Place, Suite 330, Boston, + * MA 02111-1307 USA + * + ************************************************************************/ + +#include <iostream> + +#include <libtextcat/textcat.h> +#include <altstrfunc.hxx> +#include <guess.hxx> + +using namespace std; + +Guess::Guess() +{ + language_str = DEFAULT_LANGUAGE; + country_str = DEFAULT_COUNTRY; + encoding_str = DEFAULT_ENCODING; + order = 0; +} + +Guess::Guess(string& lang, string& country, string& enc, int p_order) +{ + Guess(); + language_str=lang; + country_str=country; + encoding_str=enc; + order = p_order; +} + +/* +* this use a char * string to build the guess object +* a string like those is made as : [language-country-encoding]... +* +*/ + +Guess::Guess(char * guess_str, int p_order) +{ + Guess(); + order = p_order; + + string lang; + string country; + string enc; + + //if the guess is not like "UNKNOWN" or "SHORT", go into the brackets +// if(strncmp((const char*)(guess_str + 1), _TEXTCAT_RESULT_UNKOWN, strlen(_TEXTCAT_RESULT_UNKOWN)) != 0 +// && +// strncmp((const char*)(guess_str + 1), _TEXTCAT_RESULT_SHORT, strlen(_TEXTCAT_RESULT_SHORT)) != 0) +// { + if(strcmp((const char*)(guess_str + 1), _TEXTCAT_RESULT_UNKOWN) != 0 + && + strcmp((const char*)(guess_str + 1), _TEXTCAT_RESULT_SHORT) != 0) + { + + int current_pointer = 0; + + //this is to go to the first char of the guess string ( the '[' of "[en-US-utf8]" ) + while(!isSeparator(guess_str[current_pointer])){ + current_pointer++; + } + current_pointer++; + + //this is to pick up the language ( the "en" from "[en-US-utf8]" ) + while(!isSeparator(guess_str[current_pointer])){ + lang+=guess_str[current_pointer]; + current_pointer++; + } + current_pointer++; + + //this is to pick up the country ( the "US" from "[en-US-utf8]" ) + while(!isSeparator(guess_str[current_pointer])){ + country+=guess_str[current_pointer]; + current_pointer++; + } + current_pointer++; + + //this is to pick up the encoding ( the "utf8" from "[en-US-utf8]" ) + while(!isSeparator(guess_str[current_pointer])){ + enc+=guess_str[current_pointer]; + current_pointer++; + } + + if(lang!=""){//if not we use the default value + language_str=lang; + } + + if(/*country!=""*/1){ + country_str=country; + } + else{//if we don't have an availlable country, we use the language as a country + country_str=upperCase(language_str); + } + + if(enc!=""){//if not we use the default value + encoding_str=enc; + } + } +} + +Guess::~Guess(){} + +string Guess::GetLanguage() +{ + return language_str; +} + +string Guess::GetCountry() +{ + return country_str; +} + +string Guess::GetEncoding() +{ + return encoding_str; +} + +int Guess::GetOrder() +{ + return order; +} + +bool Guess::operator==(string lang) +{ + string toString; + toString += GetLanguage(); + toString += "-"; + toString += GetCountry(); + toString += "-"; + toString += GetEncoding(); + return start(toString, lang); +} |