summaryrefslogtreecommitdiff
path: root/lingucomponent/source/lingutil/lingutil.cxx
diff options
context:
space:
mode:
Diffstat (limited to 'lingucomponent/source/lingutil/lingutil.cxx')
-rw-r--r--lingucomponent/source/lingutil/lingutil.cxx272
1 files changed, 272 insertions, 0 deletions
diff --git a/lingucomponent/source/lingutil/lingutil.cxx b/lingucomponent/source/lingutil/lingutil.cxx
new file mode 100644
index 000000000000..ee7d71de4435
--- /dev/null
+++ b/lingucomponent/source/lingutil/lingutil.cxx
@@ -0,0 +1,272 @@
+/*************************************************************************
+ *
+ * DO NOT ALTER OR REMOVE COPYRIGHT NOTICES OR THIS FILE HEADER.
+ *
+ * Copyright 2000, 2010 Oracle and/or its affiliates.
+ *
+ * OpenOffice.org - a multi-platform office productivity suite
+ *
+ * This file is part of OpenOffice.org.
+ *
+ * OpenOffice.org is free software: you can redistribute it and/or modify
+ * it under the terms of the GNU Lesser General Public License version 3
+ * only, as published by the Free Software Foundation.
+ *
+ * OpenOffice.org is distributed in the hope that it will be useful,
+ * but WITHOUT ANY WARRANTY; without even the implied warranty of
+ * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
+ * GNU Lesser General Public License version 3 for more details
+ * (a copy is included in the LICENSE file that accompanied this code).
+ *
+ * You should have received a copy of the GNU Lesser General Public License
+ * version 3 along with OpenOffice.org. If not, see
+ * <http://www.openoffice.org/license.html>
+ * for a copy of the LGPLv3 License.
+ *
+ ************************************************************************/
+
+// MARKER(update_precomp.py): autogen include statement, do not remove
+#include "precompiled_lingucomponent.hxx"
+
+#if defined(WNT)
+#include <tools/prewin.h>
+#endif
+
+#if defined(WNT)
+#include <Windows.h>
+#endif
+
+#if defined(WNT)
+#include <tools/postwin.h>
+#endif
+
+
+#include <osl/thread.h>
+#include <osl/file.hxx>
+#include <tools/debug.hxx>
+#include <tools/urlobj.hxx>
+#include <i18npool/mslangid.hxx>
+#include <unotools/lingucfg.hxx>
+#include <unotools/pathoptions.hxx>
+#include <rtl/ustring.hxx>
+#include <rtl/string.hxx>
+#include <linguistic/misc.hxx>
+
+#include <set>
+#include <vector>
+#include <string.h>
+
+#include <lingutil.hxx>
+#include <dictmgr.hxx>
+
+
+
+
+using ::com::sun::star::lang::Locale;
+using namespace ::com::sun::star;
+
+#if 0
+//////////////////////////////////////////////////////////////////////
+
+String GetDirectoryPathFromFileURL( const String &rFileURL )
+{
+ // get file URL
+ INetURLObject aURLObj;
+ aURLObj.SetSmartProtocol( INET_PROT_FILE );
+ aURLObj.SetSmartURL( rFileURL );
+ aURLObj.removeSegment();
+ DBG_ASSERT( !aURLObj.HasError(), "invalid URL" );
+ String aRes = aURLObj.GetMainURL( INetURLObject::DECODE_TO_IURI );
+ return aRes;
+}
+#endif
+
+#if defined(WNT)
+rtl::OString Win_GetShortPathName( const rtl::OUString &rLongPathName )
+{
+ rtl::OString aRes;
+
+ sal_Unicode aShortBuffer[1024] = {0};
+ sal_Int32 nShortBufSize = sizeof( aShortBuffer ) / sizeof( aShortBuffer[0] );
+
+ // use the version of 'GetShortPathName' that can deal with Unicode...
+ sal_Int32 nShortLen = GetShortPathNameW(
+ reinterpret_cast<LPCWSTR>( rLongPathName.getStr() ),
+ reinterpret_cast<LPWSTR>( aShortBuffer ),
+ nShortBufSize );
+
+ if (nShortLen < nShortBufSize) // conversion successful?
+ aRes = rtl::OString( OU2ENC( rtl::OUString( aShortBuffer, nShortLen ), osl_getThreadTextEncoding()) );
+ else
+ DBG_ERROR( "Win_GetShortPathName: buffer to short" );
+
+ return aRes;
+}
+#endif //defined(WNT)
+
+//////////////////////////////////////////////////////////////////////
+
+// build list of old style diuctionaries (not as extensions) to use.
+// User installed dictionaries (the ones residing in the user paths)
+// will get precedence over system installed ones for the same language.
+std::vector< SvtLinguConfigDictionaryEntry > GetOldStyleDics( const char *pDicType )
+{
+ std::vector< SvtLinguConfigDictionaryEntry > aRes;
+
+ if (!pDicType)
+ return aRes;
+
+ rtl::OUString aFormatName;
+ String aDicExtension;
+#ifdef SYSTEM_DICTS
+ rtl::OUString aSystemDir;
+ rtl::OUString aSystemPrefix;
+ rtl::OUString aSystemSuffix;
+#endif
+ bool bSpell = false;
+ bool bHyph = false;
+ bool bThes = false;
+ if (strcmp( pDicType, "DICT" ) == 0)
+ {
+ aFormatName = A2OU("DICT_SPELL");
+ aDicExtension = String::CreateFromAscii( ".dic" );
+#ifdef SYSTEM_DICTS
+ aSystemDir = A2OU( DICT_SYSTEM_DIR );
+ aSystemSuffix = aDicExtension;
+#endif
+ bSpell = true;
+ }
+ else if (strcmp( pDicType, "HYPH" ) == 0)
+ {
+ aFormatName = A2OU("DICT_HYPH");
+ aDicExtension = String::CreateFromAscii( ".dic" );
+#ifdef SYSTEM_DICTS
+ aSystemDir = A2OU( HYPH_SYSTEM_DIR );
+ aSystemPrefix = A2OU( "hyph_" );
+ aSystemSuffix = aDicExtension;
+#endif
+ bHyph = true;
+ }
+ else if (strcmp( pDicType, "THES" ) == 0)
+ {
+ aFormatName = A2OU("DICT_THES");
+ aDicExtension = String::CreateFromAscii( ".dat" );
+#ifdef SYSTEM_DICTS
+ aSystemDir = A2OU( THES_SYSTEM_DIR );
+ aSystemPrefix = A2OU( "th_" );
+ aSystemSuffix = A2OU( "_v2.dat" );
+#endif
+ bThes = true;
+ }
+
+
+ if (aFormatName.getLength() == 0 || aDicExtension.Len() == 0)
+ return aRes;
+
+ // set of languages to remember the language where it is already
+ // decided to make use of the dictionary.
+ std::set< LanguageType > aDicLangInUse;
+
+#ifdef SYSTEM_DICTS
+ osl::Directory aSystemDicts(aSystemDir);
+ if (aSystemDicts.open() == osl::FileBase::E_None)
+ {
+ osl::DirectoryItem aItem;
+ osl::FileStatus aFileStatus(FileStatusMask_FileURL);
+ while (aSystemDicts.getNextItem(aItem) == osl::FileBase::E_None)
+ {
+ aItem.getFileStatus(aFileStatus);
+ rtl::OUString sPath = aFileStatus.getFileURL();
+ if (sPath.lastIndexOf(aSystemSuffix) == sPath.getLength()-aSystemSuffix.getLength())
+ {
+ sal_Int32 nStartIndex = sPath.lastIndexOf(sal_Unicode('/')) + 1;
+ if (!sPath.match(aSystemPrefix, nStartIndex))
+ continue;
+ rtl::OUString sChunk = sPath.copy(0, sPath.getLength() - aSystemSuffix.getLength());
+ sal_Int32 nIndex = nStartIndex + aSystemPrefix.getLength();
+ rtl::OUString sLang = sChunk.getToken( 0, '_', nIndex );
+ if (!sLang.getLength())
+ continue;
+ rtl::OUString sRegion;
+ if (nIndex != -1)
+ sRegion = sChunk.copy( nIndex, sChunk.getLength() - nIndex );
+
+ // Thus we first get the language of the dictionary
+ LanguageType nLang = MsLangId::convertIsoNamesToLanguage(
+ sLang, sRegion );
+
+ if (aDicLangInUse.count( nLang ) == 0)
+ {
+ // remember the new language in use
+ aDicLangInUse.insert( nLang );
+
+ // add the dictionary to the resulting vector
+ SvtLinguConfigDictionaryEntry aDicEntry;
+ aDicEntry.aLocations.realloc(1);
+ aDicEntry.aLocaleNames.realloc(1);
+ rtl::OUString aLocaleName( MsLangId::convertLanguageToIsoString( nLang ) );
+ aDicEntry.aLocations[0] = sPath;
+ aDicEntry.aFormatName = aFormatName;
+ aDicEntry.aLocaleNames[0] = aLocaleName;
+ aRes.push_back( aDicEntry );
+ }
+ }
+ }
+ }
+
+#endif
+
+ return aRes;
+}
+
+
+void MergeNewStyleDicsAndOldStyleDics(
+ std::list< SvtLinguConfigDictionaryEntry > &rNewStyleDics,
+ const std::vector< SvtLinguConfigDictionaryEntry > &rOldStyleDics )
+{
+ // get list of languages supported by new style dictionaries
+ std::set< LanguageType > aNewStyleLanguages;
+ std::list< SvtLinguConfigDictionaryEntry >::const_iterator aIt;
+ for (aIt = rNewStyleDics.begin() ; aIt != rNewStyleDics.end(); ++aIt)
+ {
+ const uno::Sequence< rtl::OUString > aLocaleNames( aIt->aLocaleNames );
+ sal_Int32 nLocaleNames = aLocaleNames.getLength();
+ for (sal_Int32 k = 0; k < nLocaleNames; ++k)
+ {
+ LanguageType nLang = MsLangId::convertIsoStringToLanguage( aLocaleNames[k] );
+ aNewStyleLanguages.insert( nLang );
+ }
+ }
+
+ // now check all old style dictionaries if they will add a not yet
+ // added language. If so add them to the resulting vector
+ std::vector< SvtLinguConfigDictionaryEntry >::const_iterator aIt2;
+ for (aIt2 = rOldStyleDics.begin(); aIt2 != rOldStyleDics.end(); ++aIt2)
+ {
+ sal_Int32 nOldStyleDics = aIt2->aLocaleNames.getLength();
+
+ // old style dics should only have one language listed...
+ DBG_ASSERT( nOldStyleDics, "old style dictionary with more then one language found!");
+ if (nOldStyleDics > 0)
+ {
+ LanguageType nLang = MsLangId::convertIsoStringToLanguage( aIt2->aLocaleNames[0] );
+
+ if (nLang == LANGUAGE_DONTKNOW || nLang == LANGUAGE_NONE)
+ {
+ DBG_ERROR( "old style dictionary with invalid language found!" );
+ continue;
+ }
+
+ // language not yet added?
+ if (aNewStyleLanguages.count( nLang ) == 0)
+ rNewStyleDics.push_back( *aIt2 );
+ }
+ else
+ {
+ DBG_ERROR( "old style dictionary with no language found!" );
+ }
+ }
+}
+
+//////////////////////////////////////////////////////////////////////
+