blob: 99a819817c8b78fbcf9329c4a5a6c3939e838a87 [file] [log] [blame]
/**************************************************************
*
* Licensed to the Apache Software Foundation (ASF) under one
* or more contributor license agreements. See the NOTICE file
* distributed with this work for additional information
* regarding copyright ownership. The ASF licenses this file
* to you under the Apache License, Version 2.0 (the
* "License"); you may not use this file except in compliance
* with the License. You may obtain a copy of the License at
*
* http://www.apache.org/licenses/LICENSE-2.0
*
* Unless required by applicable law or agreed to in writing,
* software distributed under the License is distributed on an
* "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
* KIND, either express or implied. See the License for the
* specific language governing permissions and limitations
* under the License.
*
*************************************************************/
// MARKER(update_precomp.py): autogen include statement, do not remove
#include "precompiled_lingucomponent.hxx"
#if defined(WNT)
#include <tools/prewin.h>
#endif
#if defined(WNT)
#include <Windows.h>
#endif
#if defined(WNT)
#include <tools/postwin.h>
#endif
#include <osl/thread.h>
#include <osl/file.hxx>
#include <tools/debug.hxx>
#include <tools/urlobj.hxx>
#include <i18npool/mslangid.hxx>
#include <unotools/lingucfg.hxx>
#include <unotools/pathoptions.hxx>
#include <rtl/ustring.hxx>
#include <rtl/string.hxx>
#include <rtl/tencinfo.h>
#include <linguistic/misc.hxx>
#include <set>
#include <vector>
#include <string.h>
#include <lingutil.hxx>
using ::com::sun::star::lang::Locale;
using namespace ::com::sun::star;
#if 0
//////////////////////////////////////////////////////////////////////
String GetDirectoryPathFromFileURL( const String &rFileURL )
{
// get file URL
INetURLObject aURLObj;
aURLObj.SetSmartProtocol( INET_PROT_FILE );
aURLObj.SetSmartURL( rFileURL );
aURLObj.removeSegment();
DBG_ASSERT( !aURLObj.HasError(), "invalid URL" );
String aRes = aURLObj.GetMainURL( INetURLObject::DECODE_TO_IURI );
return aRes;
}
#endif
#if defined(WNT)
rtl::OString Win_GetShortPathName( const rtl::OUString &rLongPathName )
{
rtl::OString aRes;
sal_Unicode aShortBuffer[1024] = {0};
sal_Int32 nShortBufSize = sizeof( aShortBuffer ) / sizeof( aShortBuffer[0] );
// use the version of 'GetShortPathName' that can deal with Unicode...
sal_Int32 nShortLen = GetShortPathNameW(
reinterpret_cast<LPCWSTR>( rLongPathName.getStr() ),
reinterpret_cast<LPWSTR>( aShortBuffer ),
nShortBufSize );
if (nShortLen < nShortBufSize) // conversion successful?
aRes = rtl::OString( OU2ENC( rtl::OUString( aShortBuffer, nShortLen ), osl_getThreadTextEncoding()) );
else
DBG_ERROR( "Win_GetShortPathName: buffer to short" );
return aRes;
}
#endif //defined(WNT)
//////////////////////////////////////////////////////////////////////
// build list of old style diuctionaries (not as extensions) to use.
// User installed dictionaries (the ones residing in the user paths)
// will get precedence over system installed ones for the same language.
std::vector< SvtLinguConfigDictionaryEntry > GetOldStyleDics( const char *pDicType )
{
std::vector< SvtLinguConfigDictionaryEntry > aRes;
if (!pDicType)
return aRes;
rtl::OUString aFormatName;
String aDicExtension;
#ifdef SYSTEM_DICTS
rtl::OUString aSystemDir;
rtl::OUString aSystemPrefix;
rtl::OUString aSystemSuffix;
#endif
if (strcmp( pDicType, "DICT" ) == 0)
{
aFormatName = A2OU("DICT_SPELL");
aDicExtension = String::CreateFromAscii( ".dic" );
#ifdef SYSTEM_DICTS
aSystemDir = A2OU( DICT_SYSTEM_DIR );
aSystemSuffix = aDicExtension;
#endif
}
else if (strcmp( pDicType, "HYPH" ) == 0)
{
aFormatName = A2OU("DICT_HYPH");
aDicExtension = String::CreateFromAscii( ".dic" );
#ifdef SYSTEM_DICTS
aSystemDir = A2OU( HYPH_SYSTEM_DIR );
aSystemPrefix = A2OU( "hyph_" );
aSystemSuffix = aDicExtension;
#endif
}
else if (strcmp( pDicType, "THES" ) == 0)
{
aFormatName = A2OU("DICT_THES");
aDicExtension = String::CreateFromAscii( ".dat" );
#ifdef SYSTEM_DICTS
aSystemDir = A2OU( THES_SYSTEM_DIR );
aSystemPrefix = A2OU( "th_" );
aSystemSuffix = A2OU( "_v2.dat" );
#endif
}
if (aFormatName.getLength() == 0 || aDicExtension.Len() == 0)
return aRes;
// set of languages to remember the language where it is already
// decided to make use of the dictionary.
std::set< LanguageType > aDicLangInUse;
#ifdef SYSTEM_DICTS
osl::Directory aSystemDicts(aSystemDir);
if (aSystemDicts.open() == osl::FileBase::E_None)
{
osl::DirectoryItem aItem;
osl::FileStatus aFileStatus(FileStatusMask_FileURL);
while (aSystemDicts.getNextItem(aItem) == osl::FileBase::E_None)
{
aItem.getFileStatus(aFileStatus);
rtl::OUString sPath = aFileStatus.getFileURL();
if (sPath.lastIndexOf(aSystemSuffix) == sPath.getLength()-aSystemSuffix.getLength())
{
sal_Int32 nStartIndex = sPath.lastIndexOf(sal_Unicode('/')) + 1;
if (!sPath.match(aSystemPrefix, nStartIndex))
continue;
rtl::OUString sChunk = sPath.copy(0, sPath.getLength() - aSystemSuffix.getLength());
sal_Int32 nIndex = nStartIndex + aSystemPrefix.getLength();
rtl::OUString sLang = sChunk.getToken( 0, '_', nIndex );
if (!sLang.getLength())
continue;
rtl::OUString sRegion;
if (nIndex != -1)
sRegion = sChunk.copy( nIndex, sChunk.getLength() - nIndex );
// Thus we first get the language of the dictionary
LanguageType nLang = MsLangId::convertIsoNamesToLanguage(
sLang, sRegion );
if (aDicLangInUse.count( nLang ) == 0)
{
// remember the new language in use
aDicLangInUse.insert( nLang );
// add the dictionary to the resulting vector
SvtLinguConfigDictionaryEntry aDicEntry;
aDicEntry.aLocations.realloc(1);
aDicEntry.aLocaleNames.realloc(1);
rtl::OUString aLocaleName( MsLangId::convertLanguageToIsoString( nLang ) );
aDicEntry.aLocations[0] = sPath;
aDicEntry.aFormatName = aFormatName;
aDicEntry.aLocaleNames[0] = aLocaleName;
aRes.push_back( aDicEntry );
}
}
}
}
#endif
return aRes;
}
void MergeNewStyleDicsAndOldStyleDics(
std::list< SvtLinguConfigDictionaryEntry > &rNewStyleDics,
const std::vector< SvtLinguConfigDictionaryEntry > &rOldStyleDics )
{
// get list of languages supported by new style dictionaries
std::set< LanguageType > aNewStyleLanguages;
std::list< SvtLinguConfigDictionaryEntry >::const_iterator aIt;
for (aIt = rNewStyleDics.begin() ; aIt != rNewStyleDics.end(); ++aIt)
{
const uno::Sequence< rtl::OUString > aLocaleNames( aIt->aLocaleNames );
sal_Int32 nLocaleNames = aLocaleNames.getLength();
for (sal_Int32 k = 0; k < nLocaleNames; ++k)
{
LanguageType nLang = MsLangId::convertIsoStringToLanguage( aLocaleNames[k] );
aNewStyleLanguages.insert( nLang );
}
}
// now check all old style dictionaries if they will add a not yet
// added language. If so add them to the resulting vector
std::vector< SvtLinguConfigDictionaryEntry >::const_iterator aIt2;
for (aIt2 = rOldStyleDics.begin(); aIt2 != rOldStyleDics.end(); ++aIt2)
{
sal_Int32 nOldStyleDics = aIt2->aLocaleNames.getLength();
// old style dics should only have one language listed...
DBG_ASSERT( nOldStyleDics, "old style dictionary with more then one language found!");
if (nOldStyleDics > 0)
{
LanguageType nLang = MsLangId::convertIsoStringToLanguage( aIt2->aLocaleNames[0] );
if (nLang == LANGUAGE_DONTKNOW || nLang == LANGUAGE_NONE)
{
DBG_ERROR( "old style dictionary with invalid language found!" );
continue;
}
// language not yet added?
if (aNewStyleLanguages.count( nLang ) == 0)
rNewStyleDics.push_back( *aIt2 );
}
else
{
DBG_ERROR( "old style dictionary with no language found!" );
}
}
}
rtl_TextEncoding getTextEncodingFromCharset(const sal_Char* pCharset)
{
// default result: used to indicate that we failed to get the proper encoding
rtl_TextEncoding eRet = RTL_TEXTENCODING_DONTKNOW;
if (pCharset)
{
eRet = rtl_getTextEncodingFromMimeCharset(pCharset);
if (eRet == RTL_TEXTENCODING_DONTKNOW)
eRet = rtl_getTextEncodingFromUnixCharset(pCharset);
if (eRet == RTL_TEXTENCODING_DONTKNOW)
{
if (strcmp("ISCII-DEVANAGARI", pCharset) == 0)
eRet = RTL_TEXTENCODING_ISCII_DEVANAGARI;
}
}
return eRet;
}
//////////////////////////////////////////////////////////////////////