You can not select more than 25 topics
Topics must start with a letter or number, can include dashes ('-') and can be up to 35 characters long.
442 lines
18 KiB
442 lines
18 KiB
/* This file is part of the KDE libraries
|
|
Copyright (C) 1999 Ian Zepp (icszepp@islc.net)
|
|
Copyright (C) 2000 Rik Hemsley (rikkus) <rik@kde.org>
|
|
|
|
This library is free software; you can redistribute it and/or
|
|
modify it under the terms of the GNU Library General Public
|
|
License version 2 as published by the Free Software Foundation.
|
|
|
|
This library is distributed in the hope that it will be useful,
|
|
but WITHOUT ANY WARRANTY; without even the implied warranty of
|
|
MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
|
|
Library General Public License for more details.
|
|
|
|
You should have received a copy of the GNU Library General Public License
|
|
along with this library; see the file COPYING.LIB. If not, write to
|
|
the Free Software Foundation, Inc., 51 Franklin Street, Fifth Floor,
|
|
Boston, MA 02110-1301, USA.
|
|
*/
|
|
#ifndef KSTRINGHANDLER_H
|
|
#define KSTRINGHANDLER_H
|
|
|
|
#include <tqstring.h>
|
|
#include <tqstringlist.h>
|
|
#include <tqregexp.h> // for the word ranges
|
|
#include <tqfontmetrics.h>
|
|
#include "tdelibs_export.h"
|
|
|
|
/**
|
|
* This class contains utility functions for handling strings.
|
|
*
|
|
* This class is @em not a substitute for the TQString class. What
|
|
* I tried to do with this class is provide an easy way to
|
|
* cut/slice/splice words inside sentences in whatever order desired.
|
|
* While the main focus of this class are words (ie characters
|
|
* separated by spaces/tabs), the two core functions here ( split()
|
|
* and join() ) will function given any char to use as a separator.
|
|
* This will make it easy to redefine what a 'word' means in the
|
|
* future if needed.
|
|
*
|
|
* I freely stole some of the function names from python. I also think
|
|
* some of these were influenced by mIRC (yes, believe it if you will, I
|
|
* used to write a LOT of scripts in mIRC).
|
|
*
|
|
* The ranges are a fairly powerful way of getting/stripping words from
|
|
* a string. These ranges function, for the large part, as they would in
|
|
* python. See the word(const TQString&, const char *) and remword(const TQString&, uint) functions for more detail.
|
|
*
|
|
* This class contains no data members of its own. All strings are cut
|
|
* on the fly and returned as new qstrings/qstringlists.
|
|
*
|
|
* Quick example on how to use:
|
|
*
|
|
* \code
|
|
* KStringHandler kstr;
|
|
* TQString line = "This is a test of the strings";
|
|
*
|
|
* cout << "1> " << kstr.word( line , "4:" ) << "\n";
|
|
* cout << "2> " << kstr.remrange( line , "2:5" ) << "\n";
|
|
* cout << "2> " << kstr.reverse( line ) << "\n";
|
|
* cout << "2> " << kstr.center( kstr.word( line , 4 ) , 15 ) << "\n";
|
|
* \endcode
|
|
*
|
|
* and so forth.
|
|
*
|
|
* @short Class for manipulating words and sentences in strings
|
|
* @author Ian Zepp <icszepp@islc.net>
|
|
* @see KShell
|
|
*/
|
|
class TDECORE_EXPORT KStringHandler
|
|
{
|
|
public:
|
|
/** Returns the nth word in the string if found
|
|
* Returns a EMPTY (not null) string otherwise.
|
|
* Note that the FIRST index is 0.
|
|
* @param text the string to search for the words
|
|
* @param pos the position of the word to search
|
|
* @return the word, or an empty string if not found
|
|
* @deprecated use TQString::section instead
|
|
*/
|
|
static TQString word( const TQString &text , uint pos ) KDE_DEPRECATED;
|
|
|
|
/** Returns a range of words from that string.
|
|
* Ie:
|
|
* @li "0" returns the very first word
|
|
* @li "0:" returns the first to the last word
|
|
* @li "0:3" returns the first to fourth words
|
|
* @li ":3" returns everything up to the fourth word
|
|
*
|
|
* If you grok python, you're set.
|
|
* @param text the string to search for the words
|
|
* @param range the words to return (see description)
|
|
* @return the words, or an empty string if not found
|
|
*/
|
|
static TQString word( const TQString &text , const char *range );
|
|
|
|
/** Inserts a word into the string, and returns
|
|
* a new string with the word included. the first
|
|
* index is zero (0). If there are not @p pos words in the original
|
|
* string, the new word will be appended to the end.
|
|
* @param text the original text
|
|
* @param word the word to insert
|
|
* @param pos the position (in words) for the new word
|
|
* @return the resulting string
|
|
*/
|
|
static TQString insword( const TQString &text , const TQString &word , uint pos );
|
|
|
|
/** Replaces a word in the string, and returns
|
|
* a new string with the word included. the first
|
|
* index is zero (0). If there are not @p pos words in the original
|
|
* string, the new word will be appended to the end.
|
|
* @param text the original text
|
|
* @param word the word to insert
|
|
* @param pos the position (in words) for the new word
|
|
* @return the resulting string
|
|
*/
|
|
static TQString setword( const TQString &text , const TQString &word , uint pos );
|
|
|
|
/** Removes a word or ranges of words from the string,
|
|
* and returns a new string. The ranges definitions
|
|
* follow the definitions for the word() function.
|
|
*
|
|
* @li "0" removes the very first word
|
|
* @li "0:" removes the first the the last word
|
|
* @li "0:3" removes the first to fourth words
|
|
* @li ":3" removes everything up to the fourth word
|
|
* @param text the original text
|
|
* @param range the words to remove (see description)
|
|
* @return the resulting string
|
|
*/
|
|
static TQString remrange( const TQString &text , const char *range );
|
|
|
|
|
|
/** Removes a word at the given index, and returns a
|
|
* new string. The first index is zero (0).
|
|
* @param text the original text
|
|
* @param pos the position (in words) of thw word to delete
|
|
* @return the resulting string
|
|
*/
|
|
static TQString remword( const TQString &text , uint pos );
|
|
|
|
/** Removes a matching word from the string, and returns
|
|
* a new string. Note that only ONE match is removed.
|
|
* @param text the original text
|
|
* @param word the word to remove
|
|
* @return the resulting string
|
|
*/
|
|
static TQString remword( const TQString &text , const TQString &word );
|
|
|
|
/** Capitalizes each word in the string
|
|
* "hello there" becomes "Hello There" (string)
|
|
* @param text the text to capitalize
|
|
* @return the resulting string
|
|
*/
|
|
static TQString capwords( const TQString &text );
|
|
|
|
/** Capitalizes each word in the list
|
|
* [hello, there] becomes [Hello, There] (list)
|
|
* @param list the list to capitalize
|
|
* @return the resulting list
|
|
*/
|
|
static TQStringList capwords( const TQStringList &list );
|
|
|
|
/** Reverses the order of the words in a string
|
|
* "hello there" becomes "there hello" (string)
|
|
* @param text the text to reverse
|
|
* @return the resulting string
|
|
*/
|
|
static TQString reverse( const TQString &text );
|
|
|
|
/** Reverses the order of the words in a list
|
|
* [hello, there] becomes [there, hello] (list)
|
|
* @param list the list to reverse
|
|
* @return the resulting list
|
|
*/
|
|
static TQStringList reverse( const TQStringList &list );
|
|
|
|
/** Left-justifies a string and returns a string at least 'width' characters
|
|
* wide.
|
|
* If the string is longer than the @p width, the original
|
|
* string is returned. It is never truncated.
|
|
* @param text the text to justify
|
|
* @param width the desired width of the new string
|
|
* @return the resulting string
|
|
* @deprecated use TQString::leftJustify instead
|
|
*/
|
|
static TQString ljust( const TQString &text , uint width ) KDE_DEPRECATED;
|
|
|
|
/** Right-justifies a string and returns a string at least 'width' characters
|
|
* wide.
|
|
* If the string is longer than the @p width, the original
|
|
* string is returned. It is never truncated.
|
|
* @param text the text to justify
|
|
* @param width the desired width of the new string
|
|
* @return the resulting string
|
|
* @deprecated use TQString::rightJustify instead
|
|
*/
|
|
static TQString rjust( const TQString &text , uint width ) KDE_DEPRECATED;
|
|
|
|
/** Centers a string and returns a string at least 'width' characters
|
|
* wide.
|
|
* If the string is longer than the @p width, the original
|
|
* string is returned. It is never truncated.
|
|
* @param text the text to justify
|
|
* @param width the desired width of the new string
|
|
* @return the resulting string
|
|
*/
|
|
static TQString center( const TQString &text , uint width );
|
|
|
|
/** Substitute characters at the beginning of a string by "...".
|
|
* @param str is the string to modify
|
|
* @param maxlen is the maximum length the modified string will have
|
|
* If the original string is shorter than "maxlen", it is returned verbatim
|
|
* @return the modified string
|
|
*/
|
|
static TQString lsqueeze( const TQString & str, uint maxlen = 40 );
|
|
|
|
/** Substitute characters at the beginning of a string by "...". Similar to
|
|
* method above, except that it truncates based on pixel width rather than
|
|
* the number of characters
|
|
* @param name is the string to modify
|
|
* @param fontMetrics is the font metrics to use to calculate character sizes
|
|
* @param maxlen is the maximum length in ems the modified string will have
|
|
* If the original string is shorter than "maxlen", it is returned verbatim
|
|
* @return the modified string
|
|
* @since 3.2
|
|
*/
|
|
static TQString lEmSqueeze( const TQString & name,
|
|
const TQFontMetrics& fontMetrics,
|
|
uint maxlen = 30 );
|
|
|
|
/** Substitute characters at the beginning of a string by "...". Similar to
|
|
* method above, except that maxlen is the width in pixels to truncate to
|
|
* @param name is the string to modify
|
|
* @param fontMetrics is the font metrics to use to calculate character sizes
|
|
* @param maxPixels is the maximum pixel length the modified string will have
|
|
* If the original string is shorter than "maxlen", it is returned verbatim
|
|
* @return the modified string
|
|
* @since 3.2
|
|
*/
|
|
static TQString lPixelSqueeze( const TQString & name,
|
|
const TQFontMetrics& fontMetrics,
|
|
uint maxPixels );
|
|
|
|
/** Substitute characters at the middle of a string by "...".
|
|
* @param str is the string to modify
|
|
* @param maxlen is the maximum length the modified string will have
|
|
* If the original string is shorter than "maxlen", it is returned verbatim
|
|
* @return the modified string
|
|
*/
|
|
static TQString csqueeze( const TQString & str, uint maxlen = 40 );
|
|
|
|
/** Substitute characters in the middle of a string by "...". Similar to
|
|
* method above, except that it truncates based on pixel width rather than
|
|
* the number of characters
|
|
* @param name is the string to modify
|
|
* @param fontMetrics is the font metrics to use to calculate character sizes
|
|
* @param maxlen is the maximum length in ems the modified string will have
|
|
* If the original string is shorter than "maxlen", it is returned verbatim
|
|
* @return the modified string
|
|
* @since 3.2
|
|
*/
|
|
static TQString cEmSqueeze( const TQString & name,
|
|
const TQFontMetrics& fontMetrics,
|
|
uint maxlen = 30 );
|
|
|
|
/** Substitute characters in the middle of a string by "...". Similar to
|
|
* method above, except that maxlen is the width in pixels to truncate to
|
|
* @param name is the string to modify
|
|
* @param fontMetrics is the font metrics to use to calculate character sizes
|
|
* @param maxPixels is the maximum pixel length the modified string will have
|
|
* If the original string is shorter than "maxlen", it is returned verbatim
|
|
* @return the modified string
|
|
* @since 3.2
|
|
*/
|
|
static TQString cPixelSqueeze( const TQString & name,
|
|
const TQFontMetrics& fontMetrics,
|
|
uint maxPixels );
|
|
|
|
/** Substitute characters at the end of a string by "...".
|
|
* @param str is the string to modify
|
|
* @param maxlen is the maximum length the modified string will have
|
|
* If the original string is shorter than "maxlen", it is returned verbatim
|
|
* @return the modified string
|
|
*/
|
|
static TQString rsqueeze( const TQString & str, uint maxlen = 40 );
|
|
|
|
/** Substitute characters at the end of a string by "...". Similar to
|
|
* method above, except that it truncates based on pixel width rather than
|
|
* the number of characters
|
|
* @param name is the string to modify
|
|
* @param fontMetrics is the font metrics to use to calculate character sizes
|
|
* @param maxlen is the maximum length in ems the modified string will have
|
|
* If the original string is shorter than "maxlen", it is returned verbatim
|
|
* @return the modified string
|
|
* @since 3.2
|
|
*/
|
|
static TQString rEmSqueeze( const TQString & name,
|
|
const TQFontMetrics& fontMetrics,
|
|
uint maxlen = 30 );
|
|
|
|
/** Substitute characters at the end of a string by "...". Similar to
|
|
* method above, except that maxlen is the width in pixels to truncate to
|
|
* @param name is the string to modify
|
|
* @param fontMetrics is the font metrics to use to calculate character sizes
|
|
* @param maxPixels is the maximum pixel length the modified string will have
|
|
* If the original string is shorter than "maxlen", it is returned verbatim
|
|
* @return the modified string
|
|
* @since 3.2
|
|
*/
|
|
static TQString rPixelSqueeze( const TQString & name,
|
|
const TQFontMetrics& fontMetrics,
|
|
uint maxPixels );
|
|
|
|
/**
|
|
* Match a filename.
|
|
* @param filename is the real decoded filename (or dirname
|
|
* without trailing '/').
|
|
* @param pattern is a pattern like *.txt, *.tar.gz, Makefile.*, *README*, etc.
|
|
* Patterns with two asterisks like "*.*pk" are not supported.
|
|
* @return true if the given filename matches the given pattern
|
|
*/
|
|
static bool matchFileName( const TQString& filename, const TQString& pattern );
|
|
// KDE4: move to KShell
|
|
|
|
/**
|
|
* Split a TQString into a TQStringList in a similar fashion to the static
|
|
* TQStringList function in Qt, except you can specify a maximum number
|
|
* of tokens. If max is specified (!= 0) then only that number of tokens
|
|
* will be extracted. The final token will be the remainder of the string.
|
|
*
|
|
* Example:
|
|
* \code
|
|
* perlSplit("__", "some__string__for__you__here", 4)
|
|
* TQStringList contains: "some", "string", "for", "you__here"
|
|
* \endcode
|
|
*
|
|
* @param sep is the string to use to delimit s.
|
|
* @param s is the input string
|
|
* @param max is the maximum number of extractions to perform, or 0.
|
|
* @return A TQStringList containing tokens extracted from s.
|
|
*/
|
|
static TQStringList perlSplit
|
|
(const TQString & sep, const TQString & s, uint max = 0);
|
|
|
|
/**
|
|
* Split a TQString into a TQStringList in a similar fashion to the static
|
|
* TQStringList function in Qt, except you can specify a maximum number
|
|
* of tokens. If max is specified (!= 0) then only that number of tokens
|
|
* will be extracted. The final token will be the remainder of the string.
|
|
*
|
|
* Example:
|
|
* \code
|
|
* perlSplit(' ', "tdeparts reaches the parts other parts can't", 3)
|
|
* TQStringList contains: "tdeparts", "reaches", "the parts other parts can't"
|
|
* \endcode
|
|
*
|
|
* @param sep is the character to use to delimit s.
|
|
* @param s is the input string
|
|
* @param max is the maximum number of extractions to perform, or 0.
|
|
* @return A TQStringList containing tokens extracted from s.
|
|
*/
|
|
static TQStringList perlSplit
|
|
(const TQChar & sep, const TQString & s, uint max = 0);
|
|
|
|
/**
|
|
* Split a TQString into a TQStringList in a similar fashion to the static
|
|
* TQStringList function in Qt, except you can specify a maximum number
|
|
* of tokens. If max is specified (!= 0) then only that number of tokens
|
|
* will be extracted. The final token will be the remainder of the string.
|
|
*
|
|
* Example:
|
|
* \code
|
|
* perlSplit(TQRegExp("[! ]", "Split me up ! I'm bored ! OK ?", 3)
|
|
* TQStringList contains: "Split", "me", "up ! I'm bored, OK ?"
|
|
* \endcode
|
|
*
|
|
* @param sep is the regular expression to use to delimit s.
|
|
* @param s is the input string
|
|
* @param max is the maximum number of extractions to perform, or 0.
|
|
* @return A TQStringList containing tokens extracted from s.
|
|
*/
|
|
static TQStringList perlSplit
|
|
(const TQRegExp & sep, const TQString & s, uint max = 0);
|
|
|
|
/**
|
|
* This method auto-detects URLs in strings, and adds HTML markup to them
|
|
* so that richtext or HTML-enabled widgets (such as KActiveLabel)
|
|
* will display the URL correctly.
|
|
* @param text the string which may contain URLs
|
|
* @return the resulting text
|
|
* @since 3.1
|
|
*/
|
|
static TQString tagURLs( const TQString& text );
|
|
|
|
/**
|
|
Obscure string by using a simple symmetric encryption. Applying the
|
|
function to a string obscured by this function will result in the original
|
|
string.
|
|
|
|
The function can be used to obscure passwords stored to configuration
|
|
files. Note that this won't give you any more security than preventing
|
|
that the password is directly copied and pasted.
|
|
|
|
@param str string to be obscured
|
|
@return obscured string
|
|
@since 3.2
|
|
*/
|
|
static TQString obscure( const TQString &str );
|
|
|
|
/**
|
|
Guess whether a string is UTF8 encoded.
|
|
|
|
@param str the string to check
|
|
@return true if UTF8. If false, the string is probably in Local8Bit.
|
|
@since 3.2
|
|
*/
|
|
static bool isUtf8( const char *str );
|
|
|
|
/**
|
|
Construct TQString from a c string, guessing whether it is UTF8- or
|
|
Local8Bit-encoded.
|
|
|
|
@param str the input string
|
|
@return the (hopefully correctly guessed) TQString representation of @p str
|
|
@since 3.2
|
|
*/
|
|
static TQString from8Bit( const char *str );
|
|
|
|
#ifdef KDE_NO_COMPAT
|
|
private:
|
|
#endif
|
|
/**
|
|
* @deprecated Use matchFileName () instead.
|
|
*/
|
|
static KDE_DEPRECATED bool matchFilename( const TQString& filename, const TQString& pattern )
|
|
{
|
|
return matchFileName (filename, pattern);
|
|
}
|
|
|
|
};
|
|
#endif
|