001/*
002 * $Id: DefaultSplitCharacter.java 4784 2011-03-15 08:33:00Z blowagie $
003 *
004 * This file is part of the iText (R) project.
005 * Copyright (c) 1998-2011 1T3XT BVBA
006 * Authors: Bruno Lowagie, Paulo Soares, et al.
007 *
008 * This program is free software; you can redistribute it and/or modify
009 * it under the terms of the GNU Affero General Public License version 3
010 * as published by the Free Software Foundation with the addition of the
011 * following permission added to Section 15 as permitted in Section 7(a):
012 * FOR ANY PART OF THE COVERED WORK IN WHICH THE COPYRIGHT IS OWNED BY 1T3XT,
013 * 1T3XT DISCLAIMS THE WARRANTY OF NON INFRINGEMENT OF THIRD PARTY RIGHTS.
014 *
015 * This program is distributed in the hope that it will be useful, but
016 * WITHOUT ANY WARRANTY; without even the implied warranty of MERCHANTABILITY
017 * or FITNESS FOR A PARTICULAR PURPOSE.
018 * See the GNU Affero General Public License for more details.
019 * You should have received a copy of the GNU Affero General Public License
020 * along with this program; if not, see http://www.gnu.org/licenses or write to
021 * the Free Software Foundation, Inc., 51 Franklin Street, Fifth Floor,
022 * Boston, MA, 02110-1301 USA, or download the license from the following URL:
023 * http://itextpdf.com/terms-of-use/
024 *
025 * The interactive user interfaces in modified source and object code versions
026 * of this program must display Appropriate Legal Notices, as required under
027 * Section 5 of the GNU Affero General Public License.
028 *
029 * In accordance with Section 7(b) of the GNU Affero General Public License,
030 * a covered work must retain the producer line in every PDF that is created
031 * or manipulated using iText.
032 *
033 * You can be released from the requirements of the license by purchasing
034 * a commercial license. Buying such a license is mandatory as soon as you
035 * develop commercial activities involving the iText software without
036 * disclosing the source code of your own applications.
037 * These activities include: offering paid services to customers as an ASP,
038 * serving PDFs on the fly in a web application, shipping iText with a closed
039 * source product.
040 *
041 * For more information, please contact iText Software Corp. at this
042 * address: sales@itextpdf.com
043 */
044package com.itextpdf.text.pdf;
045
046import com.itextpdf.text.SplitCharacter;
047
048/**
049 * The default class that is used to determine whether or not a character
050 * is a split character. You can subclass this class to define your own
051 * split characters.
052 * @since       2.1.2
053 */
054public class DefaultSplitCharacter implements SplitCharacter {
055        
056        /**
057         * An instance of the default SplitCharacter.
058         */
059        public static final SplitCharacter DEFAULT = new DefaultSplitCharacter();
060        
061        /**
062         * Checks if a character can be used to split a <CODE>PdfString</CODE>.
063         * <P>
064         * for the moment every character less than or equal to SPACE, the character '-'
065         * and some specific unicode ranges are 'splitCharacters'.
066         * 
067         * @param start start position in the array
068         * @param current current position in the array
069         * @param end end position in the array
070         * @param       cc              the character array that has to be checked
071         * @param ck chunk array
072         * @return      <CODE>true</CODE> if the character can be used to split a string, <CODE>false</CODE> otherwise
073         */
074    public boolean isSplitCharacter(int start, int current, int end, char[] cc, PdfChunk[] ck) {
075        char c = getCurrentCharacter(current, cc, ck);
076        if (c <= ' ' || c == '-' || c == '\u2010') {
077            return true;
078        }
079        if (c < 0x2002)
080            return false;
081        return ((c >= 0x2002 && c <= 0x200b)
082        || (c >= 0x2e80 && c < 0xd7a0)
083        || (c >= 0xf900 && c < 0xfb00)
084        || (c >= 0xfe30 && c < 0xfe50)
085        || (c >= 0xff61 && c < 0xffa0));
086    }
087
088    /**
089     * Returns the current character
090         * @param current current position in the array
091         * @param       cc              the character array that has to be checked
092         * @param ck chunk array
093     * @return  the current character
094     */
095    protected char getCurrentCharacter(int current, char[] cc, PdfChunk[] ck) {
096        if (ck == null) {
097                return cc[current];
098        }
099        return (char)ck[Math.min(current, ck.length - 1)].getUnicodeEquivalent(cc[current]);
100    }
101}