Package xbird.xquery.func.string

Source Code of xbird.xquery.func.string.NormalizeUnicode

/*
* @(#)$Id: NormalizeUnicode.java 3619 2008-03-26 07:23:03Z yui $
*
* Copyright 2006-2008 Makoto YUI
*
* Licensed under the Apache License, Version 2.0 (the "License");
* you may not use this file except in compliance with the License.
* You may obtain a copy of the License at
*
*     http://www.apache.org/licenses/LICENSE-2.0
*
* Unless required by applicable law or agreed to in writing, software
* distributed under the License is distributed on an "AS IS" BASIS,
* WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
* See the License for the specific language governing permissions and
* limitations under the License.
*
* Contributors:
*     Makoto YUI - initial implementation
*/
package xbird.xquery.func.string;

import xbird.xquery.DynamicError;
import xbird.xquery.XQueryException;
import xbird.xquery.dm.value.Item;
import xbird.xquery.dm.value.Sequence;
import xbird.xquery.dm.value.literal.XString;
import xbird.xquery.dm.value.sequence.ValueSequence;
import xbird.xquery.func.BuiltInFunction;
import xbird.xquery.func.FunctionSignature;
import xbird.xquery.meta.DynamicContext;
import xbird.xquery.type.Type;
import xbird.xquery.type.TypeRegistry;
import xbird.xquery.type.xs.StringType;

import com.ibm.icu.text.Normalizer;

/**
* fn:normalize-unicode.
* <DIV lang="en">
* Returns the value of $arg normalized according to the normalization criteria
* for a normalization form identified by the value of $normalizationForm.
* <ul>
* <li>fn:normalize-unicode($arg as xs:string?) as xs:string</li>
* <li>fn:normalize-unicode($arg as xs:string?, $normalizationForm as xs:string) as xs:string</li>
* </ul>
* </DIV>
* <DIV lang="ja"></DIV>
*
* @author Makoto YUI (yuin405+xbird@gmail.com)
* @link http://www.w3.org/TR/xquery-operators/#func-normalize-unicode
*/
public final class NormalizeUnicode extends BuiltInFunction {
    private static final long serialVersionUID = 2651492084383157264L;
    public static final String SYMBOL = "fn:normalize-unicode";

    public NormalizeUnicode() {
        super(SYMBOL, StringType.STRING);
    }

    protected FunctionSignature[] signatures() {
        final FunctionSignature[] s = new FunctionSignature[2];
        s[0] = new FunctionSignature(getName(), new Type[] { TypeRegistry.safeGet("xs:string?") });
        s[1] = new FunctionSignature(getName(), new Type[] { TypeRegistry.safeGet("xs:string?"),
                StringType.STRING });
        return s;
    }

    public Sequence eval(Sequence<? extends Item> contextSeq, ValueSequence argv, DynamicContext dynEnv) throws XQueryException {
        assert (argv != null);
        final int arglen = argv.size();
        assert (arglen == 1 || arglen == 2);
        Item firstItem = argv.getItem(0);
        // If the value of $arg is the empty sequence, returns the zero-length string.
        if(firstItem.isEmpty()) {
            return XString.valueOf("");
        }
        String arg = firstItem.stringValue();
        // If the $normalizationForm is absent, as in the first format above,
        // it shall be assumed to be "NFC"
        String nform = "NFC";
        if(arglen == 2) {
            Item secondItem = argv.getItem(1);
            nform = secondItem.stringValue();
        }
        final String normed;
        if("NFC".equalsIgnoreCase(nform)) {
            normed = Normalizer.normalize(arg, Normalizer.NFC);
        } else if("NFD".equalsIgnoreCase(nform)) {
            normed = Normalizer.normalize(arg, Normalizer.NFD);
        } else if("NFKC".equalsIgnoreCase(nform)) {
            normed = Normalizer.normalize(arg, Normalizer.NFKC);
        } else if("NFKD".equalsIgnoreCase(nform) || "FULLY-NORMALIZED".equalsIgnoreCase(nform)) {
            normed = Normalizer.normalize(arg, Normalizer.NFKD);
        } else {
            // TODO "FULLY-NORMALIZED"
            throw new DynamicError("err:FOCH0003", "Unsupported normalizationForm: " + nform);
        }
        return XString.valueOf(normed);
    }

}
TOP

Related Classes of xbird.xquery.func.string.NormalizeUnicode

TOP
Copyright © 2018 www.massapi.com. All rights reserved.
All source code are property of their respective owners. Java is a trademark of Sun Microsystems, Inc and owned by ORACLE Inc. Contact coftware#gmail.com.