Package com.caucho.quercus.lib.gettext

Source Code of com.caucho.quercus.lib.gettext.POFileParser

/*
* Copyright (c) 1998-2008 Caucho Technology -- all rights reserved
*
* This file is part of Resin(R) Open Source
*
* Each copy or derived work must preserve the copyright notice and this
* notice unmodified.
*
* Resin Open Source is free software; you can redistribute it and/or modify
* it under the terms of the GNU General Public License as published by
* the Free Software Foundation; either version 2 of the License, or
* (at your option) any later version.
*
* Resin Open Source is distributed in the hope that it will be useful,
* but WITHOUT ANY WARRANTY; without even the implied warranty of
* MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE, or any warranty
* of NON-INFRINGEMENT.  See the GNU General Public License for more
* details.
*
* You should have received a copy of the GNU General Public License
* along with Resin Open Source; if not, write to the
*
*   Free Software Foundation, Inc.
*   59 Temple Place, Suite 330
*   Boston, MA 02111-1307  USA
*
* @author Nam Nguyen
*/

package com.caucho.quercus.lib.gettext;

import com.caucho.quercus.env.StringValue;
import com.caucho.quercus.env.Env;
import com.caucho.quercus.env.UnicodeBuilderValue;
import com.caucho.quercus.lib.gettext.expr.PluralExpr;
import com.caucho.vfs.Path;
import com.caucho.vfs.ReadStream;

import java.io.IOException;
import java.util.ArrayList;
import java.util.HashMap;

/**
* Parses Gettext PO files.
*/
class POFileParser extends GettextParser
{
  // Parsing constants and variables
  private static final int MSGID = 256;
  private static final int MSGID_PLURAL = 257;
  private static final int MSGSTR = 258;

  private static final int UNKNOWN = 260;

  private ReadStream _in;

  private int _peekChar;
  private StringValue _string;

  POFileParser(Env env, Path path)
    throws IOException
  {
    init(path);
  }

  void init(Path path)
    throws IOException
  {
    _in = path.openRead();
    _peekChar = -1;

    StringValue metadata = getMetadata();

    _pluralExpr = PluralExpr.getPluralExpr(metadata);
    _charset = getCharset(metadata);

    _in.setEncoding(_charset);
  }

  private StringValue getMetadata()
    throws IOException
  {
    StringValue metadata = null;

    int token = readToken();

    while (token >= 0 && token != UNKNOWN) {
      if (token == MSGID && _string.length() == 0) {

        if (readToken() == MSGSTR)
          metadata = _string;

        break;
      }
    }

    _peekChar = -1;
    _in.setPosition(0);

    return metadata;
  }

  /**
   * Returns the gettext translations.
   *
   * @return translations from file, or null on error
   */
  HashMap<StringValue, ArrayList<StringValue>> readTranslations()
    throws IOException
  {
    HashMap<StringValue, ArrayList<StringValue>> translations =
            new HashMap<StringValue, ArrayList<StringValue>>();

    int token = readToken();

    while (token >= 0) {
      if (token != MSGID)
        return null;

      StringValue msgid = _string;

      token = readToken();
      if (token == MSGID_PLURAL)
        token = readToken();

      ArrayList<StringValue> msgstrs = new ArrayList<StringValue>();

      for (; token == MSGSTR; token = readToken()) {
        msgstrs.add(_string);
      }

      translations.put(msgid, msgstrs);
    }

    return translations;
  }

  private int readToken()
    throws IOException
  {
    int ch = skipWhitespace();

    switch (ch) {
      case '#':
        skipLine();
        return readToken();

      case 'm':
        if (read() == 's' &&
            read() == 'g') {
          return readMsgToken();
        }
        else
          return UNKNOWN;

      case -1:
        return -1;

      default:
        return UNKNOWN;
    }
  }

  private int readMsgToken()
    throws IOException
  {
    int ch = read();

    switch (ch) {
      case 'i':
        if (read() == 'd')
          return readMsgidToken();
        else
          return UNKNOWN;

      case 's':
        if (read() == 't' &&
            read() == 'r')
          return readMsgstrToken();
        else
          return UNKNOWN;

      default:
        return UNKNOWN;
    }
  }

  private int readMsgidToken()
    throws IOException
  {
    int token;
    int ch = skipWhitespace();

    if (ch == '_') {
      if (read() == 'p' &&
          read() == 'l' &&
          read() == 'u' &&
          read() == 'r' &&
          read() == 'a' &&
          read() == 'l') {
        token = MSGID_PLURAL;

        ch = skipWhitespace();
      }
      else
        return UNKNOWN;
    }
    else
      token = MSGID;

    if (ch != '"')
      return UNKNOWN;

    return readString(token);   
  }

  private int readMsgstrToken()
    throws IOException
  {
    int ch = skipWhitespace();

    if (ch == '[') {
      ch = read();

      while (ch >= 0 && ch != ']') {
        ch = read();
      }

      ch = skipWhitespace();
    }

    if (ch != '"')
      return UNKNOWN;

    return readString(MSGSTR);
  }

  /**
   * Reads a string in quotes.
   */
  private int readString(int token)
    throws IOException
  {
    return readString(new UnicodeBuilderValue(), token);
  }

  /**
   * XXX: any other possible character escapes?
   */
  private int readString(StringValue sb, int token)
    throws IOException
  {
    for (int ch = read(); ch != '"'; ch = read()) {
      switch (ch) {
        case '\\':
          ch = read();
          switch (ch) {
            case 'n':
              sb.append('\n');
              break;
            case 'r':
              sb.append('\r');
              break;
            case 't':
              sb.append('\t');
              break;
            case '\r':
              ch = read();
              if (ch != '\n')
                _peekChar = ch;
              break;
            case '\n':
              break;
            default:
              _peekChar = ch;
              sb.append('\\');
          }
          break;

        case -1:
          return UNKNOWN;

        default:
          sb.append((char)ch);
      }
    }

    // String may be continued on the next line.

    int ch = skipWhitespace();

    if (ch == '"')
      return readString(sb, token);
    else
      _peekChar = ch;

    _string = sb;
    return token;
  }

  private int read()
    throws IOException
  {
    if (_peekChar >= 0) {
      int swap = _peekChar;
      _peekChar = -1;
      return swap;
    }

    return _in.readChar();
  }

  private void skipLine()
    throws IOException
  {
    int ch = read();

    while (ch >= 0) {
      switch (ch) {
        case '\r':
          ch = read();

          if (ch != '\n')
            _peekChar = ch;

          return;

        case '\n':
          return;
      }

      ch = read();
    }
  }

  private int skipWhitespace()
    throws IOException
  {
    while (true) {
      int ch = read();

      switch (ch) {
        case ' ':
        case '\r':
        case '\n':
        case '\t':
          continue;
        default:
          return ch;
      }
    }
  }

  void close()
  {
    if (_in != null)
      _in.close();
  }
}
TOP

Related Classes of com.caucho.quercus.lib.gettext.POFileParser

TOP
Copyright © 2018 www.massapi.com. All rights reserved.
All source code are property of their respective owners. Java is a trademark of Sun Microsystems, Inc and owned by ORACLE Inc. Contact coftware#gmail.com.