Package com.hp.hpl.jena.sparql.engine.http

Source Code of com.hp.hpl.jena.sparql.engine.http.HttpQuery

/*
* Licensed to the Apache Software Foundation (ASF) under one
* or more contributor license agreements.  See the NOTICE file
* distributed with this work for additional information
* regarding copyright ownership.  The ASF licenses this file
* to you under the Apache License, Version 2.0 (the
* "License"); you may not use this file except in compliance
* with the License.  You may obtain a copy of the License at
*
*     http://www.apache.org/licenses/LICENSE-2.0
*
* Unless required by applicable law or agreed to in writing, software
* distributed under the License is distributed on an "AS IS" BASIS,
* WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
* See the License for the specific language governing permissions and
* limitations under the License.
*/

package com.hp.hpl.jena.sparql.engine.http;

import java.io.* ;
import java.net.HttpURLConnection ;
import java.net.MalformedURLException ;
import java.net.SocketTimeoutException ;
import java.net.URL ;
import java.util.ArrayList ;
import java.util.Iterator ;
import java.util.List ;
import java.util.Map ;
import java.util.regex.Pattern ;
import java.util.zip.DeflaterInputStream ;
import java.util.zip.GZIPInputStream ;

import org.apache.commons.codec.binary.Base64 ;
import org.apache.jena.atlas.lib.StrUtils ;
import org.apache.jena.riot.WebContent ;
import org.slf4j.Logger ;
import org.slf4j.LoggerFactory ;

import com.hp.hpl.jena.query.ARQ ;
import com.hp.hpl.jena.query.QueryExecException ;
import com.hp.hpl.jena.shared.JenaException ;
import com.hp.hpl.jena.sparql.ARQInternalErrorException ;
import com.hp.hpl.jena.sparql.util.Convert ;
import com.hp.hpl.jena.util.FileUtils ;

/** Create an execution object for performing a query on a model
*  over HTTP.  This is the main protocol engine for HTTP query.
*  There are higher level classes for doing a query and presenting
*  the results in an API fashion.
*
*  If the query string is large, then HTTP POST is used. */
public class HttpQuery extends Params
{
    static final Logger log = LoggerFactory.getLogger(HttpQuery.class.getName()) ;
   
    /** The definition of "large" queries */
    // Not final so that other code can change it.
    static public /*final*/ int urlLimit = 2*1024 ;
   
    String serviceURL ;
   
    String contentTypeResult = WebContent.contentTypeResultsXML ;
    HttpURLConnection httpConnection = null ;
   
    // An object indicate no value associated with parameter name
    final static Object noValue = new Object() ;
    String user = null ;
    char[] password = null ;
   
    int responseCode = 0;
    String responseMessage = null ;
    boolean forcePOST = false ;
    String queryString = null ;
    boolean serviceParams = false ;
    private final Pattern queryParamPattern = Pattern.compile(".+[&|\\?]query=.*") ;
   
    int connectTimeout = 0;
    int readTimeout = 0;
   
    private boolean allowGZip = false ;
    private boolean allowDeflate = false;
   
    //static final String ENC_UTF8 = "UTF-8" ;
   
    /** Create a execution object for a whole model GET
     * @param serviceURL     The model
     */
   
    public HttpQuery(String serviceURL)
    {
        init(serviceURL) ;
    }
       

    /** Create a execution object for a whole model GET
     * @param url           The model
     */
   
    public HttpQuery(URL url)
    {
        init(url.toString()) ;
    }
       

    private void init(String serviceURL)
    {
        if ( log.isTraceEnabled())
            log.trace("URL: "+serviceURL) ;
        if ( serviceURL.indexOf('?') >= 0 )
            serviceParams = true ;

        if ( queryParamPattern.matcher(serviceURL).matches() )
            throw new QueryExecException("SERVICE URL overrides the 'query' SPARQL protocol parameter") ;

        this.serviceURL = serviceURL ;
    }
   
    private String getQueryString()
    {
        if ( queryString == null )
            queryString = super.httpString() ;
        return queryString ;
    }

    public HttpURLConnection getConnection() { return httpConnection ; }
   
    /** Set the content type (Accept header) for the results
     */
    public void setAccept(String contentType)
    {
        contentTypeResult = contentType ;
    }
   
    /**
     * Gets the Content Type, if the query has been made this reflects the Content-Type header returns, if it has not been made this reflects only the Accept header that will be sent (as set via the {@link #setAccept(String)} method)
     */
    public String getContentType()
    {
      return contentTypeResult;
    }
   
    /**
     * Gets the HTTP Response Code returned by the request (returns 0 if request has yet to be made)
     */
    public int getResponseCode()
    {
      return responseCode;
    }
   
    /**
     * Sets whether the HTTP request will include a Accept-Encoding: gzip header
     */
    public void setAllowGZip(boolean allow)
    {
      allowGZip = allow;
    }
   
    /**
     * Sets whether the HTTP request will include a Accept-Encoding: deflate header
     */
    public void setAllowDeflate(boolean allow)
    {
      allowDeflate = allow;
    }
   
    /**
     * Sets basic authentication
     * @param user Username
     * @param password Password
     */
    public void setBasicAuthentication(String user, char[] password)
    {
        this.user = user ;
        this.password = password ;
    }
   
    /** Return whether this request will go by GET or POST
     *  @return boolean
     */
    public boolean usesPOST()
    {
        if ( forcePOST )
            return true ;
        String s = getQueryString() ;
       
        return serviceURL.length()+s.length() >= urlLimit ;
    }

    /** Force the use of HTTP POST for the query operation
     */

    public void setForcePOST()
    {
        forcePOST = true ;
    }
   
    /**
     * Sets HTTP Connection timeout, any value <= 0 is taken to mean no timeout
     */
    public void setConnectTimeout(int timeout)
    {
      connectTimeout = timeout;
    }
   
    /**
     * Gets the HTTP Connection timeout
     */
    public int getConnectTimeout()
    {
      return connectTimeout;
    }
   
    /**
     * Sets HTTP Read timeout, any value <= 0 is taken to mean no timeout
     */
    public void setReadTimeout(int timeout)
    {
      readTimeout = timeout;
    }
   
    /**
     * Gets the HTTP Read timeout
     */
    public int getReadTimeout()
    {
      return readTimeout;
    }

    /** Execute the operation
     * @return Model    The resulting model
     * @throws QueryExceptionHTTP
     */
    public InputStream exec() throws QueryExceptionHTTP
    {
        try {
            if (usesPOST())
                return execPost();
            return execGet();
        } catch (QueryExceptionHTTP httpEx)
        {
            log.trace("Exception in exec", httpEx);
            throw httpEx;
        }
        catch (JenaException jEx)
        {
            log.trace("JenaException in exec", jEx);
            throw jEx ;
        }
    }

    private InputStream execGet() throws QueryExceptionHTTP
    {
        URL target = null ;
        String qs = getQueryString() ;
       
        ARQ.getHttpRequestLogger().trace(qs) ;
       
        try {
            if ( count() == 0 )
                target = new URL(serviceURL) ;
            else
                target = new URL(serviceURL+(serviceParams ? "&" : "?")+qs) ;
        }
        catch (MalformedURLException malEx)
        { throw new QueryExceptionHTTP(0, "Malformed URL: "+malEx) ; }
        log.trace("GET "+target.toExternalForm()) ;
       
        try
        {
            httpConnection = (HttpURLConnection) target.openConnection();
            // This is the default setting - but be clear about it.
            httpConnection.setInstanceFollowRedirects(true) ;      
            httpConnection.setRequestProperty("Accept", contentTypeResult) ;
           
            int x = httpConnection.getReadTimeout() ;
           
            // By default, following 3xx redirects is true
            //conn.setFollowRedirects(true) ;
            basicAuthentication(httpConnection) ;
            applyTimeouts(httpConnection);
            applyEncodings(httpConnection);
           
            httpConnection.setDoInput(true);
            httpConnection.connect();
            try
            {
                return execCommon();
            }
            catch (QueryExceptionHTTP qEx)
            {
                // Back-off and try POST if something complain about long URIs
                // Broken
                if (qEx.getResponseCode() == 414 /*HttpServletResponse.SC_REQUEST_URI_TOO_LONG*/ )
                    return execPost();
                throw qEx;
            }
        }
        catch (java.net.ConnectException connEx)
        { throw new QueryExceptionHTTP(QueryExceptionHTTP.NoServer, "Failed to connect to remote server"); }
        catch (IOException ioEx)
        { throw new QueryExceptionHTTP(ioEx); }
    }
   
    private InputStream execPost() throws QueryExceptionHTTP
    {
        URL target = null;
        try { target = new URL(serviceURL); }
        catch (MalformedURLException malEx)
        { throw new QueryExceptionHTTP(0, "Malformed URL: " + malEx); }
        log.trace("POST "+target.toExternalForm()) ;
       
        ARQ.getHttpRequestLogger().trace(target.toExternalForm()) ;

        try
        {
            httpConnection = (HttpURLConnection) target.openConnection();
            httpConnection.setRequestMethod("POST") ;
            httpConnection.setRequestProperty("Accept", contentTypeResult) ;
            httpConnection.setRequestProperty("Content-Type", "application/x-www-form-urlencoded") ;
            basicAuthentication(httpConnection) ;
            applyTimeouts(httpConnection);
            applyEncodings(httpConnection);
            httpConnection.setDoOutput(true) ;
           
            boolean first = true ;
            OutputStream out = httpConnection.getOutputStream() ;
            for ( Iterator<Pair> iter = pairs().listIterator() ; iter.hasNext() ; )
            {
                if ( ! first )
                    out.write('&') ;
                first = false ;
                Pair p = iter.next() ;
                out.write(p.getName().getBytes()) ;
                out.write('=') ;
                String x = p.getValue() ;
                x = Convert.encWWWForm(x) ;
                out.write(x.getBytes()) ;
                ARQ.getHttpRequestLogger().trace("Param: "+x) ;
            }
            out.flush() ;
            httpConnection.connect() ;
            return execCommon() ;
        }
        catch (java.net.ConnectException connEx)
        { throw new QueryExceptionHTTP(-1, "Failed to connect to remote server"); }
        catch (SocketTimeoutException timeoutEx)
        { throw new QueryExceptionHTTP(-1, "Failed to connect to remove server within specified timeout"); }
        catch (IOException ioEx)
        { throw new QueryExceptionHTTP(ioEx); }
    }
   
    private void basicAuthentication(HttpURLConnection httpConnection2)
    {
        // Do basic authentication : do directly, not via an Authenticator, because it
        // avoids an extra round trip (Java normally does the request without authetication,
        // then reties with)

        if ( user != null || password != null)
        {
            try
            {
                if ( user == null || password == null )
                    log.warn("Only one of user/password is set") ;
                // We want: "Basic user:password" except user:password is base 64 encoded.
                // Build string, get as UTF-8, bytes, translate to base 64.
                StringBuffer x = new StringBuffer() ;
                byte b[] = x.append(user).append(":").append(password).toString().getBytes("UTF-8") ;
                String y = Base64.encodeBase64String(b) ;
                httpConnection.setRequestProperty("Authorization", "Basic "+y) ;
                // Overwrite any password details we copied.
                // Still leaves the copy in the HTTP connection.  But this only basic auth.
                for ( int i = 0 ; i < x.length() ; i++ ) x.setCharAt(i, '*') ;
                for ( int i = 0 ; i < b.length ; i++ ) b[i] = (byte)0 ;
            } catch (UnsupportedEncodingException ex)
            {
                // Can't happen - UTF-8 is required of all Java platforms.
                throw new ARQInternalErrorException("UTF-8 is broken on this platform", ex) ;
            }
        }
    }

    private void applyTimeouts(HttpURLConnection conn)
    {
      if (connectTimeout > 0)
      {
        conn.setConnectTimeout(connectTimeout);
      }
      if (readTimeout > 0)
      {
        conn.setReadTimeout(readTimeout);
      }
    }
   
    private void applyEncodings(HttpURLConnection conn)
    {
      List<String> encodings = new ArrayList<String>();
      if (allowGZip) encodings.add("gzip");
      if (allowDeflate) encodings.add("deflate");
      if (encodings.size() > 0)
      {
        //Apply the Accept-Encoding header if at least one encoding has been selected
        conn.setRequestProperty("Accept-Encoding", StrUtils.strjoin(", ", encodings));
      }
    }

    private InputStream execCommon() throws QueryExceptionHTTP
    {
        try {
            try {
                responseCode = httpConnection.getResponseCode() ;
                responseMessage = Convert.decWWWForm(httpConnection.getResponseMessage()) ;
            } catch (NullPointerException ex) {
                // This happens if you talk to a non-HTTP port.
                // e.g. memcached!
                throw new QueryExceptionHTTP("Problems with HTTP response (was it an HTTP server?)", ex) ;
            }
            // 1xx: Informational
            // 2xx: Success
            // 3xx: Redirection
            // 4xx: Client Error
            // 5xx: Server Error
           
            if ( 300 <= responseCode && responseCode < 400 )
                throw new QueryExceptionHTTP(responseCode, responseMessage) ;
           
            // Other 400 and 500 - errors
           
            if ( responseCode >= 400 )
            {
               
                InputStream x = httpConnection.getErrorStream() ;
                if ( x != null )
                {
                    //String ct = httpConnection.getContentType() ;
                    //httpConnection.getContentEncoding() ;
                    String str = FileUtils.readWholeFileAsUTF8(x) ;
                    throw new QueryExceptionHTTP(responseCode, responseMessage+"\n"+str) ;
                }
                else
                    throw new QueryExceptionHTTP(responseCode, responseMessage) ;
            }
           
            // Request succeeded
            //httpConnection.setReadTimeout(10) ;
            InputStream in = httpConnection.getInputStream() ;

            //Get the returned content type so we can expose this later via the getContentType() method
            //We strip any parameters off the returned content type e.g. ;charset=UTF-8 since code that
            //consumes our getContentType() method will expect a bare MIME type
            contentTypeResult = httpConnection.getContentType() ;
            if (contentTypeResult.contains(";"))
            {
              contentTypeResult = contentTypeResult.substring(0, contentTypeResult.indexOf(';'));
            }
           
           
            //If compression was enabled and we got a compressed response as indicated by the presence of
            //a Content-Encoding header we need to ensure the input stream is appropriately wrapped in
            //the relevant stream type but checking that the JVM hasn't been clever enough to do
            //this for us already
            String contentEnc = httpConnection.getContentEncoding() ;
           
            if (contentEnc != null)
            {
              if (contentEnc.equalsIgnoreCase("gzip"))
              {
                if (!(in instanceof GZIPInputStream))
                {
                  in = new GZIPInputStream(in);
                }
              }
              else if (contentEnc.equalsIgnoreCase("deflate"))
              {
                if (!(in instanceof DeflaterInputStream))
                {
                  in = new DeflaterInputStream(in);
                }
              }
            }
           
            if ( false )
            {
                // Dump the header
                Map<String,List<String>> map = httpConnection.getHeaderFields() ;
                for ( Iterator<String> iter = map.keySet().iterator() ; iter.hasNext() ; )
                {
                    String k = iter.next();
                    List<String> v = map.get(k) ;
                    System.out.println(k+" = "+v) ;
                }
            }
           
            // Dump response body
            if ( false )
            {
                StringBuffer b = new StringBuffer(1000) ;
                byte[] chars = new byte[1000] ;
                while(true)
                {
                    int x = in.read(chars) ;
                    if ( x < 0 ) break ;
                    b.append(new String(chars, 0, x, FileUtils.encodingUTF8)) ;
                }
                System.out.println(b.toString()) ;
                System.out.flush() ;
                // Reset
                in = new ByteArrayInputStream(b.toString().getBytes(FileUtils.encodingUTF8)) ;
            }
           
           
            // +++ WORKAROUND for badly behaved apps.
            // Apps sometimes call QueryExecution.close straight after .execSelect.
            // that results in some resuls being seen, not all of them => XMl parse errors.
//            byte[] bytes = IO.readWholeFile(in) ;
//            in.close()           
//            in = new ByteArrayInputStream(bytes) ;
            // +++
          
            return in ;
        }
        catch (IOException ioEx)
        {
            throw new QueryExceptionHTTP(ioEx) ;
        }
        catch (QueryExceptionHTTP httpEx)
        {
          //We want to throw this upwards and not catch it in the next block and inadvertently rewrap it
          //since that can hide the real error details from the user
          throw httpEx;
        }
        catch (JenaException rdfEx)
        {
            throw new QueryExceptionHTTP(rdfEx) ;
        }
    }
   
    @Override
    public String toString()
    {
        String s = httpString() ;
        if ( s != null && s.length() > 0 )
            return serviceURL+"?"+s ;
        return serviceURL ;
    }
}
TOP

Related Classes of com.hp.hpl.jena.sparql.engine.http.HttpQuery

TOP
Copyright © 2018 www.massapi.com. All rights reserved.
All source code are property of their respective owners. Java is a trademark of Sun Microsystems, Inc and owned by ORACLE Inc. Contact coftware#gmail.com.