[prev in list] [next in list] [prev in thread] [next in thread] 

List:       httpclient-commons-dev
Subject:    [jira] Commented: (HTTPCLIENT-778) DefaultRedirectHandler not
From:       "Sam Berlin (JIRA)" <jira () apache ! org>
Date:       2008-05-27 16:16:02
Message-ID: 209794026.1211904962768.JavaMail.jira () brutus
[Download RAW message or body]


    [ https://issues.apache.org/jira/browse/HTTPCLIENT-778?page=com.atlassian.jira.plu \
gin.system.issuetabpanels:comment-tabpanel&focusedCommentId=12600173#action_12600173 \
] 

Sam Berlin commented on HTTPCLIENT-778:
---------------------------------------

FWIW, HttpClient 4.0 is setup so that you can set your own RedirectHandler that can \
allow interacting with malformed servers.

> DefaultRedirectHandler not encoding url before making http request. 
> --------------------------------------------------------------------
> 
> Key: HTTPCLIENT-778
> URL: https://issues.apache.org/jira/browse/HTTPCLIENT-778
> Project: HttpComponents HttpClient
> Issue Type: Bug
> Components: HttpClient
> Affects Versions: 4.0 Alpha 4
> Environment: Windows XP, JRE_1.5.0_14
> Reporter: Mark Hankey
> 
> The redirect url from the server has a space and should be converted to %20 before \
> the redirect request is made.  The following test class reproduces the issue: /*
> * $HeadURL: https://svn.apache.org/repos/asf/httpcomponents/httpclient/tags/4.0-alph \
> a4/module-client/src/examples/org/apache/http/examples/client/ClientFormLogin.java \
>                 $
> * $Revision: 645074 $
> * $Date: 2008-04-05 12:59:59 +0200 (Sat, 05 Apr 2008) $
> * ====================================================================
> *
> *  Licensed to the Apache Software Foundation (ASF) under one or more
> *  contributor license agreements.  See the NOTICE file distributed with
> *  this work for additional information regarding copyright ownership.
> *  The ASF licenses this file to You under the Apache License, Version 2.0
> *  (the "License"); you may not use this file except in compliance with
> *  the License.  You may obtain a copy of the License at
> *
> *      http://www.apache.org/licenses/LICENSE-2.0
> *
> *  Unless required by applicable law or agreed to in writing, software
> *  distributed under the License is distributed on an "AS IS" BASIS,
> *  WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
> *  See the License for the specific language governing permissions and
> *  limitations under the License.
> * ====================================================================
> *
> * This software consists of voluntary contributions made by many
> * individuals on behalf of the Apache Software Foundation.  For more
> * information on the Apache Software Foundation, please see
> * <http://www.apache.org/>.
> *
> */
> package org.apache.http.examples.client;
> import java.util.ArrayList;
> import java.util.List;
> import java.util.Iterator;
> import au.id.jericho.lib.html.*;
> import java.util.*;
> import org.apache.http.Header;
> import org.apache.http.message.*;
> import org.apache.http.HttpEntity;
> import org.apache.http.HttpHost;
> import org.apache.http.HttpResponse;
> import org.apache.http.NameValuePair;
> import org.apache.http.client.entity.UrlEncodedFormEntity;
> import org.apache.http.client.methods.HttpGet;
> import org.apache.http.client.methods.HttpPost;
> import org.apache.http.client.params.CookiePolicy;
> import org.apache.http.client.params.ClientPNames;
> import org.apache.http.conn.params.ConnRoutePNames;
> import org.apache.http.cookie.Cookie;
> import org.apache.http.impl.client.DefaultHttpClient;
> import org.apache.http.message.BasicNameValuePair;
> import org.apache.http.protocol.HTTP;
> import org.apache.http.util.EntityUtils;
> import org.apache.http.params.*;
> /**
> * A example that demonstrates how HttpClient APIs can be used to perform
> * form-based logon.
> */
> public class ClientFormLogin {
> public static void main(String[] args) throws Exception {
> DefaultHttpClient httpclient = new DefaultHttpClient();
> final HttpHost proxy =        	
> // new HttpHost("127.0.0.1", 8666, "http");
> new HttpHost("135.214.42.162", 8080, "http");
> //added
> HttpResponse response = null;
> HttpEntity entity = null;
> httpclient.getParams().setParameter(
> ClientPNames.COOKIE_POLICY, CookiePolicy.BROWSER_COMPATIBILITY);
> httpclient.getParams().setParameter(
> ClientPNames.DEFAULT_HOST, "http://www.fultonassessor.org");
> 
> 
> //httpclient.getParams().setParameter(   ClientPNames.DEFAULT_HEADERS, \
> "Accept-Language=en-us"); httpclient.getParams().setParameter("User-Agent", \
> "Mozilla/4.0 (compatible; MSIE 6.0; Windows NT 5.1; SV1; .NET CLR 1.1.4322; .NET \
> CLR 2.0.50727; .NET CLR 3.0.04506.30; InfoPath.1)"); \
> //httpclient.getParams().setParameter("http.language.Accept-Language", "en-us"); \
> //httpclient.getParams().setParameter("Accept", "image/gif, image/x-xbitmap, \
> image/jpeg, image/pjpeg, application/vnd.ms-excel, application/vnd.ms-powerpoint, \
> application/msword,*/*"); 
> 
> httpclient.getParams().setParameter(ConnRoutePNames.DEFAULT_PROXY, proxy);
> 
> //HttpGet httpget = new \
> HttpGet("http://www.fultonassessor.org/Forms/Datalets.aspx?idx=1&parid=14%20007700061068&jur=000&roll=RE&taxyear=2007&ownseq=1&sIndex=0");
>  //httpget.addHeader("Accept", "application/xaml+xml, image/gif, image/x-xbitmap, \
> image/jpeg, image/pjpeg, application/vnd.ms-excel, application/vnd.ms-powerpoint, \
> application/msword,*/*"); 
> /*
> HttpResponse response = httpclient.execute(httpget);
> HttpEntity entity = response.getEntity();
> System.out.println("Login form get: " + response.getStatusLine());
> if (entity != null) {
> entity.consumeContent();
> }
> System.out.println("Initial set of cookies:");
> List<Cookie> cookies = httpclient.getCookieStore().getCookies();
> if (cookies.isEmpty()) {
> System.out.println("None");
> } else {
> for (int i = 0; i < cookies.size(); i++) {
> System.out.println("- " + cookies.get(i).toString());
> }
> }
> 		*/
> HttpPost httpost = new \
> HttpPost("http://www.fultonassessor.org/Search/GenericSearch.aspx?mode=PARID"); 
> List <NameValuePair> nvps = new ArrayList <NameValuePair>();
> /*
> nvps.add(new BasicNameValuePair("PARID", "14 007700061068"));
> nvps.add(new BasicNameValuePair("inpParid", "14 007700061068"));  
> nvps.add(new BasicNameValuePair("ReportsListParIDs", "14007700061068"));
> nvps.add(new BasicNameValuePair("selPageSize", "15"));  
> nvps.add(new BasicNameValuePair("selSortDir", "Ascending")); 
> nvps.add(new BasicNameValuePair("lblRoll", "Roll Type"));
> nvps.add(new BasicNameValuePair("inpRoll", "-Any-"));
> nvps.add(new BasicNameValuePair("selSortBy", "PARID"));
> nvps.add(new BasicNameValuePair("SortBy", "Parcel ID"));
> nvps.add(new BasicNameValuePair("SortDir", " asc"));
> nvps.add(new BasicNameValuePair("selSortBy", "Parcel ID"));
> nvps.add(new BasicNameValuePair("PageSize", "15"));
> */
> //nvps.add(new BasicNameValuePair("hdIDX", "14007700061068"));
> //nvps.add(new BasicNameValuePair("hdPin", "14 007700061068"));
> //nvps.add(new BasicNameValuePair("hdTaxYear", "2007"));
> //nvps.add(new BasicNameValuePair("hdJur", "000"));
> //nvps.add(new BasicNameValuePair("hdOwnSeq", "1"));
> //nvps.add(new BasicNameValuePair("hdMask", "1"));
> //nvps.add(new BasicNameValuePair("hdsIndex", "0"));   
> 
> nvps.add(new BasicNameValuePair("PageNum", "1"));
> nvps.add(new BasicNameValuePair("SortBy", "PARID"));
> nvps.add(new BasicNameValuePair("SortDir", " asc"));
> nvps.add(new BasicNameValuePair("PageSize", "15"));
> nvps.add(new BasicNameValuePair("mode", "PARID"));
> nvps.add(new BasicNameValuePair("hdAction", "Search"));
> nvps.add(new BasicNameValuePair("hdListType", "PA"));
> nvps.add(new BasicNameValuePair("sIndex", "-1"));
> nvps.add(new BasicNameValuePair("inpParid", "14 -0056-0005-058-7"));
> nvps.add(new BasicNameValuePair("selSortBy", "PARID"));
> nvps.add(new BasicNameValuePair("selSortDir", " asc"));
> nvps.add(new BasicNameValuePair("selPageSize", "15"));
> 
> nvps.add(new BasicNameValuePair("hdSelected", ""));
> nvps.add(new BasicNameValuePair("hdsIndex", ""));
> nvps.add(new BasicNameValuePair("hdSkip", ""));
> nvps.add(new BasicNameValuePair("inpRoll", ""));
> 
> nvps.add(new BasicNameValuePair("__VIEWSTATE", \
> "dDwtMTg0MjE5NjgzODt0PEAwPDtvPHQ+Oz47bDxpPDA+Oz47bDx0PDtsPGk8Nj47PjtsPHQ8cDxwPGw8VmlzaWJsZTs+O2w8bzxmPjs+Pjs+Ozs+Oz4+Oz4+Oz4="));
>  
> 
> 
> 
> 
> //nvps.add(new BasicNameValuePair("IDToken2", "password"));
> httpost.setEntity(new UrlEncodedFormEntity(nvps, HTTP.UTF_8));
> //response = httpclient.execute(httpost);
> // Add default headers
> List<BasicHeader> defaultHeaders = new ArrayList();
> defaultHeaders.add(new BasicHeader("Accept-Language", "en-us"));
> defaultHeaders.add(new BasicHeader("Accept", "image/gif, image/x-xbitmap, \
> image/jpeg, image/pjpeg, application/xaml+xml, application/vnd.ms-xpsdocument, \
> application/x-ms-xbap, application/x-ms-application, application/x-shockwave-flash, \
> application/vnd.ms-excel, application/vnd.ms-powerpoint, application/msword, \
> */*")); defaultHeaders.add(new BasicHeader("Pragma", "no-cache"));
> defaultHeaders.add(new BasicHeader("Proxy-Connection", "Keep-Alive"));
> //defaultHeaders.add(new BasicHeader("Referer", \
> "http://www.fultonassessor.org/Search/GenericSearch.aspx?mode=PARID")); 
> 
> 
> defaultHeaders.add(new BasicHeader("Content-Type", \
> "application/x-www-form-urlencoded")); 
> //httpget.getParams().setParameter(ClientPNames.DEFAULT_HEADERS,defaultHeaders);
> httpost.getParams().setParameter(ClientPNames.DEFAULT_HEADERS,defaultHeaders);
> 
> //response = httpclient.execute(httpget);
> response = httpclient.execute(httpost);
> entity = response.getEntity();
> try{
> entity = response.getEntity();
> System.out.println("----------------------------------------");
> System.out.println(response.getStatusLine());
> Header[] headers = response.getAllHeaders();
> for (int i=0; i<headers.length; i++) {
> System.out.println(headers[i]);
> }
> System.out.println("----------------------------------------");
> String responseString = null;
> if (response.getEntity() != null) {
> 	responseString = EntityUtils.toString(response.getEntity());
> System.out.println(responseString);
> }
> 
> //parseInJerico(responseString);
> } finally {
> // If we could be sure that the stream of the entity has been
> // closed, we wouldn't need this code to release the connection.
> // However, EntityUtils.toString(...) can throw an exception.
> // if there is no entity, the connection is already released
> if (entity != null)
> entity.consumeContent(); // release connection gracefully
> }
> System.out.println("Login form get: " + response.getStatusLine());
> if (entity != null) {
> entity.consumeContent();
> }
> System.out.println("Post logon cookies:");
> /*
> cookies = httpclient.getCookieStore().getCookies();
> if (cookies.isEmpty()) {
> System.out.println("None");
> } else {
> for (int i = 0; i < cookies.size(); i++) {
> System.out.println("- " + cookies.get(i).toString());
> }
> }
> */
> }
> 
> /*
> 
> 	public  static void parseInJerico(String htmlString) throws Exception {
> 		System.out.println("----------------------------------------");
> 		System.out.println("---PARSING IN JERICO---");
> 		System.out.println("----------------------------------------");
> 		// Call fullSequentialParse manually as most of the source will be parsed.
> 		Source source  = new Source(htmlString);
> 		source.fullSequentialParse();
> 		System.out.println("Document title:");
> 		String title=getTitle(source);
> 		System.out.println(title==null ? "(none)" : title);
> 		System.out.println("\nDocument description:");
> 		String description=getMetaValue(source,"description");
> 		System.out.println(description==null ? "(none)" : description);
> 		System.out.println("\nDocument keywords:");
> 		String keywords=getMetaValue(source,"keywords");
> 		System.out.println(keywords==null ? "(none)" : keywords);
> 	
> 		System.out.println("\nLinks to other documents:");
> 		List linkElements=source.findAllElements(HTMLElementName.A);
> 		for (Iterator i=linkElements.iterator(); i.hasNext();) {
> 			Element linkElement=(Element)i.next();
> 			String href=linkElement.getAttributeValue("href");
> 			if (href==null) continue;
> 			// A element can contain other tags so need to extract the text from it:
> 			String label=linkElement.getContent().getTextExtractor().toString();
> 			System.out.println(label+" <"+href+'>');
> 		}
> 		System.out.println("\nAll text from file (exluding content inside SCRIPT and \
> STYLE elements):\n");  \
> System.out.println(source.getTextExtractor().setIncludeAttributes(true).toString());
>   System.out.println("\nSame again but this time extend the TextExtractor class to \
> also exclude text from P elements and any elements with class=\"control\":\n");  \
> TextExtractor textExtractor=new TextExtractor(source) {  public boolean \
> excludeElement(StartTag startTag) {  return startTag.getName()==HTMLElementName.P \
> || "control".equalsIgnoreCase(startTag.getAttributeValue("class"));  }
> 		};
> 		System.out.println(textExtractor.setIncludeAttributes(true).toString());
> }
> 	private static String getTitle(Source source) {
> 		Element titleElement=source.findNextElement(0,HTMLElementName.TITLE);
> 		if (titleElement==null) return null;
> 		// TITLE element never contains other tags so just decode it collapsing \
> whitespace:  return \
> CharacterReference.decodeCollapseWhiteSpace(titleElement.getContent());  }
> 	private static String getMetaValue(Source source, String key) {
> 		for (int pos=0; pos<source.length();) {
> 			StartTag startTag=source.findNextStartTag(pos,"name",key,false);
> 			if (startTag==null) return null;
> 			if (startTag.getName()==HTMLElementName.META)
> 				return startTag.getAttributeValue("content"); // Attribute values are \
> automatically decoded  pos=startTag.getEnd();
> 		}
> 		return null;
> 	}
> 	*/
> }

-- 
This message is automatically generated by JIRA.
-
You can reply to this email to add a comment to the issue online.


---------------------------------------------------------------------
To unsubscribe, e-mail: dev-unsubscribe@hc.apache.org
For additional commands, e-mail: dev-help@hc.apache.org


[prev in list] [next in list] [prev in thread] [next in thread] 

Configure | About | News | Add a list | Sponsored by KoreLogic