tests/org.eclipse.wst.html.tests.encoding/src/org/eclipse/wst/html/tests/encoding/html/HTMLHeadTokenizerTester.java - sourceediting/webtools.sourceediting.tests - Git at Google

 /*******************************************************************************
  * Copyright (c) 2004 IBM Corporation and others.
  * All rights reserved. This program and the accompanying materials
  * are made available under the terms of the Eclipse Public License v1.0
  * which accompanies this distribution, and is available at
  * http://www.eclipse.org/legal/epl-v10.html
  *
  * Contributors:
  *     IBM Corporation - initial API and implementation
  *******************************************************************************/
 package org.eclipse.wst.html.tests.encoding.html;

 import java.io.IOException;
 import java.io.Reader;
 import java.util.regex.Pattern;

 import junit.framework.TestCase;

 import org.eclipse.wst.html.core.internal.contenttype.HTMLHeadTokenizer;
 import org.eclipse.wst.html.core.internal.contenttype.HTMLHeadTokenizerConstants;
 import org.eclipse.wst.html.core.internal.contenttype.HeadParserToken;
 import org.eclipse.wst.html.tests.encoding.HTMLEncodingTestsPlugin;
 import org.eclipse.wst.xml.core.internal.contenttype.EncodingParserConstants;

 public class HTMLHeadTokenizerTester extends TestCase {
 	private boolean DEBUG = false;
 	private String fCharset;

 	private String fContentTypeValue;
 	private final String fileDir = "html/";
 	private final String fileHome = "testfiles/";
 	private final String fileLocation = fileHome + fileDir;
 	private String fPageEncodingValue = null;
 	private String fXMLDecEncodingName;

 	private void doTestFile(String filename, String expectedName) throws IOException {
 		doTestFile(filename, expectedName, null);
 	}

 	private void doTestFile(String filename, String expectedName, String finalTokenType) throws IOException {
 		HTMLHeadTokenizer tokenizer = null;
 		Reader fileReader = null;
 		try {
 			if (DEBUG) {
 				System.out.println();
 				System.out.println("       " + filename);
 				System.out.println();
 			}
 			fileReader = HTMLEncodingTestsPlugin.getTestReader(filename);
 			tokenizer = new HTMLHeadTokenizer(fileReader);
 		}
 		catch (IOException e) {
 			System.out.println("Error opening file \"" + filename + "\"");
 		}

 		HeadParserToken resultToken = null;
 		HeadParserToken token = parseHeader(tokenizer);
 		String resultValue = getAppropriateEncoding();
 		fileReader.close();
 		if (finalTokenType != null) {
 			assertTrue("did not end as expected. found:  " + token.getType(), finalTokenType.equals(token.getType()));
 		}
 		else {
 			if (expectedName == null) {
 				assertTrue("expected no encoding, but found: " + resultValue, resultToken == null);
 			}
 			else {
 				// TODO: need to work on case issues
 				assertTrue("expected " + expectedName + " but found " + resultValue, expectedName.equals(resultValue.toUpperCase()));
 			}
 		}

 	}

 	// public void testMalformedNoEncoding() {
 	// String filename = fileLocation + "MalformedNoEncoding.jsp";
 	// doTestFile(filename);
 	// }
 	// public void testMalformedNoEncodingXSL() {
 	// String filename = fileLocation + "MalformedNoEncodingXSL.jsp";
 	// doTestFile(filename);
 	// }
 	// public void testNoEncoding() {
 	// String filename = fileLocation + "NoEncoding.jsp";
 	// doTestFile(filename);
 	// }
 	// public void testNormalNonDefault() {
 	// String filename = fileLocation + "NormalNonDefault.jsp";
 	// doTestFile(filename);
 	// }
 	// public void testNormalPageCaseNonDefault() {
 	// String filename = fileLocation + "NormalPageCaseNonDefault.jsp";
 	// doTestFile(filename);
 	// }
 	// public void testdefect223365() {
 	// String filename = fileLocation + "SelColBeanRow12ResultsForm.jsp";
 	// doTestFile(filename);
 	// }
 	/**
 	 * returns encoding according to priority: 1. XML Declaration 2. page
 	 * directive pageEncoding name 3. page directive contentType charset name
 	 */
 	private String getAppropriateEncoding() {
 		String result = null;
 		if (fXMLDecEncodingName != null)
 			result = fXMLDecEncodingName;
 		else if (fPageEncodingValue != null)
 			result = fPageEncodingValue;
 		else if (fCharset != null)
 			result = fCharset;
 		return result;
 	}

 	private boolean isLegalString(String tokenType) {
 		if (tokenType == null)
 			return false;
 		else
 			return tokenType.equals(EncodingParserConstants.StringValue) || tokenType.equals(EncodingParserConstants.UnDelimitedStringValue) || tokenType.equals(EncodingParserConstants.InvalidTerminatedStringValue) || tokenType.equals(EncodingParserConstants.InvalidTermintatedUnDelimitedStringValue);
 	}

 	private void parseContentTypeValue(String contentType) {
 		Pattern pattern = Pattern.compile(";\\s*charset\\s*=\\s*");
 		String[] parts = pattern.split(contentType);
 		if (parts.length > 0) {
 			// if only one item, it can still be charset instead of
 			// contentType
 			if (parts.length == 1) {
 				if (parts[0].length() > 6) {
 					String checkForCharset = parts[0].substring(0, 7);
 					if (checkForCharset.equalsIgnoreCase("charset")) {
 						int eqpos = parts[0].indexOf('=');
 						eqpos = eqpos + 1;
 						if (eqpos < parts[0].length()) {
 							fCharset = parts[0].substring(eqpos);
 							fCharset = fCharset.trim();
 						}
 					}
 				}
 			}
 			else {
 				// fContentType = parts[0];
 			}

 		}
 		if (parts.length > 1) {
 			fCharset = parts[1];
 		}
 	}

 	/**
 	 * Give's priority to encoding value, if found else, looks for contentType
 	 * value;
 	 */
 	private HeadParserToken parseHeader(HTMLHeadTokenizer tokenizer) throws IOException {
 		fPageEncodingValue = null;
 		fCharset = null;
 		/*
 		 * if (tokenType == XMLHeadTokenizerConstants.XMLDelEncoding) { if
 		 * (tokenizer.hasMoreTokens()) { ITextHeadRegion valueToken =
 		 * tokenizer.getNextToken(); String valueTokenType =
 		 * valueToken.getType(); if (isLegal(valueTokenType)) { resultValue =
 		 * valueToken.getText(); if (DEBUG) { System.out.println("XML Head
 		 * Tokenizer Found Encoding: " + resultValue); } } } }
 		 */
 		HeadParserToken token = null;
 		HeadParserToken finalToken = null;
 		do {
 			token = tokenizer.getNextToken();
 			if (DEBUG) {
 				System.out.println(token);
 			}
 			String tokenType = token.getType();
 			if (tokenType == HTMLHeadTokenizerConstants.MetaTagContentType) {
 				if (tokenizer.hasMoreTokens()) {
 					HeadParserToken valueToken = tokenizer.getNextToken();
 					if (DEBUG) {
 						System.out.println(valueToken);
 					}
 					String valueTokenType = valueToken.getType();
 					if (isLegalString(valueTokenType)) {
 						fContentTypeValue = valueToken.getText();

 					}
 				}
 			}

 		}
 		while (tokenizer.hasMoreTokens());
 		if (fContentTypeValue != null) {
 			parseContentTypeValue(fContentTypeValue);
 		}
 		finalToken = token;
 		return finalToken;

 	}

 	public void testBestCase() throws IOException {
 		String filename = fileLocation + "NormalNonDefault.html";
 		doTestFile(filename, "UTF-8");

 	}

 	// public void testIllFormed() {
 	// String filename = fileLocation + "testIllFormed.jsp";
 	// doTestFile(filename);
 	// }
 	// public void testIllFormed2() {
 	// String filename = fileLocation + "testIllFormed2.jsp";
 	// doTestFile(filename);
 	// }
 	// public void testIllformedNormalNonDefault() {
 	// String filename = fileLocation + "IllformedNormalNonDefault.jsp";
 	// doTestFile(filename);
 	// }
 	public void testEmptyFile() throws IOException {
 		String filename = fileLocation + "EmptyFile.html";
 		doTestFile(filename, null);
 	}

 	public void testIllFormedNormalNonDefault() throws IOException {
 		String filename = fileLocation + "IllformedNormalNonDefault.html";
 		doTestFile(filename, "UTF-8");
 	}

 	public void testLargeCase() throws IOException {
 		String filename = fileLocation + "LargeNonDefault.html";
 		doTestFile(filename, "ISO-8859-1");

 	}

 	public void testLargeNoEncoding() throws IOException {
 		String filename = fileLocation + "LargeNoEncoding.html";
 		doTestFile(filename, null, EncodingParserConstants.MAX_CHARS_REACHED);

 	}

 	public void testMultiNonDefault() throws IOException {
 		String filename = fileLocation + "MultiNonDefault.html";
 		doTestFile(filename, "ISO-8859-6");
 	}

 	public void testNoEncoding() throws IOException {
 		String filename = fileLocation + "NoEncoding.html";
 		doTestFile(filename, null);
 	}

 	public void testnoquotes() throws IOException {
 		String filename = fileLocation + "noquotes.html";
 		doTestFile(filename, "UTF-8");

 	}

 }
	/*******************************************************************************
	* Copyright (c) 2004 IBM Corporation and others.
	* All rights reserved. This program and the accompanying materials
	* are made available under the terms of the Eclipse Public License v1.0
	* which accompanies this distribution, and is available at
	* http://www.eclipse.org/legal/epl-v10.html
	*
	* Contributors:
	* IBM Corporation - initial API and implementation
	*******************************************************************************/
	package org.eclipse.wst.html.tests.encoding.html;

	import java.io.IOException;
	import java.io.Reader;
	import java.util.regex.Pattern;

	import junit.framework.TestCase;

	import org.eclipse.wst.html.core.internal.contenttype.HTMLHeadTokenizer;
	import org.eclipse.wst.html.core.internal.contenttype.HTMLHeadTokenizerConstants;
	import org.eclipse.wst.html.core.internal.contenttype.HeadParserToken;
	import org.eclipse.wst.html.tests.encoding.HTMLEncodingTestsPlugin;
	import org.eclipse.wst.xml.core.internal.contenttype.EncodingParserConstants;

	public class HTMLHeadTokenizerTester extends TestCase {
	private boolean DEBUG = false;
	private String fCharset;

	private String fContentTypeValue;
	private final String fileDir = "html/";
	private final String fileHome = "testfiles/";
	private final String fileLocation = fileHome + fileDir;
	private String fPageEncodingValue = null;
	private String fXMLDecEncodingName;

	private void doTestFile(String filename, String expectedName) throws IOException {
	doTestFile(filename, expectedName, null);
	}

	private void doTestFile(String filename, String expectedName, String finalTokenType) throws IOException {
	HTMLHeadTokenizer tokenizer = null;
	Reader fileReader = null;
	try {
	if (DEBUG) {
	System.out.println();
	System.out.println(" " + filename);
	System.out.println();
	}
	fileReader = HTMLEncodingTestsPlugin.getTestReader(filename);
	tokenizer = new HTMLHeadTokenizer(fileReader);
	}
	catch (IOException e) {
	System.out.println("Error opening file \"" + filename + "\"");
	}

	HeadParserToken resultToken = null;
	HeadParserToken token = parseHeader(tokenizer);
	String resultValue = getAppropriateEncoding();
	fileReader.close();
	if (finalTokenType != null) {
	assertTrue("did not end as expected. found: " + token.getType(), finalTokenType.equals(token.getType()));
	}
	else {
	if (expectedName == null) {
	assertTrue("expected no encoding, but found: " + resultValue, resultToken == null);
	}
	else {
	// TODO: need to work on case issues
	assertTrue("expected " + expectedName + " but found " + resultValue, expectedName.equals(resultValue.toUpperCase()));
	}
	}

	}

	// public void testMalformedNoEncoding() {
	// String filename = fileLocation + "MalformedNoEncoding.jsp";
	// doTestFile(filename);
	// }
	// public void testMalformedNoEncodingXSL() {
	// String filename = fileLocation + "MalformedNoEncodingXSL.jsp";
	// doTestFile(filename);
	// }
	// public void testNoEncoding() {
	// String filename = fileLocation + "NoEncoding.jsp";
	// doTestFile(filename);
	// }
	// public void testNormalNonDefault() {
	// String filename = fileLocation + "NormalNonDefault.jsp";
	// doTestFile(filename);
	// }
	// public void testNormalPageCaseNonDefault() {
	// String filename = fileLocation + "NormalPageCaseNonDefault.jsp";
	// doTestFile(filename);
	// }
	// public void testdefect223365() {
	// String filename = fileLocation + "SelColBeanRow12ResultsForm.jsp";
	// doTestFile(filename);
	// }
	/**
	* returns encoding according to priority: 1. XML Declaration 2. page
	* directive pageEncoding name 3. page directive contentType charset name
	*/
	private String getAppropriateEncoding() {
	String result = null;
	if (fXMLDecEncodingName != null)
	result = fXMLDecEncodingName;
	else if (fPageEncodingValue != null)
	result = fPageEncodingValue;
	else if (fCharset != null)
	result = fCharset;
	return result;
	}

	private boolean isLegalString(String tokenType) {
	if (tokenType == null)
	return false;
	else
	return tokenType.equals(EncodingParserConstants.StringValue) \|\| tokenType.equals(EncodingParserConstants.UnDelimitedStringValue) \|\| tokenType.equals(EncodingParserConstants.InvalidTerminatedStringValue) \|\| tokenType.equals(EncodingParserConstants.InvalidTermintatedUnDelimitedStringValue);
	}

	private void parseContentTypeValue(String contentType) {
	Pattern pattern = Pattern.compile(";\\scharset\\s=\\s*");
	String[] parts = pattern.split(contentType);
	if (parts.length > 0) {
	// if only one item, it can still be charset instead of
	// contentType
	if (parts.length == 1) {
	if (parts[0].length() > 6) {
	String checkForCharset = parts[0].substring(0, 7);
	if (checkForCharset.equalsIgnoreCase("charset")) {
	int eqpos = parts[0].indexOf('=');
	eqpos = eqpos + 1;
	if (eqpos < parts[0].length()) {
	fCharset = parts[0].substring(eqpos);
	fCharset = fCharset.trim();
	}
	}
	}
	}
	else {
	// fContentType = parts[0];
	}

	}
	if (parts.length > 1) {
	fCharset = parts[1];
	}
	}

	/**
	* Give's priority to encoding value, if found else, looks for contentType
	* value;
	*/
	private HeadParserToken parseHeader(HTMLHeadTokenizer tokenizer) throws IOException {
	fPageEncodingValue = null;
	fCharset = null;
	/*
	* if (tokenType == XMLHeadTokenizerConstants.XMLDelEncoding) { if
	* (tokenizer.hasMoreTokens()) { ITextHeadRegion valueToken =
	* tokenizer.getNextToken(); String valueTokenType =
	* valueToken.getType(); if (isLegal(valueTokenType)) { resultValue =
	* valueToken.getText(); if (DEBUG) { System.out.println("XML Head
	* Tokenizer Found Encoding: " + resultValue); } } } }
	*/
	HeadParserToken token = null;
	HeadParserToken finalToken = null;
	do {
	token = tokenizer.getNextToken();
	if (DEBUG) {
	System.out.println(token);
	}
	String tokenType = token.getType();
	if (tokenType == HTMLHeadTokenizerConstants.MetaTagContentType) {
	if (tokenizer.hasMoreTokens()) {
	HeadParserToken valueToken = tokenizer.getNextToken();
	if (DEBUG) {
	System.out.println(valueToken);
	}
	String valueTokenType = valueToken.getType();
	if (isLegalString(valueTokenType)) {
	fContentTypeValue = valueToken.getText();

	}
	}
	}

	}
	while (tokenizer.hasMoreTokens());
	if (fContentTypeValue != null) {
	parseContentTypeValue(fContentTypeValue);
	}
	finalToken = token;
	return finalToken;

	}

	public void testBestCase() throws IOException {
	String filename = fileLocation + "NormalNonDefault.html";
	doTestFile(filename, "UTF-8");

	}

	// public void testIllFormed() {
	// String filename = fileLocation + "testIllFormed.jsp";
	// doTestFile(filename);
	// }
	// public void testIllFormed2() {
	// String filename = fileLocation + "testIllFormed2.jsp";
	// doTestFile(filename);
	// }
	// public void testIllformedNormalNonDefault() {
	// String filename = fileLocation + "IllformedNormalNonDefault.jsp";
	// doTestFile(filename);
	// }
	public void testEmptyFile() throws IOException {
	String filename = fileLocation + "EmptyFile.html";
	doTestFile(filename, null);
	}

	public void testIllFormedNormalNonDefault() throws IOException {
	String filename = fileLocation + "IllformedNormalNonDefault.html";
	doTestFile(filename, "UTF-8");
	}

	public void testLargeCase() throws IOException {
	String filename = fileLocation + "LargeNonDefault.html";
	doTestFile(filename, "ISO-8859-1");

	}

	public void testLargeNoEncoding() throws IOException {
	String filename = fileLocation + "LargeNoEncoding.html";
	doTestFile(filename, null, EncodingParserConstants.MAX_CHARS_REACHED);

	}

	public void testMultiNonDefault() throws IOException {
	String filename = fileLocation + "MultiNonDefault.html";
	doTestFile(filename, "ISO-8859-6");
	}

	public void testNoEncoding() throws IOException {
	String filename = fileLocation + "NoEncoding.html";
	doTestFile(filename, null);
	}

	public void testnoquotes() throws IOException {
	String filename = fileLocation + "noquotes.html";
	doTestFile(filename, "UTF-8");

	}

	}