From 6ffe56b42c2b045c856455ca21302bbce5e38b0c Mon Sep 17 00:00:00 2001
From: Yasser Ganjisaffar <ganjisaffar@gmail.com>
Date: Tue, 3 Feb 2015 22:27:09 -0800
Subject: [PATCH] [style] re-format code

---
 .../ics/crawler4j/crawler/CrawlConfig.java    |   8 +-
 .../crawler4j/crawler/CrawlController.java    |  30 +++--
 .../edu/uci/ics/crawler4j/crawler/Page.java   |  12 +-
 .../uci/ics/crawler4j/crawler/WebCrawler.java | 103 +++++++++---------
 .../crawler/authentication/AuthInfo.java      |  12 +-
 .../crawler/authentication/BasicAuthInfo.java |   6 +-
 .../crawler/authentication/FormAuthInfo.java  |  12 +-
 .../crawler/exceptions/RedirectException.java |   3 +-
 .../crawler4j/fetcher/PageFetchResult.java    |   8 +-
 .../ics/crawler4j/fetcher/PageFetcher.java    |  84 +++++++-------
 .../uci/ics/crawler4j/frontier/Counters.java  |  24 ++--
 .../ics/crawler4j/frontier/DocIDServer.java   |  12 +-
 .../uci/ics/crawler4j/frontier/Frontier.java  |  10 +-
 .../crawler4j/frontier/InProcessPagesDB.java  |   9 +-
 .../ics/crawler4j/frontier/WorkQueues.java    |  19 +++-
 .../ics/crawler4j/parser/BinaryParseData.java |  12 +-
 .../crawler4j/parser/HtmlContentHandler.java  |  11 +-
 .../ics/crawler4j/parser/HtmlParseData.java   |   4 +-
 .../parser/NotAllowedContentException.java    |   6 +-
 .../uci/ics/crawler4j/parser/ParseData.java   |   4 +-
 .../edu/uci/ics/crawler4j/parser/Parser.java  |  12 +-
 .../ics/crawler4j/parser/TextParseData.java   |   4 +-
 .../crawler4j/robotstxt/RobotstxtServer.java  |  21 ++--
 .../edu/uci/ics/crawler4j/url/TLDList.java    |  14 ++-
 .../ics/crawler4j/url/URLCanonicalizer.java   |  22 ++--
 .../uci/ics/crawler4j/url/UrlResolver.java    |  13 +--
 .../edu/uci/ics/crawler4j/url/WebURL.java     |   2 +-
 .../java/edu/uci/ics/crawler4j/util/IO.java   |   7 +-
 .../java/edu/uci/ics/crawler4j/util/Net.java  |  25 ++---
 .../java/edu/uci/ics/crawler4j/util/Util.java |  25 +++--
 .../examples/basic/BasicCrawlController.java  |   6 +-
 .../examples/basic/BasicCrawler.java          |  20 ++--
 .../imagecrawler/ImageCrawlController.java    |   9 +-
 .../examples/imagecrawler/ImageCrawler.java   |   9 +-
 .../examples/localdata/Downloader.java        |   9 +-
 .../LocalDataCollectorController.java         |  75 ++++++-------
 .../localdata/LocalDataCollectorCrawler.java  |  22 ++--
 .../examples/multiple/BasicCrawler.java       |  10 +-
 .../multiple/MultipleCrawlerController.java   |   9 +-
 .../examples/shutdown/BasicCrawler.java       |  16 +--
 .../shutdown/ControllerWithShutdown.java      |   5 +-
 .../StatusHandlerCrawlController.java         |   5 +-
 .../statushandler/StatusHandlerCrawler.java   |  72 ++++++------
 .../uci/ics/crawler4j/tests/TLDListTest.java  |   9 +-
 .../crawler4j/tests/URLCanonicalizerTest.java |  43 ++++----
 .../uci/ics/crawler4j/tests/WebURLTest.java   |   3 +-
 46 files changed, 467 insertions(+), 389 deletions(-)
diff --git a/src/main/java/edu/uci/ics/crawler4j/crawler/CrawlConfig.java b/src/main/java/edu/uci/ics/crawler4j/crawler/CrawlConfig.java
index 941c40a9c..3d79c97e4 100644
--- a/src/main/java/edu/uci/ics/crawler4j/crawler/CrawlConfig.java
+++ b/src/main/java/edu/uci/ics/crawler4j/crawler/CrawlConfig.java
@@ -17,11 +17,11 @@
 
 package edu.uci.ics.crawler4j.crawler;
 
-import edu.uci.ics.crawler4j.crawler.authentication.AuthInfo;
-
 import java.util.ArrayList;
 import java.util.List;
 
+import edu.uci.ics.crawler4j.crawler.authentication.AuthInfo;
+
 public class CrawlConfig {
 
   /**
@@ -133,8 +133,8 @@ public class CrawlConfig {
   private String proxyPassword = null;
 
   /**
-  * List of possible authentications needed by crawler
-  */
+   * List of possible authentications needed by crawler
+   */
   private List<AuthInfo> authInfos;
 
   public CrawlConfig() {
diff --git a/src/main/java/edu/uci/ics/crawler4j/crawler/CrawlController.java b/src/main/java/edu/uci/ics/crawler4j/crawler/CrawlController.java
index 0cabbab59..34a90becd 100644
--- a/src/main/java/edu/uci/ics/crawler4j/crawler/CrawlController.java
+++ b/src/main/java/edu/uci/ics/crawler4j/crawler/CrawlController.java
@@ -17,8 +17,16 @@
 
 package edu.uci.ics.crawler4j.crawler;
 
+import java.io.File;
+import java.util.ArrayList;
+import java.util.List;
+
+import org.slf4j.Logger;
+import org.slf4j.LoggerFactory;
+
 import com.sleepycat.je.Environment;
 import com.sleepycat.je.EnvironmentConfig;
+
 import edu.uci.ics.crawler4j.fetcher.PageFetcher;
 import edu.uci.ics.crawler4j.frontier.DocIDServer;
 import edu.uci.ics.crawler4j.frontier.Frontier;
@@ -26,12 +34,6 @@
 import edu.uci.ics.crawler4j.url.URLCanonicalizer;
 import edu.uci.ics.crawler4j.url.WebURL;
 import edu.uci.ics.crawler4j.util.IO;
-import org.slf4j.Logger;
-import org.slf4j.LoggerFactory;
-
-import java.io.File;
-import java.util.ArrayList;
-import java.util.List;
 
 /**
  * The controller that manages a crawling session. This class creates the
@@ -74,14 +76,16 @@ public class CrawlController extends Configurable {
   protected final Object waitingLock = new Object();
   protected final Environment env;
 
-  public CrawlController(CrawlConfig config, PageFetcher pageFetcher, RobotstxtServer robotstxtServer) throws Exception {
+  public CrawlController(CrawlConfig config, PageFetcher pageFetcher, RobotstxtServer robotstxtServer)
+      throws Exception {
     super(config);
 
     config.validate();
     File folder = new File(config.getCrawlStorageFolder());
     if (!folder.exists()) {
       if (!folder.mkdirs()) {
-        throw new Exception("couldn't create the storage folder: " + folder.getAbsolutePath() + " does it already exist ?");
+        throw new Exception(
+            "couldn't create the storage folder: " + folder.getAbsolutePath() + " does it already exist ?");
       } else {
         logger.debug("Created folder: " + folder.getAbsolutePath());
       }
@@ -214,7 +218,9 @@ public void run() {
                       if (queueLength > 0) {
                         continue;
                       }
-                      logger.info("No thread is working and no more URLs are in queue waiting for another 10 seconds to make sure...");
+                      logger.info(
+                          "No thread is working and no more URLs are in queue waiting for another 10 seconds to make " +
+                          "sure...");
                       sleep(10);
                       queueLength = frontier.getQueueLength();
                       if (queueLength > 0) {
@@ -282,7 +288,8 @@ public void waitUntilFinish() {
   }
 
   /**
-   * Once the crawling session finishes the controller collects the local data of the crawler threads and stores them in a List.
+   * Once the crawling session finishes the controller collects the local data of the crawler threads and stores them
+   * in a List.
    * This function returns the reference to this list.
    *
    * @return List of Objects which are your local data
@@ -354,7 +361,8 @@ public void addSeed(String pageUrl, int docId) {
       webUrl.setDocid(docId);
       webUrl.setDepth((short) 0);
       if (!robotstxtServer.allows(webUrl)) {
-        logger.warn("Robots.txt does not allow this seed: {}", pageUrl); // using the WARN level here, as the user specifically asked to add this seed
+        logger.warn("Robots.txt does not allow this seed: {}",
+                    pageUrl); // using the WARN level here, as the user specifically asked to add this seed
       } else {
         frontier.schedule(webUrl);
       }
diff --git a/src/main/java/edu/uci/ics/crawler4j/crawler/Page.java b/src/main/java/edu/uci/ics/crawler4j/crawler/Page.java
index 39148f5a4..a926ad33d 100644
--- a/src/main/java/edu/uci/ics/crawler4j/crawler/Page.java
+++ b/src/main/java/edu/uci/ics/crawler4j/crawler/Page.java
@@ -40,8 +40,8 @@ public class Page {
   protected WebURL url;
 
   /**
-  * Redirection flag
-  */
+   * Redirection flag
+   */
   protected boolean redirect;
 
   /**
@@ -50,8 +50,8 @@ public class Page {
   protected String redirectedToUrl;
 
   /**
-  * Status of the page
-  */
+   * Status of the page
+   */
   protected int statusCode;
 
   /**
@@ -78,8 +78,8 @@ public class Page {
   protected String contentCharset;
 
   /**
-  * Language of the Content.
-  */
+   * Language of the Content.
+   */
   private String language;
 
   /**
diff --git a/src/main/java/edu/uci/ics/crawler4j/crawler/WebCrawler.java b/src/main/java/edu/uci/ics/crawler4j/crawler/WebCrawler.java
index ff227ff26..015197dac 100644
--- a/src/main/java/edu/uci/ics/crawler4j/crawler/WebCrawler.java
+++ b/src/main/java/edu/uci/ics/crawler4j/crawler/WebCrawler.java
@@ -17,6 +17,13 @@
 
 package edu.uci.ics.crawler4j.crawler;
 
+import java.util.ArrayList;
+import java.util.List;
+import java.util.Locale;
+
+import org.apache.http.HttpStatus;
+import org.apache.http.impl.EnglishReasonPhraseCatalog;
+
 import edu.uci.ics.crawler4j.crawler.exceptions.ContentFetchException;
 import edu.uci.ics.crawler4j.crawler.exceptions.PageBiggerThanMaxSizeException;
 import edu.uci.ics.crawler4j.crawler.exceptions.ParseException;
@@ -30,18 +37,10 @@
 import edu.uci.ics.crawler4j.parser.Parser;
 import edu.uci.ics.crawler4j.robotstxt.RobotstxtServer;
 import edu.uci.ics.crawler4j.url.WebURL;
-
-import org.apache.http.HttpStatus;
-
-import org.apache.http.impl.EnglishReasonPhraseCatalog;
 import uk.org.lidalia.slf4jext.Level;
 import uk.org.lidalia.slf4jext.Logger;
 import uk.org.lidalia.slf4jext.LoggerFactory;
 
-import java.util.ArrayList;
-import java.util.List;
-import java.util.Locale;
-
 /**
  * WebCrawler class in the Runnable class that is executed by each crawler thread.
  *
@@ -168,26 +167,26 @@ protected void handlePageStatusCode(WebURL webUrl, int statusCode, String status
     // Sub-classed can override this to add their custom functionality
   }
 
-    /**
-     * This function is called before processing of the page's URL
-     * It can be overridden by subclasses for tweaking of the url before processing it.
-     * For example, http://abc.com/def?a=123 - http://abc.com/def
-     *
-     * @param curURL current URL which can be tweaked before processing
-     * @return tweaked WebURL
-     */
-    protected WebURL handleUrlBeforeProcess(WebURL curURL) {
-      return curURL;
-    }
+  /**
+   * This function is called before processing of the page's URL
+   * It can be overridden by subclasses for tweaking of the url before processing it.
+   * For example, http://abc.com/def?a=123 - http://abc.com/def
+   *
+   * @param curURL current URL which can be tweaked before processing
+   * @return tweaked WebURL
+   */
+  protected WebURL handleUrlBeforeProcess(WebURL curURL) {
+    return curURL;
+  }
 
-    /**
-     * This function is called if the content of a url is bigger than allowed size.
-     *
-     * @param urlStr - The URL which it's content is bigger than allowed size
-     */
-    protected void onPageBiggerThanMaxSize(String urlStr, long pageSize) {
-      logger.warn("Skipping a URL: {} which was bigger ( {} ) than max allowed size", urlStr, pageSize);
-    }
+  /**
+   * This function is called if the content of a url is bigger than allowed size.
+   *
+   * @param urlStr - The URL which it's content is bigger than allowed size
+   */
+  protected void onPageBiggerThanMaxSize(String urlStr, long pageSize) {
+    logger.warn("Skipping a URL: {} which was bigger ( {} ) than max allowed size", urlStr, pageSize);
+  }
 
   /**
    * This function is called if the crawler encountered an unexpected http status code ( a status code other than 3xx)
@@ -197,11 +196,11 @@ protected void onPageBiggerThanMaxSize(String urlStr, long pageSize) {
    * @param contentType Type of Content
    * @param description Error Description
    */
-    protected void onUnexpectedStatusCode(String urlStr, int statusCode, String contentType, String description) {
-      logger.warn("Skipping URL: {}, StatusCode: {}, {}, {}", urlStr, statusCode, contentType, description);
-      // Do nothing by default (except basic logging)
-      // Sub-classed can override this to add their custom functionality
-    }
+  protected void onUnexpectedStatusCode(String urlStr, int statusCode, String contentType, String description) {
+    logger.warn("Skipping URL: {}, StatusCode: {}, {}, {}", urlStr, statusCode, contentType, description);
+    // Do nothing by default (except basic logging)
+    // Sub-classed can override this to add their custom functionality
+  }
 
   /**
    * This function is called if the content of a url could not be fetched.
@@ -271,18 +270,18 @@ public void run() {
   }
 
   /**
-  * Classes that extends WebCrawler should overwrite this function to tell the
-  * crawler whether the given url should be crawled or not. The following
-  * implementation indicates that all urls should be included in the crawl.
-  *
-  * @param url
-  *            the url which we are interested to know whether it should be
-  *            included in the crawl or not.
-  * @param page
-  *           Page context from which this URL was scraped
-  * @return if the url should be included in the crawl it returns true,
-  *         otherwise false is returned.
-  */
+   * Classes that extends WebCrawler should overwrite this function to tell the
+   * crawler whether the given url should be crawled or not. The following
+   * implementation indicates that all urls should be included in the crawl.
+   *
+   * @param url
+   *            the url which we are interested to know whether it should be
+   *            included in the crawl or not.
+   * @param page
+   *           Page context from which this URL was scraped
+   * @return if the url should be included in the crawl it returns true,
+   *         otherwise false is returned.
+   */
   public boolean shouldVisit(Page page, WebURL url) {
     return true;
   }
@@ -308,15 +307,17 @@ private void processPage(WebURL curURL) {
 
       fetchResult = pageFetcher.fetchPage(curURL);
       int statusCode = fetchResult.getStatusCode();
-      handlePageStatusCode(curURL, statusCode, EnglishReasonPhraseCatalog.INSTANCE.getReason(statusCode, Locale.ENGLISH)); // Finds the status reason for all known statuses
+      handlePageStatusCode(curURL, statusCode, EnglishReasonPhraseCatalog.INSTANCE
+          .getReason(statusCode, Locale.ENGLISH)); // Finds the status reason for all known statuses
 
       Page page = new Page(curURL);
       page.setFetchResponseHeaders(fetchResult.getResponseHeaders());
       page.setStatusCode(statusCode);
       if (statusCode != HttpStatus.SC_OK) { // Not 200
-        if (statusCode == HttpStatus.SC_MOVED_PERMANENTLY || statusCode == HttpStatus.SC_MOVED_TEMPORARILY
-            || statusCode == HttpStatus.SC_MULTIPLE_CHOICES || statusCode == HttpStatus.SC_SEE_OTHER
-            || statusCode == HttpStatus.SC_TEMPORARY_REDIRECT || statusCode == 308) { // is 3xx  todo follow https://issues.apache.org/jira/browse/HTTPCORE-389
+        if (statusCode == HttpStatus.SC_MOVED_PERMANENTLY || statusCode == HttpStatus.SC_MOVED_TEMPORARILY ||
+            statusCode == HttpStatus.SC_MULTIPLE_CHOICES || statusCode == HttpStatus.SC_SEE_OTHER ||
+            statusCode == HttpStatus.SC_TEMPORARY_REDIRECT ||
+            statusCode == 308) { // is 3xx  todo follow https://issues.apache.org/jira/browse/HTTPCORE-389
 
           page.setRedirect(true);
           if (myController.getConfig().isFollowRedirects()) {
@@ -350,8 +351,10 @@ private void processPage(WebURL curURL) {
             }
           }
         } else { // All other http codes other than 3xx & 200
-          String description = EnglishReasonPhraseCatalog.INSTANCE.getReason(fetchResult.getStatusCode(), Locale.ENGLISH); // Finds the status reason for all known statuses
-          String contentType = fetchResult.getEntity() == null ? "" : fetchResult.getEntity().getContentType().getValue();
+          String description = EnglishReasonPhraseCatalog.INSTANCE
+              .getReason(fetchResult.getStatusCode(), Locale.ENGLISH); // Finds the status reason for all known statuses
+          String contentType =
+              fetchResult.getEntity() == null ? "" : fetchResult.getEntity().getContentType().getValue();
           onUnexpectedStatusCode(curURL.getURL(), fetchResult.getStatusCode(), contentType, description);
         }
 
diff --git a/src/main/java/edu/uci/ics/crawler4j/crawler/authentication/AuthInfo.java b/src/main/java/edu/uci/ics/crawler4j/crawler/authentication/AuthInfo.java
index b2ede2223..b03fbbef3 100644
--- a/src/main/java/edu/uci/ics/crawler4j/crawler/authentication/AuthInfo.java
+++ b/src/main/java/edu/uci/ics/crawler4j/crawler/authentication/AuthInfo.java
@@ -1,20 +1,23 @@
 package edu.uci.ics.crawler4j.crawler.authentication;
 
-import javax.swing.text.html.FormSubmitEvent.MethodType;
 import java.net.MalformedURLException;
 import java.net.URL;
 
+import javax.swing.text.html.FormSubmitEvent.MethodType;
+
 /**
  * Created by Avi Hayun on 11/23/2014.
  *
  * Abstract class containing authentication information needed to login into a user/password protected site<br>
- * This class should be extended by specific authentication types like form authentication and basic authentication etc<br>
+ * This class should be extended by specific authentication types like form authentication and basic authentication
+ * etc<br>
  * <br>
  * This class contains all of the mutual authentication data for all authentication types
  */
 public abstract class AuthInfo {
   public enum AuthenticationType {
-    BASIC_AUTHENTICATION, FORM_AUTHENTICATION
+    BASIC_AUTHENTICATION,
+    FORM_AUTHENTICATION
   }
 
   protected AuthenticationType authenticationType;
@@ -41,7 +44,8 @@ public AuthInfo() {
    *
    * @throws MalformedURLException Make sure your URL is valid
    */
-  protected AuthInfo(AuthenticationType authenticationType, MethodType httpMethod, String loginUrl, String username, String password) throws MalformedURLException {
+  protected AuthInfo(AuthenticationType authenticationType, MethodType httpMethod, String loginUrl, String username,
+                     String password) throws MalformedURLException {
     this.authenticationType = authenticationType;
     this.httpMethod = httpMethod;
     URL url = new URL(loginUrl);
diff --git a/src/main/java/edu/uci/ics/crawler4j/crawler/authentication/BasicAuthInfo.java b/src/main/java/edu/uci/ics/crawler4j/crawler/authentication/BasicAuthInfo.java
index 6437f07ef..50b585047 100644
--- a/src/main/java/edu/uci/ics/crawler4j/crawler/authentication/BasicAuthInfo.java
+++ b/src/main/java/edu/uci/ics/crawler4j/crawler/authentication/BasicAuthInfo.java
@@ -1,12 +1,14 @@
 package edu.uci.ics.crawler4j.crawler.authentication;
 
-import javax.swing.text.html.FormSubmitEvent.MethodType;
 import java.net.MalformedURLException;
 
+import javax.swing.text.html.FormSubmitEvent.MethodType;
+
 /**
  * Created by Avi Hayun on 11/25/2014.
  *
- * BasicAuthInfo contains the authentication information needed for BASIC authentication (extending AuthInfo which has all common auth info in it)
+ * BasicAuthInfo contains the authentication information needed for BASIC authentication (extending AuthInfo which
+ * has all common auth info in it)
  *
  * BASIC authentication in PHP:
  * <ul>
diff --git a/src/main/java/edu/uci/ics/crawler4j/crawler/authentication/FormAuthInfo.java b/src/main/java/edu/uci/ics/crawler4j/crawler/authentication/FormAuthInfo.java
index b6ed4eee9..e06fb4e6b 100644
--- a/src/main/java/edu/uci/ics/crawler4j/crawler/authentication/FormAuthInfo.java
+++ b/src/main/java/edu/uci/ics/crawler4j/crawler/authentication/FormAuthInfo.java
@@ -1,13 +1,16 @@
 package edu.uci.ics.crawler4j.crawler.authentication;
 
-import javax.swing.text.html.FormSubmitEvent.MethodType;
 import java.net.MalformedURLException;
 
+import javax.swing.text.html.FormSubmitEvent.MethodType;
+
 /**
  * Created by Avi Hayun on 11/25/2014.
  *
- * FormAuthInfo contains the authentication information needed for FORM authentication (extending AuthInfo which has all common auth info in it)
- * Basically, this is the most common authentication, where you will get to a site and you will need to enter a username and password into an HTML form
+ * FormAuthInfo contains the authentication information needed for FORM authentication (extending AuthInfo which has
+ * all common auth info in it)
+ * Basically, this is the most common authentication, where you will get to a site and you will need to enter a
+ * username and password into an HTML form
  */
 public class FormAuthInfo extends AuthInfo {
 
@@ -25,7 +28,8 @@ public class FormAuthInfo extends AuthInfo {
    *
    * @throws MalformedURLException Make sure your URL is valid
    */
-  public FormAuthInfo(String username, String password, String loginUrl, String usernameFormStr, String passwordFormStr) throws MalformedURLException {
+  public FormAuthInfo(String username, String password, String loginUrl, String usernameFormStr, String passwordFormStr)
+      throws MalformedURLException {
     super(AuthenticationType.FORM_AUTHENTICATION, MethodType.POST, loginUrl, username, password);
 
     this.usernameFormStr = usernameFormStr;
diff --git a/src/main/java/edu/uci/ics/crawler4j/crawler/exceptions/RedirectException.java b/src/main/java/edu/uci/ics/crawler4j/crawler/exceptions/RedirectException.java
index 6f6eeacb6..07d80436d 100644
--- a/src/main/java/edu/uci/ics/crawler4j/crawler/exceptions/RedirectException.java
+++ b/src/main/java/edu/uci/ics/crawler4j/crawler/exceptions/RedirectException.java
@@ -5,7 +5,8 @@
 /**
  * Created by Avi Hayun on 12/8/2014.
  *
- * Occurs when the crawler encounters a Redirect problem, like redirecting to a visited-already page, or redirecting to nothing
+ * Occurs when the crawler encounters a Redirect problem, like redirecting to a visited-already page, or redirecting
+ * to nothing
  */
 public class RedirectException extends Exception {
   public Level level;
diff --git a/src/main/java/edu/uci/ics/crawler4j/fetcher/PageFetchResult.java b/src/main/java/edu/uci/ics/crawler4j/fetcher/PageFetchResult.java
index 00083f939..ad311eee4 100644
--- a/src/main/java/edu/uci/ics/crawler4j/fetcher/PageFetchResult.java
+++ b/src/main/java/edu/uci/ics/crawler4j/fetcher/PageFetchResult.java
@@ -17,17 +17,16 @@
 
 package edu.uci.ics.crawler4j.fetcher;
 
-import java.io.EOFException;
 import java.io.IOException;
 
 import org.apache.http.Header;
 import org.apache.http.HttpEntity;
 import org.apache.http.util.EntityUtils;
-
-import edu.uci.ics.crawler4j.crawler.Page;
 import org.slf4j.Logger;
 import org.slf4j.LoggerFactory;
 
+import edu.uci.ics.crawler4j.crawler.Page;
+
 /**
  * @author Yasser Ganjisaffar [lastname at gmail dot com]
  */
@@ -90,7 +89,8 @@ public void discardContentIfNotConsumed() {
         EntityUtils.consume(entity);
       }
     } catch (IOException e) {
-      // We can EOFException (extends IOException) exception. It can happen on compressed streams which are not repeatable
+      // We can EOFException (extends IOException) exception. It can happen on compressed streams which are not
+      // repeatable
       // We can ignore this exception. It can happen if the stream is closed.
     } catch (Exception e) {
       logger.warn("Unexpected error occurred while trying to discard content", e);
diff --git a/src/main/java/edu/uci/ics/crawler4j/fetcher/PageFetcher.java b/src/main/java/edu/uci/ics/crawler4j/fetcher/PageFetcher.java
index f8695ff9b..25cda56aa 100644
--- a/src/main/java/edu/uci/ics/crawler4j/fetcher/PageFetcher.java
+++ b/src/main/java/edu/uci/ics/crawler4j/fetcher/PageFetcher.java
@@ -26,12 +26,11 @@
 
 import javax.net.ssl.SSLContext;
 
-import edu.uci.ics.crawler4j.crawler.*;
-import edu.uci.ics.crawler4j.crawler.authentication.AuthInfo;
-import edu.uci.ics.crawler4j.crawler.authentication.BasicAuthInfo;
-import edu.uci.ics.crawler4j.crawler.authentication.FormAuthInfo;
-import edu.uci.ics.crawler4j.crawler.exceptions.PageBiggerThanMaxSizeException;
-import org.apache.http.*;
+import org.apache.http.Header;
+import org.apache.http.HttpHost;
+import org.apache.http.HttpResponse;
+import org.apache.http.HttpStatus;
+import org.apache.http.NameValuePair;
 import org.apache.http.auth.AuthScope;
 import org.apache.http.auth.UsernamePasswordCredentials;
 import org.apache.http.client.ClientProtocolException;
@@ -48,12 +47,21 @@
 import org.apache.http.conn.ssl.SSLConnectionSocketFactory;
 import org.apache.http.conn.ssl.SSLContexts;
 import org.apache.http.conn.ssl.TrustStrategy;
-import org.apache.http.impl.client.*;
+import org.apache.http.impl.client.BasicCredentialsProvider;
+import org.apache.http.impl.client.CloseableHttpClient;
+import org.apache.http.impl.client.HttpClientBuilder;
+import org.apache.http.impl.client.HttpClients;
 import org.apache.http.impl.conn.PoolingHttpClientConnectionManager;
 import org.apache.http.message.BasicNameValuePair;
 import org.slf4j.Logger;
 import org.slf4j.LoggerFactory;
 
+import edu.uci.ics.crawler4j.crawler.Configurable;
+import edu.uci.ics.crawler4j.crawler.CrawlConfig;
+import edu.uci.ics.crawler4j.crawler.authentication.AuthInfo;
+import edu.uci.ics.crawler4j.crawler.authentication.BasicAuthInfo;
+import edu.uci.ics.crawler4j.crawler.authentication.FormAuthInfo;
+import edu.uci.ics.crawler4j.crawler.exceptions.PageBiggerThanMaxSizeException;
 import edu.uci.ics.crawler4j.url.URLCanonicalizer;
 import edu.uci.ics.crawler4j.url.WebURL;
 
@@ -73,28 +81,24 @@ public class PageFetcher extends Configurable {
   public PageFetcher(CrawlConfig config) {
     super(config);
 
-    RequestConfig requestConfig = RequestConfig.custom()
-        .setExpectContinueEnabled(false)
-        .setCookieSpec(CookieSpecs.BROWSER_COMPATIBILITY)
-        .setRedirectsEnabled(false)
-        .setSocketTimeout(config.getSocketTimeout())
-        .setConnectTimeout(config.getConnectionTimeout())
-        .build();
+    RequestConfig requestConfig =
+        RequestConfig.custom().setExpectContinueEnabled(false).setCookieSpec(CookieSpecs.BROWSER_COMPATIBILITY)
+                     .setRedirectsEnabled(false).setSocketTimeout(config.getSocketTimeout())
+                     .setConnectTimeout(config.getConnectionTimeout()).build();
 
     RegistryBuilder<ConnectionSocketFactory> connRegistryBuilder = RegistryBuilder.create();
     connRegistryBuilder.register("http", PlainConnectionSocketFactory.INSTANCE);
     if (config.isIncludeHttpsPages()) {
       try { // Fixing: https://code.google.com/p/crawler4j/issues/detail?id=174
         // By always trusting the ssl certificate
-        SSLContext sslContext = SSLContexts.custom()
-            .loadTrustMaterial(null, new TrustStrategy() {
-              @Override
-              public boolean isTrusted(final X509Certificate[] chain, String authType) {
-                return true;
-              }
-            }).build();
-        SSLConnectionSocketFactory sslsf = new SSLConnectionSocketFactory(
-            sslContext, SSLConnectionSocketFactory.ALLOW_ALL_HOSTNAME_VERIFIER);
+        SSLContext sslContext = SSLContexts.custom().loadTrustMaterial(null, new TrustStrategy() {
+          @Override
+          public boolean isTrusted(final X509Certificate[] chain, String authType) {
+            return true;
+          }
+        }).build();
+        SSLConnectionSocketFactory sslsf =
+            new SSLConnectionSocketFactory(sslContext, SSLConnectionSocketFactory.ALLOW_ALL_HOSTNAME_VERIFIER);
         connRegistryBuilder.register("https", sslsf);
       } catch (Exception e) {
         logger.warn("Exception thrown while trying to register https");
@@ -115,9 +119,9 @@ public boolean isTrusted(final X509Certificate[] chain, String authType) {
     if (config.getProxyHost() != null) {
       if (config.getProxyUsername() != null) {
         BasicCredentialsProvider credentialsProvider = new BasicCredentialsProvider();
-        credentialsProvider.setCredentials(
-            new AuthScope(config.getProxyHost(), config.getProxyPort()),
-            new UsernamePasswordCredentials(config.getProxyUsername(), config.getProxyPassword()));
+        credentialsProvider.setCredentials(new AuthScope(config.getProxyHost(), config.getProxyPort()),
+                                           new UsernamePasswordCredentials(config.getProxyUsername(),
+                                                                           config.getProxyPassword()));
         clientBuilder.setDefaultCredentialsProvider(credentialsProvider);
       }
 
@@ -149,27 +153,27 @@ private void doAuthetication(List<AuthInfo> authInfos) {
 
   /**
    * BASIC authentication<br/>
-   * Official Example: https://hc.apache.org/httpcomponents-client-ga/httpclient/examples/org/apache/http/examples/client/ClientAuthentication.java
+   * Official Example: https://hc.apache.org/httpcomponents-client-ga/httpclient/examples/org/apache/http/examples
+   * /client/ClientAuthentication.java
    * */
   private void doBasicLogin(BasicAuthInfo authInfo) {
     logger.info("BASIC authentication for: " + authInfo.getLoginTarget());
     HttpHost targetHost = new HttpHost(authInfo.getHost(), authInfo.getPort(), authInfo.getProtocol());
     CredentialsProvider credsProvider = new BasicCredentialsProvider();
-    credsProvider.setCredentials(
-        new AuthScope(targetHost.getHostName(), targetHost.getPort()),
-        new UsernamePasswordCredentials(authInfo.getUsername(), authInfo.getPassword()));
-    httpClient = HttpClients.custom()
-        .setDefaultCredentialsProvider(credsProvider)
-        .build();
+    credsProvider.setCredentials(new AuthScope(targetHost.getHostName(), targetHost.getPort()),
+                                 new UsernamePasswordCredentials(authInfo.getUsername(), authInfo.getPassword()));
+    httpClient = HttpClients.custom().setDefaultCredentialsProvider(credsProvider).build();
   }
 
   /**
    * FORM authentication<br/>
-   * Official Example: https://hc.apache.org/httpcomponents-client-ga/httpclient/examples/org/apache/http/examples/client/ClientFormLogin.java
+   * Official Example: https://hc.apache.org/httpcomponents-client-ga/httpclient/examples/org/apache/http/examples
+   * /client/ClientFormLogin.java
    * */
   private void doFormLogin(FormAuthInfo authInfo) {
     logger.info("FORM authentication for: " + authInfo.getLoginTarget());
-    String fullUri = authInfo.getProtocol() + "://" + authInfo.getHost() + ":" + authInfo.getPort() + authInfo.getLoginTarget();
+    String fullUri =
+        authInfo.getProtocol() + "://" + authInfo.getHost() + ":" + authInfo.getPort() + authInfo.getLoginTarget();
     HttpPost httpPost = new HttpPost(fullUri);
     List<NameValuePair> formParams = new ArrayList<>();
     formParams.add(new BasicNameValuePair(authInfo.getUsernameFormStr(), authInfo.getUsername()));
@@ -189,7 +193,8 @@ private void doFormLogin(FormAuthInfo authInfo) {
     }
   }
 
-  public PageFetchResult fetchPage(WebURL webUrl) throws InterruptedException, IOException, PageBiggerThanMaxSizeException {
+  public PageFetchResult fetchPage(WebURL webUrl)
+      throws InterruptedException, IOException, PageBiggerThanMaxSizeException {
     // Getting URL, setting headers & content
     PageFetchResult fetchResult = new PageFetchResult();
     String toFetchURL = webUrl.getURL();
@@ -213,9 +218,10 @@ public PageFetchResult fetchPage(WebURL webUrl) throws InterruptedException, IOE
       int statusCode = response.getStatusLine().getStatusCode();
 
       // If Redirect ( 3xx )
-      if (statusCode == HttpStatus.SC_MOVED_PERMANENTLY || statusCode == HttpStatus.SC_MOVED_TEMPORARILY
-          || statusCode == HttpStatus.SC_MULTIPLE_CHOICES || statusCode == HttpStatus.SC_SEE_OTHER
-          || statusCode == HttpStatus.SC_TEMPORARY_REDIRECT || statusCode == 308) { // todo follow https://issues.apache.org/jira/browse/HTTPCORE-389
+      if (statusCode == HttpStatus.SC_MOVED_PERMANENTLY || statusCode == HttpStatus.SC_MOVED_TEMPORARILY ||
+          statusCode == HttpStatus.SC_MULTIPLE_CHOICES || statusCode == HttpStatus.SC_SEE_OTHER ||
+          statusCode == HttpStatus.SC_TEMPORARY_REDIRECT ||
+          statusCode == 308) { // todo follow https://issues.apache.org/jira/browse/HTTPCORE-389
 
         Header header = response.getFirstHeader("Location");
         if (header != null) {
diff --git a/src/main/java/edu/uci/ics/crawler4j/frontier/Counters.java b/src/main/java/edu/uci/ics/crawler4j/frontier/Counters.java
index 3f2245fb9..7227e40d8 100644
--- a/src/main/java/edu/uci/ics/crawler4j/frontier/Counters.java
+++ b/src/main/java/edu/uci/ics/crawler4j/frontier/Counters.java
@@ -17,15 +17,24 @@
 
 package edu.uci.ics.crawler4j.frontier;
 
-import com.sleepycat.je.*;
-import edu.uci.ics.crawler4j.crawler.Configurable;
-import edu.uci.ics.crawler4j.crawler.CrawlConfig;
-import edu.uci.ics.crawler4j.util.Util;
+import java.util.HashMap;
+import java.util.Map;
+
 import org.slf4j.Logger;
 import org.slf4j.LoggerFactory;
 
-import java.util.HashMap;
-import java.util.Map;
+import com.sleepycat.je.Cursor;
+import com.sleepycat.je.Database;
+import com.sleepycat.je.DatabaseConfig;
+import com.sleepycat.je.DatabaseEntry;
+import com.sleepycat.je.DatabaseException;
+import com.sleepycat.je.Environment;
+import com.sleepycat.je.OperationStatus;
+import com.sleepycat.je.Transaction;
+
+import edu.uci.ics.crawler4j.crawler.Configurable;
+import edu.uci.ics.crawler4j.crawler.CrawlConfig;
+import edu.uci.ics.crawler4j.util.Util;
 
 /**
  * @author Yasser Ganjisaffar [lastname at gmail dot com]
@@ -95,8 +104,7 @@ public void setValue(String name, long value) {
         counterValues.put(name, value);
         if (statisticsDB != null) {
           Transaction txn = env.beginTransaction(null, null);
-          statisticsDB.put(txn, new DatabaseEntry(name.getBytes()),
-              new DatabaseEntry(Util.long2ByteArray(value)));
+          statisticsDB.put(txn, new DatabaseEntry(name.getBytes()), new DatabaseEntry(Util.long2ByteArray(value)));
           txn.commit();
         }
       } catch (Exception e) {
diff --git a/src/main/java/edu/uci/ics/crawler4j/frontier/DocIDServer.java b/src/main/java/edu/uci/ics/crawler4j/frontier/DocIDServer.java
index d4f66863d..5cb31f786 100644
--- a/src/main/java/edu/uci/ics/crawler4j/frontier/DocIDServer.java
+++ b/src/main/java/edu/uci/ics/crawler4j/frontier/DocIDServer.java
@@ -17,13 +17,19 @@
 
 package edu.uci.ics.crawler4j.frontier;
 
-import com.sleepycat.je.*;
+import org.slf4j.Logger;
+import org.slf4j.LoggerFactory;
+
+import com.sleepycat.je.Database;
+import com.sleepycat.je.DatabaseConfig;
+import com.sleepycat.je.DatabaseEntry;
+import com.sleepycat.je.DatabaseException;
+import com.sleepycat.je.Environment;
+import com.sleepycat.je.OperationStatus;
 
 import edu.uci.ics.crawler4j.crawler.Configurable;
 import edu.uci.ics.crawler4j.crawler.CrawlConfig;
 import edu.uci.ics.crawler4j.util.Util;
-import org.slf4j.Logger;
-import org.slf4j.LoggerFactory;
 
 /**
  * @author Yasser Ganjisaffar [lastname at gmail dot com]
diff --git a/src/main/java/edu/uci/ics/crawler4j/frontier/Frontier.java b/src/main/java/edu/uci/ics/crawler4j/frontier/Frontier.java
index 105a8d223..8a0cb5047 100644
--- a/src/main/java/edu/uci/ics/crawler4j/frontier/Frontier.java
+++ b/src/main/java/edu/uci/ics/crawler4j/frontier/Frontier.java
@@ -17,16 +17,18 @@
 
 package edu.uci.ics.crawler4j.frontier;
 
+import java.util.List;
+
+import org.slf4j.Logger;
+import org.slf4j.LoggerFactory;
+
 import com.sleepycat.je.DatabaseException;
 import com.sleepycat.je.Environment;
+
 import edu.uci.ics.crawler4j.crawler.Configurable;
 import edu.uci.ics.crawler4j.crawler.CrawlConfig;
 import edu.uci.ics.crawler4j.frontier.Counters.ReservedCounterNames;
 import edu.uci.ics.crawler4j.url.WebURL;
-import org.slf4j.Logger;
-import org.slf4j.LoggerFactory;
-
-import java.util.List;
 
 /**
  * @author Yasser Ganjisaffar [lastname at gmail dot com]
diff --git a/src/main/java/edu/uci/ics/crawler4j/frontier/InProcessPagesDB.java b/src/main/java/edu/uci/ics/crawler4j/frontier/InProcessPagesDB.java
index e9007a34b..d2420a8b6 100644
--- a/src/main/java/edu/uci/ics/crawler4j/frontier/InProcessPagesDB.java
+++ b/src/main/java/edu/uci/ics/crawler4j/frontier/InProcessPagesDB.java
@@ -18,6 +18,9 @@
 package edu.uci.ics.crawler4j.frontier;
 
 
+import org.slf4j.Logger;
+import org.slf4j.LoggerFactory;
+
 import com.sleepycat.je.Cursor;
 import com.sleepycat.je.DatabaseEntry;
 import com.sleepycat.je.DatabaseException;
@@ -26,14 +29,12 @@
 import com.sleepycat.je.Transaction;
 
 import edu.uci.ics.crawler4j.url.WebURL;
-import org.slf4j.Logger;
-import org.slf4j.LoggerFactory;
 
 /**
  * This class maintains the list of pages which are
  * assigned to crawlers but are not yet processed.
- * It is used for resuming a previous crawl. 
- * 
+ * It is used for resuming a previous crawl.
+ *
  * @author Yasser Ganjisaffar [lastname at gmail dot com]
  */
 public class InProcessPagesDB extends WorkQueues {
diff --git a/src/main/java/edu/uci/ics/crawler4j/frontier/WorkQueues.java b/src/main/java/edu/uci/ics/crawler4j/frontier/WorkQueues.java
index aaa92452f..cfc0670a0 100644
--- a/src/main/java/edu/uci/ics/crawler4j/frontier/WorkQueues.java
+++ b/src/main/java/edu/uci/ics/crawler4j/frontier/WorkQueues.java
@@ -17,14 +17,23 @@
 
 package edu.uci.ics.crawler4j.frontier;
 
-import com.sleepycat.je.*;
-import edu.uci.ics.crawler4j.url.WebURL;
-import edu.uci.ics.crawler4j.util.Util;
+import java.util.ArrayList;
+import java.util.List;
+
 import org.slf4j.Logger;
 import org.slf4j.LoggerFactory;
 
-import java.util.ArrayList;
-import java.util.List;
+import com.sleepycat.je.Cursor;
+import com.sleepycat.je.Database;
+import com.sleepycat.je.DatabaseConfig;
+import com.sleepycat.je.DatabaseEntry;
+import com.sleepycat.je.DatabaseException;
+import com.sleepycat.je.Environment;
+import com.sleepycat.je.OperationStatus;
+import com.sleepycat.je.Transaction;
+
+import edu.uci.ics.crawler4j.url.WebURL;
+import edu.uci.ics.crawler4j.util.Util;
 
 /**
  * @author Yasser Ganjisaffar [lastname at gmail dot com]
diff --git a/src/main/java/edu/uci/ics/crawler4j/parser/BinaryParseData.java b/src/main/java/edu/uci/ics/crawler4j/parser/BinaryParseData.java
index 355d42903..e9e2b2924 100644
--- a/src/main/java/edu/uci/ics/crawler4j/parser/BinaryParseData.java
+++ b/src/main/java/edu/uci/ics/crawler4j/parser/BinaryParseData.java
@@ -22,7 +22,6 @@
 import java.io.InputStream;
 import java.io.OutputStream;
 import java.io.PrintStream;
-import java.io.UnsupportedEncodingException;
 import java.util.HashSet;
 import java.util.Set;
 
@@ -33,7 +32,6 @@
 import javax.xml.transform.sax.TransformerHandler;
 import javax.xml.transform.stream.StreamResult;
 
-import edu.uci.ics.crawler4j.url.WebURL;
 import org.apache.tika.metadata.Metadata;
 import org.apache.tika.parser.AutoDetectParser;
 import org.apache.tika.parser.ParseContext;
@@ -41,6 +39,8 @@
 import org.slf4j.Logger;
 import org.slf4j.LoggerFactory;
 
+import edu.uci.ics.crawler4j.url.WebURL;
+
 public class BinaryParseData implements ParseData {
 
   private static final Logger logger = LoggerFactory.getLogger(BinaryParseData.class);
@@ -48,7 +48,8 @@ public class BinaryParseData implements ParseData {
   private static final String DEFAULT_OUTPUT_FORMAT = "html";
 
   private static final Parser AUTO_DETECT_PARSER = new AutoDetectParser();
-  private static final SAXTransformerFactory SAX_TRANSFORMER_FACTORY = (SAXTransformerFactory) SAXTransformerFactory.newInstance();
+  private static final SAXTransformerFactory SAX_TRANSFORMER_FACTORY =
+      (SAXTransformerFactory) SAXTransformerFactory.newInstance();
 
   private final ParseContext context = new ParseContext();
   private Set<WebURL> outgoingUrls = new HashSet<>();
@@ -67,7 +68,8 @@ public void setBinaryContent(byte[] data) {
       AUTO_DETECT_PARSER.parse(inputStream, handler, new Metadata(), context);
 
       // Hacking the following line to remove Tika's inserted DocType
-      String htmlContent = new String(outputStream.toByteArray(), DEFAULT_ENCODING).replace("http://www.w3.org/1999/xhtml", "");
+      String htmlContent =
+          new String(outputStream.toByteArray(), DEFAULT_ENCODING).replace("http://www.w3.org/1999/xhtml", "");
       setHtml(htmlContent);
     } catch (Exception e) {
       logger.error("Error parsing file", e);
@@ -81,7 +83,7 @@ public void setBinaryContent(byte[] data) {
    * @param encoding output encoding, or <code>null</code> for the platform default
    */
   private static TransformerHandler getTransformerHandler(OutputStream out, String method, String encoding)
-        throws TransformerConfigurationException {
+      throws TransformerConfigurationException {
 
     TransformerHandler transformerHandler = SAX_TRANSFORMER_FACTORY.newTransformerHandler();
     Transformer transformer = transformerHandler.getTransformer();
diff --git a/src/main/java/edu/uci/ics/crawler4j/parser/HtmlContentHandler.java b/src/main/java/edu/uci/ics/crawler4j/parser/HtmlContentHandler.java
index dde66f600..2d123037e 100644
--- a/src/main/java/edu/uci/ics/crawler4j/parser/HtmlContentHandler.java
+++ b/src/main/java/edu/uci/ics/crawler4j/parser/HtmlContentHandler.java
@@ -31,7 +31,16 @@ public class HtmlContentHandler extends DefaultHandler {
   private final int MAX_ANCHOR_LENGTH = 100;
 
   private enum Element {
-    A, AREA, LINK, IFRAME, FRAME, EMBED, IMG, BASE, META, BODY
+    A,
+    AREA,
+    LINK,
+    IFRAME,
+    FRAME,
+    EMBED,
+    IMG,
+    BASE,
+    META,
+    BODY
   }
 
   private static class HtmlFactory {
diff --git a/src/main/java/edu/uci/ics/crawler4j/parser/HtmlParseData.java b/src/main/java/edu/uci/ics/crawler4j/parser/HtmlParseData.java
index 566706891..8f9412f2e 100644
--- a/src/main/java/edu/uci/ics/crawler4j/parser/HtmlParseData.java
+++ b/src/main/java/edu/uci/ics/crawler4j/parser/HtmlParseData.java
@@ -17,11 +17,11 @@
 
 package edu.uci.ics.crawler4j.parser;
 
-import edu.uci.ics.crawler4j.url.WebURL;
-
 import java.util.Map;
 import java.util.Set;
 
+import edu.uci.ics.crawler4j.url.WebURL;
+
 public class HtmlParseData implements ParseData {
 
   private String html;
diff --git a/src/main/java/edu/uci/ics/crawler4j/parser/NotAllowedContentException.java b/src/main/java/edu/uci/ics/crawler4j/parser/NotAllowedContentException.java
index 2511c5a82..b3a304a81 100644
--- a/src/main/java/edu/uci/ics/crawler4j/parser/NotAllowedContentException.java
+++ b/src/main/java/edu/uci/ics/crawler4j/parser/NotAllowedContentException.java
@@ -7,7 +7,7 @@
  * For example when the parser tries to parse binary content although the user configured it not to do it
  */
 public class NotAllowedContentException extends Exception {
-    public NotAllowedContentException() {
-      super("Not allowed to parse this type of content");
-    }
+  public NotAllowedContentException() {
+    super("Not allowed to parse this type of content");
+  }
 }
\ No newline at end of file
diff --git a/src/main/java/edu/uci/ics/crawler4j/parser/ParseData.java b/src/main/java/edu/uci/ics/crawler4j/parser/ParseData.java
index f0709dbc4..d21907150 100644
--- a/src/main/java/edu/uci/ics/crawler4j/parser/ParseData.java
+++ b/src/main/java/edu/uci/ics/crawler4j/parser/ParseData.java
@@ -17,10 +17,10 @@
 
 package edu.uci.ics.crawler4j.parser;
 
-import edu.uci.ics.crawler4j.url.WebURL;
-
 import java.util.Set;
 
+import edu.uci.ics.crawler4j.url.WebURL;
+
 public interface ParseData {
 
   Set<WebURL> getOutgoingUrls();
diff --git a/src/main/java/edu/uci/ics/crawler4j/parser/Parser.java b/src/main/java/edu/uci/ics/crawler4j/parser/Parser.java
index 1bc7d4333..8e3b3cdea 100644
--- a/src/main/java/edu/uci/ics/crawler4j/parser/Parser.java
+++ b/src/main/java/edu/uci/ics/crawler4j/parser/Parser.java
@@ -18,28 +18,27 @@
 package edu.uci.ics.crawler4j.parser;
 
 import java.io.ByteArrayInputStream;
-import java.io.IOException;
 import java.io.InputStream;
 import java.io.UnsupportedEncodingException;
 import java.util.HashSet;
 import java.util.Set;
 
-import edu.uci.ics.crawler4j.crawler.exceptions.ParseException;
-import edu.uci.ics.crawler4j.util.Net;
 import org.apache.tika.language.LanguageIdentifier;
 import org.apache.tika.metadata.DublinCore;
 import org.apache.tika.metadata.Metadata;
 import org.apache.tika.parser.ParseContext;
 import org.apache.tika.parser.html.HtmlParser;
+import org.slf4j.Logger;
+import org.slf4j.LoggerFactory;
 
 import edu.uci.ics.crawler4j.crawler.Configurable;
 import edu.uci.ics.crawler4j.crawler.CrawlConfig;
 import edu.uci.ics.crawler4j.crawler.Page;
+import edu.uci.ics.crawler4j.crawler.exceptions.ParseException;
 import edu.uci.ics.crawler4j.url.URLCanonicalizer;
 import edu.uci.ics.crawler4j.url.WebURL;
+import edu.uci.ics.crawler4j.util.Net;
 import edu.uci.ics.crawler4j.util.Util;
-import org.slf4j.Logger;
-import org.slf4j.LoggerFactory;
 
 /**
  * @author Yasser Ganjisaffar [lastname at gmail dot com]
@@ -122,7 +121,8 @@ public void parse(Page page, String contextURL) throws NotAllowedContentExceptio
         }
 
         String hrefLoweredCase = href.trim().toLowerCase();
-        if (!hrefLoweredCase.contains("javascript:") && !hrefLoweredCase.contains("mailto:") && !hrefLoweredCase.contains("@")) {
+        if (!hrefLoweredCase.contains("javascript:") && !hrefLoweredCase.contains("mailto:") &&
+            !hrefLoweredCase.contains("@")) {
           String url = URLCanonicalizer.getCanonicalURL(href, contextURL);
           if (url != null) {
             WebURL webURL = new WebURL();
diff --git a/src/main/java/edu/uci/ics/crawler4j/parser/TextParseData.java b/src/main/java/edu/uci/ics/crawler4j/parser/TextParseData.java
index 0e66e7d12..273cfebc7 100644
--- a/src/main/java/edu/uci/ics/crawler4j/parser/TextParseData.java
+++ b/src/main/java/edu/uci/ics/crawler4j/parser/TextParseData.java
@@ -17,11 +17,11 @@
 
 package edu.uci.ics.crawler4j.parser;
 
-import edu.uci.ics.crawler4j.url.WebURL;
-
 import java.util.HashSet;
 import java.util.Set;
 
+import edu.uci.ics.crawler4j.url.WebURL;
+
 public class TextParseData implements ParseData {
 
   private String textContent;
diff --git a/src/main/java/edu/uci/ics/crawler4j/robotstxt/RobotstxtServer.java b/src/main/java/edu/uci/ics/crawler4j/robotstxt/RobotstxtServer.java
index 442aa6231..32cb37cbf 100644
--- a/src/main/java/edu/uci/ics/crawler4j/robotstxt/RobotstxtServer.java
+++ b/src/main/java/edu/uci/ics/crawler4j/robotstxt/RobotstxtServer.java
@@ -17,22 +17,26 @@
 
 package edu.uci.ics.crawler4j.robotstxt;
 
-import java.net.*;
+import java.net.MalformedURLException;
+import java.net.SocketException;
+import java.net.SocketTimeoutException;
+import java.net.URL;
+import java.net.UnknownHostException;
 import java.util.HashMap;
 import java.util.Map;
 import java.util.Map.Entry;
 
-import edu.uci.ics.crawler4j.crawler.exceptions.PageBiggerThanMaxSizeException;
 import org.apache.http.HttpStatus;
+import org.apache.http.NoHttpResponseException;
+import org.slf4j.Logger;
+import org.slf4j.LoggerFactory;
 
 import edu.uci.ics.crawler4j.crawler.Page;
+import edu.uci.ics.crawler4j.crawler.exceptions.PageBiggerThanMaxSizeException;
 import edu.uci.ics.crawler4j.fetcher.PageFetchResult;
 import edu.uci.ics.crawler4j.fetcher.PageFetcher;
 import edu.uci.ics.crawler4j.url.WebURL;
 import edu.uci.ics.crawler4j.util.Util;
-import org.apache.http.NoHttpResponseException;
-import org.slf4j.Logger;
-import org.slf4j.LoggerFactory;
 
 /**
  * @author Yasser Ganjisaffar [lastname at gmail dot com]
@@ -110,11 +114,12 @@ private HostDirectives fetchDirectives(URL url) {
           String content = new String(page.getContentData());
           directives = RobotstxtParser.parse(content, config.getUserAgentName());
         } else {
-            logger.warn("Can't read this robots.txt: {}  as it is not written in plain text, contentType: {}",
-                robotsTxtUrl.getURL(), page.getContentType());
+          logger.warn("Can't read this robots.txt: {}  as it is not written in plain text, contentType: {}",
+                      robotsTxtUrl.getURL(), page.getContentType());
         }
       } else {
-        logger.debug("Can't read this robots.txt: {}  as it's status code is {}", robotsTxtUrl.getURL(), fetchResult.getStatusCode());
+        logger.debug("Can't read this robots.txt: {}  as it's status code is {}", robotsTxtUrl.getURL(),
+                     fetchResult.getStatusCode());
       }
     } catch (SocketException | UnknownHostException | SocketTimeoutException | NoHttpResponseException se) {
       // No logging here, as it just means that robots.txt doesn't exist on this server which is perfectly ok
diff --git a/src/main/java/edu/uci/ics/crawler4j/url/TLDList.java b/src/main/java/edu/uci/ics/crawler4j/url/TLDList.java
index d3899316f..6228f38e8 100644
--- a/src/main/java/edu/uci/ics/crawler4j/url/TLDList.java
+++ b/src/main/java/edu/uci/ics/crawler4j/url/TLDList.java
@@ -1,8 +1,5 @@
 package edu.uci.ics.crawler4j.url;
 
-import org.slf4j.Logger;
-import org.slf4j.LoggerFactory;
-
 import java.io.BufferedReader;
 import java.io.InputStream;
 import java.io.InputStreamReader;
@@ -10,9 +7,13 @@
 import java.util.HashSet;
 import java.util.Set;
 
+import org.slf4j.Logger;
+import org.slf4j.LoggerFactory;
+
 /**
- * This class is a singleton which obtains a list of TLDs (from online or a local file) in order to compare against those TLDs
- * */
+ * This class is a singleton which obtains a list of TLDs (from online or a local file) in order to compare against
+ * those TLDs
+ */
 public class TLDList {
 
   private final static String TLD_NAMES_ONLINE_URL = "https://publicsuffix.org/list/effective_tld_names.dat";
@@ -26,7 +27,8 @@ public class TLDList {
   private TLDList() {
     try {
       URL url = new URL(TLD_NAMES_ONLINE_URL);
-      try (InputStream stream = url.openStream(); BufferedReader reader = new BufferedReader(new InputStreamReader(stream))) {
+      try (InputStream stream = url.openStream(); BufferedReader reader = new BufferedReader(
+          new InputStreamReader(stream))) {
         logger.debug("Fetching the most updated TLD list online");
 
         String line;
diff --git a/src/main/java/edu/uci/ics/crawler4j/url/URLCanonicalizer.java b/src/main/java/edu/uci/ics/crawler4j/url/URLCanonicalizer.java
index dd970d41e..6d8d22647 100644
--- a/src/main/java/edu/uci/ics/crawler4j/url/URLCanonicalizer.java
+++ b/src/main/java/edu/uci/ics/crawler4j/url/URLCanonicalizer.java
@@ -31,7 +31,7 @@
 /**
  * See http://en.wikipedia.org/wiki/URL_normalization for a reference Note: some
  * parts of the code are adapted from: http://stackoverflow.com/a/4057470/405418
- * 
+ *
  * @author Yasser Ganjisaffar [lastname at gmail dot com]
  */
 public class URLCanonicalizer {
@@ -123,16 +123,16 @@ private static SortedMap<String, String> createParameterMap(final String querySt
 
       String[] tokens = pair.split("=", 2);
       switch (tokens.length) {
-      case 1:
-        if (pair.charAt(0) == '=') {
-          params.put("", tokens[0]);
-        } else {
-          params.put(tokens[0], "");
-        }
-        break;
-      case 2:
-        params.put(tokens[0], tokens[1]);
-        break;
+        case 1:
+          if (pair.charAt(0) == '=') {
+            params.put("", tokens[0]);
+          } else {
+            params.put(tokens[0], "");
+          }
+          break;
+        case 2:
+          params.put(tokens[0], tokens[1]);
+          break;
       }
     }
     return new TreeMap<>(params);
diff --git a/src/main/java/edu/uci/ics/crawler4j/url/UrlResolver.java b/src/main/java/edu/uci/ics/crawler4j/url/UrlResolver.java
index d68ed095b..5a95d51cc 100644
--- a/src/main/java/edu/uci/ics/crawler4j/url/UrlResolver.java
+++ b/src/main/java/edu/uci/ics/crawler4j/url/UrlResolver.java
@@ -1,6 +1,6 @@
 /**
  * This class is adopted from Htmlunit with the following copyright:
- * 
+ *
  * Copyright (c) 2002-2012 Gargoyle Software Inc.
  *
  * Licensed under the Apache License, Version 2.0 (the "License");
@@ -142,8 +142,7 @@ private static Url parseUrl(final String spec) {
       if (locationEndIndex >= 0) {
         startIndex = locationEndIndex;
       }
-    }
-    else {
+    } else {
       locationStartIndex = -1;
       locationEndIndex = -1;
     }
@@ -202,8 +201,7 @@ private static Url parseUrl(final String spec) {
       // The entire remaining parse string is assigned to the network
       // location/login (<net_loc>) of the URL.
       locationEndIndex = endIndex;
-    }
-    else if (startIndex < endIndex) {
+    } else if (startIndex < endIndex) {
       url.path_ = spec.substring(startIndex, endIndex);
     }
     // Set the network location/login (<net_loc>) of the URL.
@@ -323,10 +321,9 @@ private static Url resolveUrl(final Url baseUrl, final String relativeUrl) {
       final int lastSlashIndex = basePath.lastIndexOf('/');
 
       if (lastSlashIndex >= 0) {
-          path = basePath.substring(0, lastSlashIndex + 1);
+        path = basePath.substring(0, lastSlashIndex + 1);
       }
-   }
-    else {
+    } else {
       path = "/";
     }
     path = path.concat(url.path_);
diff --git a/src/main/java/edu/uci/ics/crawler4j/url/WebURL.java b/src/main/java/edu/uci/ics/crawler4j/url/WebURL.java
index 1227f917c..610d2e9f7 100644
--- a/src/main/java/edu/uci/ics/crawler4j/url/WebURL.java
+++ b/src/main/java/edu/uci/ics/crawler4j/url/WebURL.java
@@ -69,7 +69,7 @@ public void setURL(String url) {
 
     int domainStartIdx = url.indexOf("//") + 2;
     int domainEndIdx = url.indexOf('/', domainStartIdx);
-        domainEndIdx = domainEndIdx > domainStartIdx ? domainEndIdx : url.length();
+    domainEndIdx = domainEndIdx > domainStartIdx ? domainEndIdx : url.length();
     domain = url.substring(domainStartIdx, domainEndIdx);
     subDomain = "";
     String[] parts = domain.split("\\.");
diff --git a/src/main/java/edu/uci/ics/crawler4j/util/IO.java b/src/main/java/edu/uci/ics/crawler4j/util/IO.java
index eda1b6a0b..03b3ee764 100644
--- a/src/main/java/edu/uci/ics/crawler4j/util/IO.java
+++ b/src/main/java/edu/uci/ics/crawler4j/util/IO.java
@@ -17,14 +17,11 @@
 
 package edu.uci.ics.crawler4j.util;
 
-import com.google.common.io.Files;
+import java.io.File;
+
 import org.slf4j.Logger;
 import org.slf4j.LoggerFactory;
 
-import java.io.*;
-import java.nio.ByteBuffer;
-import java.nio.channels.FileChannel;
-
 /**
  * @author Yasser Ganjisaffar [lastname at gmail dot com]
  */
diff --git a/src/main/java/edu/uci/ics/crawler4j/util/Net.java b/src/main/java/edu/uci/ics/crawler4j/util/Net.java
index 4fc54b239..98224ef1a 100644
--- a/src/main/java/edu/uci/ics/crawler4j/util/Net.java
+++ b/src/main/java/edu/uci/ics/crawler4j/util/Net.java
@@ -1,12 +1,12 @@
 package edu.uci.ics.crawler4j.util;
 
-import edu.uci.ics.crawler4j.url.WebURL;
-
 import java.util.HashSet;
 import java.util.Set;
 import java.util.regex.Matcher;
 import java.util.regex.Pattern;
 
+import edu.uci.ics.crawler4j.url.WebURL;
+
 /**
  * Created by Avi Hayun on 9/22/2014.
  * Net related Utils
@@ -35,16 +35,15 @@ public static Set<WebURL> extractUrls(String input) {
 
   /** Singleton like one time call to initialize the Pattern */
   private static Pattern initializePattern() {
-    return Pattern.compile(
-      "\\b(((ht|f)tp(s?)\\:\\/\\/|~\\/|\\/)|www.)" +
-      "(\\w+:\\w+@)?(([-\\w]+\\.)+(com|org|net|gov" +
-      "|mil|biz|info|mobi|name|aero|jobs|museum" +
-      "|travel|[a-z]{2}))(:[\\d]{1,5})?" +
-      "(((\\/([-\\w~!$+|.,=]|%[a-f\\d]{2})+)+|\\/)+|\\?|#)?" +
-      "((\\?([-\\w~!$+|.,*:]|%[a-f\\d{2}])+=?" +
-      "([-\\w~!$+|.,*:=]|%[a-f\\d]{2})*)" +
-      "(&(?:[-\\w~!$+|.,*:]|%[a-f\\d{2}])+=?" +
-      "([-\\w~!$+|.,*:=]|%[a-f\\d]{2})*)*)*" +
-      "(#([-\\w~!$+|.,*:=]|%[a-f\\d]{2})*)?\\b");
+    return Pattern.compile("\\b(((ht|f)tp(s?)\\:\\/\\/|~\\/|\\/)|www.)" +
+                           "(\\w+:\\w+@)?(([-\\w]+\\.)+(com|org|net|gov" +
+                           "|mil|biz|info|mobi|name|aero|jobs|museum" +
+                           "|travel|[a-z]{2}))(:[\\d]{1,5})?" +
+                           "(((\\/([-\\w~!$+|.,=]|%[a-f\\d]{2})+)+|\\/)+|\\?|#)?" +
+                           "((\\?([-\\w~!$+|.,*:]|%[a-f\\d{2}])+=?" +
+                           "([-\\w~!$+|.,*:=]|%[a-f\\d]{2})*)" +
+                           "(&(?:[-\\w~!$+|.,*:]|%[a-f\\d{2}])+=?" +
+                           "([-\\w~!$+|.,*:=]|%[a-f\\d]{2})*)*)*" +
+                           "(#([-\\w~!$+|.,*:=]|%[a-f\\d]{2})*)?\\b");
   }
 }
\ No newline at end of file
diff --git a/src/main/java/edu/uci/ics/crawler4j/util/Util.java b/src/main/java/edu/uci/ics/crawler4j/util/Util.java
index 542c34fa4..ace934f4c 100644
--- a/src/main/java/edu/uci/ics/crawler4j/util/Util.java
+++ b/src/main/java/edu/uci/ics/crawler4j/util/Util.java
@@ -25,29 +25,29 @@ public class Util {
 
   public static byte[] long2ByteArray(long l) {
     byte[] array = new byte[8];
-      int i, shift;
-      for(i = 0, shift = 56; i < 8; i++, shift -= 8) {
-        array[i] = (byte)(0xFF & (l >> shift));
-      }
-      return array;
+    int i, shift;
+    for (i = 0, shift = 56; i < 8; i++, shift -= 8) {
+      array[i] = (byte) (0xFF & (l >> shift));
+    }
+    return array;
   }
-    
+
   public static byte[] int2ByteArray(int value) {
-  byte[] b = new byte[4];
+    byte[] b = new byte[4];
     for (int i = 0; i < 4; i++) {
       int offset = (3 - i) * 8;
       b[i] = (byte) ((value >>> offset) & 0xFF);
     }
     return b;
   }
-    
+
   public static void putIntInByteArray(int value, byte[] buf, int offset) {
     for (int i = 0; i < 4; i++) {
       int valueOffset = (3 - i) * 8;
       buf[offset + i] = (byte) ((value >>> valueOffset) & 0xFF);
     }
   }
-    
+
   public static int byteArray2Int(byte[] b) {
     int value = 0;
     for (int i = 0; i < 4; i++) {
@@ -56,7 +56,7 @@ public static int byteArray2Int(byte[] b) {
     }
     return value;
   }
-    
+
   public static long byteArray2Long(byte[] b) {
     int value = 0;
     for (int i = 0; i < 8; i++) {
@@ -69,9 +69,10 @@ public static long byteArray2Long(byte[] b) {
   public static boolean hasBinaryContent(String contentType) {
     String typeStr = contentType != null ? contentType.toLowerCase() : "";
 
-    return typeStr.contains("image") || typeStr.contains("audio") || typeStr.contains("video") || typeStr.contains("application");
+    return typeStr.contains("image") || typeStr.contains("audio") || typeStr.contains("video") ||
+           typeStr.contains("application");
   }
-    
+
   public static boolean hasPlainTextContent(String contentType) {
     String typeStr = contentType != null ? contentType.toLowerCase() : "";
 
diff --git a/src/test/java/edu/uci/ics/crawler4j/examples/basic/BasicCrawlController.java b/src/test/java/edu/uci/ics/crawler4j/examples/basic/BasicCrawlController.java
index 3de022517..574706b06 100644
--- a/src/test/java/edu/uci/ics/crawler4j/examples/basic/BasicCrawlController.java
+++ b/src/test/java/edu/uci/ics/crawler4j/examples/basic/BasicCrawlController.java
@@ -17,14 +17,14 @@
 
 package edu.uci.ics.crawler4j.examples.basic;
 
-import com.sleepycat.je.txn.LockerFactory;
+import org.slf4j.Logger;
+import org.slf4j.LoggerFactory;
+
 import edu.uci.ics.crawler4j.crawler.CrawlConfig;
 import edu.uci.ics.crawler4j.crawler.CrawlController;
 import edu.uci.ics.crawler4j.fetcher.PageFetcher;
 import edu.uci.ics.crawler4j.robotstxt.RobotstxtConfig;
 import edu.uci.ics.crawler4j.robotstxt.RobotstxtServer;
-import org.slf4j.Logger;
-import org.slf4j.LoggerFactory;
 
 /**
  * @author Yasser Ganjisaffar [lastname at gmail dot com]
diff --git a/src/test/java/edu/uci/ics/crawler4j/examples/basic/BasicCrawler.java b/src/test/java/edu/uci/ics/crawler4j/examples/basic/BasicCrawler.java
index 6c573d26e..e24e83f61 100644
--- a/src/test/java/edu/uci/ics/crawler4j/examples/basic/BasicCrawler.java
+++ b/src/test/java/edu/uci/ics/crawler4j/examples/basic/BasicCrawler.java
@@ -17,27 +17,27 @@
 
 package edu.uci.ics.crawler4j.examples.basic;
 
-import edu.uci.ics.crawler4j.crawler.Page;
-import edu.uci.ics.crawler4j.crawler.WebCrawler;
-import edu.uci.ics.crawler4j.parser.HtmlParseData;
-import edu.uci.ics.crawler4j.url.WebURL;
-
 import java.util.Set;
 import java.util.regex.Pattern;
 
 import org.apache.http.Header;
 
+import edu.uci.ics.crawler4j.crawler.Page;
+import edu.uci.ics.crawler4j.crawler.WebCrawler;
+import edu.uci.ics.crawler4j.parser.HtmlParseData;
+import edu.uci.ics.crawler4j.url.WebURL;
+
 /**
  * @author Yasser Ganjisaffar [lastname at gmail dot com]
  */
 public class BasicCrawler extends WebCrawler {
 
   private final static Pattern BINARY_FILES_EXTENSIONS =
-        Pattern.compile(".*\\.(bmp|gif|jpe?g|png|tiff?|pdf|ico|xaml|pict|rif|pptx?|ps" +
-        "|mid|mp2|mp3|mp4|wav|wma|au|aiff|flac|ogg|3gp|aac|amr|au|vox" +
-        "|avi|mov|mpe?g|ra?m|m4v|smil|wm?v|swf|aaf|asf|flv|mkv" +
-        "|zip|rar|gz|7z|aac|ace|alz|apk|arc|arj|dmg|jar|lzip|lha)" +
-        "(\\?.*)?$"); // For url Query parts ( URL?q=... )
+      Pattern.compile(".*\\.(bmp|gif|jpe?g|png|tiff?|pdf|ico|xaml|pict|rif|pptx?|ps" +
+                      "|mid|mp2|mp3|mp4|wav|wma|au|aiff|flac|ogg|3gp|aac|amr|au|vox" +
+                      "|avi|mov|mpe?g|ra?m|m4v|smil|wm?v|swf|aaf|asf|flv|mkv" +
+                      "|zip|rar|gz|7z|aac|ace|alz|apk|arc|arj|dmg|jar|lzip|lha)" +
+                      "(\\?.*)?$"); // For url Query parts ( URL?q=... )
 
   /**
    * You should implement this function to specify whether the given url
diff --git a/src/test/java/edu/uci/ics/crawler4j/examples/imagecrawler/ImageCrawlController.java b/src/test/java/edu/uci/ics/crawler4j/examples/imagecrawler/ImageCrawlController.java
index a8797e2b7..8af0d2e63 100644
--- a/src/test/java/edu/uci/ics/crawler4j/examples/imagecrawler/ImageCrawlController.java
+++ b/src/test/java/edu/uci/ics/crawler4j/examples/imagecrawler/ImageCrawlController.java
@@ -17,19 +17,20 @@
 
 package edu.uci.ics.crawler4j.examples.imagecrawler;
 
+import org.slf4j.Logger;
+import org.slf4j.LoggerFactory;
+
 import edu.uci.ics.crawler4j.crawler.CrawlConfig;
 import edu.uci.ics.crawler4j.crawler.CrawlController;
 import edu.uci.ics.crawler4j.fetcher.PageFetcher;
 import edu.uci.ics.crawler4j.robotstxt.RobotstxtConfig;
 import edu.uci.ics.crawler4j.robotstxt.RobotstxtServer;
-import org.slf4j.Logger;
-import org.slf4j.LoggerFactory;
 
 /**
  * @author Yasser Ganjisaffar [lastname at gmail dot com]
  */
 public class ImageCrawlController {
-    private static Logger logger = LoggerFactory.getLogger(ImageCrawlController.class);
+  private static Logger logger = LoggerFactory.getLogger(ImageCrawlController.class);
 
   public static void main(String[] args) throws Exception {
     if (args.length < 3) {
@@ -54,7 +55,7 @@ public static void main(String[] args) throws Exception {
      */
     config.setIncludeBinaryContentInCrawling(true);
 
-    String[] crawlDomains = new String[] { "http://uci.edu/" };
+    String[] crawlDomains = new String[] {"http://uci.edu/"};
 
     PageFetcher pageFetcher = new PageFetcher(config);
     RobotstxtConfig robotstxtConfig = new RobotstxtConfig();
diff --git a/src/test/java/edu/uci/ics/crawler4j/examples/imagecrawler/ImageCrawler.java b/src/test/java/edu/uci/ics/crawler4j/examples/imagecrawler/ImageCrawler.java
index a2db705a0..f6348d9b2 100644
--- a/src/test/java/edu/uci/ics/crawler4j/examples/imagecrawler/ImageCrawler.java
+++ b/src/test/java/edu/uci/ics/crawler4j/examples/imagecrawler/ImageCrawler.java
@@ -23,11 +23,11 @@
 import java.util.regex.Pattern;
 
 import com.google.common.io.Files;
+
 import edu.uci.ics.crawler4j.crawler.Page;
 import edu.uci.ics.crawler4j.crawler.WebCrawler;
 import edu.uci.ics.crawler4j.parser.BinaryParseData;
 import edu.uci.ics.crawler4j.url.WebURL;
-import edu.uci.ics.crawler4j.util.IO;
 
 /**
  * @author Yasser Ganjisaffar [lastname at gmail dot com]
@@ -41,8 +41,8 @@
  */
 public class ImageCrawler extends WebCrawler {
 
-  private static final Pattern filters = Pattern.compile(".*(\\.(css|js|mid|mp2|mp3|mp4|wav|avi|mov|mpeg|ram|m4v|pdf"
-      + "|rm|smil|wmv|swf|wma|zip|rar|gz))$");
+  private static final Pattern filters = Pattern
+      .compile(".*(\\.(css|js|mid|mp2|mp3|mp4|wav|avi|mov|mpeg|ram|m4v|pdf" + "|rm|smil|wmv|swf|wma|zip|rar|gz))$");
 
   private static final Pattern imgPatterns = Pattern.compile(".*(\\.(bmp|gif|jpe?g|png|tiff?))$");
 
@@ -82,7 +82,8 @@ public void visit(Page page) {
     String url = page.getWebURL().getURL();
 
     // We are only interested in processing images which are bigger than 10k
-    if (!imgPatterns.matcher(url).matches() || !(page.getParseData() instanceof BinaryParseData || page.getContentData().length < 10 * 1024)) {
+    if (!imgPatterns.matcher(url).matches() ||
+        !(page.getParseData() instanceof BinaryParseData || page.getContentData().length < 10 * 1024)) {
       return;
     }
 
diff --git a/src/test/java/edu/uci/ics/crawler4j/examples/localdata/Downloader.java b/src/test/java/edu/uci/ics/crawler4j/examples/localdata/Downloader.java
index f4603951e..afe67c3cb 100644
--- a/src/test/java/edu/uci/ics/crawler4j/examples/localdata/Downloader.java
+++ b/src/test/java/edu/uci/ics/crawler4j/examples/localdata/Downloader.java
@@ -18,6 +18,8 @@
 package edu.uci.ics.crawler4j.examples.localdata;
 
 import org.apache.http.HttpStatus;
+import org.slf4j.Logger;
+import org.slf4j.LoggerFactory;
 
 import edu.uci.ics.crawler4j.crawler.CrawlConfig;
 import edu.uci.ics.crawler4j.crawler.Page;
@@ -27,10 +29,6 @@
 import edu.uci.ics.crawler4j.parser.ParseData;
 import edu.uci.ics.crawler4j.parser.Parser;
 import edu.uci.ics.crawler4j.url.WebURL;
-import org.slf4j.Logger;
-import org.slf4j.LoggerFactory;
-
-import java.io.IOException;
 
 /**
  * This class is a demonstration of how crawler4j can be used to download a
@@ -90,8 +88,7 @@ private Page download(String url) {
     } catch (Exception e) {
       logger.error("Error occurred while fetching url: " + curURL.getURL(), e);
     } finally {
-      if (fetchResult != null)
-      {
+      if (fetchResult != null) {
         fetchResult.discardContentIfNotConsumed();
       }
     }
diff --git a/src/test/java/edu/uci/ics/crawler4j/examples/localdata/LocalDataCollectorController.java b/src/test/java/edu/uci/ics/crawler4j/examples/localdata/LocalDataCollectorController.java
index c2bf7ee30..df577834e 100644
--- a/src/test/java/edu/uci/ics/crawler4j/examples/localdata/LocalDataCollectorController.java
+++ b/src/test/java/edu/uci/ics/crawler4j/examples/localdata/LocalDataCollectorController.java
@@ -19,55 +19,56 @@
 
 import java.util.List;
 
+import org.slf4j.Logger;
+import org.slf4j.LoggerFactory;
+
 import edu.uci.ics.crawler4j.crawler.CrawlConfig;
 import edu.uci.ics.crawler4j.crawler.CrawlController;
 import edu.uci.ics.crawler4j.fetcher.PageFetcher;
 import edu.uci.ics.crawler4j.robotstxt.RobotstxtConfig;
 import edu.uci.ics.crawler4j.robotstxt.RobotstxtServer;
-import org.slf4j.Logger;
-import org.slf4j.LoggerFactory;
 
 public class LocalDataCollectorController {
-	private static Logger logger = LoggerFactory.getLogger(LocalDataCollectorController.class);
+  private static Logger logger = LoggerFactory.getLogger(LocalDataCollectorController.class);
 
-	public static void main(String[] args) throws Exception {
-		if (args.length != 2) {
-			logger.info("Needed parameters: ");
-			logger.info("\t rootFolder (it will contain intermediate crawl data)");
-			logger.info("\t numberOfCralwers (number of concurrent threads)");
-			return;
-		}
+  public static void main(String[] args) throws Exception {
+    if (args.length != 2) {
+      logger.info("Needed parameters: ");
+      logger.info("\t rootFolder (it will contain intermediate crawl data)");
+      logger.info("\t numberOfCralwers (number of concurrent threads)");
+      return;
+    }
 
-		String rootFolder = args[0];
-		int numberOfCrawlers = Integer.parseInt(args[1]);
+    String rootFolder = args[0];
+    int numberOfCrawlers = Integer.parseInt(args[1]);
 
-		CrawlConfig config = new CrawlConfig();
-		config.setCrawlStorageFolder(rootFolder);
-		config.setMaxPagesToFetch(10);
-		config.setPolitenessDelay(1000);
+    CrawlConfig config = new CrawlConfig();
+    config.setCrawlStorageFolder(rootFolder);
+    config.setMaxPagesToFetch(10);
+    config.setPolitenessDelay(1000);
 
-		PageFetcher pageFetcher = new PageFetcher(config);
-		RobotstxtConfig robotstxtConfig = new RobotstxtConfig();
-		RobotstxtServer robotstxtServer = new RobotstxtServer(robotstxtConfig, pageFetcher);
-		CrawlController controller = new CrawlController(config, pageFetcher, robotstxtServer);
+    PageFetcher pageFetcher = new PageFetcher(config);
+    RobotstxtConfig robotstxtConfig = new RobotstxtConfig();
+    RobotstxtServer robotstxtServer = new RobotstxtServer(robotstxtConfig, pageFetcher);
+    CrawlController controller = new CrawlController(config, pageFetcher, robotstxtServer);
 
-		controller.addSeed("http://www.ics.uci.edu/");
-		controller.start(LocalDataCollectorCrawler.class, numberOfCrawlers);
+    controller.addSeed("http://www.ics.uci.edu/");
+    controller.start(LocalDataCollectorCrawler.class, numberOfCrawlers);
 
-		List<Object> crawlersLocalData = controller.getCrawlersLocalData();
-		long totalLinks = 0;
-		long totalTextSize = 0;
-		int totalProcessedPages = 0;
-		for (Object localData : crawlersLocalData) {
-			CrawlStat stat = (CrawlStat) localData;
-			totalLinks += stat.getTotalLinks();
-			totalTextSize += stat.getTotalTextSize();
-			totalProcessedPages += stat.getTotalProcessedPages();
-		}
+    List<Object> crawlersLocalData = controller.getCrawlersLocalData();
+    long totalLinks = 0;
+    long totalTextSize = 0;
+    int totalProcessedPages = 0;
+    for (Object localData : crawlersLocalData) {
+      CrawlStat stat = (CrawlStat) localData;
+      totalLinks += stat.getTotalLinks();
+      totalTextSize += stat.getTotalTextSize();
+      totalProcessedPages += stat.getTotalProcessedPages();
+    }
 
-		logger.info("Aggregated Statistics:");
-		logger.info("\tProcessed Pages: {}", totalProcessedPages);
-		logger.info("\tTotal Links found: {}", totalLinks);
-		logger.info("\tTotal Text Size: {}", totalTextSize);
-	}
+    logger.info("Aggregated Statistics:");
+    logger.info("\tProcessed Pages: {}", totalProcessedPages);
+    logger.info("\tTotal Links found: {}", totalLinks);
+    logger.info("\tTotal Text Size: {}", totalTextSize);
+  }
 }
\ No newline at end of file
diff --git a/src/test/java/edu/uci/ics/crawler4j/examples/localdata/LocalDataCollectorCrawler.java b/src/test/java/edu/uci/ics/crawler4j/examples/localdata/LocalDataCollectorCrawler.java
index 9e99db208..4f35bb184 100644
--- a/src/test/java/edu/uci/ics/crawler4j/examples/localdata/LocalDataCollectorCrawler.java
+++ b/src/test/java/edu/uci/ics/crawler4j/examples/localdata/LocalDataCollectorCrawler.java
@@ -17,22 +17,24 @@
 
 package edu.uci.ics.crawler4j.examples.localdata;
 
+import java.io.UnsupportedEncodingException;
+import java.util.Set;
+import java.util.regex.Pattern;
+
+import org.slf4j.Logger;
+import org.slf4j.LoggerFactory;
+
 import edu.uci.ics.crawler4j.crawler.Page;
 import edu.uci.ics.crawler4j.crawler.WebCrawler;
 import edu.uci.ics.crawler4j.parser.HtmlParseData;
 import edu.uci.ics.crawler4j.url.WebURL;
-import org.slf4j.Logger;
-import org.slf4j.LoggerFactory;
-
-import java.io.UnsupportedEncodingException;
-import java.util.Set;
-import java.util.regex.Pattern;
 
 public class LocalDataCollectorCrawler extends WebCrawler {
   private Logger logger = LoggerFactory.getLogger(LocalDataCollectorCrawler.class);
 
-  Pattern filters = Pattern.compile(".*(\\.(css|js|bmp|gif|jpe?g" + "|png|tiff?|mid|mp2|mp3|mp4"
-      + "|wav|avi|mov|mpeg|ram|m4v|pdf" + "|rm|smil|wmv|swf|wma|zip|rar|gz))$");
+  Pattern filters = Pattern.compile(
+      ".*(\\.(css|js|bmp|gif|jpe?g" + "|png|tiff?|mid|mp2|mp3|mp4" + "|wav|avi|mov|mpeg|ram|m4v|pdf" +
+      "|rm|smil|wmv|swf|wma|zip|rar|gz))$");
 
   CrawlStat myCrawlStat;
 
@@ -69,7 +71,7 @@ public void visit(Page page) {
 
   /**
    * This function is called by controller to get the local data of this crawler when job is finished
-  */
+   */
   @Override
   public Object getMyLocalData() {
     return myCrawlStat;
@@ -89,6 +91,6 @@ public void dumpMyData() {
     // You can configure the log to output to file
     logger.info("Crawler {} > Processed Pages: {}", id, myCrawlStat.getTotalProcessedPages());
     logger.info("Crawler {} > Total Links Found: {}", id, myCrawlStat.getTotalLinks());
-    logger.info("Crawler {} > Total Text Size: {}", id,  myCrawlStat.getTotalTextSize());
+    logger.info("Crawler {} > Total Text Size: {}", id, myCrawlStat.getTotalTextSize());
   }
 }
\ No newline at end of file
diff --git a/src/test/java/edu/uci/ics/crawler4j/examples/multiple/BasicCrawler.java b/src/test/java/edu/uci/ics/crawler4j/examples/multiple/BasicCrawler.java
index 9f75b6cbc..98e1fb93a 100644
--- a/src/test/java/edu/uci/ics/crawler4j/examples/multiple/BasicCrawler.java
+++ b/src/test/java/edu/uci/ics/crawler4j/examples/multiple/BasicCrawler.java
@@ -20,12 +20,13 @@
 import java.util.Set;
 import java.util.regex.Pattern;
 
+import org.slf4j.Logger;
+import org.slf4j.LoggerFactory;
+
 import edu.uci.ics.crawler4j.crawler.Page;
 import edu.uci.ics.crawler4j.crawler.WebCrawler;
 import edu.uci.ics.crawler4j.parser.HtmlParseData;
 import edu.uci.ics.crawler4j.url.WebURL;
-import org.slf4j.Logger;
-import org.slf4j.LoggerFactory;
 
 /**
  * @author Yasser Ganjisaffar [lastname at gmail dot com]
@@ -33,8 +34,9 @@
 public class BasicCrawler extends WebCrawler {
   private Logger logger = LoggerFactory.getLogger(BasicCrawler.class);
 
-  private final static Pattern FILTERS = Pattern.compile(".*(\\.(css|js|bmp|gif|jpe?g" + "|png|tiff?|mid|mp2|mp3|mp4"
-      + "|wav|avi|mov|mpeg|ram|m4v|pdf" + "|rm|smil|wmv|swf|wma|zip|rar|gz))$");
+  private final static Pattern FILTERS = Pattern.compile(
+      ".*(\\.(css|js|bmp|gif|jpe?g" + "|png|tiff?|mid|mp2|mp3|mp4" + "|wav|avi|mov|mpeg|ram|m4v|pdf" +
+      "|rm|smil|wmv|swf|wma|zip|rar|gz))$");
 
   private String[] myCrawlDomains;
 
diff --git a/src/test/java/edu/uci/ics/crawler4j/examples/multiple/MultipleCrawlerController.java b/src/test/java/edu/uci/ics/crawler4j/examples/multiple/MultipleCrawlerController.java
index 16ceb9993..6c70ce6ad 100644
--- a/src/test/java/edu/uci/ics/crawler4j/examples/multiple/MultipleCrawlerController.java
+++ b/src/test/java/edu/uci/ics/crawler4j/examples/multiple/MultipleCrawlerController.java
@@ -17,13 +17,14 @@
 
 package edu.uci.ics.crawler4j.examples.multiple;
 
+import org.slf4j.Logger;
+import org.slf4j.LoggerFactory;
+
 import edu.uci.ics.crawler4j.crawler.CrawlConfig;
 import edu.uci.ics.crawler4j.crawler.CrawlController;
 import edu.uci.ics.crawler4j.fetcher.PageFetcher;
 import edu.uci.ics.crawler4j.robotstxt.RobotstxtConfig;
 import edu.uci.ics.crawler4j.robotstxt.RobotstxtServer;
-import org.slf4j.Logger;
-import org.slf4j.LoggerFactory;
 
 /**
  * @author Yasser Ganjisaffar [lastname at gmail dot com]
@@ -76,8 +77,8 @@ public static void main(String[] args) throws Exception {
     CrawlController controller1 = new CrawlController(config1, pageFetcher1, robotstxtServer);
     CrawlController controller2 = new CrawlController(config2, pageFetcher2, robotstxtServer);
 
-    String[] crawler1Domains = new String[] { "http://www.ics.uci.edu/", "http://www.cnn.com/" };
-    String[] crawler2Domains = new String[] { "http://en.wikipedia.org/" };
+    String[] crawler1Domains = new String[] {"http://www.ics.uci.edu/", "http://www.cnn.com/"};
+    String[] crawler2Domains = new String[] {"http://en.wikipedia.org/"};
 
     controller1.setCustomData(crawler1Domains);
     controller2.setCustomData(crawler2Domains);
diff --git a/src/test/java/edu/uci/ics/crawler4j/examples/shutdown/BasicCrawler.java b/src/test/java/edu/uci/ics/crawler4j/examples/shutdown/BasicCrawler.java
index 849b32c78..0e432ceb9 100644
--- a/src/test/java/edu/uci/ics/crawler4j/examples/shutdown/BasicCrawler.java
+++ b/src/test/java/edu/uci/ics/crawler4j/examples/shutdown/BasicCrawler.java
@@ -17,15 +17,16 @@
 
 package edu.uci.ics.crawler4j.examples.shutdown;
 
+import java.util.Set;
+import java.util.regex.Pattern;
+
+import org.slf4j.Logger;
+import org.slf4j.LoggerFactory;
+
 import edu.uci.ics.crawler4j.crawler.Page;
 import edu.uci.ics.crawler4j.crawler.WebCrawler;
 import edu.uci.ics.crawler4j.parser.HtmlParseData;
 import edu.uci.ics.crawler4j.url.WebURL;
-import org.slf4j.Logger;
-import org.slf4j.LoggerFactory;
-
-import java.util.Set;
-import java.util.regex.Pattern;
 
 /**
  * @author Yasser Ganjisaffar [lastname at gmail dot com]
@@ -34,8 +35,9 @@
 public class BasicCrawler extends WebCrawler {
   private Logger logger = LoggerFactory.getLogger(BasicCrawler.class);
 
-  private final static Pattern FILTERS = Pattern.compile(".*(\\.(css|js|bmp|gif|jpe?g" + "|png|tiff?|mid|mp2|mp3|mp4"
-      + "|wav|avi|mov|mpeg|ram|m4v|pdf" + "|rm|smil|wmv|swf|wma|zip|rar|gz))$");
+  private final static Pattern FILTERS = Pattern.compile(
+      ".*(\\.(css|js|bmp|gif|jpe?g" + "|png|tiff?|mid|mp2|mp3|mp4" + "|wav|avi|mov|mpeg|ram|m4v|pdf" +
+      "|rm|smil|wmv|swf|wma|zip|rar|gz))$");
 
   private final static String DOMAIN = "http://www.ics.uci.edu/";
 
diff --git a/src/test/java/edu/uci/ics/crawler4j/examples/shutdown/ControllerWithShutdown.java b/src/test/java/edu/uci/ics/crawler4j/examples/shutdown/ControllerWithShutdown.java
index afcc4cbd4..f8f27178f 100644
--- a/src/test/java/edu/uci/ics/crawler4j/examples/shutdown/ControllerWithShutdown.java
+++ b/src/test/java/edu/uci/ics/crawler4j/examples/shutdown/ControllerWithShutdown.java
@@ -17,13 +17,14 @@
 
 package edu.uci.ics.crawler4j.examples.shutdown;
 
+import org.slf4j.Logger;
+import org.slf4j.LoggerFactory;
+
 import edu.uci.ics.crawler4j.crawler.CrawlConfig;
 import edu.uci.ics.crawler4j.crawler.CrawlController;
 import edu.uci.ics.crawler4j.fetcher.PageFetcher;
 import edu.uci.ics.crawler4j.robotstxt.RobotstxtConfig;
 import edu.uci.ics.crawler4j.robotstxt.RobotstxtServer;
-import org.slf4j.Logger;
-import org.slf4j.LoggerFactory;
 
 /**
  * @author Yasser Ganjisaffar [lastname at gmail dot com]
diff --git a/src/test/java/edu/uci/ics/crawler4j/examples/statushandler/StatusHandlerCrawlController.java b/src/test/java/edu/uci/ics/crawler4j/examples/statushandler/StatusHandlerCrawlController.java
index 4bb07c0f3..a894cb1fa 100644
--- a/src/test/java/edu/uci/ics/crawler4j/examples/statushandler/StatusHandlerCrawlController.java
+++ b/src/test/java/edu/uci/ics/crawler4j/examples/statushandler/StatusHandlerCrawlController.java
@@ -17,13 +17,14 @@
 
 package edu.uci.ics.crawler4j.examples.statushandler;
 
+import org.slf4j.Logger;
+import org.slf4j.LoggerFactory;
+
 import edu.uci.ics.crawler4j.crawler.CrawlConfig;
 import edu.uci.ics.crawler4j.crawler.CrawlController;
 import edu.uci.ics.crawler4j.fetcher.PageFetcher;
 import edu.uci.ics.crawler4j.robotstxt.RobotstxtConfig;
 import edu.uci.ics.crawler4j.robotstxt.RobotstxtServer;
-import org.slf4j.Logger;
-import org.slf4j.LoggerFactory;
 
 /**
  * @author Yasser Ganjisaffar [lastname at gmail dot com]
diff --git a/src/test/java/edu/uci/ics/crawler4j/examples/statushandler/StatusHandlerCrawler.java b/src/test/java/edu/uci/ics/crawler4j/examples/statushandler/StatusHandlerCrawler.java
index b899a2fe4..195d14063 100644
--- a/src/test/java/edu/uci/ics/crawler4j/examples/statushandler/StatusHandlerCrawler.java
+++ b/src/test/java/edu/uci/ics/crawler4j/examples/statushandler/StatusHandlerCrawler.java
@@ -20,52 +20,54 @@
 import java.util.regex.Pattern;
 
 import org.apache.http.HttpStatus;
+import org.slf4j.Logger;
+import org.slf4j.LoggerFactory;
 
 import edu.uci.ics.crawler4j.crawler.Page;
 import edu.uci.ics.crawler4j.crawler.WebCrawler;
 import edu.uci.ics.crawler4j.url.WebURL;
-import org.slf4j.Logger;
-import org.slf4j.LoggerFactory;
 
 /**
  * @author Yasser Ganjisaffar [lastname at gmail dot com]
  */
 public class StatusHandlerCrawler extends WebCrawler {
-	private Logger logger = LoggerFactory.getLogger(StatusHandlerCrawler.class);
+  private Logger logger = LoggerFactory.getLogger(StatusHandlerCrawler.class);
+
+  private final static Pattern FILTERS = Pattern.compile(
+      ".*(\\.(css|js|bmp|gif|jpe?g" + "|png|tiff?|mid|mp2|mp3|mp4" + "|wav|avi|mov|mpeg|ram|m4v|pdf" +
+      "|rm|smil|wmv|swf|wma|zip|rar|gz))$");
+
+  /**
+   * You should implement this function to specify whether
+   * the given url should be crawled or not (based on your
+   * crawling logic).
+   */
+  @Override
+  public boolean shouldVisit(Page page, WebURL url) {
+    String href = url.getURL().toLowerCase();
+    return !FILTERS.matcher(href).matches() && href.startsWith("http://www.ics.uci.edu/");
+  }
 
-	private final static Pattern FILTERS = Pattern.compile(".*(\\.(css|js|bmp|gif|jpe?g" + "|png|tiff?|mid|mp2|mp3|mp4"
-			+ "|wav|avi|mov|mpeg|ram|m4v|pdf" + "|rm|smil|wmv|swf|wma|zip|rar|gz))$");
+  /**
+   * This function is called when a page is fetched and ready
+   * to be processed by your program.
+   */
+  @Override
+  public void visit(Page page) {
+    // Do nothing
+  }
 
-	/**
-	 * You should implement this function to specify whether
-	 * the given url should be crawled or not (based on your
-	 * crawling logic).
-	 */
-	@Override
-	public boolean shouldVisit(Page page, WebURL url) {
-		String href = url.getURL().toLowerCase();
-		return !FILTERS.matcher(href).matches() && href.startsWith("http://www.ics.uci.edu/");
-	}
+  @Override
+  protected void handlePageStatusCode(WebURL webUrl, int statusCode, String statusDescription) {
 
-	/**
-	 * This function is called when a page is fetched and ready 
-	 * to be processed by your program.
-	 */
-	@Override
-	public void visit(Page page) {
-		// Do nothing
-	}
-	
-	@Override
-	protected void handlePageStatusCode(WebURL webUrl, int statusCode, String statusDescription) {
-		
-		if (statusCode != HttpStatus.SC_OK) {
+    if (statusCode != HttpStatus.SC_OK) {
 
-			if (statusCode == HttpStatus.SC_NOT_FOUND) {
-				logger.warn("Broken link: {}, this link was found in page: {}", webUrl.getURL(), webUrl.getParentUrl());
-			} else {
-				logger.warn("Non success status for link: {} status code: {}, description: ", webUrl.getURL(), statusCode, statusDescription);
-			}
-		}
-	}
+      if (statusCode == HttpStatus.SC_NOT_FOUND) {
+        logger.warn("Broken link: {}, this link was found in page: {}", webUrl.getURL(), webUrl.getParentUrl());
+      } else {
+        logger.warn("Non success status for link: {} status code: {}, description: ", webUrl.getURL(), statusCode,
+                    statusDescription);
+      }
+    }
+  }
 }
\ No newline at end of file
diff --git a/src/test/java/edu/uci/ics/crawler4j/tests/TLDListTest.java b/src/test/java/edu/uci/ics/crawler4j/tests/TLDListTest.java
index ea5c0fa2b..e9a80a2da 100644
--- a/src/test/java/edu/uci/ics/crawler4j/tests/TLDListTest.java
+++ b/src/test/java/edu/uci/ics/crawler4j/tests/TLDListTest.java
@@ -1,10 +1,11 @@
 package edu.uci.ics.crawler4j.tests;
 
-import edu.uci.ics.crawler4j.url.URLCanonicalizer;
-import edu.uci.ics.crawler4j.url.WebURL;
+import static org.junit.Assert.assertEquals;
+
 import org.junit.Test;
 
-import static org.junit.Assert.assertEquals;
+import edu.uci.ics.crawler4j.url.URLCanonicalizer;
+import edu.uci.ics.crawler4j.url.WebURL;
 
 public class TLDListTest {
 
@@ -14,7 +15,7 @@ private void setUrl(String url) {
     webUrl.setURL(URLCanonicalizer.getCanonicalURL(url));
   }
 
-    @Test
+  @Test
   public void testTLD() {
 
     setUrl("http://example.com");
diff --git a/src/test/java/edu/uci/ics/crawler4j/tests/URLCanonicalizerTest.java b/src/test/java/edu/uci/ics/crawler4j/tests/URLCanonicalizerTest.java
index eeac0823b..691199b0b 100644
--- a/src/test/java/edu/uci/ics/crawler4j/tests/URLCanonicalizerTest.java
+++ b/src/test/java/edu/uci/ics/crawler4j/tests/URLCanonicalizerTest.java
@@ -1,9 +1,10 @@
 package edu.uci.ics.crawler4j.tests;
 
-import edu.uci.ics.crawler4j.url.URLCanonicalizer;
+import static org.junit.Assert.assertEquals;
+
 import org.junit.Test;
 
-import static org.junit.Assert.assertEquals;
+import edu.uci.ics.crawler4j.url.URLCanonicalizer;
 
 public class URLCanonicalizerTest {
 
@@ -11,64 +12,62 @@ public class URLCanonicalizerTest {
   public void testCanonizalier() {
 
     assertEquals("http://www.example.com/display?category=foo%2Fbar%2Bbaz",
-        URLCanonicalizer.getCanonicalURL("http://www.example.com/display?category=foo/bar+baz"));
+                 URLCanonicalizer.getCanonicalURL("http://www.example.com/display?category=foo/bar+baz"));
 
-    assertEquals("http://www.example.com/?q=a%2Bb",
-        URLCanonicalizer.getCanonicalURL("http://www.example.com/?q=a+b"));
+    assertEquals("http://www.example.com/?q=a%2Bb", URLCanonicalizer.getCanonicalURL("http://www.example.com/?q=a+b"));
 
     assertEquals("http://www.example.com/display?category=foo%2Fbar%2Bbaz",
-        URLCanonicalizer.getCanonicalURL("http://www.example.com/display?category=foo%2Fbar%2Bbaz"));
+                 URLCanonicalizer.getCanonicalURL("http://www.example.com/display?category=foo%2Fbar%2Bbaz"));
 
-    assertEquals("http://somedomain.com/uploads/1/0/2/5/10259653/6199347.jpg?1325154037",
-        URLCanonicalizer
-            .getCanonicalURL("http://somedomain.com/uploads/1/0/2/5/10259653/6199347.jpg?1325154037"));
+    assertEquals("http://somedomain.com/uploads/1/0/2/5/10259653/6199347.jpg?1325154037", URLCanonicalizer
+                     .getCanonicalURL("http://somedomain.com/uploads/1/0/2/5/10259653/6199347.jpg?1325154037"));
 
     assertEquals("http://hostname.com/", URLCanonicalizer.getCanonicalURL("http://hostname.com"));
 
     assertEquals("http://hostname.com/", URLCanonicalizer.getCanonicalURL("http://HOSTNAME.com"));
 
     assertEquals("http://www.example.com/index.html",
-        URLCanonicalizer.getCanonicalURL("http://www.example.com/index.html?&"));
+                 URLCanonicalizer.getCanonicalURL("http://www.example.com/index.html?&"));
 
     assertEquals("http://www.example.com/index.html",
-        URLCanonicalizer.getCanonicalURL("http://www.example.com/index.html?"));
+                 URLCanonicalizer.getCanonicalURL("http://www.example.com/index.html?"));
 
     assertEquals("http://www.example.com/", URLCanonicalizer.getCanonicalURL("http://www.example.com"));
 
     assertEquals("http://www.example.com/bar.html",
-        URLCanonicalizer.getCanonicalURL("http://www.example.com:80/bar.html"));
+                 URLCanonicalizer.getCanonicalURL("http://www.example.com:80/bar.html"));
 
     assertEquals("http://www.example.com/index.html?name=test&rame=base",
-        URLCanonicalizer.getCanonicalURL("http://www.example.com/index.html?name=test&rame=base#123"));
+                 URLCanonicalizer.getCanonicalURL("http://www.example.com/index.html?name=test&rame=base#123"));
 
     assertEquals("http://www.example.com/~username/",
-        URLCanonicalizer.getCanonicalURL("http://www.example.com/%7Eusername/"));
+                 URLCanonicalizer.getCanonicalURL("http://www.example.com/%7Eusername/"));
 
     assertEquals("http://www.example.com/A/B/index.html",
-        URLCanonicalizer.getCanonicalURL("http://www.example.com//A//B/index.html"));
+                 URLCanonicalizer.getCanonicalURL("http://www.example.com//A//B/index.html"));
 
     assertEquals("http://www.example.com/index.html?x=y",
-        URLCanonicalizer.getCanonicalURL("http://www.example.com/index.html?&x=y"));
+                 URLCanonicalizer.getCanonicalURL("http://www.example.com/index.html?&x=y"));
 
     assertEquals("http://www.example.com/a.html",
-        URLCanonicalizer.getCanonicalURL("http://www.example.com/../../a.html"));
+                 URLCanonicalizer.getCanonicalURL("http://www.example.com/../../a.html"));
 
     assertEquals("http://www.example.com/a/c/d.html",
-        URLCanonicalizer.getCanonicalURL("http://www.example.com/../a/b/../c/./d.html"));
+                 URLCanonicalizer.getCanonicalURL("http://www.example.com/../a/b/../c/./d.html"));
 
     assertEquals("http://foo.bar.com/?baz=1", URLCanonicalizer.getCanonicalURL("http://foo.bar.com?baz=1"));
 
     assertEquals("http://www.example.com/index.html?a=b&c=d&e=f",
-        URLCanonicalizer.getCanonicalURL("http://www.example.com/index.html?&c=d&e=f&a=b"));
+                 URLCanonicalizer.getCanonicalURL("http://www.example.com/index.html?&c=d&e=f&a=b"));
 
     assertEquals("http://www.example.com/index.html?q=a%20b",
-        URLCanonicalizer.getCanonicalURL("http://www.example.com/index.html?q=a b"));
+                 URLCanonicalizer.getCanonicalURL("http://www.example.com/index.html?q=a b"));
 
     assertEquals("http://www.example.com/search?height=100%&width=100%",
-        URLCanonicalizer.getCanonicalURL("http://www.example.com/search?width=100%&height=100%"));
+                 URLCanonicalizer.getCanonicalURL("http://www.example.com/search?width=100%&height=100%"));
 
     assertEquals("http://foo.bar/mydir/myfile?page=2",
-        URLCanonicalizer.getCanonicalURL("?page=2", "http://foo.bar/mydir/myfile"));
+                 URLCanonicalizer.getCanonicalURL("?page=2", "http://foo.bar/mydir/myfile"));
 
   }
 }
\ No newline at end of file
diff --git a/src/test/java/edu/uci/ics/crawler4j/tests/WebURLTest.java b/src/test/java/edu/uci/ics/crawler4j/tests/WebURLTest.java
index c23dd1f3a..7b1b0b1b8 100644
--- a/src/test/java/edu/uci/ics/crawler4j/tests/WebURLTest.java
+++ b/src/test/java/edu/uci/ics/crawler4j/tests/WebURLTest.java
@@ -1,8 +1,9 @@
 package edu.uci.ics.crawler4j.tests;
 
-import edu.uci.ics.crawler4j.url.WebURL;
 import org.junit.Test;
 
+import edu.uci.ics.crawler4j.url.WebURL;
+
 
 /**
  * Created by Avi on 8/19/2014.