GeekHubJava4WebThursday · MykolaMorhun · Jan 23, 2016 · Jan 23, 2016 · Jan 23, 2016
diff --git a/.gitignore b/.gitignore
@@ -0,0 +1,3 @@
+/out
+.idea
+*.iml
diff --git a/org/geekhub/ConnectionUtils.java b/org/geekhub/ConnectionUtils.java
diff --git a/src/org/geekhub/ConnectionUtils.java b/src/org/geekhub/ConnectionUtils.java
@@ -0,0 +1,33 @@
+package org.geekhub;
+
+import java.io.BufferedInputStream;
+import java.io.ByteArrayOutputStream;
+import java.io.IOException;
+import java.net.URL;
+import java.net.URLConnection;
+
+/**
+ * Utils class that contains useful method to interact with URLConnection
+ */
+public class ConnectionUtils {
+
+    /**
+     * Downloads content for specified URL and returns it as a byte array.
+     * Should be used for small files only. Don't use it to download big files it's dangerous.
+     * @param url url of web page to download
+     * @return web page source as byte array
+     * @throws IOException
+     */
+    public static byte[] getData(URL url) throws IOException {
+        URLConnection connection = url.openConnection();
+        ByteArrayOutputStream outputStream = new ByteArrayOutputStream();
+        try (BufferedInputStream in = new BufferedInputStream(connection.getInputStream())) {
+            int b;
+            while ((b = in.read()) != -1) {
+                outputStream.write(b);
+            }
+        }
+        return outputStream.toByteArray();
+    }
+
+}
diff --git a/org/geekhub/ImageCrawler.java → src/org/geekhub/ImageCrawler.java b/org/geekhub/ImageCrawler.java → src/org/geekhub/ImageCrawler.java
@@ -3,6 +3,7 @@
 import java.io.*;
 import java.net.MalformedURLException;
 import java.net.URL;
+import java.util.Collection;
 import java.util.concurrent.ExecutorService;
 import java.util.concurrent.Executors;
 
@@ -25,11 +26,14 @@ public ImageCrawler(String folder) throws MalformedURLException {
 
     /**
      * Call this method to start download images from specified URL.
-     * @param urlToPage
+     * @param urlToPage url to web page
      * @throws IOException
      */
     public void downloadImages(String urlToPage) throws IOException {
-        //implement me
+        Page page = new Page(new URL(urlToPage));
+        page.getImageLinks().stream()
+                .filter(this::isImageURL)
+                .forEach(url -> executorService.submit(new ImageTask(url, folder)));
     }
 
     /**
@@ -39,12 +43,11 @@ public void stop() {
         executorService.shutdown();
     }
 
-    //detects is current url is an image. Checking for popular extensions should be enough
     private boolean isImageURL(URL url) {
-        //implement me
-        return false;
+        String u = url.toString();
+        return u.endsWith(".png") || u.endsWith(".jpg") || u.endsWith(".jpeg") ||
+                u.endsWith(".gif") || u.endsWith(".ico") || u.endsWith(".svg") ||
+                u.endsWith(".bmp");
     }
 
-
-
 }
diff --git a/org/geekhub/ImageTask.java → src/org/geekhub/ImageTask.java b/org/geekhub/ImageTask.java → src/org/geekhub/ImageTask.java
@@ -1,5 +1,6 @@
 package org.geekhub;
 
+import java.io.*;
 import java.net.URL;
 
 /**
@@ -20,11 +21,24 @@ public ImageTask(URL url, String folder) {
      */
     @Override
     public void run() {
-       //implement me
+        try (
+            BufferedInputStream inputStream = new BufferedInputStream(url.openStream());
+            BufferedOutputStream outputStream = new BufferedOutputStream(new FileOutputStream(folder + buildFileName(url)))
+        ) {
+            int b;
+            while ((b = inputStream.read()) != -1) {
+                outputStream.write(b);
+            }
+        } catch (IOException e) {
+            System.out.println("Error while loading data from " + url);
+        }
     }
 
-    //converts URL to unique file name
+    /**
+     * Converts URL to unique file name
+     */
     private String buildFileName(URL url) {
         return url.toString().replaceAll("[^a-zA-Z0-9-_\\.]", "_");
     }
+
 }
diff --git a/org/geekhub/Main.java → src/org/geekhub/Main.java b/org/geekhub/Main.java → src/org/geekhub/Main.java
@@ -5,7 +5,7 @@
 
 public class Main {
 
-    public static final String FOLDER_TO_DOWNLOAD = "d:/images/";
+    public static final String FOLDER_TO_DOWNLOAD = "/tmp/images/";
 
     public static void main(String[] args) throws IOException {
         ImageCrawler imageCrawler = new ImageCrawler(FOLDER_TO_DOWNLOAD);

diff --git a/org/geekhub/Page.java → src/org/geekhub/Page.java b/org/geekhub/Page.java → src/org/geekhub/Page.java
@@ -20,7 +20,7 @@ public class Page {
 
     /**
      * Be careful, constructor downloads content, it could be slow.
-     * @param url
+     * @param url url to web page
      * @throws IOException
      */
     public Page(URL url) throws IOException {
@@ -53,4 +53,5 @@ private Collection<URL> extractMatches(Matcher matcher) throws MalformedURLExcep
         }
         return links;
     }
+
 }
-Original file line number
+Diff line change
@@ -0,0 +1,3 @@
+    /out
+    .idea
+    *.iml