AakashSasikumar · jwong101 · Oct 25, 2016
diff --git a/.classpath b/.classpath
@@ -0,0 +1,9 @@
+<?xml version="1.0" encoding="UTF-8"?>
+<classpath>
+	<classpathentry kind="src" path="src"/>
+	<classpathentry kind="con" path="org.eclipse.jdt.launching.JRE_CONTAINER/org.eclipse.jdt.internal.debug.ui.launcher.StandardVMType/JavaSE-1.8"/>
+	<classpathentry kind="lib" path="lib/jsoup-1.10.1.jar"/>
+	<classpathentry kind="lib" path="lib/commons-io-2.5.jar"/>
+	<classpathentry kind="lib" path="lib/ui4j-ide-1.1.0.jar"/>
+	<classpathentry kind="output" path="bin"/>
+</classpath>
diff --git a/.project b/.project
@@ -0,0 +1,17 @@
+<?xml version="1.0" encoding="UTF-8"?>
+<projectDescription>
+	<name>YoutubeScraper</name>
+	<comment></comment>
+	<projects>
+	</projects>
+	<buildSpec>
+		<buildCommand>
+			<name>org.eclipse.jdt.core.javabuilder</name>
+			<arguments>
+			</arguments>
+		</buildCommand>
+	</buildSpec>
+	<natures>
+		<nature>org.eclipse.jdt.core.javanature</nature>
+	</natures>
+</projectDescription>
diff --git a/.settings/org.eclipse.jdt.core.prefs b/.settings/org.eclipse.jdt.core.prefs
@@ -0,0 +1,11 @@
+eclipse.preferences.version=1
+org.eclipse.jdt.core.compiler.codegen.inlineJsrBytecode=enabled
+org.eclipse.jdt.core.compiler.codegen.targetPlatform=1.8
+org.eclipse.jdt.core.compiler.codegen.unusedLocal=preserve
+org.eclipse.jdt.core.compiler.compliance=1.8
+org.eclipse.jdt.core.compiler.debug.lineNumber=generate
+org.eclipse.jdt.core.compiler.debug.localVariable=generate
+org.eclipse.jdt.core.compiler.debug.sourceFile=generate
+org.eclipse.jdt.core.compiler.problem.assertIdentifier=error
+org.eclipse.jdt.core.compiler.problem.enumIdentifier=error
+org.eclipse.jdt.core.compiler.source=1.8
diff --git a/lib/commons-io-2.5.jar b/lib/commons-io-2.5.jar
diff --git a/lib/jsoup-1.10.1.jar b/lib/jsoup-1.10.1.jar
diff --git a/lib/ui4j-ide-1.1.0.jar b/lib/ui4j-ide-1.1.0.jar
diff --git a/src/YouTubeScraper.java b/src/YouTubeScraper.java
@@ -2,10 +2,10 @@
 import java.io.IOException;
 import java.net.HttpURLConnection;
 import java.net.URL;
-import java.net.URLEncoder;
+import java.util.ArrayList;
+import java.util.List;
 import java.util.Scanner;
 import java.util.concurrent.TimeUnit;
-import java.util.logging.Level;
 
 import org.apache.commons.io.FileUtils;
 import org.jsoup.Jsoup;
@@ -29,92 +29,92 @@ public static void main(String[] args) throws IOException, InterruptedException{
 		//closing in on the target,(class name is lockup-title)
 		Elements subdiv = website.select("h3.yt-lockup-title>a");
 		//System.out.println(subdiv);---checking to see if .select worked 
-		String[] seperateLinks = new String[subdiv.size()];
-		String[] title = new String[subdiv.size()];
-		int i =0;
+		List<String> separateLinks = new ArrayList<>(); 
+		List<String> titles = new ArrayList<>();
 		for(Element temp:subdiv)
-		{	String a = temp.attr("href");
-		//youtube has playlists, and these contail "list" in the URL and we dont need these playlists
+		{	
+			String a = temp.attr("href");
+			//youtube has playlists, and these contail "list" in the URL and we dont need these playlists
 			if(a.contains("list"))
 			{
 				continue;
 			}
 			else{
 				//adding the non playlist URL's into my link array
-				seperateLinks[i] = "https://www.youtube.com"+temp.attr("href");
-				title[i] = temp.text();
-				i++;
+				separateLinks.add("https://www.youtube.com"+temp.attr("href"));
+				titles.add(temp.text());
 			}
 		}
-			for(int j=0; j<seperateLinks.length;j++){
-				System.out.println((j+1)+": "+title[j]);
-				//System.out.println(seplinks[j]);---checking to see if the links are proper
-			}
-			System.out.println("Please enter your choice");
-			int choice = in.nextInt();
-			choice--;
-			String userchoice = seperateLinks[choice];
-			//System.out.println(userchoice);---final URL selected
-
-
-			//-------------Done with Scraping youtube-------------------
-
-
-			//Start of scraping the second website
-
-			BrowserEngine browser = BrowserFactory.getWebKit();
-			//java.util.logging.Logger.getLogger("com.ui4j").setLevel(Level.OFF);
-			com.ui4j.api.browser.Page docu = browser.navigate("http://www.listentoyoutube.com/");
-			com.ui4j.api.dom.Document process = docu.getDocument();
-			process.query("input[type='text']").get().setValue(userchoice);
-			process.query("input[type='submit']").get().click();
-			//copied over the url and clicked the button
-			TimeUnit.SECONDS.sleep(20);//delay to make it work for slow networks
-			String ur =(String) docu.executeScript("window.location.href");//got the current URL
-			if(ur.contains("captcha")){//found a temporary solution for the captcha issue
-				System.out.println("Please go to http://www.listentoyoutube.com/captcha.php and prove you're not a robot and run the program again");
-				System.exit(0);
-			}
-			ur=ur.substring(49, ur.length());
-			/*There are three parameters
-  			 * 1. The Server number
-  			 * 2.The hash
- 			 * 3.The file name
- 			 * so i got the url and split it at '&'
-   			 */
-			String[] segments = ur.split("&");
-			segments[1]=segments[1].substring(5, segments[1].length());
-			/* segments[0] is the server number
-			 * segments[1] is the hash code
-			 * segments[2] is the file name
-			 */
-			segments[1]=segments[1].replaceAll("%253D%253D","");
-			segments[2]=segments[2].substring(5, segments[2].length());
-			String finalur = "http://"+segments[0]+".listentoyoutube.com/download/"+segments[1]+"==/"+segments[2];
-			URL url = new URL(finalur);
-			HttpURLConnection httpConnection = (HttpURLConnection) (url.openConnection());//this connection is to get the file size
-			long fileSize = httpConnection.getContentLength();
-			System.out.println(title[choice]+"\t\tSize : "+fileSize/1048576f+" mb");//----this will calcluate the total file size in mb
-			segments[2]=segments[2].replace("%7C", "");
-			segments[2]=segments[2].replace("%22", "");
-			segments[2]=segments[2].replace("%3F", "");
-			segments[2]=java.net.URLDecoder.decode(segments[2], "UTF-8");//java doesnt allow ", ?, | to be in the file name
-			String path = ""+segments[2]+".mp3";//downloads in the file where the jar file is located
-			File file = new File(path);
-			TimeUnit.SECONDS.sleep(5);
-			try
-			{	System.out.println("Downloading....");
-				FileUtils.copyURLToFile(url, file);
-				System.out.println("Download Complete");
-			}
-			catch(Exception e)
-			{
-				System.out.println("Got an IOException: " + e.getMessage());
-				System.out.println("Download Failed");
-			}
-			finally{
-				System.exit(0);
-			}
-			in.close();			
+		for(int j=0; j<separateLinks.size();j++){
+			System.out.println((j+1)+": "+titles.get(j));
+			//System.out.println(seplinks[j]);---checking to see if the links are proper
+		}
+		System.out.println("Please enter your choice");
+		int choice = in.nextInt();
+		choice--;
+		String userchoice = separateLinks.get(choice);
+		//System.out.println(userchoice);---final URL selected
+
+
+		//-------------Done with Scraping youtube-------------------
+
+
+		//Start of scraping the second website
+
+		BrowserEngine browser = BrowserFactory.getWebKit();
+		//java.util.logging.Logger.getLogger("com.ui4j").setLevel(Level.OFF);
+		com.ui4j.api.browser.Page docu = browser.navigate("http://www.listentoyoutube.com/");
+		com.ui4j.api.dom.Document process = docu.getDocument();
+		process.query("input[type='text']").setValue(userchoice);
+		process.query("input[type='submit']").click();
+		//copied over the url and clicked the button
+		TimeUnit.SECONDS.sleep(20);//delay to make it work for slow networks
+		String ur =(String) docu.executeScript("window.location.href");//got the current URL
+		if(ur.contains("captcha")){//found a temporary solution for the captcha issue
+			System.out.println("Please go to http://www.listentoyoutube.com/captcha.php and prove you're not a robot and run the program again");
+			System.exit(0);
+		}
+		System.out.println(ur);
+		ur=ur.substring(49, ur.length());
+		/*There are three parameters
+		 * 1. The Server number
+		 * 2.The hash
+		 * 3.The file name
+		 * so i got the url and split it at '&'
+		 */
+		String[] segments = ur.split("&");
+		segments[1]=segments[1].substring(5, segments[1].length());
+		/* segments[0] is the server number
+		 * segments[1] is the hash code
+		 * segments[2] is the file name
+		 */
+		segments[1]=segments[1].replaceAll("%253D%253D","");
+		segments[2]=segments[2].substring(5, segments[2].length());
+		String finalur = "http://"+segments[0]+".listentoyoutube.com/download/"+segments[1]+"==/"+segments[2];
+		URL url = new URL(finalur);
+		HttpURLConnection httpConnection = (HttpURLConnection) (url.openConnection());//this connection is to get the file size
+		long fileSize = httpConnection.getContentLength();
+		System.out.println(titles.get(choice)+"\t\tSize : "+fileSize/1048576f+" mb");//----this will calcluate the total file size in mb
+		segments[2]=segments[2].replace("%7C", "");
+		segments[2]=segments[2].replace("%22", "");
+		segments[2]=segments[2].replace("%3F", "");
+		segments[2]=java.net.URLDecoder.decode(segments[2], "UTF-8");//java doesnt allow ", ?, | to be in the file name
+		String path = ""+segments[2]+".mp3";//downloads in the file where the jar file is located
+		File file = new File(path);
+		TimeUnit.SECONDS.sleep(5);
+		try
+		{	System.out.println("Downloading....");
+			FileUtils.copyURLToFile(url, file);
+			System.out.println("Download Complete");
+		}
+		catch(IOException ex)
+		{
+			System.out.println("Got an IOException: " + ex.getMessage());
+			System.out.println("Download failed");
+		}
+		finally{
+			System.exit(0);
+		}
+		in.close();			
 	}
 }