Skip to content

Big Data CJimenez #81

New issue

Have a question about this project? Sign up for a free GitHub account to open an issue and contact its maintainers and the community.

By clicking “Sign up for GitHub”, you agree to our terms of service and privacy statement. We’ll occasionally send you account related emails.

Already on GitHub? Sign in to your account

Open
wants to merge 1 commit into
base: master
Choose a base branch
from
Open
Show file tree
Hide file tree
Changes from all commits
Commits
File filter

Filter by extension

Filter by extension


Conversations
Failed to load comments.
Loading
Jump to
Jump to file
Failed to load files.
Loading
Diff view
Diff view
2 changes: 2 additions & 0 deletions pom.xml
Original file line number Diff line number Diff line change
Expand Up @@ -12,6 +12,8 @@

<properties>
<project.build.sourceEncoding>UTF-8</project.build.sourceEncoding>
<maven.compiler.source>7</maven.compiler.source>
<maven.compiler.target>7</maven.compiler.target>
</properties>

<dependencies>
Expand Down
Original file line number Diff line number Diff line change
@@ -0,0 +1,111 @@

package nearsoft.academy.bigdata.recommendation;

import com.google.common.collect.BiMap;
import com.google.common.collect.HashBiMap;
import java.io.BufferedReader;
import java.io.BufferedWriter;
import java.io.File;
import java.io.FileNotFoundException;
import java.io.FileReader;
import java.io.FileWriter;
import java.io.IOException;
import java.util.ArrayList;
import java.util.HashMap;
import java.util.List;
import org.apache.mahout.cf.taste.common.TasteException;
import org.apache.mahout.cf.taste.impl.model.file.FileDataModel;
import org.apache.mahout.cf.taste.impl.neighborhood.ThresholdUserNeighborhood;
import org.apache.mahout.cf.taste.impl.recommender.GenericUserBasedRecommender;
import org.apache.mahout.cf.taste.impl.similarity.PearsonCorrelationSimilarity;
import org.apache.mahout.cf.taste.model.DataModel;
import org.apache.mahout.cf.taste.neighborhood.UserNeighborhood;
import org.apache.mahout.cf.taste.recommender.RecommendedItem;
import org.apache.mahout.cf.taste.recommender.UserBasedRecommender;
import org.apache.mahout.cf.taste.similarity.UserSimilarity;

/**
* @author carlo
*/
public class MovieRecommender {

private UserBasedRecommender recommender;
private HashMap<String, Integer> users = new HashMap();
private HashBiMap<String, Integer> products = HashBiMap.create();
private int totalReviews = 0, totalUsers = 0, totalProducts = 0;

// Constructor
public MovieRecommender(String path) throws IOException, TasteException {
inicialize(path);
}

private void inicialize(String path) throws FileNotFoundException, IOException, TasteException {
String pathWriter = "D:/Charlitos/Nearsoft/programs/Semana_3/movies.csv";
File file = new File(path);
BufferedReader br = new BufferedReader(new FileReader(file));
BufferedWriter wr = new BufferedWriter(new FileWriter(pathWriter));

String userId = "", productId = "", score, line;
int currentUser = 0, currentProduct = 0;

while ((line = br.readLine()) != null) {
switch(line.split(" ")[0]) {
case "product/productId:":
productId = line.split(" ")[1];
if (!products.containsKey(productId)) {
totalProducts++;
products.put(productId,totalProducts);
currentProduct = totalProducts;
}else{
currentProduct = products.get(productId);
}
break;
case "review/userId:":
userId = line.split(" ")[1];
if (!users.containsKey(userId)) {
totalUsers++;
users.put(userId,totalUsers);
currentUser = totalUsers;
}else{
currentUser = users.get(userId);
}
break;
case "review/score:":
score = line.split(" ")[1];
wr.write(currentUser+","+currentProduct+","+score+"\n");
totalReviews++;
break;
}
}
br.close();
wr.close();
DataModel model = new FileDataModel(new File(pathWriter));
UserSimilarity similarity = new PearsonCorrelationSimilarity(model);
UserNeighborhood neighborhood = new ThresholdUserNeighborhood(0.1, similarity, model);
recommender = new GenericUserBasedRecommender(model, neighborhood, similarity);
}

public int getTotalReviews() {
return totalReviews;
}

public int getTotalProducts() {
return totalProducts;
}

public int getTotalUsers() {
return totalUsers;
}

public List<String> getRecommendationsForUser(String userId) throws TasteException {
List<String> list = new ArrayList<String>();
int id = users.get(userId);
List<RecommendedItem> recommendations = recommender.recommend(id, 3);
BiMap<Integer, String> inverseProducts = products.inverse();
for (RecommendedItem recommendation: recommendations) {
list.add(inverseProducts.get((int) recommendation.getItemID()));
}
return list;
}

}
Original file line number Diff line number Diff line change
Expand Up @@ -15,7 +15,7 @@ public class MovieRecommenderTest {
public void testDataInfo() throws IOException, TasteException {
//download movies.txt.gz from
// http://snap.stanford.edu/data/web-Movies.html
MovieRecommender recommender = new MovieRecommender("/path/to/movies.txt.gz");
MovieRecommender recommender = new MovieRecommender("D:/Charlitos/Nearsoft/programs/Semana_3/movies.txt");
assertEquals(7911684, recommender.getTotalReviews());
assertEquals(253059, recommender.getTotalProducts());
assertEquals(889176, recommender.getTotalUsers());
Expand Down
Binary file added target/big-data-1.0-SNAPSHOT.jar
Binary file not shown.
5 changes: 5 additions & 0 deletions target/maven-archiver/pom.properties
Original file line number Diff line number Diff line change
@@ -0,0 +1,5 @@
#Generated by Maven
#Sun Apr 19 21:24:13 MST 2020
groupId=nearsoft.academy
artifactId=big-data
version=1.0-SNAPSHOT
Original file line number Diff line number Diff line change
@@ -0,0 +1,2 @@
nearsoft\academy\bigdata\recommendation\MovieRecommender.class
nearsoft\academy\bigdata\recommendation\MovieRecommenderTest.class
Original file line number Diff line number Diff line change
@@ -0,0 +1,2 @@
D:\NetBeansProjects\big-data-exercises-master\src\test\java\nearsoft\academy\bigdata\recommendation\MovieRecommenderTest.java
D:\NetBeansProjects\big-data-exercises-master\src\test\java\nearsoft\academy\bigdata\recommendation\MovieRecommender.java
Original file line number Diff line number Diff line change
@@ -0,0 +1,61 @@
<?xml version="1.0" encoding="UTF-8" ?>
<testsuite tests="1" failures="0" name="nearsoft.academy.bigdata.recommendation.MovieRecommenderTest" time="520.675" errors="0" skipped="0">
<properties>
<property name="java.runtime.name" value="Java(TM) SE Runtime Environment"/>
<property name="java.vm.version" value="14.0.1+7"/>
<property name="sun.boot.library.path" value="C:\Program Files\Java\jdk-14.0.1\bin"/>
<property name="maven.multiModuleProjectDirectory" value="D:\NetBeansProjects\big-data-exercises-master"/>
<property name="java.vm.vendor" value="Oracle Corporation"/>
<property name="java.vendor.url" value="https://java.oracle.com/"/>
<property name="guice.disable.misplaced.annotation.check" value="true"/>
<property name="path.separator" value=";"/>
<property name="java.vm.name" value="Java HotSpot(TM) 64-Bit Server VM"/>
<property name="sun.os.patch.level" value=""/>
<property name="user.script" value=""/>
<property name="user.country" value="MX"/>
<property name="sun.java.launcher" value="SUN_STANDARD"/>
<property name="java.vm.specification.name" value="Java Virtual Machine Specification"/>
<property name="user.dir" value="D:\NetBeansProjects\big-data-exercises-master"/>
<property name="java.vm.compressedOopsMode" value="32-bit"/>
<property name="java.runtime.version" value="14.0.1+7"/>
<property name="os.arch" value="amd64"/>
<property name="java.io.tmpdir" value="C:\Users\carlo\AppData\Local\Temp\"/>
<property name="line.separator" value="
"/>
<property name="java.vm.specification.vendor" value="Oracle Corporation"/>
<property name="user.variant" value=""/>
<property name="os.name" value="Windows 10"/>
<property name="maven.ext.class.path" value="D:\Program Files\NetBeans-11.3\netbeans\java\maven-nblib\netbeans-eventspy.jar"/>
<property name="classworlds.conf" value="D:\Program Files\NetBeans-11.3\netbeans\java\maven\bin\m2.conf"/>
<property name="sun.jnu.encoding" value="Cp1252"/>
<property name="java.library.path" value="C:\Program Files\Java\jdk-14.0.1\bin;C:\WINDOWS\Sun\Java\bin;C:\WINDOWS\system32;C:\WINDOWS;C:\Program Files (x86)\Common Files\Oracle\Java\javapath;C:\ProgramData\Oracle\Java\javapath;C:\Program Files (x86)\Common Files\Intel\Shared Libraries\redist\intel64\compiler;C:\Program Files (x86)\Java\jre1.8.0_161;C:\Program Files (x86)\Intel\iCLS Client\;C:\Program Files\Intel\iCLS Client\;C:\WINDOWS\system32;C:\WINDOWS;C:\WINDOWS\System32\Wbem;C:\WINDOWS\System32\WindowsPowerShell\v1.0\;C:\Program Files (x86)\Intel\Intel(R) Management Engine Components\DAL;C:\Program Files\Intel\Intel(R) Management Engine Components\DAL;C:\Program Files (x86)\Intel\Intel(R) Management Engine Components\IPT;C:\Program Files\Intel\Intel(R) Management Engine Components\IPT;C:\Program Files (x86)\Microsoft SQL Server\100\Tools\Binn\VSShell\Common7\IDE\;C:\Program Files (x86)\Microsoft SQL Server\100\Tools\Binn\;C:\Program Files\Microsoft SQL Server\100\Tools\Binn\;C:\Program Files (x86)\Microsoft SQL Server\100\DTS\Binn\;C:\Program Files\Microsoft SQL Server\100\DTS\Binn\;C:\WINDOWS\System32\OpenSSH\;D:\Program Files (x86)\Git\cmd;C:\Program Files\Java\jdk1.8.0_161\bin;D:\Program Files (x86)\QuickTime\QTSystem\;C:\Users\carlo\AppData\Local\Microsoft\WindowsApps;D:\Program Files\apache-maven-3.6.3\bin;C:\Program Files\Java\jdk1.8.0_251\bin;D:\Program Files (x86)\Microsoft VS Code\bin;;."/>
<property name="jdk.debug" value="release"/>
<property name="java.class.version" value="58.0"/>
<property name="java.specification.name" value="Java Platform API Specification"/>
<property name="sun.management.compiler" value="HotSpot 64-Bit Tiered Compilers"/>
<property name="os.version" value="10.0"/>
<property name="user.home" value="C:\Users\carlo"/>
<property name="user.timezone" value="America/Hermosillo"/>
<property name="file.encoding" value="UTF-8"/>
<property name="java.specification.version" value="14"/>
<property name="user.name" value="carlo"/>
<property name="java.class.path" value="D:\Program Files\NetBeans-11.3\netbeans\java\maven\boot\plexus-classworlds-2.5.2.jar"/>
<property name="java.vm.specification.version" value="14"/>
<property name="sun.arch.data.model" value="64"/>
<property name="sun.java.command" value="org.codehaus.plexus.classworlds.launcher.Launcher -Dmaven.ext.class.path=D:\Program Files\NetBeans-11.3\netbeans\java\maven-nblib\netbeans-eventspy.jar -Dfile.encoding=UTF-8 install"/>
<property name="java.home" value="C:\Program Files\Java\jdk-14.0.1"/>
<property name="user.language" value="es"/>
<property name="java.specification.vendor" value="Oracle Corporation"/>
<property name="java.vm.info" value="mixed mode, sharing"/>
<property name="java.version" value="14.0.1"/>
<property name="java.vendor" value="Oracle Corporation"/>
<property name="maven.home" value="D:\Program Files\NetBeans-11.3\netbeans\java\maven"/>
<property name="file.separator" value="\"/>
<property name="java.version.date" value="2020-04-14"/>
<property name="java.vendor.url.bug" value="https://bugreport.java.com/bugreport/"/>
<property name="sun.io.unicode.encoding" value="UnicodeLittle"/>
<property name="sun.cpu.endian" value="little"/>
<property name="sun.cpu.isalist" value="amd64"/>
</properties>
<testcase classname="nearsoft.academy.bigdata.recommendation.MovieRecommenderTest" name="testDataInfo" time="520.675"/>
</testsuite>
Original file line number Diff line number Diff line change
@@ -0,0 +1,4 @@
-------------------------------------------------------------------------------
Test set: nearsoft.academy.bigdata.recommendation.MovieRecommenderTest
-------------------------------------------------------------------------------
Tests run: 1, Failures: 0, Errors: 0, Skipped: 0, Time elapsed: 520.792 sec
Binary file not shown.
Binary file not shown.