From 4e2ebab1541ee415a5c82003281ddc58f7993ec8 Mon Sep 17 00:00:00 2001 From: lromero Date: Mon, 7 Oct 2019 23:58:54 -0700 Subject: [PATCH 1/8] Movies recommender working --- pom.xml | 1 + .../recommendation/MovieRecommenderTest.java | 19 ++++++++++++++++--- 2 files changed, 17 insertions(+), 3 deletions(-) diff --git a/pom.xml b/pom.xml index 8169ff7..810bf09 100644 --- a/pom.xml +++ b/pom.xml @@ -26,5 +26,6 @@ 4.7 test + diff --git a/src/test/java/nearsoft/academy/bigdata/recommendation/MovieRecommenderTest.java b/src/test/java/nearsoft/academy/bigdata/recommendation/MovieRecommenderTest.java index 0d0b1fe..eb999af 100644 --- a/src/test/java/nearsoft/academy/bigdata/recommendation/MovieRecommenderTest.java +++ b/src/test/java/nearsoft/academy/bigdata/recommendation/MovieRecommenderTest.java @@ -15,11 +15,19 @@ public class MovieRecommenderTest { public void testDataInfo() throws IOException, TasteException { //download movies.txt.gz from // http://snap.stanford.edu/data/web-Movies.html - MovieRecommender recommender = new MovieRecommender("/path/to/movies.txt.gz"); - assertEquals(7911684, recommender.getTotalReviews()); - assertEquals(253059, recommender.getTotalProducts()); + MovieRecommender recommender = new MovieRecommender("/Desktop/LuisMario/AmazonProblem/movies.txt.gz"); + assertEquals(7911684, recommender.getTotalReviews()); // + assertEquals(253059, recommender.getTotalProducts()); // product/productId: assertEquals(889176, recommender.getTotalUsers()); + // get a token with a review and saved it if it's not already defined, but if it's already defined plus one + // + + + // total reviews : 7911684 + // total products : 253059 + // total users : 889176 + List recommendations = recommender.getRecommendationsForUser("A141HP4LYPWMSR"); assertThat(recommendations, hasItem("B0002O7Y8U")); assertThat(recommendations, hasItem("B00004CQTF")); @@ -27,4 +35,9 @@ public void testDataInfo() throws IOException, TasteException { } + public static void main(String[] args) throws IOException, TasteException { + MovieRecommenderTest call = new MovieRecommenderTest(); + call.testDataInfo(); + } + } From 956a52043f88a24ed5f4687a5e9b0fa9764efea8 Mon Sep 17 00:00:00 2001 From: lromero Date: Tue, 8 Oct 2019 03:24:16 -0700 Subject: [PATCH 2/8] Applying changes --- .idea/$PRODUCT_WORKSPACE_FILE$ | 19 ++ .idea/.gitignore | 3 + .idea/.name | 1 + .idea/compiler.xml | 16 ++ .idea/encodings.xml | 6 + .idea/libraries/Maven__asm_asm_3_1.xml | 13 ++ .../Maven__com_google_guava_guava_16_0.xml | 13 ++ .../Maven__com_sun_jersey_jersey_core_1_8.xml | 13 ++ .../Maven__com_sun_jersey_jersey_json_1_8.xml | 13 ++ ...aven__com_sun_jersey_jersey_server_1_8.xml | 13 ++ ...en__com_sun_xml_bind_jaxb_impl_2_2_3_1.xml | 13 ++ ...com_thoughtworks_xstream_xstream_1_4_4.xml | 13 ++ ...mons_beanutils_commons_beanutils_1_7_0.xml | 13 ++ ...beanutils_commons_beanutils_core_1_8_0.xml | 13 ++ .../Maven__commons_cli_commons_cli_1_2.xml | 13 ++ ...Maven__commons_codec_commons_codec_1_4.xml | 13 ++ ..._collections_commons_collections_3_2_1.xml | 13 ++ ...onfiguration_commons_configuration_1_6.xml | 13 ++ ..._commons_digester_commons_digester_1_8.xml | 13 ++ .../Maven__commons_el_commons_el_1_0.xml | 13 ++ ...ns_httpclient_commons_httpclient_3_0_1.xml | 13 ++ .../Maven__commons_io_commons_io_2_1.xml | 13 ++ .../Maven__commons_lang_commons_lang_2_4.xml | 13 ++ ..._commons_logging_commons_logging_1_0_3.xml | 13 ++ .../Maven__commons_net_commons_net_1_4_1.xml | 13 ++ ...Maven__javax_activation_activation_1_1.xml | 13 ++ .../Maven__javax_xml_bind_jaxb_api_2_2_2.xml | 13 ++ ...Maven__javax_xml_stream_stax_api_1_0_2.xml | 13 ++ .idea/libraries/Maven__junit_junit_4_7.xml | 13 ++ ...__org_apache_commons_commons_lang3_3_1.xml | 13 ++ ...__org_apache_commons_commons_math3_3_2.xml | 13 ++ ...n__org_apache_commons_commons_math_2_1.xml | 13 ++ ...n__org_apache_hadoop_hadoop_core_1_2_1.xml | 13 ++ ...e_lucene_lucene_analyzers_common_4_6_1.xml | 13 ++ ...n__org_apache_lucene_lucene_core_4_6_1.xml | 13 ++ ..._mahout_commons_commons_cli_2_0_mahout.xml | 13 ++ ...ven__org_apache_mahout_mahout_core_0_9.xml | 13 ++ ...ven__org_apache_mahout_mahout_math_0_9.xml | 13 ++ ...org_apache_solr_solr_commons_csv_3_5_0.xml | 13 ++ ...dehaus_jackson_jackson_core_asl_1_9_12.xml | 13 ++ ...g_codehaus_jackson_jackson_jaxrs_1_7_1.xml | 13 ++ ...haus_jackson_jackson_mapper_asl_1_9_12.xml | 13 ++ ..._org_codehaus_jackson_jackson_xc_1_7_1.xml | 13 ++ ...en__org_codehaus_jettison_jettison_1_1.xml | 13 ++ .../Maven__org_slf4j_slf4j_api_1_7_5.xml | 13 ++ .../libraries/Maven__stax_stax_api_1_0_1.xml | 13 ++ .../Maven__xmlpull_xmlpull_1_1_3_1.xml | 13 ++ .../libraries/Maven__xpp3_xpp3_min_1_1_4c.xml | 13 ++ .idea/misc.xml | 13 ++ .idea/modules.xml | 8 + .idea/vcs.xml | 6 + big-data.iml | 56 +++++ .../recommendation/MovieRecommender.java | 216 ++++++++++++++++++ .../recommendation/MovieRecommenderTest.java | 8 +- .../academy/bigdata/recommendation/test.java | 176 ++++++++++++++ .../default-testCompile/createdFiles.lst | 0 .../default-testCompile/inputFiles.lst | 3 + ...ta.recommendation.MovieRecommenderTest.xml | 68 ++++++ ...ta.recommendation.MovieRecommenderTest.txt | 4 + .../recommendation/MovieRecommender.class | Bin 0 -> 7365 bytes .../recommendation/MovieRecommenderTest.class | Bin 0 -> 1739 bytes .../academy/bigdata/recommendation/test.class | Bin 0 -> 4156 bytes 62 files changed, 1158 insertions(+), 4 deletions(-) create mode 100644 .idea/$PRODUCT_WORKSPACE_FILE$ create mode 100644 .idea/.gitignore create mode 100644 .idea/.name create mode 100644 .idea/compiler.xml create mode 100644 .idea/encodings.xml create mode 100644 .idea/libraries/Maven__asm_asm_3_1.xml create mode 100644 .idea/libraries/Maven__com_google_guava_guava_16_0.xml create mode 100644 .idea/libraries/Maven__com_sun_jersey_jersey_core_1_8.xml create mode 100644 .idea/libraries/Maven__com_sun_jersey_jersey_json_1_8.xml create mode 100644 .idea/libraries/Maven__com_sun_jersey_jersey_server_1_8.xml create mode 100644 .idea/libraries/Maven__com_sun_xml_bind_jaxb_impl_2_2_3_1.xml create mode 100644 .idea/libraries/Maven__com_thoughtworks_xstream_xstream_1_4_4.xml create mode 100644 .idea/libraries/Maven__commons_beanutils_commons_beanutils_1_7_0.xml create mode 100644 .idea/libraries/Maven__commons_beanutils_commons_beanutils_core_1_8_0.xml create mode 100644 .idea/libraries/Maven__commons_cli_commons_cli_1_2.xml create mode 100644 .idea/libraries/Maven__commons_codec_commons_codec_1_4.xml create mode 100644 .idea/libraries/Maven__commons_collections_commons_collections_3_2_1.xml create mode 100644 .idea/libraries/Maven__commons_configuration_commons_configuration_1_6.xml create mode 100644 .idea/libraries/Maven__commons_digester_commons_digester_1_8.xml create mode 100644 .idea/libraries/Maven__commons_el_commons_el_1_0.xml create mode 100644 .idea/libraries/Maven__commons_httpclient_commons_httpclient_3_0_1.xml create mode 100644 .idea/libraries/Maven__commons_io_commons_io_2_1.xml create mode 100644 .idea/libraries/Maven__commons_lang_commons_lang_2_4.xml create mode 100644 .idea/libraries/Maven__commons_logging_commons_logging_1_0_3.xml create mode 100644 .idea/libraries/Maven__commons_net_commons_net_1_4_1.xml create mode 100644 .idea/libraries/Maven__javax_activation_activation_1_1.xml create mode 100644 .idea/libraries/Maven__javax_xml_bind_jaxb_api_2_2_2.xml create mode 100644 .idea/libraries/Maven__javax_xml_stream_stax_api_1_0_2.xml create mode 100644 .idea/libraries/Maven__junit_junit_4_7.xml create mode 100644 .idea/libraries/Maven__org_apache_commons_commons_lang3_3_1.xml create mode 100644 .idea/libraries/Maven__org_apache_commons_commons_math3_3_2.xml create mode 100644 .idea/libraries/Maven__org_apache_commons_commons_math_2_1.xml create mode 100644 .idea/libraries/Maven__org_apache_hadoop_hadoop_core_1_2_1.xml create mode 100644 .idea/libraries/Maven__org_apache_lucene_lucene_analyzers_common_4_6_1.xml create mode 100644 .idea/libraries/Maven__org_apache_lucene_lucene_core_4_6_1.xml create mode 100644 .idea/libraries/Maven__org_apache_mahout_commons_commons_cli_2_0_mahout.xml create mode 100644 .idea/libraries/Maven__org_apache_mahout_mahout_core_0_9.xml create mode 100644 .idea/libraries/Maven__org_apache_mahout_mahout_math_0_9.xml create mode 100644 .idea/libraries/Maven__org_apache_solr_solr_commons_csv_3_5_0.xml create mode 100644 .idea/libraries/Maven__org_codehaus_jackson_jackson_core_asl_1_9_12.xml create mode 100644 .idea/libraries/Maven__org_codehaus_jackson_jackson_jaxrs_1_7_1.xml create mode 100644 .idea/libraries/Maven__org_codehaus_jackson_jackson_mapper_asl_1_9_12.xml create mode 100644 .idea/libraries/Maven__org_codehaus_jackson_jackson_xc_1_7_1.xml create mode 100644 .idea/libraries/Maven__org_codehaus_jettison_jettison_1_1.xml create mode 100644 .idea/libraries/Maven__org_slf4j_slf4j_api_1_7_5.xml create mode 100644 .idea/libraries/Maven__stax_stax_api_1_0_1.xml create mode 100644 .idea/libraries/Maven__xmlpull_xmlpull_1_1_3_1.xml create mode 100644 .idea/libraries/Maven__xpp3_xpp3_min_1_1_4c.xml create mode 100644 .idea/misc.xml create mode 100644 .idea/modules.xml create mode 100644 .idea/vcs.xml create mode 100644 big-data.iml create mode 100644 src/test/java/nearsoft/academy/bigdata/recommendation/MovieRecommender.java create mode 100644 src/test/java/nearsoft/academy/bigdata/recommendation/test.java create mode 100644 target/maven-status/maven-compiler-plugin/testCompile/default-testCompile/createdFiles.lst create mode 100644 target/maven-status/maven-compiler-plugin/testCompile/default-testCompile/inputFiles.lst create mode 100644 target/surefire-reports/TEST-nearsoft.academy.bigdata.recommendation.MovieRecommenderTest.xml create mode 100644 target/surefire-reports/nearsoft.academy.bigdata.recommendation.MovieRecommenderTest.txt create mode 100644 target/test-classes/nearsoft/academy/bigdata/recommendation/MovieRecommender.class create mode 100644 target/test-classes/nearsoft/academy/bigdata/recommendation/MovieRecommenderTest.class create mode 100644 target/test-classes/nearsoft/academy/bigdata/recommendation/test.class diff --git a/.idea/$PRODUCT_WORKSPACE_FILE$ b/.idea/$PRODUCT_WORKSPACE_FILE$ new file mode 100644 index 0000000..3733e0d --- /dev/null +++ b/.idea/$PRODUCT_WORKSPACE_FILE$ @@ -0,0 +1,19 @@ + + + + + + + 1.8 + + + + + + + + \ No newline at end of file diff --git a/.idea/.gitignore b/.idea/.gitignore new file mode 100644 index 0000000..0e40fe8 --- /dev/null +++ b/.idea/.gitignore @@ -0,0 +1,3 @@ + +# Default ignored files +/workspace.xml \ No newline at end of file diff --git a/.idea/.name b/.idea/.name new file mode 100644 index 0000000..a6f69a2 --- /dev/null +++ b/.idea/.name @@ -0,0 +1 @@ +big-data \ No newline at end of file diff --git a/.idea/compiler.xml b/.idea/compiler.xml new file mode 100644 index 0000000..81ad3ee --- /dev/null +++ b/.idea/compiler.xml @@ -0,0 +1,16 @@ + + + + + + + + + + + + + + + + \ No newline at end of file diff --git a/.idea/encodings.xml b/.idea/encodings.xml new file mode 100644 index 0000000..b26911b --- /dev/null +++ b/.idea/encodings.xml @@ -0,0 +1,6 @@ + + + + + + \ No newline at end of file diff --git a/.idea/libraries/Maven__asm_asm_3_1.xml b/.idea/libraries/Maven__asm_asm_3_1.xml new file mode 100644 index 0000000..3386f10 --- /dev/null +++ b/.idea/libraries/Maven__asm_asm_3_1.xml @@ -0,0 +1,13 @@ + + + + + + + + + + + + + \ No newline at end of file diff --git a/.idea/libraries/Maven__com_google_guava_guava_16_0.xml b/.idea/libraries/Maven__com_google_guava_guava_16_0.xml new file mode 100644 index 0000000..91cff2f --- /dev/null +++ b/.idea/libraries/Maven__com_google_guava_guava_16_0.xml @@ -0,0 +1,13 @@ + + + + + + + + + + + + + \ No newline at end of file diff --git a/.idea/libraries/Maven__com_sun_jersey_jersey_core_1_8.xml b/.idea/libraries/Maven__com_sun_jersey_jersey_core_1_8.xml new file mode 100644 index 0000000..bf486c9 --- /dev/null +++ b/.idea/libraries/Maven__com_sun_jersey_jersey_core_1_8.xml @@ -0,0 +1,13 @@ + + + + + + + + + + + + + \ No newline at end of file diff --git a/.idea/libraries/Maven__com_sun_jersey_jersey_json_1_8.xml b/.idea/libraries/Maven__com_sun_jersey_jersey_json_1_8.xml new file mode 100644 index 0000000..ab01cdd --- /dev/null +++ b/.idea/libraries/Maven__com_sun_jersey_jersey_json_1_8.xml @@ -0,0 +1,13 @@ + + + + + + + + + + + + + \ No newline at end of file diff --git a/.idea/libraries/Maven__com_sun_jersey_jersey_server_1_8.xml b/.idea/libraries/Maven__com_sun_jersey_jersey_server_1_8.xml new file mode 100644 index 0000000..e7e8ba0 --- /dev/null +++ b/.idea/libraries/Maven__com_sun_jersey_jersey_server_1_8.xml @@ -0,0 +1,13 @@ + + + + + + + + + + + + + \ No newline at end of file diff --git a/.idea/libraries/Maven__com_sun_xml_bind_jaxb_impl_2_2_3_1.xml b/.idea/libraries/Maven__com_sun_xml_bind_jaxb_impl_2_2_3_1.xml new file mode 100644 index 0000000..1165a3b --- /dev/null +++ b/.idea/libraries/Maven__com_sun_xml_bind_jaxb_impl_2_2_3_1.xml @@ -0,0 +1,13 @@ + + + + + + + + + + + + + \ No newline at end of file diff --git a/.idea/libraries/Maven__com_thoughtworks_xstream_xstream_1_4_4.xml b/.idea/libraries/Maven__com_thoughtworks_xstream_xstream_1_4_4.xml new file mode 100644 index 0000000..2c3025b --- /dev/null +++ b/.idea/libraries/Maven__com_thoughtworks_xstream_xstream_1_4_4.xml @@ -0,0 +1,13 @@ + + + + + + + + + + + + + \ No newline at end of file diff --git a/.idea/libraries/Maven__commons_beanutils_commons_beanutils_1_7_0.xml b/.idea/libraries/Maven__commons_beanutils_commons_beanutils_1_7_0.xml new file mode 100644 index 0000000..1cb64ed --- /dev/null +++ b/.idea/libraries/Maven__commons_beanutils_commons_beanutils_1_7_0.xml @@ -0,0 +1,13 @@ + + + + + + + + + + + + + \ No newline at end of file diff --git a/.idea/libraries/Maven__commons_beanutils_commons_beanutils_core_1_8_0.xml b/.idea/libraries/Maven__commons_beanutils_commons_beanutils_core_1_8_0.xml new file mode 100644 index 0000000..3fda2c0 --- /dev/null +++ b/.idea/libraries/Maven__commons_beanutils_commons_beanutils_core_1_8_0.xml @@ -0,0 +1,13 @@ + + + + + + + + + + + + + \ No newline at end of file diff --git a/.idea/libraries/Maven__commons_cli_commons_cli_1_2.xml b/.idea/libraries/Maven__commons_cli_commons_cli_1_2.xml new file mode 100644 index 0000000..cec2493 --- /dev/null +++ b/.idea/libraries/Maven__commons_cli_commons_cli_1_2.xml @@ -0,0 +1,13 @@ + + + + + + + + + + + + + \ No newline at end of file diff --git a/.idea/libraries/Maven__commons_codec_commons_codec_1_4.xml b/.idea/libraries/Maven__commons_codec_commons_codec_1_4.xml new file mode 100644 index 0000000..2b149c4 --- /dev/null +++ b/.idea/libraries/Maven__commons_codec_commons_codec_1_4.xml @@ -0,0 +1,13 @@ + + + + + + + + + + + + + \ No newline at end of file diff --git a/.idea/libraries/Maven__commons_collections_commons_collections_3_2_1.xml b/.idea/libraries/Maven__commons_collections_commons_collections_3_2_1.xml new file mode 100644 index 0000000..3caee7e --- /dev/null +++ b/.idea/libraries/Maven__commons_collections_commons_collections_3_2_1.xml @@ -0,0 +1,13 @@ + + + + + + + + + + + + + \ No newline at end of file diff --git a/.idea/libraries/Maven__commons_configuration_commons_configuration_1_6.xml b/.idea/libraries/Maven__commons_configuration_commons_configuration_1_6.xml new file mode 100644 index 0000000..ae96781 --- /dev/null +++ b/.idea/libraries/Maven__commons_configuration_commons_configuration_1_6.xml @@ -0,0 +1,13 @@ + + + + + + + + + + + + + \ No newline at end of file diff --git a/.idea/libraries/Maven__commons_digester_commons_digester_1_8.xml b/.idea/libraries/Maven__commons_digester_commons_digester_1_8.xml new file mode 100644 index 0000000..49f1def --- /dev/null +++ b/.idea/libraries/Maven__commons_digester_commons_digester_1_8.xml @@ -0,0 +1,13 @@ + + + + + + + + + + + + + \ No newline at end of file diff --git a/.idea/libraries/Maven__commons_el_commons_el_1_0.xml b/.idea/libraries/Maven__commons_el_commons_el_1_0.xml new file mode 100644 index 0000000..598d1b0 --- /dev/null +++ b/.idea/libraries/Maven__commons_el_commons_el_1_0.xml @@ -0,0 +1,13 @@ + + + + + + + + + + + + + \ No newline at end of file diff --git a/.idea/libraries/Maven__commons_httpclient_commons_httpclient_3_0_1.xml b/.idea/libraries/Maven__commons_httpclient_commons_httpclient_3_0_1.xml new file mode 100644 index 0000000..f040f16 --- /dev/null +++ b/.idea/libraries/Maven__commons_httpclient_commons_httpclient_3_0_1.xml @@ -0,0 +1,13 @@ + + + + + + + + + + + + + \ No newline at end of file diff --git a/.idea/libraries/Maven__commons_io_commons_io_2_1.xml b/.idea/libraries/Maven__commons_io_commons_io_2_1.xml new file mode 100644 index 0000000..3b78142 --- /dev/null +++ b/.idea/libraries/Maven__commons_io_commons_io_2_1.xml @@ -0,0 +1,13 @@ + + + + + + + + + + + + + \ No newline at end of file diff --git a/.idea/libraries/Maven__commons_lang_commons_lang_2_4.xml b/.idea/libraries/Maven__commons_lang_commons_lang_2_4.xml new file mode 100644 index 0000000..5e8b8d3 --- /dev/null +++ b/.idea/libraries/Maven__commons_lang_commons_lang_2_4.xml @@ -0,0 +1,13 @@ + + + + + + + + + + + + + \ No newline at end of file diff --git a/.idea/libraries/Maven__commons_logging_commons_logging_1_0_3.xml b/.idea/libraries/Maven__commons_logging_commons_logging_1_0_3.xml new file mode 100644 index 0000000..e20ca3a --- /dev/null +++ b/.idea/libraries/Maven__commons_logging_commons_logging_1_0_3.xml @@ -0,0 +1,13 @@ + + + + + + + + + + + + + \ No newline at end of file diff --git a/.idea/libraries/Maven__commons_net_commons_net_1_4_1.xml b/.idea/libraries/Maven__commons_net_commons_net_1_4_1.xml new file mode 100644 index 0000000..7fb71b5 --- /dev/null +++ b/.idea/libraries/Maven__commons_net_commons_net_1_4_1.xml @@ -0,0 +1,13 @@ + + + + + + + + + + + + + \ No newline at end of file diff --git a/.idea/libraries/Maven__javax_activation_activation_1_1.xml b/.idea/libraries/Maven__javax_activation_activation_1_1.xml new file mode 100644 index 0000000..180d587 --- /dev/null +++ b/.idea/libraries/Maven__javax_activation_activation_1_1.xml @@ -0,0 +1,13 @@ + + + + + + + + + + + + + \ No newline at end of file diff --git a/.idea/libraries/Maven__javax_xml_bind_jaxb_api_2_2_2.xml b/.idea/libraries/Maven__javax_xml_bind_jaxb_api_2_2_2.xml new file mode 100644 index 0000000..a3054d2 --- /dev/null +++ b/.idea/libraries/Maven__javax_xml_bind_jaxb_api_2_2_2.xml @@ -0,0 +1,13 @@ + + + + + + + + + + + + + \ No newline at end of file diff --git a/.idea/libraries/Maven__javax_xml_stream_stax_api_1_0_2.xml b/.idea/libraries/Maven__javax_xml_stream_stax_api_1_0_2.xml new file mode 100644 index 0000000..2a4dd7a --- /dev/null +++ b/.idea/libraries/Maven__javax_xml_stream_stax_api_1_0_2.xml @@ -0,0 +1,13 @@ + + + + + + + + + + + + + \ No newline at end of file diff --git a/.idea/libraries/Maven__junit_junit_4_7.xml b/.idea/libraries/Maven__junit_junit_4_7.xml new file mode 100644 index 0000000..4402995 --- /dev/null +++ b/.idea/libraries/Maven__junit_junit_4_7.xml @@ -0,0 +1,13 @@ + + + + + + + + + + + + + \ No newline at end of file diff --git a/.idea/libraries/Maven__org_apache_commons_commons_lang3_3_1.xml b/.idea/libraries/Maven__org_apache_commons_commons_lang3_3_1.xml new file mode 100644 index 0000000..32bfe3b --- /dev/null +++ b/.idea/libraries/Maven__org_apache_commons_commons_lang3_3_1.xml @@ -0,0 +1,13 @@ + + + + + + + + + + + + + \ No newline at end of file diff --git a/.idea/libraries/Maven__org_apache_commons_commons_math3_3_2.xml b/.idea/libraries/Maven__org_apache_commons_commons_math3_3_2.xml new file mode 100644 index 0000000..dde81ab --- /dev/null +++ b/.idea/libraries/Maven__org_apache_commons_commons_math3_3_2.xml @@ -0,0 +1,13 @@ + + + + + + + + + + + + + \ No newline at end of file diff --git a/.idea/libraries/Maven__org_apache_commons_commons_math_2_1.xml b/.idea/libraries/Maven__org_apache_commons_commons_math_2_1.xml new file mode 100644 index 0000000..eaa8a65 --- /dev/null +++ b/.idea/libraries/Maven__org_apache_commons_commons_math_2_1.xml @@ -0,0 +1,13 @@ + + + + + + + + + + + + + \ No newline at end of file diff --git a/.idea/libraries/Maven__org_apache_hadoop_hadoop_core_1_2_1.xml b/.idea/libraries/Maven__org_apache_hadoop_hadoop_core_1_2_1.xml new file mode 100644 index 0000000..cd8023f --- /dev/null +++ b/.idea/libraries/Maven__org_apache_hadoop_hadoop_core_1_2_1.xml @@ -0,0 +1,13 @@ + + + + + + + + + + + + + \ No newline at end of file diff --git a/.idea/libraries/Maven__org_apache_lucene_lucene_analyzers_common_4_6_1.xml b/.idea/libraries/Maven__org_apache_lucene_lucene_analyzers_common_4_6_1.xml new file mode 100644 index 0000000..2717cd6 --- /dev/null +++ b/.idea/libraries/Maven__org_apache_lucene_lucene_analyzers_common_4_6_1.xml @@ -0,0 +1,13 @@ + + + + + + + + + + + + + \ No newline at end of file diff --git a/.idea/libraries/Maven__org_apache_lucene_lucene_core_4_6_1.xml b/.idea/libraries/Maven__org_apache_lucene_lucene_core_4_6_1.xml new file mode 100644 index 0000000..66fc4a9 --- /dev/null +++ b/.idea/libraries/Maven__org_apache_lucene_lucene_core_4_6_1.xml @@ -0,0 +1,13 @@ + + + + + + + + + + + + + \ No newline at end of file diff --git a/.idea/libraries/Maven__org_apache_mahout_commons_commons_cli_2_0_mahout.xml b/.idea/libraries/Maven__org_apache_mahout_commons_commons_cli_2_0_mahout.xml new file mode 100644 index 0000000..c672cac --- /dev/null +++ b/.idea/libraries/Maven__org_apache_mahout_commons_commons_cli_2_0_mahout.xml @@ -0,0 +1,13 @@ + + + + + + + + + + + + + \ No newline at end of file diff --git a/.idea/libraries/Maven__org_apache_mahout_mahout_core_0_9.xml b/.idea/libraries/Maven__org_apache_mahout_mahout_core_0_9.xml new file mode 100644 index 0000000..79debcc --- /dev/null +++ b/.idea/libraries/Maven__org_apache_mahout_mahout_core_0_9.xml @@ -0,0 +1,13 @@ + + + + + + + + + + + + + \ No newline at end of file diff --git a/.idea/libraries/Maven__org_apache_mahout_mahout_math_0_9.xml b/.idea/libraries/Maven__org_apache_mahout_mahout_math_0_9.xml new file mode 100644 index 0000000..98bd640 --- /dev/null +++ b/.idea/libraries/Maven__org_apache_mahout_mahout_math_0_9.xml @@ -0,0 +1,13 @@ + + + + + + + + + + + + + \ No newline at end of file diff --git a/.idea/libraries/Maven__org_apache_solr_solr_commons_csv_3_5_0.xml b/.idea/libraries/Maven__org_apache_solr_solr_commons_csv_3_5_0.xml new file mode 100644 index 0000000..36db039 --- /dev/null +++ b/.idea/libraries/Maven__org_apache_solr_solr_commons_csv_3_5_0.xml @@ -0,0 +1,13 @@ + + + + + + + + + + + + + \ No newline at end of file diff --git a/.idea/libraries/Maven__org_codehaus_jackson_jackson_core_asl_1_9_12.xml b/.idea/libraries/Maven__org_codehaus_jackson_jackson_core_asl_1_9_12.xml new file mode 100644 index 0000000..a02acc0 --- /dev/null +++ b/.idea/libraries/Maven__org_codehaus_jackson_jackson_core_asl_1_9_12.xml @@ -0,0 +1,13 @@ + + + + + + + + + + + + + \ No newline at end of file diff --git a/.idea/libraries/Maven__org_codehaus_jackson_jackson_jaxrs_1_7_1.xml b/.idea/libraries/Maven__org_codehaus_jackson_jackson_jaxrs_1_7_1.xml new file mode 100644 index 0000000..9039684 --- /dev/null +++ b/.idea/libraries/Maven__org_codehaus_jackson_jackson_jaxrs_1_7_1.xml @@ -0,0 +1,13 @@ + + + + + + + + + + + + + \ No newline at end of file diff --git a/.idea/libraries/Maven__org_codehaus_jackson_jackson_mapper_asl_1_9_12.xml b/.idea/libraries/Maven__org_codehaus_jackson_jackson_mapper_asl_1_9_12.xml new file mode 100644 index 0000000..2e3cd1a --- /dev/null +++ b/.idea/libraries/Maven__org_codehaus_jackson_jackson_mapper_asl_1_9_12.xml @@ -0,0 +1,13 @@ + + + + + + + + + + + + + \ No newline at end of file diff --git a/.idea/libraries/Maven__org_codehaus_jackson_jackson_xc_1_7_1.xml b/.idea/libraries/Maven__org_codehaus_jackson_jackson_xc_1_7_1.xml new file mode 100644 index 0000000..dc10a10 --- /dev/null +++ b/.idea/libraries/Maven__org_codehaus_jackson_jackson_xc_1_7_1.xml @@ -0,0 +1,13 @@ + + + + + + + + + + + + + \ No newline at end of file diff --git a/.idea/libraries/Maven__org_codehaus_jettison_jettison_1_1.xml b/.idea/libraries/Maven__org_codehaus_jettison_jettison_1_1.xml new file mode 100644 index 0000000..d62802e --- /dev/null +++ b/.idea/libraries/Maven__org_codehaus_jettison_jettison_1_1.xml @@ -0,0 +1,13 @@ + + + + + + + + + + + + + \ No newline at end of file diff --git a/.idea/libraries/Maven__org_slf4j_slf4j_api_1_7_5.xml b/.idea/libraries/Maven__org_slf4j_slf4j_api_1_7_5.xml new file mode 100644 index 0000000..6f808f1 --- /dev/null +++ b/.idea/libraries/Maven__org_slf4j_slf4j_api_1_7_5.xml @@ -0,0 +1,13 @@ + + + + + + + + + + + + + \ No newline at end of file diff --git a/.idea/libraries/Maven__stax_stax_api_1_0_1.xml b/.idea/libraries/Maven__stax_stax_api_1_0_1.xml new file mode 100644 index 0000000..0b13335 --- /dev/null +++ b/.idea/libraries/Maven__stax_stax_api_1_0_1.xml @@ -0,0 +1,13 @@ + + + + + + + + + + + + + \ No newline at end of file diff --git a/.idea/libraries/Maven__xmlpull_xmlpull_1_1_3_1.xml b/.idea/libraries/Maven__xmlpull_xmlpull_1_1_3_1.xml new file mode 100644 index 0000000..0f2d9ef --- /dev/null +++ b/.idea/libraries/Maven__xmlpull_xmlpull_1_1_3_1.xml @@ -0,0 +1,13 @@ + + + + + + + + + + + + + \ No newline at end of file diff --git a/.idea/libraries/Maven__xpp3_xpp3_min_1_1_4c.xml b/.idea/libraries/Maven__xpp3_xpp3_min_1_1_4c.xml new file mode 100644 index 0000000..6726a2d --- /dev/null +++ b/.idea/libraries/Maven__xpp3_xpp3_min_1_1_4c.xml @@ -0,0 +1,13 @@ + + + + + + + + + + + + + \ No newline at end of file diff --git a/.idea/misc.xml b/.idea/misc.xml new file mode 100644 index 0000000..d30d09e --- /dev/null +++ b/.idea/misc.xml @@ -0,0 +1,13 @@ + + + + + + + + + \ No newline at end of file diff --git a/.idea/modules.xml b/.idea/modules.xml new file mode 100644 index 0000000..6237568 --- /dev/null +++ b/.idea/modules.xml @@ -0,0 +1,8 @@ + + + + + + + + \ No newline at end of file diff --git a/.idea/vcs.xml b/.idea/vcs.xml new file mode 100644 index 0000000..35eb1dd --- /dev/null +++ b/.idea/vcs.xml @@ -0,0 +1,6 @@ + + + + + + \ No newline at end of file diff --git a/big-data.iml b/big-data.iml new file mode 100644 index 0000000..38c1e5e --- /dev/null +++ b/big-data.iml @@ -0,0 +1,56 @@ + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + \ No newline at end of file diff --git a/src/test/java/nearsoft/academy/bigdata/recommendation/MovieRecommender.java b/src/test/java/nearsoft/academy/bigdata/recommendation/MovieRecommender.java new file mode 100644 index 0000000..96da4f9 --- /dev/null +++ b/src/test/java/nearsoft/academy/bigdata/recommendation/MovieRecommender.java @@ -0,0 +1,216 @@ +package nearsoft.academy.bigdata.recommendation; +import org.apache.mahout.cf.taste.common.TasteException; +import org.apache.mahout.cf.taste.impl.model.file.FileDataModel; +import org.apache.mahout.cf.taste.impl.neighborhood.ThresholdUserNeighborhood; +import org.apache.mahout.cf.taste.impl.recommender.GenericUserBasedRecommender; +import org.apache.mahout.cf.taste.impl.similarity.PearsonCorrelationSimilarity; +import org.apache.mahout.cf.taste.model.DataModel; +import org.apache.mahout.cf.taste.neighborhood.UserNeighborhood; +import org.apache.mahout.cf.taste.recommender.Recommender; +import org.apache.mahout.cf.taste.recommender.UserBasedRecommender; +import org.apache.mahout.cf.taste.recommender.RecommendedItem; +import org.apache.mahout.cf.taste.similarity.UserSimilarity; + +import java.io.*; +import java.util.*; +import java.util.zip.GZIPInputStream; + +public class MovieRecommender { + + String path; + private DataModel model; + private UserSimilarity similarity; + private UserNeighborhood neighborhood; + private UserBasedRecommender recommender; + + private HashMap products = new HashMap(); + private HashMap productsToString = new HashMap(); + private HashMap users = new HashMap(); + + private int keyProducts = 0; + private int keyPUsers = 0; + + + public MovieRecommender() throws IOException, TasteException { + createReccommendedFile("/Users/lromero/Desktop/LuisMario/AmazonProblem/recommenderFile.csv"); + + + } + + + int getTotalReviews(String archivo) throws FileNotFoundException, IOException { + String cadena; + String [] arreglo_datos; + InputStream stream = new GZIPInputStream(new FileInputStream("/Users/lromero/Desktop/LuisMario/AmazonProblem/movies.txt.gz")); + BufferedReader b = new BufferedReader(new InputStreamReader(stream, "US-ASCII")); + int i = 0; + String path = ""; + String TRV = ""; + char slash; + char u; + int contador = 0; + //char e; + HashSet set = new HashSet(); + while((cadena = b.readLine())!=null) { + try{ + if(cadena.contains("/summary:")){ + contador++; + } + }catch (IndexOutOfBoundsException ioub){ +// System.out.println("LLEGO VACIO EXCEPTION"); + } + } + + return contador; + } + + + int getTotalProducts(String archivo) throws FileNotFoundException, IOException { + String cadena; + String [] arreglo_datos; + InputStream stream = new GZIPInputStream(new FileInputStream("/Users/lromero/Desktop/LuisMario/AmazonProblem/movies.txt.gz")); + BufferedReader b = new BufferedReader(new InputStreamReader(stream, "US-ASCII")); + int i = 0; + String path = ""; + String TP = ""; + char slash; + char u; + //char e; + HashSet set = new HashSet(); + while((cadena = b.readLine())!=null) { + try{ + if(cadena.contains("/productId:")){ + TP = cadena.split(" ")[1]; + set.add(TP); + } + }catch (IndexOutOfBoundsException ioub){ +// System.out.println("LLEGO VACIO EXCEPTION"); + } + } + Iterator itr = set.iterator(); + int productID = 0; + while(itr.hasNext()) { + itr.next(); + productID++; + } + System.out.println("Total PID: "+productID); + b.close(); + return productID; + } + + + int getTotalUsers(String archivo) throws FileNotFoundException, IOException { + String cadena; + String [] arreglo_datos; + InputStream stream = new GZIPInputStream(new FileInputStream("/Users/lromero/Desktop/LuisMario/AmazonProblem/movies.txt.gz")); + BufferedReader b = new BufferedReader(new InputStreamReader(stream, "US-ASCII")); + int i = 0; + String path = ""; + String pdID = ""; + char slash; + char u; + //char e; + HashSet set = new HashSet(); + while((cadena = b.readLine())!=null) { + try{ + if(cadena.startsWith("review/user")){ + pdID = cadena.split(" ")[1]; + set.add(pdID); + } + }catch (IndexOutOfBoundsException ioub){ +// System.out.println("LLEGO VACIO EXCEPTION"); + } + } + Iterator itr = set.iterator(); + int totalUsers = 0; + while(itr.hasNext()) { + itr.next(); + totalUsers++; + } + System.out.println("Total users: "+totalUsers); + b.close(); + return totalUsers; + } + + void createReccommendedFile(String archivo) throws IOException, TasteException { + InputStream stream = new GZIPInputStream(new FileInputStream("/Users/lromero/Desktop/LuisMario/AmazonProblem/movies.txt.gz")); + BufferedReader b = new BufferedReader(new InputStreamReader(stream, "US-ASCII")); + String cadena; + File csv = new File("/Users/lromero/Desktop/LuisMario/AmazonProblem/recommenderFile.csv"); + if (!csv.exists()) { + csv.createNewFile(); + } + FileWriter fw = new FileWriter(csv); + BufferedWriter bw = new BufferedWriter(fw); + + long productId = 0, userId = 0; + while((cadena = b.readLine())!=null) { + String prefijo = cadena.split(" ")[0]; + if(prefijo.equals("product/productId:")) { + String pdID = cadena.split(" ")[1]; + if (products.containsKey(pdID)) { + productId = products.get(pdID); + }else { +// System.out.println("Product " + key); + products.put(pdID, (long) keyProducts); + productsToString.put((long) keyProducts, pdID); + productId = keyProducts; + keyProducts++; + } + } + + if(prefijo.equals("review/userId:")){ + String usID = cadena.split(" ")[1]; + if (users.containsKey(usID)) { + userId = users.get(usID); + }else { +// System.out.println("User: " + key); + users.put(usID, (long) keyPUsers); + userId = keyPUsers; + keyPUsers++; + + } + } + + if(prefijo.equals("review/score:")){ + String rvSC = cadena.split(" ")[1]; +// System.out.println("Score " + rvSC); + bw.write(userId + "," + productId + "," + rvSC+"\n"); + } + + } + bw.close(); + + + + + } + + + + public List getRecommendationsForUser(String user) throws IOException, TasteException { + List stringList = new ArrayList(); + //List recommendations = new ArrayList(); + DataModel model = new FileDataModel(new File("/Users/lromero/Desktop/LuisMario/AmazonProblem/recommenderFile.csv")); + UserSimilarity similarity = new PearsonCorrelationSimilarity(model); + UserNeighborhood neighborhood = new ThresholdUserNeighborhood(0.1, similarity, model); + UserBasedRecommender recommender = new GenericUserBasedRecommender(model, neighborhood, similarity); + + System.out.println("User: " + users.get(user)); + //List recommendations = recommender.recommend(users.get(user), 3); + for (RecommendedItem recommendation : recommender.recommend(users.get(user), 3)) { + System.out.println(recommendation.getItemID()); + stringList.add(productsToString.get(recommendation.getItemID())); + + } +// List getValues = new ArrayList(); + System.out.println(stringList); + return stringList; + } + +// public static void main(String[] args) throws IOException, TasteException { +// MovieRecommender call = new MovieRecommender(); +// call.getRecommendationsForUser("A141HP4LYPWMSR"); +// } + +} diff --git a/src/test/java/nearsoft/academy/bigdata/recommendation/MovieRecommenderTest.java b/src/test/java/nearsoft/academy/bigdata/recommendation/MovieRecommenderTest.java index eb999af..7b46acf 100644 --- a/src/test/java/nearsoft/academy/bigdata/recommendation/MovieRecommenderTest.java +++ b/src/test/java/nearsoft/academy/bigdata/recommendation/MovieRecommenderTest.java @@ -15,10 +15,10 @@ public class MovieRecommenderTest { public void testDataInfo() throws IOException, TasteException { //download movies.txt.gz from // http://snap.stanford.edu/data/web-Movies.html - MovieRecommender recommender = new MovieRecommender("/Desktop/LuisMario/AmazonProblem/movies.txt.gz"); - assertEquals(7911684, recommender.getTotalReviews()); // - assertEquals(253059, recommender.getTotalProducts()); // product/productId: - assertEquals(889176, recommender.getTotalUsers()); + MovieRecommender recommender = new MovieRecommender(); + assertEquals(7911684, recommender.getTotalReviews("Users/Desktop/LuisMario/AmazonProblem/movies.txt.gz")); // + assertEquals(253059, recommender.getTotalProducts("Users/Desktop/LuisMario/AmazonProblem/movies.txt.gz")); // product/productId: + assertEquals(889176, recommender.getTotalUsers("Users/Desktop/LuisMario/AmazonProblem/movies.txt.gz")); // get a token with a review and saved it if it's not already defined, but if it's already defined plus one // diff --git a/src/test/java/nearsoft/academy/bigdata/recommendation/test.java b/src/test/java/nearsoft/academy/bigdata/recommendation/test.java new file mode 100644 index 0000000..779ee15 --- /dev/null +++ b/src/test/java/nearsoft/academy/bigdata/recommendation/test.java @@ -0,0 +1,176 @@ +package nearsoft.academy.bigdata.recommendation; + +import java.io.*; +import java.util.*; +import java.util.zip.GZIPInputStream; + +public class test { + +// void muestraContenido(String archivo) throws FileNotFoundException, IOException { +// String cadena; +// String [] arreglo_datos; +//// FileReader f = new FileReader("/Users/lromero/Desktop/LuisMario/AmazonProblem/movies.txt.gz"); +//// BufferedReader b = new BufferedReader(f); +// InputStream stream = new GZIPInputStream(new FileInputStream("/Users/lromero/Desktop/LuisMario/AmazonProblem/moviesTest2.txt.gz")); +// BufferedReader b = new BufferedReader(new InputStreamReader(stream, "US-ASCII")); +// int i = 0; +// String path = ""; +// String pdID = ""; +// HashSet set = new HashSet(); +// while((cadena = b.readLine())!=null) { +// if(!(cadena.equals(""))){ +// pdID = ""; +// path = ""; +// for (int j = 0; j < cadena.length(); j++) { +// if(!(path.equals("product/productId:"))){ +// path += cadena.charAt(j); +// }else{ +// for (int k = 0; k < 10; k++) { +// pdID += cadena.charAt(j+1); +// j++; +// if(pdID.length() == 10) { +// j = cadena.length(); +// break; +// } +// } +// } +// } +// if(!(pdID.equals(""))) { +// //System.out.println("PRODUCT ID CATCHED: " + pdID); +// set.add(pdID); +// } +// +// }else { +// for (int j = 0; j < cadena.length(); j++) { +// if(!(path.equals("product/productId:"))){ +// path += cadena.charAt(j); +// }else{ +// for (int k = 0; k < 10; k++) { +// pdID += cadena.charAt(j+1); +// j++; +// if(pdID.length() == 10){ +// j = cadena.length(); +// break; +// } +// +// } +// } +// } +// if(!(pdID.equals(""))) { +// //System.out.println("PRODUCT ID CATCHED: " + pdID); +// set.add(pdID); +// } +// } +// } +// Iterator itr = set.iterator(); +// int pdIDCounter = 0; +// while(itr.hasNext()) { +// System.out.println(itr.next()); +// pdIDCounter++; +// } +// System.out.println("Numero sin repetir de Products Id: "+pdIDCounter); +// b.close(); +// } + + + int getTotalUsers(String archivo) throws FileNotFoundException, IOException { + String cadena; + String [] arreglo_datos; + InputStream stream = new GZIPInputStream(new FileInputStream("/Users/lromero/Desktop/LuisMario/AmazonProblem/movies.txt.gz")); + BufferedReader b = new BufferedReader(new InputStreamReader(stream, "US-ASCII")); + int i = 0; + String path = ""; + String pdID = ""; + char slash; + char u; + //char e; + HashSet set = new HashSet(); + while((cadena = b.readLine())!=null) { + try{ + if(cadena.startsWith("review/user")){ + pdID = cadena.split(" ")[1]; + set.add(pdID); + } + }catch (IndexOutOfBoundsException ioub){ +// System.out.println("LLEGO VACIO EXCEPTION"); + } + } + Iterator itr = set.iterator(); + int totalUsers = 0; + while(itr.hasNext()) { + itr.next(); + totalUsers++; + } + System.out.println("Total users: "+totalUsers); + b.close(); + return totalUsers; + } + + + + int getTotalReviews(String archivo) throws FileNotFoundException, IOException { + String cadena; + String [] arreglo_datos; +// FileReader f = new FileReader("/Users/lromero/Desktop/LuisMario/AmazonProblem/movies.txt.gz"); +// BufferedReader b = new BufferedReader(f); + InputStream stream = new GZIPInputStream(new FileInputStream("/Users/lromero/Desktop/LuisMario/AmazonProblem/moviesTest3.txt.gz")); + BufferedReader b = new BufferedReader(new InputStreamReader(stream, "US-ASCII")); + int i = 0; + String path = ""; + String pdID = ""; + char slash; + char t; + char e; + int reviewCounter = 0; + + HashSet set = new HashSet(); + while((cadena = b.readLine())!=null) { + try{ + slash = cadena.charAt(6); + t = cadena.charAt(7); + e = cadena.charAt(8); + if(slash == '/' && t == 't' && e == 'e'){ + reviewCounter++; + } +// + }catch (IndexOutOfBoundsException ioub){ +// System.out.println("LLEGO VACIO EXCEPTION"); + } + + + } + + System.out.println("Total Reviews: "+reviewCounter); + return reviewCounter; + } + + public Map findDuplicateString(String str) { + String[] stringArrays = str.split(" "); + Map map = new HashMap(); + Set words = new HashSet(Arrays.asList(stringArrays)); + int count = 0; + for (String word : words) { + for (String temp : stringArrays) { + if (word.equals(temp)) { + ++count; + } + } + map.put(word, count); + count = 0; + } + + return map; + + } + + public static void main(String[] args) throws IOException { + test call = new test(); + //call.muestraContenido("/Users/lromero/Desktop/LuisMario/AmazonProblem/smalltest.txt "); + //call.findDuplicateString("d"); + //call.getTotalReviews("/Users/lromero/Desktop/LuisMario/AmazonProblem/smalltest.txt "); + //call.getTotalReviews("/Users/lromero/Desktop/LuisMario/AmazonProblem/smalltest.txt "); + call.getTotalUsers("/Users/lromero/Desktop/LuisMario/AmazonProblem/movies.txt.gz "); + + } + +} diff --git a/target/maven-status/maven-compiler-plugin/testCompile/default-testCompile/createdFiles.lst b/target/maven-status/maven-compiler-plugin/testCompile/default-testCompile/createdFiles.lst new file mode 100644 index 0000000..e69de29 diff --git a/target/maven-status/maven-compiler-plugin/testCompile/default-testCompile/inputFiles.lst b/target/maven-status/maven-compiler-plugin/testCompile/default-testCompile/inputFiles.lst new file mode 100644 index 0000000..fa44f53 --- /dev/null +++ b/target/maven-status/maven-compiler-plugin/testCompile/default-testCompile/inputFiles.lst @@ -0,0 +1,3 @@ +/Users/lromero/Desktop/LuisMario/AmazonProblem/big-data-exercises/src/test/java/nearsoft/academy/bigdata/recommendation/MovieRecommender.java +/Users/lromero/Desktop/LuisMario/AmazonProblem/big-data-exercises/src/test/java/nearsoft/academy/bigdata/recommendation/test.java +/Users/lromero/Desktop/LuisMario/AmazonProblem/big-data-exercises/src/test/java/nearsoft/academy/bigdata/recommendation/MovieRecommenderTest.java diff --git a/target/surefire-reports/TEST-nearsoft.academy.bigdata.recommendation.MovieRecommenderTest.xml b/target/surefire-reports/TEST-nearsoft.academy.bigdata.recommendation.MovieRecommenderTest.xml new file mode 100644 index 0000000..80f0636 --- /dev/null +++ b/target/surefire-reports/TEST-nearsoft.academy.bigdata.recommendation.MovieRecommenderTest.xml @@ -0,0 +1,68 @@ + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + \ No newline at end of file diff --git a/target/surefire-reports/nearsoft.academy.bigdata.recommendation.MovieRecommenderTest.txt b/target/surefire-reports/nearsoft.academy.bigdata.recommendation.MovieRecommenderTest.txt new file mode 100644 index 0000000..57dcd7a --- /dev/null +++ b/target/surefire-reports/nearsoft.academy.bigdata.recommendation.MovieRecommenderTest.txt @@ -0,0 +1,4 @@ +------------------------------------------------------------------------------- +Test set: nearsoft.academy.bigdata.recommendation.MovieRecommenderTest +------------------------------------------------------------------------------- +Tests run: 1, Failures: 0, Errors: 0, Skipped: 0, Time elapsed: 609.375 sec diff --git a/target/test-classes/nearsoft/academy/bigdata/recommendation/MovieRecommender.class b/target/test-classes/nearsoft/academy/bigdata/recommendation/MovieRecommender.class new file mode 100644 index 0000000000000000000000000000000000000000..3aaedc53f8a2bf3ee68207765c43904a2ac27cdc GIT binary patch literal 7365 zcmcIp33waTwf?UyYsRB-APP<*2x~&(7~4t$*g;MLN!$bnCvjsF$3WALrLjFh(umP0 ziCv&AP2MYADU`k!ULSqkUfR-9N0{LpBencu?cBs9;LL zLn=;a(D6HlLTx7c_hkUy>rftl}$D$X8W- zO~KbS#HBTHd_y+hRPZeg7vtLszN6t%d{@QyL+ayZA(Qu^{`&$h=@H+*+4_|)bnEbm-Lm&R2;Ex*m z@h263mV*8g!C&#W2%f;l6r7A;uK*7qgdE|)zbNVyQLl)QKqzOp;{wsX1I9rko;I>$ z@d4MdvSZx>4H-LSrUlyiY-cQPY#Cr_a*eQG5rsb`S zl{Os9oe=1pZ*O&B{OY{v4EXyfMbDbn*!YO;jN5ifATghu;8IW0uE1W(ia2J{&ScDN z%5(%a&L=9c(v!5s$eXD>)$Np~<{Ud!NV<7}MJ3n@u9c2oY2?Ru8aXa#9I(c+hFfq< zfv(vrHq6F4Fw$oe`%RQ`dPU8kU1H=P3iGxGM3sq@!Ws(1mj*|!Hz)di^F=R>l_L^; z&W1NwSmmv$E!{LT1Et291$4N1}ap(n#+m#qzy87;?ug%1HEO zO~c9Cqi)&}vURoHTQCHm`^VMTDt+%yb8B z*GTU%x%?0{G`Gw?<7%EnF`VSMbPTqA)Bf~wVEtVbc&E^U&k>N0L5hDUi z{kbiL(NWWpd~?4er!8VJxQAG%NjvKrDVzRNpEupv)DM_0H!QA2W+GQXXH`jw?@U4N0%e3eZIvZ+suO6c=qmd_ zD3_8FG*@C?9$TCwT(0D*a*a~kEa?byQXxI3ke5P2&cT7LBqryWqt*cuQ=iNq6jcdH>i95@H7_m!96smlzM`dza^N`E9l%Pb9En zE*A>G+Gph@n+s|^R$%>84IRE>Ge!KRr`1_2JY1xDjc&;hE47g9*?L#Z7#vK5(0Og+`9daRI1>p)H0ff2I89)=r@%|bz06sMcNg5< zqg(7kHkJ1SBx8BJa^q78`u=&kI9)8%MN}-(#TlYm5sP)PL@d=sOq{8RvvjdcoLvDf zkm$D*thARGBVL$2ufMk^L0RXBb7jNc`9fF31-e*HWW);T6U?VF7RTjP)5V2iCBsN* zvmD7M&SUznU?h3f#VTn>i&)Cs5u7O9Vu{k~IqdyBE#;@!g3++~c#a<1e|^zLq5 zY!Dk2!TO?e9;<^YW`t2)TrLS+F0PQxX2#=xw$@IUYQmIF6e1VTu+thrj}o+>4Tz^(NbFRCssmn>3* z%4D6AH5+qk%j(%XYtCM(5i9kLm1TW(Rxqt>9XFf-^M-<%O`6@SuVE#b&!sJbwJNx( zB&B=xwR35!H&RT;HKjrcaZjEq^Smr!7yv5P*3>P`ou!yjGs>!B+{o`T57QJ@t28W> z^Vk-tO+u^p8g<%NJsabC^LrKH?QKb6I{_sxSIL8EIfOU3BDIG;Z#UB@4xG=83e z{cP*-Ogzhb8W{1ONu<1|iBa##nwMpq<@FD6J$1H7s@H~aCQidy zY?t9eoP$=J%O9hb^B1I*C~$>d(uRXL#J9uzglWkHCfR#7t?{f9YdE@qBm1Wj8J>nd z9BrDyf+?Jq2ulaI`t0@T1muMy9cthgg!(V+}M!E+I! z{PlPqZb1XJT#DzDn=o~)^}ImgvmHmcL#5tU9OZ0;dd|mx;6I7s3uvoEvNUol`xPW# zNGyRD`AELCjO0D1jARAIh!5k+w&*es#^$!@*+rZaT9;5`k(gS|G!*bfk&k|MY$=pT-I@bYXO55v!V;ifAcfbrG#n(M8Qo zl9nD`f)SsVy=dm4wiCQ730p4#+d+7)B1pSQSwC0r!A=q~ghB4x$DMn5W%lvQ;Wc#r zYw7OS(Yc;MkoV(OUar@{z#F+rI%JN(0{8fo-BYG)GYQi=$Pua~rWs`WZ zM_GazB~cM---wssr6lMETKY25*yNG7n66M-b*sPXwpld3{NF`mTM_NY@UNn=_4ce&FWQI2-0t;1Xu zdKOayHC^s$dU~yht1vmhs4z zHwYbX6zAYg;zGPx#PK$98SWE3xL@3W2Zf8Gn838>wJ&A9xdm5K(|!hq$FY?<*yGxE zYLa6a5u(2R3=I&Il_14lDX%OPmKU1puv`pzp{X9v6lZyXD})Zw$MAa>Gt72zF)e-- zy>E|bq0M(g!PT_x)%ZVVn0?{`yoNo^&muA(3!dq9%!{lN#Esn9NVFcA#x_Ro?R3{G znT5*^I)z?(>yF{}DO@EJbl>n9*cl7)b$6m+8vVoVv4&V^3Qtdj1Hpd}xslXgR79eP zfpQ86SB6Ti7(Ri)5KhooB$Sv^&L~~7$BgnY_9j${jHxFuBv8b@Hg0byzj|()IDz3h zFg<;c>lpT~X}gc-C}sO~5>*OO@qWbc0eZnBSjT^nU4aiVNqmIdKSoqOiigPYG(O2y zpYm9{j#%8m>gM%$1NYv9P56I$g(C5(FvQ+*vc@m7co$>Tn|S|YOfs^vtEZmVFaeFQ p23SYtWp&p;okt++yRe_zOFQ4pot4}!St(V0_fYa%sILxh{X6JrxKIE9 literal 0 HcmV?d00001 diff --git a/target/test-classes/nearsoft/academy/bigdata/recommendation/MovieRecommenderTest.class b/target/test-classes/nearsoft/academy/bigdata/recommendation/MovieRecommenderTest.class new file mode 100644 index 0000000000000000000000000000000000000000..85e50ce2f726ece948fd8d2575823d125429cb40 GIT binary patch literal 1739 zcmbVNT~{MT5WSrQ60*aG0iyVcin|FxIzVJ`LDnoEk~mo)1d!uX6Pjc&GlMgomEBj5 zKfs^j3ybbK`{1L$!QbMsdL{u}^F$t|s%}qJ->O?l{`%*S*8t{ln8XAMaeR?P1cg4r zfQ#Q_2`p;hVG>LDGDM?)|E!@$VKn&bcRE^5U`5-n5?D>*F}~Ib#RQ%tuolO95@{6l zVb9*43F+yohlDsmkJ0F*%9+hJQKXFtQI$|;QI7`dwYJ~?QiOhcUQu=C7cG|Q=a8C zmRISLdaIC1Y6F_oe6ab?N`0 z+;eWWEx$s0;qsy_UbxPV=TgTux3$*(th!LMjTZ(=D97=w0TUGiPf<3ojWWYfajr18 zwNo&Ub`C3hRRcTNrCy%o^ZEJhheu2MaS*tNnt^@Lf(9q~!rE?)mNyI*7Y>)^8CLGv zk=DS#$9gIw!EOZlZXch?x}uo}5Or7DzLuFGuO$@cqTZC;7EQOUc>RO6U_GQXty%!_hnl$v2 zc3siYU>6EhqD`Rq`WqLn;HK;8Lx!nd1m4(r+V9C5KDJQQGO1tQr}eFLB8GTV_$4K6 zhUwci!yztbOyg^E{E_<)}M0XT>c$v46m@DU~{Vp@4BqLcqbj69(F3X!9ih?--F5Zi2rhh z#25yG;9eLQK`^9)Tx$3dBbAxdTUSV3VRR-n)^)~1M>B~AOzvZV{1g%x#W=?B2|YP+ zStK@(iOUutyO;`?PKIncOcN;6*{8&Kk=Rb*GwSU=)zbZh$OA$$g!GfmVj8)?XP6;7 zfX^{YxbCw=HbQpr71Gq_+h*<(@7xS)D7f|kQOr>BY(OO)CJ@y;B__~Ee^irn@$Ksv K=IJbgg?|Ap7Pxr; literal 0 HcmV?d00001 diff --git a/target/test-classes/nearsoft/academy/bigdata/recommendation/test.class b/target/test-classes/nearsoft/academy/bigdata/recommendation/test.class new file mode 100644 index 0000000000000000000000000000000000000000..40c91822ba0c8a00caffe02c12853f2c6e2e5d95 GIT binary patch literal 4156 zcmbVP>wgqi8Ga^vna%7hgoUMS3j%UWAjw)<*Sb(NB!zBG2qi!a#o}alk__zbY-VPY zkXA||Xp5It?L{iKNY&H=l~&zAqu6>ut=CU}@ta@$AH?U(-c9`dw7>jz&Y5%G^Io3k zecvs$e@z8F?Aw0ayw=uoX1Hkx`H_5x}H^0HzekI2pjSj3*R?V2bxA z1Nef1tvD6HQ(`!0h|}(m&M~N;_+1lU&C`k z-}3={UFi8n0N<4Hf`U!L&Wm_S=zBScZ{e(r3qs-*1>eTSAijfFWxS@KQ|P@U#_!6w zEWy9i$QjNq37*!r!xFsRW?Gl9wAaY#`wH1%-8!fZXSfpXHB(yVux1(Jy}amk#td6R zXKzl|EZZD$Vp>W|>)DgBVPiC{IaT^P%0oY;<~YgsBPi5X@rnadX( zs^T&YO2ZOXRrhumMn-f?Pan{E-V)mef3)Y#YtEP$(#akoV(X5C<)vc<$H>GU*6gtX zT}0q9981EAy1k^MTbg4Eb&69L+sa1ZPUb7%ZK*q4R=l&cR1d>0>MNt;x==CmUqqFM zrc!!dU~S8IUB>swWd-a5`h=lR5^kTJVIT~-n?Hsqk>8Nz?sl7n90Ot4BStRWQ^;qG zl;-FqP9$ttjHtRe`m{X#^*VYs&q1@Sjnwqm!l<~J(R18vGWhULnpRriEihI2B>!EO zrJba&o~%YyOBdMii8I`<-zib!ONkgH#2e2n0$812Nk%=&To7KU%Et6%Njb%;d zfZgd#Ih~`^!ut2c;|GkRVxqA)Bt$D4b#_aIBO!2TprdP`JDC(pX2s(T36QX?7Ed{| zRs0ZdN(h#+ELLFMtGI%zOult0uHh{eKf-ll@1ArEAel?+Q~d>}e`GfaP21JXR`E98 zk?~^{KfzB`6fq~`hKiebw}Mn%0qrgr85TJc+-*4Pgk?KHoAdaYc>G+&Exak?7b@Np zV7xE*==xBo9we*xRiXVQe#Pu887)^{V%-90STHhvt>QPhE#UjDjNeIUsew=`JQcsk zbr~P1_yhhZ<4-F7jK4@||9{%9gapLun<`4g(a%}apx_3?t1 zVMi}Dw{nYeZwi1q&*xiV!3yFA`lHm14XPDoW1k+ggSfYZ_!{8D-)_G9*U|rahHS( zSSDtxBn-}kq}e&3FtVB5j=}A zybc3z;J6E29zg+56}l_fi3jOH7x#B@)~r!&!hnjbkq!rsf>qlX!##jdS%gJP|@K?X9HVl2l(+Y9FQgx##EJentsKS)uVF zSC?|-VwJ{^{*N?z;%bG-P?gCY?JfQyHpH9TTVydR?JZ<+Lp&I1Zi!vOiipzUTtX-k zY|$^lKckYj+leK!ciyifZ=)bjt&$f}1#f#XNfau)JwogNhtC4Bn;>eF#A}L3J<04o zMQonpiKiL$8FF`)+|5w>9Hq`v%QKWZPl@M<|MMbA76@ zCehjucSZ4~nZGI#IK9oSm%e#yV%~4wCkSc3fh}`rO?W+VU(|aOZ4wgxsJ~n@{bI(N zc@J9?ay!c`a4X*Ii7OE$(tH_fqJfCAos}tza@%%+6#1kXg)IG}BPvIHH_(0)9Ucr) z_w1c(9oOkYsgmOK7I=Z#`Xck`C9KBFSj&GdcM;=3yaJ8?Tc$Zbj#tUkYpj|}?XLVdn!&6K1@t5Rc>YGySbrv}k0dpS07Y?((V zp^o)#3xBMLdk1T6a|zD^v-JBaZNBA3CaRHVaDtwII{{?aNF}!#y&NCqFUy@K Date: Wed, 9 Oct 2019 13:08:26 -0700 Subject: [PATCH 3/8] This class was made for sending the total of users, products and reviews as well as for sending recommendations to a specific user --- .idea/$PRODUCT_WORKSPACE_FILE$ | 19 -- .idea/.gitignore | 3 - .idea/.name | 1 - .idea/compiler.xml | 16 -- .idea/encodings.xml | 6 - .idea/libraries/Maven__asm_asm_3_1.xml | 13 -- .../Maven__com_google_guava_guava_16_0.xml | 13 -- .../Maven__com_sun_jersey_jersey_core_1_8.xml | 13 -- .../Maven__com_sun_jersey_jersey_json_1_8.xml | 13 -- ...aven__com_sun_jersey_jersey_server_1_8.xml | 13 -- ...en__com_sun_xml_bind_jaxb_impl_2_2_3_1.xml | 13 -- ...com_thoughtworks_xstream_xstream_1_4_4.xml | 13 -- ...mons_beanutils_commons_beanutils_1_7_0.xml | 13 -- ...beanutils_commons_beanutils_core_1_8_0.xml | 13 -- .../Maven__commons_cli_commons_cli_1_2.xml | 13 -- ...Maven__commons_codec_commons_codec_1_4.xml | 13 -- ..._collections_commons_collections_3_2_1.xml | 13 -- ...onfiguration_commons_configuration_1_6.xml | 13 -- ..._commons_digester_commons_digester_1_8.xml | 13 -- .../Maven__commons_el_commons_el_1_0.xml | 13 -- ...ns_httpclient_commons_httpclient_3_0_1.xml | 13 -- .../Maven__commons_io_commons_io_2_1.xml | 13 -- .../Maven__commons_lang_commons_lang_2_4.xml | 13 -- ..._commons_logging_commons_logging_1_0_3.xml | 13 -- .../Maven__commons_net_commons_net_1_4_1.xml | 13 -- ...Maven__javax_activation_activation_1_1.xml | 13 -- .../Maven__javax_xml_bind_jaxb_api_2_2_2.xml | 13 -- ...Maven__javax_xml_stream_stax_api_1_0_2.xml | 13 -- .idea/libraries/Maven__junit_junit_4_7.xml | 13 -- ...__org_apache_commons_commons_lang3_3_1.xml | 13 -- ...__org_apache_commons_commons_math3_3_2.xml | 13 -- ...n__org_apache_commons_commons_math_2_1.xml | 13 -- ...n__org_apache_hadoop_hadoop_core_1_2_1.xml | 13 -- ...e_lucene_lucene_analyzers_common_4_6_1.xml | 13 -- ...n__org_apache_lucene_lucene_core_4_6_1.xml | 13 -- ..._mahout_commons_commons_cli_2_0_mahout.xml | 13 -- ...ven__org_apache_mahout_mahout_core_0_9.xml | 13 -- ...ven__org_apache_mahout_mahout_math_0_9.xml | 13 -- ...org_apache_solr_solr_commons_csv_3_5_0.xml | 13 -- ...dehaus_jackson_jackson_core_asl_1_9_12.xml | 13 -- ...g_codehaus_jackson_jackson_jaxrs_1_7_1.xml | 13 -- ...haus_jackson_jackson_mapper_asl_1_9_12.xml | 13 -- ..._org_codehaus_jackson_jackson_xc_1_7_1.xml | 13 -- ...en__org_codehaus_jettison_jettison_1_1.xml | 13 -- .../Maven__org_slf4j_slf4j_api_1_7_5.xml | 13 -- .../libraries/Maven__stax_stax_api_1_0_1.xml | 13 -- .../Maven__xmlpull_xmlpull_1_1_3_1.xml | 13 -- .../libraries/Maven__xpp3_xpp3_min_1_1_4c.xml | 13 -- .idea/misc.xml | 13 -- .idea/modules.xml | 8 - .idea/vcs.xml | 6 - .../recommendation/MovieRecommender.java | 162 +++--------------- 52 files changed, 26 insertions(+), 767 deletions(-) delete mode 100644 .idea/$PRODUCT_WORKSPACE_FILE$ delete mode 100644 .idea/.gitignore delete mode 100644 .idea/.name delete mode 100644 .idea/compiler.xml delete mode 100644 .idea/encodings.xml delete mode 100644 .idea/libraries/Maven__asm_asm_3_1.xml delete mode 100644 .idea/libraries/Maven__com_google_guava_guava_16_0.xml delete mode 100644 .idea/libraries/Maven__com_sun_jersey_jersey_core_1_8.xml delete mode 100644 .idea/libraries/Maven__com_sun_jersey_jersey_json_1_8.xml delete mode 100644 .idea/libraries/Maven__com_sun_jersey_jersey_server_1_8.xml delete mode 100644 .idea/libraries/Maven__com_sun_xml_bind_jaxb_impl_2_2_3_1.xml delete mode 100644 .idea/libraries/Maven__com_thoughtworks_xstream_xstream_1_4_4.xml delete mode 100644 .idea/libraries/Maven__commons_beanutils_commons_beanutils_1_7_0.xml delete mode 100644 .idea/libraries/Maven__commons_beanutils_commons_beanutils_core_1_8_0.xml delete mode 100644 .idea/libraries/Maven__commons_cli_commons_cli_1_2.xml delete mode 100644 .idea/libraries/Maven__commons_codec_commons_codec_1_4.xml delete mode 100644 .idea/libraries/Maven__commons_collections_commons_collections_3_2_1.xml delete mode 100644 .idea/libraries/Maven__commons_configuration_commons_configuration_1_6.xml delete mode 100644 .idea/libraries/Maven__commons_digester_commons_digester_1_8.xml delete mode 100644 .idea/libraries/Maven__commons_el_commons_el_1_0.xml delete mode 100644 .idea/libraries/Maven__commons_httpclient_commons_httpclient_3_0_1.xml delete mode 100644 .idea/libraries/Maven__commons_io_commons_io_2_1.xml delete mode 100644 .idea/libraries/Maven__commons_lang_commons_lang_2_4.xml delete mode 100644 .idea/libraries/Maven__commons_logging_commons_logging_1_0_3.xml delete mode 100644 .idea/libraries/Maven__commons_net_commons_net_1_4_1.xml delete mode 100644 .idea/libraries/Maven__javax_activation_activation_1_1.xml delete mode 100644 .idea/libraries/Maven__javax_xml_bind_jaxb_api_2_2_2.xml delete mode 100644 .idea/libraries/Maven__javax_xml_stream_stax_api_1_0_2.xml delete mode 100644 .idea/libraries/Maven__junit_junit_4_7.xml delete mode 100644 .idea/libraries/Maven__org_apache_commons_commons_lang3_3_1.xml delete mode 100644 .idea/libraries/Maven__org_apache_commons_commons_math3_3_2.xml delete mode 100644 .idea/libraries/Maven__org_apache_commons_commons_math_2_1.xml delete mode 100644 .idea/libraries/Maven__org_apache_hadoop_hadoop_core_1_2_1.xml delete mode 100644 .idea/libraries/Maven__org_apache_lucene_lucene_analyzers_common_4_6_1.xml delete mode 100644 .idea/libraries/Maven__org_apache_lucene_lucene_core_4_6_1.xml delete mode 100644 .idea/libraries/Maven__org_apache_mahout_commons_commons_cli_2_0_mahout.xml delete mode 100644 .idea/libraries/Maven__org_apache_mahout_mahout_core_0_9.xml delete mode 100644 .idea/libraries/Maven__org_apache_mahout_mahout_math_0_9.xml delete mode 100644 .idea/libraries/Maven__org_apache_solr_solr_commons_csv_3_5_0.xml delete mode 100644 .idea/libraries/Maven__org_codehaus_jackson_jackson_core_asl_1_9_12.xml delete mode 100644 .idea/libraries/Maven__org_codehaus_jackson_jackson_jaxrs_1_7_1.xml delete mode 100644 .idea/libraries/Maven__org_codehaus_jackson_jackson_mapper_asl_1_9_12.xml delete mode 100644 .idea/libraries/Maven__org_codehaus_jackson_jackson_xc_1_7_1.xml delete mode 100644 .idea/libraries/Maven__org_codehaus_jettison_jettison_1_1.xml delete mode 100644 .idea/libraries/Maven__org_slf4j_slf4j_api_1_7_5.xml delete mode 100644 .idea/libraries/Maven__stax_stax_api_1_0_1.xml delete mode 100644 .idea/libraries/Maven__xmlpull_xmlpull_1_1_3_1.xml delete mode 100644 .idea/libraries/Maven__xpp3_xpp3_min_1_1_4c.xml delete mode 100644 .idea/misc.xml delete mode 100644 .idea/modules.xml delete mode 100644 .idea/vcs.xml diff --git a/.idea/$PRODUCT_WORKSPACE_FILE$ b/.idea/$PRODUCT_WORKSPACE_FILE$ deleted file mode 100644 index 3733e0d..0000000 --- a/.idea/$PRODUCT_WORKSPACE_FILE$ +++ /dev/null @@ -1,19 +0,0 @@ - - - - - - - 1.8 - - - - - - - - \ No newline at end of file diff --git a/.idea/.gitignore b/.idea/.gitignore deleted file mode 100644 index 0e40fe8..0000000 --- a/.idea/.gitignore +++ /dev/null @@ -1,3 +0,0 @@ - -# Default ignored files -/workspace.xml \ No newline at end of file diff --git a/.idea/.name b/.idea/.name deleted file mode 100644 index a6f69a2..0000000 --- a/.idea/.name +++ /dev/null @@ -1 +0,0 @@ -big-data \ No newline at end of file diff --git a/.idea/compiler.xml b/.idea/compiler.xml deleted file mode 100644 index 81ad3ee..0000000 --- a/.idea/compiler.xml +++ /dev/null @@ -1,16 +0,0 @@ - - - - - - - - - - - - - - - - \ No newline at end of file diff --git a/.idea/encodings.xml b/.idea/encodings.xml deleted file mode 100644 index b26911b..0000000 --- a/.idea/encodings.xml +++ /dev/null @@ -1,6 +0,0 @@ - - - - - - \ No newline at end of file diff --git a/.idea/libraries/Maven__asm_asm_3_1.xml b/.idea/libraries/Maven__asm_asm_3_1.xml deleted file mode 100644 index 3386f10..0000000 --- a/.idea/libraries/Maven__asm_asm_3_1.xml +++ /dev/null @@ -1,13 +0,0 @@ - - - - - - - - - - - - - \ No newline at end of file diff --git a/.idea/libraries/Maven__com_google_guava_guava_16_0.xml b/.idea/libraries/Maven__com_google_guava_guava_16_0.xml deleted file mode 100644 index 91cff2f..0000000 --- a/.idea/libraries/Maven__com_google_guava_guava_16_0.xml +++ /dev/null @@ -1,13 +0,0 @@ - - - - - - - - - - - - - \ No newline at end of file diff --git a/.idea/libraries/Maven__com_sun_jersey_jersey_core_1_8.xml b/.idea/libraries/Maven__com_sun_jersey_jersey_core_1_8.xml deleted file mode 100644 index bf486c9..0000000 --- a/.idea/libraries/Maven__com_sun_jersey_jersey_core_1_8.xml +++ /dev/null @@ -1,13 +0,0 @@ - - - - - - - - - - - - - \ No newline at end of file diff --git a/.idea/libraries/Maven__com_sun_jersey_jersey_json_1_8.xml b/.idea/libraries/Maven__com_sun_jersey_jersey_json_1_8.xml deleted file mode 100644 index ab01cdd..0000000 --- a/.idea/libraries/Maven__com_sun_jersey_jersey_json_1_8.xml +++ /dev/null @@ -1,13 +0,0 @@ - - - - - - - - - - - - - \ No newline at end of file diff --git a/.idea/libraries/Maven__com_sun_jersey_jersey_server_1_8.xml b/.idea/libraries/Maven__com_sun_jersey_jersey_server_1_8.xml deleted file mode 100644 index e7e8ba0..0000000 --- a/.idea/libraries/Maven__com_sun_jersey_jersey_server_1_8.xml +++ /dev/null @@ -1,13 +0,0 @@ - - - - - - - - - - - - - \ No newline at end of file diff --git a/.idea/libraries/Maven__com_sun_xml_bind_jaxb_impl_2_2_3_1.xml b/.idea/libraries/Maven__com_sun_xml_bind_jaxb_impl_2_2_3_1.xml deleted file mode 100644 index 1165a3b..0000000 --- a/.idea/libraries/Maven__com_sun_xml_bind_jaxb_impl_2_2_3_1.xml +++ /dev/null @@ -1,13 +0,0 @@ - - - - - - - - - - - - - \ No newline at end of file diff --git a/.idea/libraries/Maven__com_thoughtworks_xstream_xstream_1_4_4.xml b/.idea/libraries/Maven__com_thoughtworks_xstream_xstream_1_4_4.xml deleted file mode 100644 index 2c3025b..0000000 --- a/.idea/libraries/Maven__com_thoughtworks_xstream_xstream_1_4_4.xml +++ /dev/null @@ -1,13 +0,0 @@ - - - - - - - - - - - - - \ No newline at end of file diff --git a/.idea/libraries/Maven__commons_beanutils_commons_beanutils_1_7_0.xml b/.idea/libraries/Maven__commons_beanutils_commons_beanutils_1_7_0.xml deleted file mode 100644 index 1cb64ed..0000000 --- a/.idea/libraries/Maven__commons_beanutils_commons_beanutils_1_7_0.xml +++ /dev/null @@ -1,13 +0,0 @@ - - - - - - - - - - - - - \ No newline at end of file diff --git a/.idea/libraries/Maven__commons_beanutils_commons_beanutils_core_1_8_0.xml b/.idea/libraries/Maven__commons_beanutils_commons_beanutils_core_1_8_0.xml deleted file mode 100644 index 3fda2c0..0000000 --- a/.idea/libraries/Maven__commons_beanutils_commons_beanutils_core_1_8_0.xml +++ /dev/null @@ -1,13 +0,0 @@ - - - - - - - - - - - - - \ No newline at end of file diff --git a/.idea/libraries/Maven__commons_cli_commons_cli_1_2.xml b/.idea/libraries/Maven__commons_cli_commons_cli_1_2.xml deleted file mode 100644 index cec2493..0000000 --- a/.idea/libraries/Maven__commons_cli_commons_cli_1_2.xml +++ /dev/null @@ -1,13 +0,0 @@ - - - - - - - - - - - - - \ No newline at end of file diff --git a/.idea/libraries/Maven__commons_codec_commons_codec_1_4.xml b/.idea/libraries/Maven__commons_codec_commons_codec_1_4.xml deleted file mode 100644 index 2b149c4..0000000 --- a/.idea/libraries/Maven__commons_codec_commons_codec_1_4.xml +++ /dev/null @@ -1,13 +0,0 @@ - - - - - - - - - - - - - \ No newline at end of file diff --git a/.idea/libraries/Maven__commons_collections_commons_collections_3_2_1.xml b/.idea/libraries/Maven__commons_collections_commons_collections_3_2_1.xml deleted file mode 100644 index 3caee7e..0000000 --- a/.idea/libraries/Maven__commons_collections_commons_collections_3_2_1.xml +++ /dev/null @@ -1,13 +0,0 @@ - - - - - - - - - - - - - \ No newline at end of file diff --git a/.idea/libraries/Maven__commons_configuration_commons_configuration_1_6.xml b/.idea/libraries/Maven__commons_configuration_commons_configuration_1_6.xml deleted file mode 100644 index ae96781..0000000 --- a/.idea/libraries/Maven__commons_configuration_commons_configuration_1_6.xml +++ /dev/null @@ -1,13 +0,0 @@ - - - - - - - - - - - - - \ No newline at end of file diff --git a/.idea/libraries/Maven__commons_digester_commons_digester_1_8.xml b/.idea/libraries/Maven__commons_digester_commons_digester_1_8.xml deleted file mode 100644 index 49f1def..0000000 --- a/.idea/libraries/Maven__commons_digester_commons_digester_1_8.xml +++ /dev/null @@ -1,13 +0,0 @@ - - - - - - - - - - - - - \ No newline at end of file diff --git a/.idea/libraries/Maven__commons_el_commons_el_1_0.xml b/.idea/libraries/Maven__commons_el_commons_el_1_0.xml deleted file mode 100644 index 598d1b0..0000000 --- a/.idea/libraries/Maven__commons_el_commons_el_1_0.xml +++ /dev/null @@ -1,13 +0,0 @@ - - - - - - - - - - - - - \ No newline at end of file diff --git a/.idea/libraries/Maven__commons_httpclient_commons_httpclient_3_0_1.xml b/.idea/libraries/Maven__commons_httpclient_commons_httpclient_3_0_1.xml deleted file mode 100644 index f040f16..0000000 --- a/.idea/libraries/Maven__commons_httpclient_commons_httpclient_3_0_1.xml +++ /dev/null @@ -1,13 +0,0 @@ - - - - - - - - - - - - - \ No newline at end of file diff --git a/.idea/libraries/Maven__commons_io_commons_io_2_1.xml b/.idea/libraries/Maven__commons_io_commons_io_2_1.xml deleted file mode 100644 index 3b78142..0000000 --- a/.idea/libraries/Maven__commons_io_commons_io_2_1.xml +++ /dev/null @@ -1,13 +0,0 @@ - - - - - - - - - - - - - \ No newline at end of file diff --git a/.idea/libraries/Maven__commons_lang_commons_lang_2_4.xml b/.idea/libraries/Maven__commons_lang_commons_lang_2_4.xml deleted file mode 100644 index 5e8b8d3..0000000 --- a/.idea/libraries/Maven__commons_lang_commons_lang_2_4.xml +++ /dev/null @@ -1,13 +0,0 @@ - - - - - - - - - - - - - \ No newline at end of file diff --git a/.idea/libraries/Maven__commons_logging_commons_logging_1_0_3.xml b/.idea/libraries/Maven__commons_logging_commons_logging_1_0_3.xml deleted file mode 100644 index e20ca3a..0000000 --- a/.idea/libraries/Maven__commons_logging_commons_logging_1_0_3.xml +++ /dev/null @@ -1,13 +0,0 @@ - - - - - - - - - - - - - \ No newline at end of file diff --git a/.idea/libraries/Maven__commons_net_commons_net_1_4_1.xml b/.idea/libraries/Maven__commons_net_commons_net_1_4_1.xml deleted file mode 100644 index 7fb71b5..0000000 --- a/.idea/libraries/Maven__commons_net_commons_net_1_4_1.xml +++ /dev/null @@ -1,13 +0,0 @@ - - - - - - - - - - - - - \ No newline at end of file diff --git a/.idea/libraries/Maven__javax_activation_activation_1_1.xml b/.idea/libraries/Maven__javax_activation_activation_1_1.xml deleted file mode 100644 index 180d587..0000000 --- a/.idea/libraries/Maven__javax_activation_activation_1_1.xml +++ /dev/null @@ -1,13 +0,0 @@ - - - - - - - - - - - - - \ No newline at end of file diff --git a/.idea/libraries/Maven__javax_xml_bind_jaxb_api_2_2_2.xml b/.idea/libraries/Maven__javax_xml_bind_jaxb_api_2_2_2.xml deleted file mode 100644 index a3054d2..0000000 --- a/.idea/libraries/Maven__javax_xml_bind_jaxb_api_2_2_2.xml +++ /dev/null @@ -1,13 +0,0 @@ - - - - - - - - - - - - - \ No newline at end of file diff --git a/.idea/libraries/Maven__javax_xml_stream_stax_api_1_0_2.xml b/.idea/libraries/Maven__javax_xml_stream_stax_api_1_0_2.xml deleted file mode 100644 index 2a4dd7a..0000000 --- a/.idea/libraries/Maven__javax_xml_stream_stax_api_1_0_2.xml +++ /dev/null @@ -1,13 +0,0 @@ - - - - - - - - - - - - - \ No newline at end of file diff --git a/.idea/libraries/Maven__junit_junit_4_7.xml b/.idea/libraries/Maven__junit_junit_4_7.xml deleted file mode 100644 index 4402995..0000000 --- a/.idea/libraries/Maven__junit_junit_4_7.xml +++ /dev/null @@ -1,13 +0,0 @@ - - - - - - - - - - - - - \ No newline at end of file diff --git a/.idea/libraries/Maven__org_apache_commons_commons_lang3_3_1.xml b/.idea/libraries/Maven__org_apache_commons_commons_lang3_3_1.xml deleted file mode 100644 index 32bfe3b..0000000 --- a/.idea/libraries/Maven__org_apache_commons_commons_lang3_3_1.xml +++ /dev/null @@ -1,13 +0,0 @@ - - - - - - - - - - - - - \ No newline at end of file diff --git a/.idea/libraries/Maven__org_apache_commons_commons_math3_3_2.xml b/.idea/libraries/Maven__org_apache_commons_commons_math3_3_2.xml deleted file mode 100644 index dde81ab..0000000 --- a/.idea/libraries/Maven__org_apache_commons_commons_math3_3_2.xml +++ /dev/null @@ -1,13 +0,0 @@ - - - - - - - - - - - - - \ No newline at end of file diff --git a/.idea/libraries/Maven__org_apache_commons_commons_math_2_1.xml b/.idea/libraries/Maven__org_apache_commons_commons_math_2_1.xml deleted file mode 100644 index eaa8a65..0000000 --- a/.idea/libraries/Maven__org_apache_commons_commons_math_2_1.xml +++ /dev/null @@ -1,13 +0,0 @@ - - - - - - - - - - - - - \ No newline at end of file diff --git a/.idea/libraries/Maven__org_apache_hadoop_hadoop_core_1_2_1.xml b/.idea/libraries/Maven__org_apache_hadoop_hadoop_core_1_2_1.xml deleted file mode 100644 index cd8023f..0000000 --- a/.idea/libraries/Maven__org_apache_hadoop_hadoop_core_1_2_1.xml +++ /dev/null @@ -1,13 +0,0 @@ - - - - - - - - - - - - - \ No newline at end of file diff --git a/.idea/libraries/Maven__org_apache_lucene_lucene_analyzers_common_4_6_1.xml b/.idea/libraries/Maven__org_apache_lucene_lucene_analyzers_common_4_6_1.xml deleted file mode 100644 index 2717cd6..0000000 --- a/.idea/libraries/Maven__org_apache_lucene_lucene_analyzers_common_4_6_1.xml +++ /dev/null @@ -1,13 +0,0 @@ - - - - - - - - - - - - - \ No newline at end of file diff --git a/.idea/libraries/Maven__org_apache_lucene_lucene_core_4_6_1.xml b/.idea/libraries/Maven__org_apache_lucene_lucene_core_4_6_1.xml deleted file mode 100644 index 66fc4a9..0000000 --- a/.idea/libraries/Maven__org_apache_lucene_lucene_core_4_6_1.xml +++ /dev/null @@ -1,13 +0,0 @@ - - - - - - - - - - - - - \ No newline at end of file diff --git a/.idea/libraries/Maven__org_apache_mahout_commons_commons_cli_2_0_mahout.xml b/.idea/libraries/Maven__org_apache_mahout_commons_commons_cli_2_0_mahout.xml deleted file mode 100644 index c672cac..0000000 --- a/.idea/libraries/Maven__org_apache_mahout_commons_commons_cli_2_0_mahout.xml +++ /dev/null @@ -1,13 +0,0 @@ - - - - - - - - - - - - - \ No newline at end of file diff --git a/.idea/libraries/Maven__org_apache_mahout_mahout_core_0_9.xml b/.idea/libraries/Maven__org_apache_mahout_mahout_core_0_9.xml deleted file mode 100644 index 79debcc..0000000 --- a/.idea/libraries/Maven__org_apache_mahout_mahout_core_0_9.xml +++ /dev/null @@ -1,13 +0,0 @@ - - - - - - - - - - - - - \ No newline at end of file diff --git a/.idea/libraries/Maven__org_apache_mahout_mahout_math_0_9.xml b/.idea/libraries/Maven__org_apache_mahout_mahout_math_0_9.xml deleted file mode 100644 index 98bd640..0000000 --- a/.idea/libraries/Maven__org_apache_mahout_mahout_math_0_9.xml +++ /dev/null @@ -1,13 +0,0 @@ - - - - - - - - - - - - - \ No newline at end of file diff --git a/.idea/libraries/Maven__org_apache_solr_solr_commons_csv_3_5_0.xml b/.idea/libraries/Maven__org_apache_solr_solr_commons_csv_3_5_0.xml deleted file mode 100644 index 36db039..0000000 --- a/.idea/libraries/Maven__org_apache_solr_solr_commons_csv_3_5_0.xml +++ /dev/null @@ -1,13 +0,0 @@ - - - - - - - - - - - - - \ No newline at end of file diff --git a/.idea/libraries/Maven__org_codehaus_jackson_jackson_core_asl_1_9_12.xml b/.idea/libraries/Maven__org_codehaus_jackson_jackson_core_asl_1_9_12.xml deleted file mode 100644 index a02acc0..0000000 --- a/.idea/libraries/Maven__org_codehaus_jackson_jackson_core_asl_1_9_12.xml +++ /dev/null @@ -1,13 +0,0 @@ - - - - - - - - - - - - - \ No newline at end of file diff --git a/.idea/libraries/Maven__org_codehaus_jackson_jackson_jaxrs_1_7_1.xml b/.idea/libraries/Maven__org_codehaus_jackson_jackson_jaxrs_1_7_1.xml deleted file mode 100644 index 9039684..0000000 --- a/.idea/libraries/Maven__org_codehaus_jackson_jackson_jaxrs_1_7_1.xml +++ /dev/null @@ -1,13 +0,0 @@ - - - - - - - - - - - - - \ No newline at end of file diff --git a/.idea/libraries/Maven__org_codehaus_jackson_jackson_mapper_asl_1_9_12.xml b/.idea/libraries/Maven__org_codehaus_jackson_jackson_mapper_asl_1_9_12.xml deleted file mode 100644 index 2e3cd1a..0000000 --- a/.idea/libraries/Maven__org_codehaus_jackson_jackson_mapper_asl_1_9_12.xml +++ /dev/null @@ -1,13 +0,0 @@ - - - - - - - - - - - - - \ No newline at end of file diff --git a/.idea/libraries/Maven__org_codehaus_jackson_jackson_xc_1_7_1.xml b/.idea/libraries/Maven__org_codehaus_jackson_jackson_xc_1_7_1.xml deleted file mode 100644 index dc10a10..0000000 --- a/.idea/libraries/Maven__org_codehaus_jackson_jackson_xc_1_7_1.xml +++ /dev/null @@ -1,13 +0,0 @@ - - - - - - - - - - - - - \ No newline at end of file diff --git a/.idea/libraries/Maven__org_codehaus_jettison_jettison_1_1.xml b/.idea/libraries/Maven__org_codehaus_jettison_jettison_1_1.xml deleted file mode 100644 index d62802e..0000000 --- a/.idea/libraries/Maven__org_codehaus_jettison_jettison_1_1.xml +++ /dev/null @@ -1,13 +0,0 @@ - - - - - - - - - - - - - \ No newline at end of file diff --git a/.idea/libraries/Maven__org_slf4j_slf4j_api_1_7_5.xml b/.idea/libraries/Maven__org_slf4j_slf4j_api_1_7_5.xml deleted file mode 100644 index 6f808f1..0000000 --- a/.idea/libraries/Maven__org_slf4j_slf4j_api_1_7_5.xml +++ /dev/null @@ -1,13 +0,0 @@ - - - - - - - - - - - - - \ No newline at end of file diff --git a/.idea/libraries/Maven__stax_stax_api_1_0_1.xml b/.idea/libraries/Maven__stax_stax_api_1_0_1.xml deleted file mode 100644 index 0b13335..0000000 --- a/.idea/libraries/Maven__stax_stax_api_1_0_1.xml +++ /dev/null @@ -1,13 +0,0 @@ - - - - - - - - - - - - - \ No newline at end of file diff --git a/.idea/libraries/Maven__xmlpull_xmlpull_1_1_3_1.xml b/.idea/libraries/Maven__xmlpull_xmlpull_1_1_3_1.xml deleted file mode 100644 index 0f2d9ef..0000000 --- a/.idea/libraries/Maven__xmlpull_xmlpull_1_1_3_1.xml +++ /dev/null @@ -1,13 +0,0 @@ - - - - - - - - - - - - - \ No newline at end of file diff --git a/.idea/libraries/Maven__xpp3_xpp3_min_1_1_4c.xml b/.idea/libraries/Maven__xpp3_xpp3_min_1_1_4c.xml deleted file mode 100644 index 6726a2d..0000000 --- a/.idea/libraries/Maven__xpp3_xpp3_min_1_1_4c.xml +++ /dev/null @@ -1,13 +0,0 @@ - - - - - - - - - - - - - \ No newline at end of file diff --git a/.idea/misc.xml b/.idea/misc.xml deleted file mode 100644 index d30d09e..0000000 --- a/.idea/misc.xml +++ /dev/null @@ -1,13 +0,0 @@ - - - - - - - - - \ No newline at end of file diff --git a/.idea/modules.xml b/.idea/modules.xml deleted file mode 100644 index 6237568..0000000 --- a/.idea/modules.xml +++ /dev/null @@ -1,8 +0,0 @@ - - - - - - - - \ No newline at end of file diff --git a/.idea/vcs.xml b/.idea/vcs.xml deleted file mode 100644 index 35eb1dd..0000000 --- a/.idea/vcs.xml +++ /dev/null @@ -1,6 +0,0 @@ - - - - - - \ No newline at end of file diff --git a/src/test/java/nearsoft/academy/bigdata/recommendation/MovieRecommender.java b/src/test/java/nearsoft/academy/bigdata/recommendation/MovieRecommender.java index 96da4f9..d0abc36 100644 --- a/src/test/java/nearsoft/academy/bigdata/recommendation/MovieRecommender.java +++ b/src/test/java/nearsoft/academy/bigdata/recommendation/MovieRecommender.java @@ -6,7 +6,6 @@ import org.apache.mahout.cf.taste.impl.similarity.PearsonCorrelationSimilarity; import org.apache.mahout.cf.taste.model.DataModel; import org.apache.mahout.cf.taste.neighborhood.UserNeighborhood; -import org.apache.mahout.cf.taste.recommender.Recommender; import org.apache.mahout.cf.taste.recommender.UserBasedRecommender; import org.apache.mahout.cf.taste.recommender.RecommendedItem; import org.apache.mahout.cf.taste.similarity.UserSimilarity; @@ -17,200 +16,91 @@ public class MovieRecommender { - String path; - private DataModel model; - private UserSimilarity similarity; - private UserNeighborhood neighborhood; - private UserBasedRecommender recommender; private HashMap products = new HashMap(); private HashMap productsToString = new HashMap(); private HashMap users = new HashMap(); - private int keyProducts = 0; private int keyPUsers = 0; + int totalReviews = 0; + int totalProducts = 0; + int totalUsers = 0; - public MovieRecommender() throws IOException, TasteException { - createReccommendedFile("/Users/lromero/Desktop/LuisMario/AmazonProblem/recommenderFile.csv"); - + public MovieRecommender(String movies) throws IOException, TasteException { + createReccommendedFile(movies); } - - int getTotalReviews(String archivo) throws FileNotFoundException, IOException { - String cadena; - String [] arreglo_datos; - InputStream stream = new GZIPInputStream(new FileInputStream("/Users/lromero/Desktop/LuisMario/AmazonProblem/movies.txt.gz")); - BufferedReader b = new BufferedReader(new InputStreamReader(stream, "US-ASCII")); - int i = 0; - String path = ""; - String TRV = ""; - char slash; - char u; - int contador = 0; - //char e; - HashSet set = new HashSet(); - while((cadena = b.readLine())!=null) { - try{ - if(cadena.contains("/summary:")){ - contador++; - } - }catch (IndexOutOfBoundsException ioub){ -// System.out.println("LLEGO VACIO EXCEPTION"); - } - } - - return contador; + int getTotalReviews() throws IOException { + return totalReviews; } - - int getTotalProducts(String archivo) throws FileNotFoundException, IOException { - String cadena; - String [] arreglo_datos; - InputStream stream = new GZIPInputStream(new FileInputStream("/Users/lromero/Desktop/LuisMario/AmazonProblem/movies.txt.gz")); - BufferedReader b = new BufferedReader(new InputStreamReader(stream, "US-ASCII")); - int i = 0; - String path = ""; - String TP = ""; - char slash; - char u; - //char e; - HashSet set = new HashSet(); - while((cadena = b.readLine())!=null) { - try{ - if(cadena.contains("/productId:")){ - TP = cadena.split(" ")[1]; - set.add(TP); - } - }catch (IndexOutOfBoundsException ioub){ -// System.out.println("LLEGO VACIO EXCEPTION"); - } - } - Iterator itr = set.iterator(); - int productID = 0; - while(itr.hasNext()) { - itr.next(); - productID++; - } - System.out.println("Total PID: "+productID); - b.close(); - return productID; + int getTotalProducts() throws FileNotFoundException, IOException { + return totalProducts; } - int getTotalUsers(String archivo) throws FileNotFoundException, IOException { - String cadena; - String [] arreglo_datos; - InputStream stream = new GZIPInputStream(new FileInputStream("/Users/lromero/Desktop/LuisMario/AmazonProblem/movies.txt.gz")); - BufferedReader b = new BufferedReader(new InputStreamReader(stream, "US-ASCII")); - int i = 0; - String path = ""; - String pdID = ""; - char slash; - char u; - //char e; - HashSet set = new HashSet(); - while((cadena = b.readLine())!=null) { - try{ - if(cadena.startsWith("review/user")){ - pdID = cadena.split(" ")[1]; - set.add(pdID); - } - }catch (IndexOutOfBoundsException ioub){ -// System.out.println("LLEGO VACIO EXCEPTION"); - } - } - Iterator itr = set.iterator(); - int totalUsers = 0; - while(itr.hasNext()) { - itr.next(); - totalUsers++; - } - System.out.println("Total users: "+totalUsers); - b.close(); + int getTotalUsers() throws FileNotFoundException, IOException { return totalUsers; } - void createReccommendedFile(String archivo) throws IOException, TasteException { - InputStream stream = new GZIPInputStream(new FileInputStream("/Users/lromero/Desktop/LuisMario/AmazonProblem/movies.txt.gz")); + void createReccommendedFile(String pathToMovies) throws IOException, TasteException { + InputStream stream = new GZIPInputStream(new FileInputStream(pathToMovies)); BufferedReader b = new BufferedReader(new InputStreamReader(stream, "US-ASCII")); - String cadena; - File csv = new File("/Users/lromero/Desktop/LuisMario/AmazonProblem/recommenderFile.csv"); + String line; + File csv = new File("recommenderFile.csv"); if (!csv.exists()) { csv.createNewFile(); } FileWriter fw = new FileWriter(csv); BufferedWriter bw = new BufferedWriter(fw); - long productId = 0, userId = 0; - while((cadena = b.readLine())!=null) { - String prefijo = cadena.split(" ")[0]; - if(prefijo.equals("product/productId:")) { - String pdID = cadena.split(" ")[1]; + while((line = b.readLine())!=null) { + String prefix = line.split(" ")[0]; + if(prefix.equals("product/productId:")) { + String pdID = line.split(" ")[1]; if (products.containsKey(pdID)) { productId = products.get(pdID); }else { -// System.out.println("Product " + key); products.put(pdID, (long) keyProducts); productsToString.put((long) keyProducts, pdID); productId = keyProducts; keyProducts++; + totalProducts++; } } - - if(prefijo.equals("review/userId:")){ - String usID = cadena.split(" ")[1]; + if(prefix.equals("review/userId:")){ + String usID = line.split(" ")[1]; if (users.containsKey(usID)) { userId = users.get(usID); }else { -// System.out.println("User: " + key); users.put(usID, (long) keyPUsers); userId = keyPUsers; keyPUsers++; - + totalUsers++; } } - - if(prefijo.equals("review/score:")){ - String rvSC = cadena.split(" ")[1]; -// System.out.println("Score " + rvSC); + if(prefix.equals("review/score:")){ + totalReviews++; + String rvSC = line.split(" ")[1]; bw.write(userId + "," + productId + "," + rvSC+"\n"); } - } bw.close(); - - - - } - - public List getRecommendationsForUser(String user) throws IOException, TasteException { List stringList = new ArrayList(); - //List recommendations = new ArrayList(); - DataModel model = new FileDataModel(new File("/Users/lromero/Desktop/LuisMario/AmazonProblem/recommenderFile.csv")); + DataModel model = new FileDataModel(new File("recommenderFile.csv")); UserSimilarity similarity = new PearsonCorrelationSimilarity(model); UserNeighborhood neighborhood = new ThresholdUserNeighborhood(0.1, similarity, model); UserBasedRecommender recommender = new GenericUserBasedRecommender(model, neighborhood, similarity); - - System.out.println("User: " + users.get(user)); - //List recommendations = recommender.recommend(users.get(user), 3); for (RecommendedItem recommendation : recommender.recommend(users.get(user), 3)) { - System.out.println(recommendation.getItemID()); stringList.add(productsToString.get(recommendation.getItemID())); - } -// List getValues = new ArrayList(); - System.out.println(stringList); return stringList; } -// public static void main(String[] args) throws IOException, TasteException { -// MovieRecommender call = new MovieRecommender(); -// call.getRecommendationsForUser("A141HP4LYPWMSR"); -// } } From 96259d9a8fb8d1f85376cbf532f55d3b7690a886 Mon Sep 17 00:00:00 2001 From: lromero Date: Wed, 9 Oct 2019 13:15:38 -0700 Subject: [PATCH 4/8] Deleted unnecessary files --- .../default-testCompile/createdFiles.lst | 0 .../default-testCompile/inputFiles.lst | 3 - ...ta.recommendation.MovieRecommenderTest.xml | 68 ------------------ ...ta.recommendation.MovieRecommenderTest.txt | 4 -- .../recommendation/MovieRecommender.class | Bin 7365 -> 0 bytes .../recommendation/MovieRecommenderTest.class | Bin 1739 -> 0 bytes .../academy/bigdata/recommendation/test.class | Bin 4156 -> 0 bytes 7 files changed, 75 deletions(-) delete mode 100644 target/maven-status/maven-compiler-plugin/testCompile/default-testCompile/createdFiles.lst delete mode 100644 target/maven-status/maven-compiler-plugin/testCompile/default-testCompile/inputFiles.lst delete mode 100644 target/surefire-reports/TEST-nearsoft.academy.bigdata.recommendation.MovieRecommenderTest.xml delete mode 100644 target/surefire-reports/nearsoft.academy.bigdata.recommendation.MovieRecommenderTest.txt delete mode 100644 target/test-classes/nearsoft/academy/bigdata/recommendation/MovieRecommender.class delete mode 100644 target/test-classes/nearsoft/academy/bigdata/recommendation/MovieRecommenderTest.class delete mode 100644 target/test-classes/nearsoft/academy/bigdata/recommendation/test.class diff --git a/target/maven-status/maven-compiler-plugin/testCompile/default-testCompile/createdFiles.lst b/target/maven-status/maven-compiler-plugin/testCompile/default-testCompile/createdFiles.lst deleted file mode 100644 index e69de29..0000000 diff --git a/target/maven-status/maven-compiler-plugin/testCompile/default-testCompile/inputFiles.lst b/target/maven-status/maven-compiler-plugin/testCompile/default-testCompile/inputFiles.lst deleted file mode 100644 index fa44f53..0000000 --- a/target/maven-status/maven-compiler-plugin/testCompile/default-testCompile/inputFiles.lst +++ /dev/null @@ -1,3 +0,0 @@ -/Users/lromero/Desktop/LuisMario/AmazonProblem/big-data-exercises/src/test/java/nearsoft/academy/bigdata/recommendation/MovieRecommender.java -/Users/lromero/Desktop/LuisMario/AmazonProblem/big-data-exercises/src/test/java/nearsoft/academy/bigdata/recommendation/test.java -/Users/lromero/Desktop/LuisMario/AmazonProblem/big-data-exercises/src/test/java/nearsoft/academy/bigdata/recommendation/MovieRecommenderTest.java diff --git a/target/surefire-reports/TEST-nearsoft.academy.bigdata.recommendation.MovieRecommenderTest.xml b/target/surefire-reports/TEST-nearsoft.academy.bigdata.recommendation.MovieRecommenderTest.xml deleted file mode 100644 index 80f0636..0000000 --- a/target/surefire-reports/TEST-nearsoft.academy.bigdata.recommendation.MovieRecommenderTest.xml +++ /dev/null @@ -1,68 +0,0 @@ - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - \ No newline at end of file diff --git a/target/surefire-reports/nearsoft.academy.bigdata.recommendation.MovieRecommenderTest.txt b/target/surefire-reports/nearsoft.academy.bigdata.recommendation.MovieRecommenderTest.txt deleted file mode 100644 index 57dcd7a..0000000 --- a/target/surefire-reports/nearsoft.academy.bigdata.recommendation.MovieRecommenderTest.txt +++ /dev/null @@ -1,4 +0,0 @@ -------------------------------------------------------------------------------- -Test set: nearsoft.academy.bigdata.recommendation.MovieRecommenderTest -------------------------------------------------------------------------------- -Tests run: 1, Failures: 0, Errors: 0, Skipped: 0, Time elapsed: 609.375 sec diff --git a/target/test-classes/nearsoft/academy/bigdata/recommendation/MovieRecommender.class b/target/test-classes/nearsoft/academy/bigdata/recommendation/MovieRecommender.class deleted file mode 100644 index 3aaedc53f8a2bf3ee68207765c43904a2ac27cdc..0000000000000000000000000000000000000000 GIT binary patch literal 0 HcmV?d00001 literal 7365 zcmcIp33waTwf?UyYsRB-APP<*2x~&(7~4t$*g;MLN!$bnCvjsF$3WALrLjFh(umP0 ziCv&AP2MYADU`k!ULSqkUfR-9N0{LpBencu?cBs9;LL zLn=;a(D6HlLTx7c_hkUy>rftl}$D$X8W- zO~KbS#HBTHd_y+hRPZeg7vtLszN6t%d{@QyL+ayZA(Qu^{`&$h=@H+*+4_|)bnEbm-Lm&R2;Ex*m z@h263mV*8g!C&#W2%f;l6r7A;uK*7qgdE|)zbNVyQLl)QKqzOp;{wsX1I9rko;I>$ z@d4MdvSZx>4H-LSrUlyiY-cQPY#Cr_a*eQG5rsb`S zl{Os9oe=1pZ*O&B{OY{v4EXyfMbDbn*!YO;jN5ifATghu;8IW0uE1W(ia2J{&ScDN z%5(%a&L=9c(v!5s$eXD>)$Np~<{Ud!NV<7}MJ3n@u9c2oY2?Ru8aXa#9I(c+hFfq< zfv(vrHq6F4Fw$oe`%RQ`dPU8kU1H=P3iGxGM3sq@!Ws(1mj*|!Hz)di^F=R>l_L^; z&W1NwSmmv$E!{LT1Et291$4N1}ap(n#+m#qzy87;?ug%1HEO zO~c9Cqi)&}vURoHTQCHm`^VMTDt+%yb8B z*GTU%x%?0{G`Gw?<7%EnF`VSMbPTqA)Bf~wVEtVbc&E^U&k>N0L5hDUi z{kbiL(NWWpd~?4er!8VJxQAG%NjvKrDVzRNpEupv)DM_0H!QA2W+GQXXH`jw?@U4N0%e3eZIvZ+suO6c=qmd_ zD3_8FG*@C?9$TCwT(0D*a*a~kEa?byQXxI3ke5P2&cT7LBqryWqt*cuQ=iNq6jcdH>i95@H7_m!96smlzM`dza^N`E9l%Pb9En zE*A>G+Gph@n+s|^R$%>84IRE>Ge!KRr`1_2JY1xDjc&;hE47g9*?L#Z7#vK5(0Og+`9daRI1>p)H0ff2I89)=r@%|bz06sMcNg5< zqg(7kHkJ1SBx8BJa^q78`u=&kI9)8%MN}-(#TlYm5sP)PL@d=sOq{8RvvjdcoLvDf zkm$D*thARGBVL$2ufMk^L0RXBb7jNc`9fF31-e*HWW);T6U?VF7RTjP)5V2iCBsN* zvmD7M&SUznU?h3f#VTn>i&)Cs5u7O9Vu{k~IqdyBE#;@!g3++~c#a<1e|^zLq5 zY!Dk2!TO?e9;<^YW`t2)TrLS+F0PQxX2#=xw$@IUYQmIF6e1VTu+thrj}o+>4Tz^(NbFRCssmn>3* z%4D6AH5+qk%j(%XYtCM(5i9kLm1TW(Rxqt>9XFf-^M-<%O`6@SuVE#b&!sJbwJNx( zB&B=xwR35!H&RT;HKjrcaZjEq^Smr!7yv5P*3>P`ou!yjGs>!B+{o`T57QJ@t28W> z^Vk-tO+u^p8g<%NJsabC^LrKH?QKb6I{_sxSIL8EIfOU3BDIG;Z#UB@4xG=83e z{cP*-Ogzhb8W{1ONu<1|iBa##nwMpq<@FD6J$1H7s@H~aCQidy zY?t9eoP$=J%O9hb^B1I*C~$>d(uRXL#J9uzglWkHCfR#7t?{f9YdE@qBm1Wj8J>nd z9BrDyf+?Jq2ulaI`t0@T1muMy9cthgg!(V+}M!E+I! z{PlPqZb1XJT#DzDn=o~)^}ImgvmHmcL#5tU9OZ0;dd|mx;6I7s3uvoEvNUol`xPW# zNGyRD`AELCjO0D1jARAIh!5k+w&*es#^$!@*+rZaT9;5`k(gS|G!*bfk&k|MY$=pT-I@bYXO55v!V;ifAcfbrG#n(M8Qo zl9nD`f)SsVy=dm4wiCQ730p4#+d+7)B1pSQSwC0r!A=q~ghB4x$DMn5W%lvQ;Wc#r zYw7OS(Yc;MkoV(OUar@{z#F+rI%JN(0{8fo-BYG)GYQi=$Pua~rWs`WZ zM_GazB~cM---wssr6lMETKY25*yNG7n66M-b*sPXwpld3{NF`mTM_NY@UNn=_4ce&FWQI2-0t;1Xu zdKOayHC^s$dU~yht1vmhs4z zHwYbX6zAYg;zGPx#PK$98SWE3xL@3W2Zf8Gn838>wJ&A9xdm5K(|!hq$FY?<*yGxE zYLa6a5u(2R3=I&Il_14lDX%OPmKU1puv`pzp{X9v6lZyXD})Zw$MAa>Gt72zF)e-- zy>E|bq0M(g!PT_x)%ZVVn0?{`yoNo^&muA(3!dq9%!{lN#Esn9NVFcA#x_Ro?R3{G znT5*^I)z?(>yF{}DO@EJbl>n9*cl7)b$6m+8vVoVv4&V^3Qtdj1Hpd}xslXgR79eP zfpQ86SB6Ti7(Ri)5KhooB$Sv^&L~~7$BgnY_9j${jHxFuBv8b@Hg0byzj|()IDz3h zFg<;c>lpT~X}gc-C}sO~5>*OO@qWbc0eZnBSjT^nU4aiVNqmIdKSoqOiigPYG(O2y zpYm9{j#%8m>gM%$1NYv9P56I$g(C5(FvQ+*vc@m7co$>Tn|S|YOfs^vtEZmVFaeFQ p23SYtWp&p;okt++yRe_zOFQ4pot4}!St(V0_fYa%sILxh{X6JrxKIE9 diff --git a/target/test-classes/nearsoft/academy/bigdata/recommendation/MovieRecommenderTest.class b/target/test-classes/nearsoft/academy/bigdata/recommendation/MovieRecommenderTest.class deleted file mode 100644 index 85e50ce2f726ece948fd8d2575823d125429cb40..0000000000000000000000000000000000000000 GIT binary patch literal 0 HcmV?d00001 literal 1739 zcmbVNT~{MT5WSrQ60*aG0iyVcin|FxIzVJ`LDnoEk~mo)1d!uX6Pjc&GlMgomEBj5 zKfs^j3ybbK`{1L$!QbMsdL{u}^F$t|s%}qJ->O?l{`%*S*8t{ln8XAMaeR?P1cg4r zfQ#Q_2`p;hVG>LDGDM?)|E!@$VKn&bcRE^5U`5-n5?D>*F}~Ib#RQ%tuolO95@{6l zVb9*43F+yohlDsmkJ0F*%9+hJQKXFtQI$|;QI7`dwYJ~?QiOhcUQu=C7cG|Q=a8C zmRISLdaIC1Y6F_oe6ab?N`0 z+;eWWEx$s0;qsy_UbxPV=TgTux3$*(th!LMjTZ(=D97=w0TUGiPf<3ojWWYfajr18 zwNo&Ub`C3hRRcTNrCy%o^ZEJhheu2MaS*tNnt^@Lf(9q~!rE?)mNyI*7Y>)^8CLGv zk=DS#$9gIw!EOZlZXch?x}uo}5Or7DzLuFGuO$@cqTZC;7EQOUc>RO6U_GQXty%!_hnl$v2 zc3siYU>6EhqD`Rq`WqLn;HK;8Lx!nd1m4(r+V9C5KDJQQGO1tQr}eFLB8GTV_$4K6 zhUwci!yztbOyg^E{E_<)}M0XT>c$v46m@DU~{Vp@4BqLcqbj69(F3X!9ih?--F5Zi2rhh z#25yG;9eLQK`^9)Tx$3dBbAxdTUSV3VRR-n)^)~1M>B~AOzvZV{1g%x#W=?B2|YP+ zStK@(iOUutyO;`?PKIncOcN;6*{8&Kk=Rb*GwSU=)zbZh$OA$$g!GfmVj8)?XP6;7 zfX^{YxbCw=HbQpr71Gq_+h*<(@7xS)D7f|kQOr>BY(OO)CJ@y;B__~Ee^irn@$Ksv K=IJbgg?|Ap7Pxr; diff --git a/target/test-classes/nearsoft/academy/bigdata/recommendation/test.class b/target/test-classes/nearsoft/academy/bigdata/recommendation/test.class deleted file mode 100644 index 40c91822ba0c8a00caffe02c12853f2c6e2e5d95..0000000000000000000000000000000000000000 GIT binary patch literal 0 HcmV?d00001 literal 4156 zcmbVP>wgqi8Ga^vna%7hgoUMS3j%UWAjw)<*Sb(NB!zBG2qi!a#o}alk__zbY-VPY zkXA||Xp5It?L{iKNY&H=l~&zAqu6>ut=CU}@ta@$AH?U(-c9`dw7>jz&Y5%G^Io3k zecvs$e@z8F?Aw0ayw=uoX1Hkx`H_5x}H^0HzekI2pjSj3*R?V2bxA z1Nef1tvD6HQ(`!0h|}(m&M~N;_+1lU&C`k z-}3={UFi8n0N<4Hf`U!L&Wm_S=zBScZ{e(r3qs-*1>eTSAijfFWxS@KQ|P@U#_!6w zEWy9i$QjNq37*!r!xFsRW?Gl9wAaY#`wH1%-8!fZXSfpXHB(yVux1(Jy}amk#td6R zXKzl|EZZD$Vp>W|>)DgBVPiC{IaT^P%0oY;<~YgsBPi5X@rnadX( zs^T&YO2ZOXRrhumMn-f?Pan{E-V)mef3)Y#YtEP$(#akoV(X5C<)vc<$H>GU*6gtX zT}0q9981EAy1k^MTbg4Eb&69L+sa1ZPUb7%ZK*q4R=l&cR1d>0>MNt;x==CmUqqFM zrc!!dU~S8IUB>swWd-a5`h=lR5^kTJVIT~-n?Hsqk>8Nz?sl7n90Ot4BStRWQ^;qG zl;-FqP9$ttjHtRe`m{X#^*VYs&q1@Sjnwqm!l<~J(R18vGWhULnpRriEihI2B>!EO zrJba&o~%YyOBdMii8I`<-zib!ONkgH#2e2n0$812Nk%=&To7KU%Et6%Njb%;d zfZgd#Ih~`^!ut2c;|GkRVxqA)Bt$D4b#_aIBO!2TprdP`JDC(pX2s(T36QX?7Ed{| zRs0ZdN(h#+ELLFMtGI%zOult0uHh{eKf-ll@1ArEAel?+Q~d>}e`GfaP21JXR`E98 zk?~^{KfzB`6fq~`hKiebw}Mn%0qrgr85TJc+-*4Pgk?KHoAdaYc>G+&Exak?7b@Np zV7xE*==xBo9we*xRiXVQe#Pu887)^{V%-90STHhvt>QPhE#UjDjNeIUsew=`JQcsk zbr~P1_yhhZ<4-F7jK4@||9{%9gapLun<`4g(a%}apx_3?t1 zVMi}Dw{nYeZwi1q&*xiV!3yFA`lHm14XPDoW1k+ggSfYZ_!{8D-)_G9*U|rahHS( zSSDtxBn-}kq}e&3FtVB5j=}A zybc3z;J6E29zg+56}l_fi3jOH7x#B@)~r!&!hnjbkq!rsf>qlX!##jdS%gJP|@K?X9HVl2l(+Y9FQgx##EJentsKS)uVF zSC?|-VwJ{^{*N?z;%bG-P?gCY?JfQyHpH9TTVydR?JZ<+Lp&I1Zi!vOiipzUTtX-k zY|$^lKckYj+leK!ciyifZ=)bjt&$f}1#f#XNfau)JwogNhtC4Bn;>eF#A}L3J<04o zMQonpiKiL$8FF`)+|5w>9Hq`v%QKWZPl@M<|MMbA76@ zCehjucSZ4~nZGI#IK9oSm%e#yV%~4wCkSc3fh}`rO?W+VU(|aOZ4wgxsJ~n@{bI(N zc@J9?ay!c`a4X*Ii7OE$(tH_fqJfCAos}tza@%%+6#1kXg)IG}BPvIHH_(0)9Ucr) z_w1c(9oOkYsgmOK7I=Z#`Xck`C9KBFSj&GdcM;=3yaJ8?Tc$Zbj#tUkYpj|}?XLVdn!&6K1@t5Rc>YGySbrv}k0dpS07Y?((V zp^o)#3xBMLdk1T6a|zD^v-JBaZNBA3CaRHVaDtwII{{?aNF}!#y&NCqFUy@K Date: Wed, 9 Oct 2019 13:18:47 -0700 Subject: [PATCH 5/8] Deteletd unnecessary file --- .../academy/bigdata/recommendation/test.java | 176 ------------------ 1 file changed, 176 deletions(-) delete mode 100644 src/test/java/nearsoft/academy/bigdata/recommendation/test.java diff --git a/src/test/java/nearsoft/academy/bigdata/recommendation/test.java b/src/test/java/nearsoft/academy/bigdata/recommendation/test.java deleted file mode 100644 index 779ee15..0000000 --- a/src/test/java/nearsoft/academy/bigdata/recommendation/test.java +++ /dev/null @@ -1,176 +0,0 @@ -package nearsoft.academy.bigdata.recommendation; - -import java.io.*; -import java.util.*; -import java.util.zip.GZIPInputStream; - -public class test { - -// void muestraContenido(String archivo) throws FileNotFoundException, IOException { -// String cadena; -// String [] arreglo_datos; -//// FileReader f = new FileReader("/Users/lromero/Desktop/LuisMario/AmazonProblem/movies.txt.gz"); -//// BufferedReader b = new BufferedReader(f); -// InputStream stream = new GZIPInputStream(new FileInputStream("/Users/lromero/Desktop/LuisMario/AmazonProblem/moviesTest2.txt.gz")); -// BufferedReader b = new BufferedReader(new InputStreamReader(stream, "US-ASCII")); -// int i = 0; -// String path = ""; -// String pdID = ""; -// HashSet set = new HashSet(); -// while((cadena = b.readLine())!=null) { -// if(!(cadena.equals(""))){ -// pdID = ""; -// path = ""; -// for (int j = 0; j < cadena.length(); j++) { -// if(!(path.equals("product/productId:"))){ -// path += cadena.charAt(j); -// }else{ -// for (int k = 0; k < 10; k++) { -// pdID += cadena.charAt(j+1); -// j++; -// if(pdID.length() == 10) { -// j = cadena.length(); -// break; -// } -// } -// } -// } -// if(!(pdID.equals(""))) { -// //System.out.println("PRODUCT ID CATCHED: " + pdID); -// set.add(pdID); -// } -// -// }else { -// for (int j = 0; j < cadena.length(); j++) { -// if(!(path.equals("product/productId:"))){ -// path += cadena.charAt(j); -// }else{ -// for (int k = 0; k < 10; k++) { -// pdID += cadena.charAt(j+1); -// j++; -// if(pdID.length() == 10){ -// j = cadena.length(); -// break; -// } -// -// } -// } -// } -// if(!(pdID.equals(""))) { -// //System.out.println("PRODUCT ID CATCHED: " + pdID); -// set.add(pdID); -// } -// } -// } -// Iterator itr = set.iterator(); -// int pdIDCounter = 0; -// while(itr.hasNext()) { -// System.out.println(itr.next()); -// pdIDCounter++; -// } -// System.out.println("Numero sin repetir de Products Id: "+pdIDCounter); -// b.close(); -// } - - - int getTotalUsers(String archivo) throws FileNotFoundException, IOException { - String cadena; - String [] arreglo_datos; - InputStream stream = new GZIPInputStream(new FileInputStream("/Users/lromero/Desktop/LuisMario/AmazonProblem/movies.txt.gz")); - BufferedReader b = new BufferedReader(new InputStreamReader(stream, "US-ASCII")); - int i = 0; - String path = ""; - String pdID = ""; - char slash; - char u; - //char e; - HashSet set = new HashSet(); - while((cadena = b.readLine())!=null) { - try{ - if(cadena.startsWith("review/user")){ - pdID = cadena.split(" ")[1]; - set.add(pdID); - } - }catch (IndexOutOfBoundsException ioub){ -// System.out.println("LLEGO VACIO EXCEPTION"); - } - } - Iterator itr = set.iterator(); - int totalUsers = 0; - while(itr.hasNext()) { - itr.next(); - totalUsers++; - } - System.out.println("Total users: "+totalUsers); - b.close(); - return totalUsers; - } - - - - int getTotalReviews(String archivo) throws FileNotFoundException, IOException { - String cadena; - String [] arreglo_datos; -// FileReader f = new FileReader("/Users/lromero/Desktop/LuisMario/AmazonProblem/movies.txt.gz"); -// BufferedReader b = new BufferedReader(f); - InputStream stream = new GZIPInputStream(new FileInputStream("/Users/lromero/Desktop/LuisMario/AmazonProblem/moviesTest3.txt.gz")); - BufferedReader b = new BufferedReader(new InputStreamReader(stream, "US-ASCII")); - int i = 0; - String path = ""; - String pdID = ""; - char slash; - char t; - char e; - int reviewCounter = 0; - - HashSet set = new HashSet(); - while((cadena = b.readLine())!=null) { - try{ - slash = cadena.charAt(6); - t = cadena.charAt(7); - e = cadena.charAt(8); - if(slash == '/' && t == 't' && e == 'e'){ - reviewCounter++; - } -// - }catch (IndexOutOfBoundsException ioub){ -// System.out.println("LLEGO VACIO EXCEPTION"); - } - - - } - - System.out.println("Total Reviews: "+reviewCounter); - return reviewCounter; - } - - public Map findDuplicateString(String str) { - String[] stringArrays = str.split(" "); - Map map = new HashMap(); - Set words = new HashSet(Arrays.asList(stringArrays)); - int count = 0; - for (String word : words) { - for (String temp : stringArrays) { - if (word.equals(temp)) { - ++count; - } - } - map.put(word, count); - count = 0; - } - - return map; - - } - - public static void main(String[] args) throws IOException { - test call = new test(); - //call.muestraContenido("/Users/lromero/Desktop/LuisMario/AmazonProblem/smalltest.txt "); - //call.findDuplicateString("d"); - //call.getTotalReviews("/Users/lromero/Desktop/LuisMario/AmazonProblem/smalltest.txt "); - //call.getTotalReviews("/Users/lromero/Desktop/LuisMario/AmazonProblem/smalltest.txt "); - call.getTotalUsers("/Users/lromero/Desktop/LuisMario/AmazonProblem/movies.txt.gz "); - - } - -} From 1cb76d43b45817941d4dde94e9a7be7124b00635 Mon Sep 17 00:00:00 2001 From: lromero Date: Wed, 9 Oct 2019 13:20:04 -0700 Subject: [PATCH 6/8] Deleted unnecessary file --- big-data.iml | 56 ---------------------------------------------------- 1 file changed, 56 deletions(-) delete mode 100644 big-data.iml diff --git a/big-data.iml b/big-data.iml deleted file mode 100644 index 38c1e5e..0000000 --- a/big-data.iml +++ /dev/null @@ -1,56 +0,0 @@ - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - \ No newline at end of file From 39b256e0f091aa38097e2a1b33aab11ed4a2d744 Mon Sep 17 00:00:00 2001 From: lromero Date: Wed, 9 Oct 2019 13:24:11 -0700 Subject: [PATCH 7/8] Deleted unnecessary lines --- pom.xml | 2 -- 1 file changed, 2 deletions(-) diff --git a/pom.xml b/pom.xml index 810bf09..7ce31f8 100644 --- a/pom.xml +++ b/pom.xml @@ -13,7 +13,6 @@ UTF-8 - org.apache.mahout @@ -26,6 +25,5 @@ 4.7 test - From 3746dbb5a203ce955a3ba43fb4d182e9645959fc Mon Sep 17 00:00:00 2001 From: lromero Date: Wed, 9 Oct 2019 13:26:08 -0700 Subject: [PATCH 8/8] Changed unnecessary lines --- .../recommendation/MovieRecommenderTest.java | 23 ++++--------------- 1 file changed, 4 insertions(+), 19 deletions(-) diff --git a/src/test/java/nearsoft/academy/bigdata/recommendation/MovieRecommenderTest.java b/src/test/java/nearsoft/academy/bigdata/recommendation/MovieRecommenderTest.java index 7b46acf..2e7b3b1 100644 --- a/src/test/java/nearsoft/academy/bigdata/recommendation/MovieRecommenderTest.java +++ b/src/test/java/nearsoft/academy/bigdata/recommendation/MovieRecommenderTest.java @@ -15,29 +15,14 @@ public class MovieRecommenderTest { public void testDataInfo() throws IOException, TasteException { //download movies.txt.gz from // http://snap.stanford.edu/data/web-Movies.html - MovieRecommender recommender = new MovieRecommender(); - assertEquals(7911684, recommender.getTotalReviews("Users/Desktop/LuisMario/AmazonProblem/movies.txt.gz")); // - assertEquals(253059, recommender.getTotalProducts("Users/Desktop/LuisMario/AmazonProblem/movies.txt.gz")); // product/productId: - assertEquals(889176, recommender.getTotalUsers("Users/Desktop/LuisMario/AmazonProblem/movies.txt.gz")); - - // get a token with a review and saved it if it's not already defined, but if it's already defined plus one - // - - - // total reviews : 7911684 - // total products : 253059 - // total users : 889176 + MovieRecommender recommender = new MovieRecommender("/Users/lromero/Desktop/LuisMario/AmazonProblem/big-data-exercises/src/test/java/nearsoft/academy/bigdata/recommendation/movies.txt.gz"); + assertEquals(7911684, recommender.getTotalReviews()); + assertEquals(253059, recommender.getTotalProducts()); + assertEquals(889176, recommender.getTotalUsers()); List recommendations = recommender.getRecommendationsForUser("A141HP4LYPWMSR"); assertThat(recommendations, hasItem("B0002O7Y8U")); assertThat(recommendations, hasItem("B00004CQTF")); assertThat(recommendations, hasItem("B000063W82")); - } - - public static void main(String[] args) throws IOException, TasteException { - MovieRecommenderTest call = new MovieRecommenderTest(); - call.testDataInfo(); - } - }