diff --git a/gonna need a bigger bot.ipynb b/gonna need a bigger bot.ipynb index 16bb34f..e78ed77 100644 --- a/gonna need a bigger bot.ipynb +++ b/gonna need a bigger bot.ipynb @@ -14,7 +14,7 @@ "\n", "While some tags are straight forward (`Star Trek`) others are much tougher (`boxing` or `french art movie`) where its unlikely any text has a match. \n", "\n", - "We're not going to solve those problems here, but we give this to you as a sandbox to apply your skills after the class to see how close you can get to approximating the genome tags data\n" + "We're not going to solve those problems here, but we give this to you as a sandbox to apply your skills after the class to see how close you can get to approximating the genome tags data. \n" ] }, { diff --git a/netfix movies.ipynb b/netfix movies.ipynb index 1b815bd..dcf0534 100644 --- a/netfix movies.ipynb +++ b/netfix movies.ipynb @@ -28346,7 +28346,7 @@ }, { "cell_type": "code", - "execution_count": 10, + "execution_count": 6, "metadata": {}, "outputs": [ { @@ -28370,7 +28370,7 @@ " \"featureset\": {\n", " \"features\": [\n", " {\n", - " \"name\": \"title_phrase\",\n", + " \"name\": \"title_has_phrase\",\n", " \"params\": [\"keywords\"],\n", " \"template\": {\n", " \"constant_score\": {\n", @@ -28382,7 +28382,7 @@ " }\n", " },\n", " {\n", - " \"name\": \"title\",\n", + " \"name\": \"title_has_terms\",\n", " \"params\": [\"keywords\"],\n", " \"template\": {\n", " \"constant_score\": {\n", @@ -28459,7 +28459,7 @@ }, { "cell_type": "code", - "execution_count": 6, + "execution_count": 3, "metadata": {}, "outputs": [ { @@ -28546,7 +28546,8 @@ "Searching tmdb - [{'terms': {'_id': [ [Status: 200]\n", "REBUILDING TRAINING DATA for how to train your dragon 2 (38/40)\n", "Searching tmdb - [{'terms': {'_id': [ [Status: 200]\n", - "REBUILDING TRAINING DATA for star wars (39/40)\n" + "REBUILDING TRAINING DATA for star wars (39/40)\n", + "Discarded 0 Keep 1390\n" ] } ], @@ -28578,100 +28579,109 @@ "text": [ "Running java -jar data/RankyMcRankFace.jar -ranker 6 -metric2t NDCG@10 -tree 20 -leaf 20 -train data/title_judgments_train.txt -save data/temp_model.txt -feature features.txt -kcv 15 \n", "DONE\n", - "Trying features [1] TEST NDCG@10=0.9071 after cost 0.9071\n", + "Trying features [1] TEST NDCG@10=0.9071\n", "Running java -jar data/RankyMcRankFace.jar -ranker 6 -metric2t NDCG@10 -tree 20 -leaf 20 -train data/title_judgments_train.txt -save data/temp_model.txt -feature features.txt -kcv 15 \n", "DONE\n", - "Trying features [2] TEST NDCG@10=0.9067 after cost 0.9067\n", + "Trying features [2] TEST NDCG@10=0.9067\n", "Running java -jar data/RankyMcRankFace.jar -ranker 6 -metric2t NDCG@10 -tree 20 -leaf 20 -train data/title_judgments_train.txt -save data/temp_model.txt -feature features.txt -kcv 15 \n", "DONE\n", - "Trying features [3] TEST NDCG@10=0.8754 after cost 0.8754\n", + "Trying features [3] TEST NDCG@10=0.8754\n", "Running java -jar data/RankyMcRankFace.jar -ranker 6 -metric2t NDCG@10 -tree 20 -leaf 20 -train data/title_judgments_train.txt -save data/temp_model.txt -feature features.txt -kcv 15 \n", "DONE\n", - "Trying features [4] TEST NDCG@10=0.5022 after cost 0.5022\n", + "Trying features [4] TEST NDCG@10=0.5022\n", "Running java -jar data/RankyMcRankFace.jar -ranker 6 -metric2t NDCG@10 -tree 20 -leaf 20 -train data/title_judgments_train.txt -save data/temp_model.txt -feature features.txt -kcv 15 \n", "DONE\n", - "Trying features [5] TEST NDCG@10=0.7247 after cost 0.7247\n", + "Trying features [5] TEST NDCG@10=0.7247\n", "Running java -jar data/RankyMcRankFace.jar -ranker 6 -metric2t NDCG@10 -tree 20 -leaf 20 -train data/title_judgments_train.txt -save data/temp_model.txt -feature features.txt -kcv 15 \n", "DONE\n", - "Trying features [6] TEST NDCG@10=0.8084 after cost 0.8084\n", + "Trying features [6] TEST NDCG@10=0.8084\n", "Running java -jar data/RankyMcRankFace.jar -ranker 6 -metric2t NDCG@10 -tree 20 -leaf 20 -train data/title_judgments_train.txt -save data/temp_model.txt -feature features.txt -kcv 15 \n", "DONE\n", - "Trying features [7] TEST NDCG@10=0.2794 after cost 0.2794\n", + "Trying features [7] TEST NDCG@10=0.2794\n", "Running java -jar data/RankyMcRankFace.jar -ranker 6 -metric2t NDCG@10 -tree 20 -leaf 20 -train data/title_judgments_train.txt -save data/temp_model.txt -feature features.txt -kcv 15 \n", "DONE\n", - "Trying features [1, 2] TEST NDCG@10=0.9067 after cost 0.9067\n", + "Trying features [1, 2] TEST NDCG@10=0.9067\n", "Running java -jar data/RankyMcRankFace.jar -ranker 6 -metric2t NDCG@10 -tree 20 -leaf 20 -train data/title_judgments_train.txt -save data/temp_model.txt -feature features.txt -kcv 15 \n", "DONE\n", - "Trying features [1, 3] TEST NDCG@10=0.8737 after cost 0.8737\n", + "Trying features [1, 3] TEST NDCG@10=0.8737\n", "Running java -jar data/RankyMcRankFace.jar -ranker 6 -metric2t NDCG@10 -tree 20 -leaf 20 -train data/title_judgments_train.txt -save data/temp_model.txt -feature features.txt -kcv 15 \n", "DONE\n", - "Trying features [1, 4] TEST NDCG@10=0.8057 after cost 0.8057\n", + "Trying features [1, 4] TEST NDCG@10=0.8057\n", "Running java -jar data/RankyMcRankFace.jar -ranker 6 -metric2t NDCG@10 -tree 20 -leaf 20 -train data/title_judgments_train.txt -save data/temp_model.txt -feature features.txt -kcv 15 \n", "DONE\n", - "Trying features [1, 5] TEST NDCG@10=0.8597 after cost 0.8597\n", + "Trying features [1, 5] TEST NDCG@10=0.8597\n", "Running java -jar data/RankyMcRankFace.jar -ranker 6 -metric2t NDCG@10 -tree 20 -leaf 20 -train data/title_judgments_train.txt -save data/temp_model.txt -feature features.txt -kcv 15 \n", "DONE\n", - "Trying features [1, 6] TEST NDCG@10=0.8654 after cost 0.8654\n", + "Trying features [1, 6] TEST NDCG@10=0.8654\n", "Running java -jar data/RankyMcRankFace.jar -ranker 6 -metric2t NDCG@10 -tree 20 -leaf 20 -train data/title_judgments_train.txt -save data/temp_model.txt -feature features.txt -kcv 15 \n", "DONE\n", - "Trying features [1, 7] TEST NDCG@10=0.7869 after cost 0.7869\n", + "Trying features [1, 7] TEST NDCG@10=0.7869\n", "Running java -jar data/RankyMcRankFace.jar -ranker 6 -metric2t NDCG@10 -tree 20 -leaf 20 -train data/title_judgments_train.txt -save data/temp_model.txt -feature features.txt -kcv 15 \n", "DONE\n", - "Trying features [2, 3] TEST NDCG@10=0.8754 after cost 0.8754\n", + "Trying features [2, 3] TEST NDCG@10=0.8754\n", "Running java -jar data/RankyMcRankFace.jar -ranker 6 -metric2t NDCG@10 -tree 20 -leaf 20 -train data/title_judgments_train.txt -save data/temp_model.txt -feature features.txt -kcv 15 \n", "DONE\n", - "Trying features [2, 4] TEST NDCG@10=0.5979 after cost 0.5979\n", + "Trying features [2, 4] TEST NDCG@10=0.5979\n", "Running java -jar data/RankyMcRankFace.jar -ranker 6 -metric2t NDCG@10 -tree 20 -leaf 20 -train data/title_judgments_train.txt -save data/temp_model.txt -feature features.txt -kcv 15 \n", "DONE\n", - "Trying features [2, 5] TEST NDCG@10=0.8498 after cost 0.8498\n", + "Trying features [2, 5] TEST NDCG@10=0.8498\n", "Running java -jar data/RankyMcRankFace.jar -ranker 6 -metric2t NDCG@10 -tree 20 -leaf 20 -train data/title_judgments_train.txt -save data/temp_model.txt -feature features.txt -kcv 15 \n", "DONE\n", - "Trying features [2, 6] TEST NDCG@10=0.8061 after cost 0.8061\n", + "Trying features [2, 6] TEST NDCG@10=0.8061\n", "Running java -jar data/RankyMcRankFace.jar -ranker 6 -metric2t NDCG@10 -tree 20 -leaf 20 -train data/title_judgments_train.txt -save data/temp_model.txt -feature features.txt -kcv 15 \n", "DONE\n", - "Trying features [2, 7] TEST NDCG@10=0.5268 after cost 0.5268\n", + "Trying features [2, 7] TEST NDCG@10=0.5268\n", "Running java -jar data/RankyMcRankFace.jar -ranker 6 -metric2t NDCG@10 -tree 20 -leaf 20 -train data/title_judgments_train.txt -save data/temp_model.txt -feature features.txt -kcv 15 \n", "DONE\n", - "Trying features [3, 4] TEST NDCG@10=0.8693 after cost 0.8693\n", + "Trying features [3, 4] TEST NDCG@10=0.8693\n", "Running java -jar data/RankyMcRankFace.jar -ranker 6 -metric2t NDCG@10 -tree 20 -leaf 20 -train data/title_judgments_train.txt -save data/temp_model.txt -feature features.txt -kcv 15 \n", "DONE\n", - "Trying features [3, 5] TEST NDCG@10=0.8822 after cost 0.8822\n", + "Trying features [3, 5] TEST NDCG@10=0.8822\n", "Running java -jar data/RankyMcRankFace.jar -ranker 6 -metric2t NDCG@10 -tree 20 -leaf 20 -train data/title_judgments_train.txt -save data/temp_model.txt -feature features.txt -kcv 15 \n", "DONE\n", - "Trying features [3, 6] TEST NDCG@10=0.8959 after cost 0.8959\n", + "Trying features [3, 6] TEST NDCG@10=0.8959\n", "Running java -jar data/RankyMcRankFace.jar -ranker 6 -metric2t NDCG@10 -tree 20 -leaf 20 -train data/title_judgments_train.txt -save data/temp_model.txt -feature features.txt -kcv 15 \n", "DONE\n", - "Trying features [3, 7] TEST NDCG@10=0.8778 after cost 0.8778\n", + "Trying features [3, 7] TEST NDCG@10=0.8778\n", "Running java -jar data/RankyMcRankFace.jar -ranker 6 -metric2t NDCG@10 -tree 20 -leaf 20 -train data/title_judgments_train.txt -save data/temp_model.txt -feature features.txt -kcv 15 \n", "DONE\n", - "Trying features [4, 5] TEST NDCG@10=0.4874 after cost 0.4874\n", + "Trying features [4, 5] TEST NDCG@10=0.4874\n", "Running java -jar data/RankyMcRankFace.jar -ranker 6 -metric2t NDCG@10 -tree 20 -leaf 20 -train data/title_judgments_train.txt -save data/temp_model.txt -feature features.txt -kcv 15 \n", "DONE\n", - "Trying features [4, 6] TEST NDCG@10=0.8286 after cost 0.8286\n", + "Trying features [4, 6] TEST NDCG@10=0.8286\n", "Running java -jar data/RankyMcRankFace.jar -ranker 6 -metric2t NDCG@10 -tree 20 -leaf 20 -train data/title_judgments_train.txt -save data/temp_model.txt -feature features.txt -kcv 15 \n", "DONE\n", - "Trying features [4, 7] TEST NDCG@10=0.4166 after cost 0.4166\n", + "Trying features [4, 7] TEST NDCG@10=0.4166\n", "Running java -jar data/RankyMcRankFace.jar -ranker 6 -metric2t NDCG@10 -tree 20 -leaf 20 -train data/title_judgments_train.txt -save data/temp_model.txt -feature features.txt -kcv 15 \n", "DONE\n", - "Trying features [5, 6] TEST NDCG@10=0.7694 after cost 0.7694\n", + "Trying features [5, 6] TEST NDCG@10=0.7694\n", "Running java -jar data/RankyMcRankFace.jar -ranker 6 -metric2t NDCG@10 -tree 20 -leaf 20 -train data/title_judgments_train.txt -save data/temp_model.txt -feature features.txt -kcv 15 \n", "DONE\n", - "Trying features [5, 7] TEST NDCG@10=0.3976 after cost 0.3976\n", + "Trying features [5, 7] TEST NDCG@10=0.3976\n", "Running java -jar data/RankyMcRankFace.jar -ranker 6 -metric2t NDCG@10 -tree 20 -leaf 20 -train data/title_judgments_train.txt -save data/temp_model.txt -feature features.txt -kcv 15 \n", "DONE\n", - "Trying features [6, 7] TEST NDCG@10=0.7877 after cost 0.7877\n", + "Trying features [6, 7] TEST NDCG@10=0.7877\n", "Running java -jar data/RankyMcRankFace.jar -ranker 6 -metric2t NDCG@10 -tree 20 -leaf 20 -train data/title_judgments_train.txt -save data/temp_model.txt -feature features.txt -kcv 15 \n", "DONE\n", - "Trying features [1, 2, 3] TEST NDCG@10=0.8737 after cost 0.8737\n", + "Trying features [1, 2, 3] TEST NDCG@10=0.8737\n", "Running java -jar data/RankyMcRankFace.jar -ranker 6 -metric2t NDCG@10 -tree 20 -leaf 20 -train data/title_judgments_train.txt -save data/temp_model.txt -feature features.txt -kcv 15 \n", "DONE\n", - "Trying features [1, 2, 4] TEST NDCG@10=0.7967 after cost 0.7967\n", + "Trying features [1, 2, 4] TEST NDCG@10=0.7967\n", "Running java -jar data/RankyMcRankFace.jar -ranker 6 -metric2t NDCG@10 -tree 20 -leaf 20 -train data/title_judgments_train.txt -save data/temp_model.txt -feature features.txt -kcv 15 \n", "DONE\n", - "Trying features [1, 2, 5] TEST NDCG@10=0.863 after cost 0.863\n", + "Trying features [1, 2, 5] TEST NDCG@10=0.863\n", + "Running java -jar data/RankyMcRankFace.jar -ranker 6 -metric2t NDCG@10 -tree 20 -leaf 20 -train data/title_judgments_train.txt -save data/temp_model.txt -feature features.txt -kcv 15 \n", + "DONE\n", + "Trying features [1, 2, 6] TEST NDCG@10=0.8779\n", "Running java -jar data/RankyMcRankFace.jar -ranker 6 -metric2t NDCG@10 -tree 20 -leaf 20 -train data/title_judgments_train.txt -save data/temp_model.txt -feature features.txt -kcv 15 \n", "DONE\n", - "Trying features [1, 2, 6] TEST NDCG@10=0.8779 after cost 0.8779\n", + "Trying features [1, 2, 7] TEST NDCG@10=0.7955\n", + "Running java -jar data/RankyMcRankFace.jar -ranker 6 -metric2t NDCG@10 -tree 20 -leaf 20 -train data/title_judgments_train.txt -save data/temp_model.txt -feature features.txt -kcv 15 \n", + "DONE\n", + "Trying features [1, 3, 4] TEST NDCG@10=0.9011\n", + "Running java -jar data/RankyMcRankFace.jar -ranker 6 -metric2t NDCG@10 -tree 20 -leaf 20 -train data/title_judgments_train.txt -save data/temp_model.txt -feature features.txt -kcv 15 \n", + "DONE\n", + "Trying features [1, 3, 5] TEST NDCG@10=0.8822\n", "Running java -jar data/RankyMcRankFace.jar -ranker 6 -metric2t NDCG@10 -tree 20 -leaf 20 -train data/title_judgments_train.txt -save data/temp_model.txt -feature features.txt -kcv 15 \n" ] }, @@ -28680,103 +28690,109 @@ "output_type": "stream", "text": [ "DONE\n", - "Trying features [1, 2, 7] TEST NDCG@10=0.7955 after cost 0.7955\n", + "Trying features [1, 3, 6] TEST NDCG@10=0.879\n", "Running java -jar data/RankyMcRankFace.jar -ranker 6 -metric2t NDCG@10 -tree 20 -leaf 20 -train data/title_judgments_train.txt -save data/temp_model.txt -feature features.txt -kcv 15 \n", "DONE\n", - "Trying features [1, 3, 4] TEST NDCG@10=0.9011 after cost 0.9011\n", + "Trying features [1, 3, 7] TEST NDCG@10=0.8756\n", "Running java -jar data/RankyMcRankFace.jar -ranker 6 -metric2t NDCG@10 -tree 20 -leaf 20 -train data/title_judgments_train.txt -save data/temp_model.txt -feature features.txt -kcv 15 \n", "DONE\n", - "Trying features [1, 3, 5] TEST NDCG@10=0.8822 after cost 0.8822\n", + "Trying features [1, 4, 5] TEST NDCG@10=0.8321\n", "Running java -jar data/RankyMcRankFace.jar -ranker 6 -metric2t NDCG@10 -tree 20 -leaf 20 -train data/title_judgments_train.txt -save data/temp_model.txt -feature features.txt -kcv 15 \n", "DONE\n", - "Trying features [1, 3, 6] TEST NDCG@10=0.879 after cost 0.879\n", + "Trying features [1, 4, 6] TEST NDCG@10=0.8822\n", "Running java -jar data/RankyMcRankFace.jar -ranker 6 -metric2t NDCG@10 -tree 20 -leaf 20 -train data/title_judgments_train.txt -save data/temp_model.txt -feature features.txt -kcv 15 \n", "DONE\n", - "Trying features [1, 3, 7] TEST NDCG@10=0.8756 after cost 0.8756\n", + "Trying features [1, 4, 7] TEST NDCG@10=0.8098\n", "Running java -jar data/RankyMcRankFace.jar -ranker 6 -metric2t NDCG@10 -tree 20 -leaf 20 -train data/title_judgments_train.txt -save data/temp_model.txt -feature features.txt -kcv 15 \n", "DONE\n", - "Trying features [1, 4, 5] TEST NDCG@10=0.8321 after cost 0.8321\n", + "Trying features [1, 5, 6] TEST NDCG@10=0.8777\n", "Running java -jar data/RankyMcRankFace.jar -ranker 6 -metric2t NDCG@10 -tree 20 -leaf 20 -train data/title_judgments_train.txt -save data/temp_model.txt -feature features.txt -kcv 15 \n", "DONE\n", - "Trying features [1, 4, 6] TEST NDCG@10=0.8822 after cost 0.8822\n", + "Trying features [1, 5, 7] TEST NDCG@10=0.7773\n", "Running java -jar data/RankyMcRankFace.jar -ranker 6 -metric2t NDCG@10 -tree 20 -leaf 20 -train data/title_judgments_train.txt -save data/temp_model.txt -feature features.txt -kcv 15 \n", "DONE\n", - "Trying features [1, 4, 7] TEST NDCG@10=0.8098 after cost 0.8098\n", + "Trying features [1, 6, 7] TEST NDCG@10=0.8282\n", "Running java -jar data/RankyMcRankFace.jar -ranker 6 -metric2t NDCG@10 -tree 20 -leaf 20 -train data/title_judgments_train.txt -save data/temp_model.txt -feature features.txt -kcv 15 \n", "DONE\n", - "Trying features [1, 5, 6] TEST NDCG@10=0.8777 after cost 0.8777\n", + "Trying features [2, 3, 4] TEST NDCG@10=0.8693\n", "Running java -jar data/RankyMcRankFace.jar -ranker 6 -metric2t NDCG@10 -tree 20 -leaf 20 -train data/title_judgments_train.txt -save data/temp_model.txt -feature features.txt -kcv 15 \n", "DONE\n", - "Trying features [1, 5, 7] TEST NDCG@10=0.7773 after cost 0.7773\n", + "Trying features [2, 3, 5] TEST NDCG@10=0.8822\n", "Running java -jar data/RankyMcRankFace.jar -ranker 6 -metric2t NDCG@10 -tree 20 -leaf 20 -train data/title_judgments_train.txt -save data/temp_model.txt -feature features.txt -kcv 15 \n", "DONE\n", - "Trying features [1, 6, 7] TEST NDCG@10=0.8282 after cost 0.8282\n", + "Trying features [2, 3, 6] TEST NDCG@10=0.8959\n", "Running java -jar data/RankyMcRankFace.jar -ranker 6 -metric2t NDCG@10 -tree 20 -leaf 20 -train data/title_judgments_train.txt -save data/temp_model.txt -feature features.txt -kcv 15 \n", "DONE\n", - "Trying features [2, 3, 4] TEST NDCG@10=0.8693 after cost 0.8693\n", + "Trying features [2, 3, 7] TEST NDCG@10=0.8778\n", "Running java -jar data/RankyMcRankFace.jar -ranker 6 -metric2t NDCG@10 -tree 20 -leaf 20 -train data/title_judgments_train.txt -save data/temp_model.txt -feature features.txt -kcv 15 \n", "DONE\n", - "Trying features [2, 3, 5] TEST NDCG@10=0.8822 after cost 0.8822\n", + "Trying features [2, 4, 5] TEST NDCG@10=0.6083\n", "Running java -jar data/RankyMcRankFace.jar -ranker 6 -metric2t NDCG@10 -tree 20 -leaf 20 -train data/title_judgments_train.txt -save data/temp_model.txt -feature features.txt -kcv 15 \n", "DONE\n", - "Trying features [2, 3, 6] TEST NDCG@10=0.8959 after cost 0.8959\n", + "Trying features [2, 4, 6] TEST NDCG@10=0.8016\n", "Running java -jar data/RankyMcRankFace.jar -ranker 6 -metric2t NDCG@10 -tree 20 -leaf 20 -train data/title_judgments_train.txt -save data/temp_model.txt -feature features.txt -kcv 15 \n", "DONE\n", - "Trying features [2, 3, 7] TEST NDCG@10=0.8778 after cost 0.8778\n", + "Trying features [2, 4, 7] TEST NDCG@10=0.5786\n", "Running java -jar data/RankyMcRankFace.jar -ranker 6 -metric2t NDCG@10 -tree 20 -leaf 20 -train data/title_judgments_train.txt -save data/temp_model.txt -feature features.txt -kcv 15 \n", "DONE\n", - "Trying features [2, 4, 5] TEST NDCG@10=0.6083 after cost 0.6083\n", + "Trying features [2, 5, 6] TEST NDCG@10=0.8065\n", "Running java -jar data/RankyMcRankFace.jar -ranker 6 -metric2t NDCG@10 -tree 20 -leaf 20 -train data/title_judgments_train.txt -save data/temp_model.txt -feature features.txt -kcv 15 \n", "DONE\n", - "Trying features [2, 4, 6] TEST NDCG@10=0.8016 after cost 0.8016\n", + "Trying features [2, 5, 7] TEST NDCG@10=0.5996\n", "Running java -jar data/RankyMcRankFace.jar -ranker 6 -metric2t NDCG@10 -tree 20 -leaf 20 -train data/title_judgments_train.txt -save data/temp_model.txt -feature features.txt -kcv 15 \n", "DONE\n", - "Trying features [2, 4, 7] TEST NDCG@10=0.5786 after cost 0.5786\n", + "Trying features [2, 6, 7] TEST NDCG@10=0.8102\n", "Running java -jar data/RankyMcRankFace.jar -ranker 6 -metric2t NDCG@10 -tree 20 -leaf 20 -train data/title_judgments_train.txt -save data/temp_model.txt -feature features.txt -kcv 15 \n", "DONE\n", - "Trying features [2, 5, 6] TEST NDCG@10=0.8065 after cost 0.8065\n", + "Trying features [3, 4, 5] TEST NDCG@10=0.854\n", "Running java -jar data/RankyMcRankFace.jar -ranker 6 -metric2t NDCG@10 -tree 20 -leaf 20 -train data/title_judgments_train.txt -save data/temp_model.txt -feature features.txt -kcv 15 \n", "DONE\n", - "Trying features [2, 5, 7] TEST NDCG@10=0.5996 after cost 0.5996\n", + "Trying features [3, 4, 6] TEST NDCG@10=0.889\n", "Running java -jar data/RankyMcRankFace.jar -ranker 6 -metric2t NDCG@10 -tree 20 -leaf 20 -train data/title_judgments_train.txt -save data/temp_model.txt -feature features.txt -kcv 15 \n", "DONE\n", - "Trying features [2, 6, 7] TEST NDCG@10=0.8102 after cost 0.8102\n", + "Trying features [3, 4, 7] TEST NDCG@10=0.8815\n", "Running java -jar data/RankyMcRankFace.jar -ranker 6 -metric2t NDCG@10 -tree 20 -leaf 20 -train data/title_judgments_train.txt -save data/temp_model.txt -feature features.txt -kcv 15 \n", "DONE\n", - "Trying features [3, 4, 5] TEST NDCG@10=0.854 after cost 0.854\n", + "Trying features [3, 5, 6] TEST NDCG@10=0.8813\n", "Running java -jar data/RankyMcRankFace.jar -ranker 6 -metric2t NDCG@10 -tree 20 -leaf 20 -train data/title_judgments_train.txt -save data/temp_model.txt -feature features.txt -kcv 15 \n", "DONE\n", - "Trying features [3, 4, 6] TEST NDCG@10=0.889 after cost 0.889\n", + "Trying features [3, 5, 7] TEST NDCG@10=0.8657\n", "Running java -jar data/RankyMcRankFace.jar -ranker 6 -metric2t NDCG@10 -tree 20 -leaf 20 -train data/title_judgments_train.txt -save data/temp_model.txt -feature features.txt -kcv 15 \n", "DONE\n", - "Trying features [3, 4, 7] TEST NDCG@10=0.8815 after cost 0.8815\n", + "Trying features [3, 6, 7] TEST NDCG@10=0.8753\n", "Running java -jar data/RankyMcRankFace.jar -ranker 6 -metric2t NDCG@10 -tree 20 -leaf 20 -train data/title_judgments_train.txt -save data/temp_model.txt -feature features.txt -kcv 15 \n", "DONE\n", - "Trying features [3, 5, 6] TEST NDCG@10=0.8813 after cost 0.8813\n", + "Trying features [4, 5, 6] TEST NDCG@10=0.8144\n", "Running java -jar data/RankyMcRankFace.jar -ranker 6 -metric2t NDCG@10 -tree 20 -leaf 20 -train data/title_judgments_train.txt -save data/temp_model.txt -feature features.txt -kcv 15 \n", "DONE\n", - "Trying features [3, 5, 7] TEST NDCG@10=0.8657 after cost 0.8657\n", + "Trying features [4, 5, 7] TEST NDCG@10=0.3601\n", "Running java -jar data/RankyMcRankFace.jar -ranker 6 -metric2t NDCG@10 -tree 20 -leaf 20 -train data/title_judgments_train.txt -save data/temp_model.txt -feature features.txt -kcv 15 \n", "DONE\n", - "Trying features [3, 6, 7] TEST NDCG@10=0.8753 after cost 0.8753\n", + "Trying features [4, 6, 7] TEST NDCG@10=0.8208\n", "Running java -jar data/RankyMcRankFace.jar -ranker 6 -metric2t NDCG@10 -tree 20 -leaf 20 -train data/title_judgments_train.txt -save data/temp_model.txt -feature features.txt -kcv 15 \n", "DONE\n", - "Trying features [4, 5, 6] TEST NDCG@10=0.8144 after cost 0.8144\n", + "Trying features [5, 6, 7] TEST NDCG@10=0.798\n", "Running java -jar data/RankyMcRankFace.jar -ranker 6 -metric2t NDCG@10 -tree 20 -leaf 20 -train data/title_judgments_train.txt -save data/temp_model.txt -feature features.txt -kcv 15 \n", "DONE\n", - "Trying features [4, 5, 7] TEST NDCG@10=0.3601 after cost 0.3601\n", + "Trying features [1, 2, 3, 4] TEST NDCG@10=0.9011\n", "Running java -jar data/RankyMcRankFace.jar -ranker 6 -metric2t NDCG@10 -tree 20 -leaf 20 -train data/title_judgments_train.txt -save data/temp_model.txt -feature features.txt -kcv 15 \n", "DONE\n", - "Trying features [4, 6, 7] TEST NDCG@10=0.8208 after cost 0.8208\n", + "Trying features [1, 2, 3, 5] TEST NDCG@10=0.8822\n", "Running java -jar data/RankyMcRankFace.jar -ranker 6 -metric2t NDCG@10 -tree 20 -leaf 20 -train data/title_judgments_train.txt -save data/temp_model.txt -feature features.txt -kcv 15 \n", "DONE\n", - "Trying features [5, 6, 7] TEST NDCG@10=0.798 after cost 0.798\n", + "Trying features [1, 2, 3, 6] TEST NDCG@10=0.879\n", "Running java -jar data/RankyMcRankFace.jar -ranker 6 -metric2t NDCG@10 -tree 20 -leaf 20 -train data/title_judgments_train.txt -save data/temp_model.txt -feature features.txt -kcv 15 \n", "DONE\n", - "Trying features [1, 2, 3, 4] TEST NDCG@10=0.9011 after cost 0.9011\n", + "Trying features [1, 2, 3, 7] TEST NDCG@10=0.8756\n", "Running java -jar data/RankyMcRankFace.jar -ranker 6 -metric2t NDCG@10 -tree 20 -leaf 20 -train data/title_judgments_train.txt -save data/temp_model.txt -feature features.txt -kcv 15 \n", "DONE\n", - "Trying features [1, 2, 3, 5] TEST NDCG@10=0.8822 after cost 0.8822\n", + "Trying features [1, 2, 4, 5] TEST NDCG@10=0.8296\n", + "Running java -jar data/RankyMcRankFace.jar -ranker 6 -metric2t NDCG@10 -tree 20 -leaf 20 -train data/title_judgments_train.txt -save data/temp_model.txt -feature features.txt -kcv 15 \n", + "DONE\n", + "Trying features [1, 2, 4, 6] TEST NDCG@10=0.8822\n", + "Running java -jar data/RankyMcRankFace.jar -ranker 6 -metric2t NDCG@10 -tree 20 -leaf 20 -train data/title_judgments_train.txt -save data/temp_model.txt -feature features.txt -kcv 15 \n", + "DONE\n", + "Trying features [1, 2, 4, 7] TEST NDCG@10=0.8054\n", "Running java -jar data/RankyMcRankFace.jar -ranker 6 -metric2t NDCG@10 -tree 20 -leaf 20 -train data/title_judgments_train.txt -save data/temp_model.txt -feature features.txt -kcv 15 \n" ] }, @@ -28785,100 +28801,109 @@ "output_type": "stream", "text": [ "DONE\n", - "Trying features [1, 2, 3, 6] TEST NDCG@10=0.879 after cost 0.879\n", + "Trying features [1, 2, 5, 6] TEST NDCG@10=0.8838\n", "Running java -jar data/RankyMcRankFace.jar -ranker 6 -metric2t NDCG@10 -tree 20 -leaf 20 -train data/title_judgments_train.txt -save data/temp_model.txt -feature features.txt -kcv 15 \n", "DONE\n", - "Trying features [1, 2, 3, 7] TEST NDCG@10=0.8756 after cost 0.8756\n", + "Trying features [1, 2, 5, 7] TEST NDCG@10=0.7935\n", "Running java -jar data/RankyMcRankFace.jar -ranker 6 -metric2t NDCG@10 -tree 20 -leaf 20 -train data/title_judgments_train.txt -save data/temp_model.txt -feature features.txt -kcv 15 \n", "DONE\n", - "Trying features [1, 2, 4, 5] TEST NDCG@10=0.8296 after cost 0.8296\n", + "Trying features [1, 2, 6, 7] TEST NDCG@10=0.8447\n", "Running java -jar data/RankyMcRankFace.jar -ranker 6 -metric2t NDCG@10 -tree 20 -leaf 20 -train data/title_judgments_train.txt -save data/temp_model.txt -feature features.txt -kcv 15 \n", "DONE\n", - "Trying features [1, 2, 4, 6] TEST NDCG@10=0.8822 after cost 0.8822\n", + "Trying features [1, 3, 4, 5] TEST NDCG@10=0.907\n", "Running java -jar data/RankyMcRankFace.jar -ranker 6 -metric2t NDCG@10 -tree 20 -leaf 20 -train data/title_judgments_train.txt -save data/temp_model.txt -feature features.txt -kcv 15 \n", "DONE\n", - "Trying features [1, 2, 4, 7] TEST NDCG@10=0.8054 after cost 0.8054\n", + "Trying features [1, 3, 4, 6] TEST NDCG@10=0.9022\n", "Running java -jar data/RankyMcRankFace.jar -ranker 6 -metric2t NDCG@10 -tree 20 -leaf 20 -train data/title_judgments_train.txt -save data/temp_model.txt -feature features.txt -kcv 15 \n", "DONE\n", - "Trying features [1, 2, 5, 6] TEST NDCG@10=0.8838 after cost 0.8838\n", + "Trying features [1, 3, 4, 7] TEST NDCG@10=0.9119\n", "Running java -jar data/RankyMcRankFace.jar -ranker 6 -metric2t NDCG@10 -tree 20 -leaf 20 -train data/title_judgments_train.txt -save data/temp_model.txt -feature features.txt -kcv 15 \n", "DONE\n", - "Trying features [1, 2, 5, 7] TEST NDCG@10=0.7935 after cost 0.7935\n", + "Trying features [1, 3, 5, 6] TEST NDCG@10=0.8876\n", "Running java -jar data/RankyMcRankFace.jar -ranker 6 -metric2t NDCG@10 -tree 20 -leaf 20 -train data/title_judgments_train.txt -save data/temp_model.txt -feature features.txt -kcv 15 \n", "DONE\n", - "Trying features [1, 2, 6, 7] TEST NDCG@10=0.8447 after cost 0.8447\n", + "Trying features [1, 3, 5, 7] TEST NDCG@10=0.8644\n", "Running java -jar data/RankyMcRankFace.jar -ranker 6 -metric2t NDCG@10 -tree 20 -leaf 20 -train data/title_judgments_train.txt -save data/temp_model.txt -feature features.txt -kcv 15 \n", "DONE\n", - "Trying features [1, 3, 4, 5] TEST NDCG@10=0.907 after cost 0.907\n", + "Trying features [1, 3, 6, 7] TEST NDCG@10=0.8747\n", "Running java -jar data/RankyMcRankFace.jar -ranker 6 -metric2t NDCG@10 -tree 20 -leaf 20 -train data/title_judgments_train.txt -save data/temp_model.txt -feature features.txt -kcv 15 \n", "DONE\n", - "Trying features [1, 3, 4, 6] TEST NDCG@10=0.9022 after cost 0.9022\n", + "Trying features [1, 4, 5, 6] TEST NDCG@10=0.8826\n", "Running java -jar data/RankyMcRankFace.jar -ranker 6 -metric2t NDCG@10 -tree 20 -leaf 20 -train data/title_judgments_train.txt -save data/temp_model.txt -feature features.txt -kcv 15 \n", "DONE\n", - "Trying features [1, 3, 4, 7] TEST NDCG@10=0.9119 after cost 0.9119\n", + "Trying features [1, 4, 5, 7] TEST NDCG@10=0.8222\n", "Running java -jar data/RankyMcRankFace.jar -ranker 6 -metric2t NDCG@10 -tree 20 -leaf 20 -train data/title_judgments_train.txt -save data/temp_model.txt -feature features.txt -kcv 15 \n", "DONE\n", - "Trying features [1, 3, 5, 6] TEST NDCG@10=0.8876 after cost 0.8876\n", + "Trying features [1, 4, 6, 7] TEST NDCG@10=0.8953\n", "Running java -jar data/RankyMcRankFace.jar -ranker 6 -metric2t NDCG@10 -tree 20 -leaf 20 -train data/title_judgments_train.txt -save data/temp_model.txt -feature features.txt -kcv 15 \n", "DONE\n", - "Trying features [1, 3, 5, 7] TEST NDCG@10=0.8644 after cost 0.8644\n", + "Trying features [1, 5, 6, 7] TEST NDCG@10=0.8504\n", "Running java -jar data/RankyMcRankFace.jar -ranker 6 -metric2t NDCG@10 -tree 20 -leaf 20 -train data/title_judgments_train.txt -save data/temp_model.txt -feature features.txt -kcv 15 \n", "DONE\n", - "Trying features [1, 3, 6, 7] TEST NDCG@10=0.8747 after cost 0.8747\n", + "Trying features [2, 3, 4, 5] TEST NDCG@10=0.854\n", "Running java -jar data/RankyMcRankFace.jar -ranker 6 -metric2t NDCG@10 -tree 20 -leaf 20 -train data/title_judgments_train.txt -save data/temp_model.txt -feature features.txt -kcv 15 \n", "DONE\n", - "Trying features [1, 4, 5, 6] TEST NDCG@10=0.8826 after cost 0.8826\n", + "Trying features [2, 3, 4, 6] TEST NDCG@10=0.889\n", "Running java -jar data/RankyMcRankFace.jar -ranker 6 -metric2t NDCG@10 -tree 20 -leaf 20 -train data/title_judgments_train.txt -save data/temp_model.txt -feature features.txt -kcv 15 \n", "DONE\n", - "Trying features [1, 4, 5, 7] TEST NDCG@10=0.8222 after cost 0.8222\n", + "Trying features [2, 3, 4, 7] TEST NDCG@10=0.8815\n", "Running java -jar data/RankyMcRankFace.jar -ranker 6 -metric2t NDCG@10 -tree 20 -leaf 20 -train data/title_judgments_train.txt -save data/temp_model.txt -feature features.txt -kcv 15 \n", "DONE\n", - "Trying features [1, 4, 6, 7] TEST NDCG@10=0.8953 after cost 0.8953\n", + "Trying features [2, 3, 5, 6] TEST NDCG@10=0.8813\n", "Running java -jar data/RankyMcRankFace.jar -ranker 6 -metric2t NDCG@10 -tree 20 -leaf 20 -train data/title_judgments_train.txt -save data/temp_model.txt -feature features.txt -kcv 15 \n", "DONE\n", - "Trying features [1, 5, 6, 7] TEST NDCG@10=0.8504 after cost 0.8504\n", + "Trying features [2, 3, 5, 7] TEST NDCG@10=0.8657\n", "Running java -jar data/RankyMcRankFace.jar -ranker 6 -metric2t NDCG@10 -tree 20 -leaf 20 -train data/title_judgments_train.txt -save data/temp_model.txt -feature features.txt -kcv 15 \n", "DONE\n", - "Trying features [2, 3, 4, 5] TEST NDCG@10=0.854 after cost 0.854\n", + "Trying features [2, 3, 6, 7] TEST NDCG@10=0.8753\n", "Running java -jar data/RankyMcRankFace.jar -ranker 6 -metric2t NDCG@10 -tree 20 -leaf 20 -train data/title_judgments_train.txt -save data/temp_model.txt -feature features.txt -kcv 15 \n", "DONE\n", - "Trying features [2, 3, 4, 6] TEST NDCG@10=0.889 after cost 0.889\n", + "Trying features [2, 4, 5, 6] TEST NDCG@10=0.7876\n", "Running java -jar data/RankyMcRankFace.jar -ranker 6 -metric2t NDCG@10 -tree 20 -leaf 20 -train data/title_judgments_train.txt -save data/temp_model.txt -feature features.txt -kcv 15 \n", "DONE\n", - "Trying features [2, 3, 4, 7] TEST NDCG@10=0.8815 after cost 0.8815\n", + "Trying features [2, 4, 5, 7] TEST NDCG@10=0.6095\n", "Running java -jar data/RankyMcRankFace.jar -ranker 6 -metric2t NDCG@10 -tree 20 -leaf 20 -train data/title_judgments_train.txt -save data/temp_model.txt -feature features.txt -kcv 15 \n", "DONE\n", - "Trying features [2, 3, 5, 6] TEST NDCG@10=0.8813 after cost 0.8813\n", + "Trying features [2, 4, 6, 7] TEST NDCG@10=0.8212\n", "Running java -jar data/RankyMcRankFace.jar -ranker 6 -metric2t NDCG@10 -tree 20 -leaf 20 -train data/title_judgments_train.txt -save data/temp_model.txt -feature features.txt -kcv 15 \n", "DONE\n", - "Trying features [2, 3, 5, 7] TEST NDCG@10=0.8657 after cost 0.8657\n", + "Trying features [2, 5, 6, 7] TEST NDCG@10=0.8167\n", "Running java -jar data/RankyMcRankFace.jar -ranker 6 -metric2t NDCG@10 -tree 20 -leaf 20 -train data/title_judgments_train.txt -save data/temp_model.txt -feature features.txt -kcv 15 \n", "DONE\n", - "Trying features [2, 3, 6, 7] TEST NDCG@10=0.8753 after cost 0.8753\n", + "Trying features [3, 4, 5, 6] TEST NDCG@10=0.8849\n", "Running java -jar data/RankyMcRankFace.jar -ranker 6 -metric2t NDCG@10 -tree 20 -leaf 20 -train data/title_judgments_train.txt -save data/temp_model.txt -feature features.txt -kcv 15 \n", "DONE\n", - "Trying features [2, 4, 5, 6] TEST NDCG@10=0.7876 after cost 0.7876\n", + "Trying features [3, 4, 5, 7] TEST NDCG@10=0.8877\n", "Running java -jar data/RankyMcRankFace.jar -ranker 6 -metric2t NDCG@10 -tree 20 -leaf 20 -train data/title_judgments_train.txt -save data/temp_model.txt -feature features.txt -kcv 15 \n", "DONE\n", - "Trying features [2, 4, 5, 7] TEST NDCG@10=0.6095 after cost 0.6095\n", + "Trying features [3, 4, 6, 7] TEST NDCG@10=0.8605\n", "Running java -jar data/RankyMcRankFace.jar -ranker 6 -metric2t NDCG@10 -tree 20 -leaf 20 -train data/title_judgments_train.txt -save data/temp_model.txt -feature features.txt -kcv 15 \n", "DONE\n", - "Trying features [2, 4, 6, 7] TEST NDCG@10=0.8212 after cost 0.8212\n", + "Trying features [3, 5, 6, 7] TEST NDCG@10=0.8503\n", + "Running java -jar data/RankyMcRankFace.jar -ranker 6 -metric2t NDCG@10 -tree 20 -leaf 20 -train data/title_judgments_train.txt -save data/temp_model.txt -feature features.txt -kcv 15 \n", + "DONE\n", + "Trying features [4, 5, 6, 7] TEST NDCG@10=0.7956\n", + "Running java -jar data/RankyMcRankFace.jar -ranker 6 -metric2t NDCG@10 -tree 20 -leaf 20 -train data/title_judgments_train.txt -save data/temp_model.txt -feature features.txt -kcv 15 \n", + "DONE\n", + "Trying features [1, 2, 3, 4, 5] TEST NDCG@10=0.907\n", + "Running java -jar data/RankyMcRankFace.jar -ranker 6 -metric2t NDCG@10 -tree 20 -leaf 20 -train data/title_judgments_train.txt -save data/temp_model.txt -feature features.txt -kcv 15 \n", + "DONE\n", + "Trying features [1, 2, 3, 4, 6] TEST NDCG@10=0.9022\n", "Running java -jar data/RankyMcRankFace.jar -ranker 6 -metric2t NDCG@10 -tree 20 -leaf 20 -train data/title_judgments_train.txt -save data/temp_model.txt -feature features.txt -kcv 15 \n", "DONE\n", - "Trying features [2, 5, 6, 7] TEST NDCG@10=0.8167 after cost 0.8167\n", + "Trying features [1, 2, 3, 4, 7] TEST NDCG@10=0.9119\n", "Running java -jar data/RankyMcRankFace.jar -ranker 6 -metric2t NDCG@10 -tree 20 -leaf 20 -train data/title_judgments_train.txt -save data/temp_model.txt -feature features.txt -kcv 15 \n", "DONE\n", - "Trying features [3, 4, 5, 6] TEST NDCG@10=0.8849 after cost 0.8849\n", + "Trying features [1, 2, 3, 5, 6] TEST NDCG@10=0.8876\n", "Running java -jar data/RankyMcRankFace.jar -ranker 6 -metric2t NDCG@10 -tree 20 -leaf 20 -train data/title_judgments_train.txt -save data/temp_model.txt -feature features.txt -kcv 15 \n", "DONE\n", - "Trying features [3, 4, 5, 7] TEST NDCG@10=0.8877 after cost 0.8877\n", + "Trying features [1, 2, 3, 5, 7] TEST NDCG@10=0.8644\n", "Running java -jar data/RankyMcRankFace.jar -ranker 6 -metric2t NDCG@10 -tree 20 -leaf 20 -train data/title_judgments_train.txt -save data/temp_model.txt -feature features.txt -kcv 15 \n", "DONE\n", - "Trying features [3, 4, 6, 7] TEST NDCG@10=0.8605 after cost 0.8605\n", + "Trying features [1, 2, 3, 6, 7] TEST NDCG@10=0.8747\n", "Running java -jar data/RankyMcRankFace.jar -ranker 6 -metric2t NDCG@10 -tree 20 -leaf 20 -train data/title_judgments_train.txt -save data/temp_model.txt -feature features.txt -kcv 15 \n", "DONE\n", - "Trying features [3, 5, 6, 7] TEST NDCG@10=0.8503 after cost 0.8503\n", + "Trying features [1, 2, 4, 5, 6] TEST NDCG@10=0.8828\n", "Running java -jar data/RankyMcRankFace.jar -ranker 6 -metric2t NDCG@10 -tree 20 -leaf 20 -train data/title_judgments_train.txt -save data/temp_model.txt -feature features.txt -kcv 15 \n" ] }, @@ -28887,94 +28912,70 @@ "output_type": "stream", "text": [ "DONE\n", - "Trying features [4, 5, 6, 7] TEST NDCG@10=0.7956 after cost 0.7956\n", - "Running java -jar data/RankyMcRankFace.jar -ranker 6 -metric2t NDCG@10 -tree 20 -leaf 20 -train data/title_judgments_train.txt -save data/temp_model.txt -feature features.txt -kcv 15 \n", - "DONE\n", - "Trying features [1, 2, 3, 4, 5] TEST NDCG@10=0.907 after cost 0.907\n", - "Running java -jar data/RankyMcRankFace.jar -ranker 6 -metric2t NDCG@10 -tree 20 -leaf 20 -train data/title_judgments_train.txt -save data/temp_model.txt -feature features.txt -kcv 15 \n", - "DONE\n", - "Trying features [1, 2, 3, 4, 6] TEST NDCG@10=0.9022 after cost 0.9022\n", - "Running java -jar data/RankyMcRankFace.jar -ranker 6 -metric2t NDCG@10 -tree 20 -leaf 20 -train data/title_judgments_train.txt -save data/temp_model.txt -feature features.txt -kcv 15 \n", - "DONE\n", - "Trying features [1, 2, 3, 4, 7] TEST NDCG@10=0.9119 after cost 0.9119\n", - "Running java -jar data/RankyMcRankFace.jar -ranker 6 -metric2t NDCG@10 -tree 20 -leaf 20 -train data/title_judgments_train.txt -save data/temp_model.txt -feature features.txt -kcv 15 \n", - "DONE\n", - "Trying features [1, 2, 3, 5, 6] TEST NDCG@10=0.8876 after cost 0.8876\n", - "Running java -jar data/RankyMcRankFace.jar -ranker 6 -metric2t NDCG@10 -tree 20 -leaf 20 -train data/title_judgments_train.txt -save data/temp_model.txt -feature features.txt -kcv 15 \n", - "DONE\n", - "Trying features [1, 2, 3, 5, 7] TEST NDCG@10=0.8644 after cost 0.8644\n", - "Running java -jar data/RankyMcRankFace.jar -ranker 6 -metric2t NDCG@10 -tree 20 -leaf 20 -train data/title_judgments_train.txt -save data/temp_model.txt -feature features.txt -kcv 15 \n", - "DONE\n", - "Trying features [1, 2, 3, 6, 7] TEST NDCG@10=0.8747 after cost 0.8747\n", - "Running java -jar data/RankyMcRankFace.jar -ranker 6 -metric2t NDCG@10 -tree 20 -leaf 20 -train data/title_judgments_train.txt -save data/temp_model.txt -feature features.txt -kcv 15 \n", - "DONE\n", - "Trying features [1, 2, 4, 5, 6] TEST NDCG@10=0.8828 after cost 0.8828\n", - "Running java -jar data/RankyMcRankFace.jar -ranker 6 -metric2t NDCG@10 -tree 20 -leaf 20 -train data/title_judgments_train.txt -save data/temp_model.txt -feature features.txt -kcv 15 \n", - "DONE\n", - "Trying features [1, 2, 4, 5, 7] TEST NDCG@10=0.815 after cost 0.815\n", + "Trying features [1, 2, 4, 5, 7] TEST NDCG@10=0.815\n", "Running java -jar data/RankyMcRankFace.jar -ranker 6 -metric2t NDCG@10 -tree 20 -leaf 20 -train data/title_judgments_train.txt -save data/temp_model.txt -feature features.txt -kcv 15 \n", "DONE\n", - "Trying features [1, 2, 4, 6, 7] TEST NDCG@10=0.8953 after cost 0.8953\n", + "Trying features [1, 2, 4, 6, 7] TEST NDCG@10=0.8953\n", "Running java -jar data/RankyMcRankFace.jar -ranker 6 -metric2t NDCG@10 -tree 20 -leaf 20 -train data/title_judgments_train.txt -save data/temp_model.txt -feature features.txt -kcv 15 \n", "DONE\n", - "Trying features [1, 2, 5, 6, 7] TEST NDCG@10=0.8493 after cost 0.8493\n", + "Trying features [1, 2, 5, 6, 7] TEST NDCG@10=0.8493\n", "Running java -jar data/RankyMcRankFace.jar -ranker 6 -metric2t NDCG@10 -tree 20 -leaf 20 -train data/title_judgments_train.txt -save data/temp_model.txt -feature features.txt -kcv 15 \n", "DONE\n", - "Trying features [1, 3, 4, 5, 6] TEST NDCG@10=0.8978 after cost 0.8978\n", + "Trying features [1, 3, 4, 5, 6] TEST NDCG@10=0.8978\n", "Running java -jar data/RankyMcRankFace.jar -ranker 6 -metric2t NDCG@10 -tree 20 -leaf 20 -train data/title_judgments_train.txt -save data/temp_model.txt -feature features.txt -kcv 15 \n", "DONE\n", - "Trying features [1, 3, 4, 5, 7] TEST NDCG@10=0.906 after cost 0.906\n", + "Trying features [1, 3, 4, 5, 7] TEST NDCG@10=0.906\n", "Running java -jar data/RankyMcRankFace.jar -ranker 6 -metric2t NDCG@10 -tree 20 -leaf 20 -train data/title_judgments_train.txt -save data/temp_model.txt -feature features.txt -kcv 15 \n", "DONE\n", - "Trying features [1, 3, 4, 6, 7] TEST NDCG@10=0.8951 after cost 0.8951\n", + "Trying features [1, 3, 4, 6, 7] TEST NDCG@10=0.8951\n", "Running java -jar data/RankyMcRankFace.jar -ranker 6 -metric2t NDCG@10 -tree 20 -leaf 20 -train data/title_judgments_train.txt -save data/temp_model.txt -feature features.txt -kcv 15 \n", "DONE\n", - "Trying features [1, 3, 5, 6, 7] TEST NDCG@10=0.8709 after cost 0.8709\n", + "Trying features [1, 3, 5, 6, 7] TEST NDCG@10=0.8709\n", "Running java -jar data/RankyMcRankFace.jar -ranker 6 -metric2t NDCG@10 -tree 20 -leaf 20 -train data/title_judgments_train.txt -save data/temp_model.txt -feature features.txt -kcv 15 \n", "DONE\n", - "Trying features [1, 4, 5, 6, 7] TEST NDCG@10=0.8837 after cost 0.8837\n", + "Trying features [1, 4, 5, 6, 7] TEST NDCG@10=0.8837\n", "Running java -jar data/RankyMcRankFace.jar -ranker 6 -metric2t NDCG@10 -tree 20 -leaf 20 -train data/title_judgments_train.txt -save data/temp_model.txt -feature features.txt -kcv 15 \n", "DONE\n", - "Trying features [2, 3, 4, 5, 6] TEST NDCG@10=0.8849 after cost 0.8849\n", + "Trying features [2, 3, 4, 5, 6] TEST NDCG@10=0.8849\n", "Running java -jar data/RankyMcRankFace.jar -ranker 6 -metric2t NDCG@10 -tree 20 -leaf 20 -train data/title_judgments_train.txt -save data/temp_model.txt -feature features.txt -kcv 15 \n", "DONE\n", - "Trying features [2, 3, 4, 5, 7] TEST NDCG@10=0.8877 after cost 0.8877\n", + "Trying features [2, 3, 4, 5, 7] TEST NDCG@10=0.8877\n", "Running java -jar data/RankyMcRankFace.jar -ranker 6 -metric2t NDCG@10 -tree 20 -leaf 20 -train data/title_judgments_train.txt -save data/temp_model.txt -feature features.txt -kcv 15 \n", "DONE\n", - "Trying features [2, 3, 4, 6, 7] TEST NDCG@10=0.8605 after cost 0.8605\n", + "Trying features [2, 3, 4, 6, 7] TEST NDCG@10=0.8605\n", "Running java -jar data/RankyMcRankFace.jar -ranker 6 -metric2t NDCG@10 -tree 20 -leaf 20 -train data/title_judgments_train.txt -save data/temp_model.txt -feature features.txt -kcv 15 \n", "DONE\n", - "Trying features [2, 3, 5, 6, 7] TEST NDCG@10=0.8503 after cost 0.8503\n", + "Trying features [2, 3, 5, 6, 7] TEST NDCG@10=0.8503\n", "Running java -jar data/RankyMcRankFace.jar -ranker 6 -metric2t NDCG@10 -tree 20 -leaf 20 -train data/title_judgments_train.txt -save data/temp_model.txt -feature features.txt -kcv 15 \n", "DONE\n", - "Trying features [2, 4, 5, 6, 7] TEST NDCG@10=0.8083 after cost 0.8083\n", + "Trying features [2, 4, 5, 6, 7] TEST NDCG@10=0.8083\n", "Running java -jar data/RankyMcRankFace.jar -ranker 6 -metric2t NDCG@10 -tree 20 -leaf 20 -train data/title_judgments_train.txt -save data/temp_model.txt -feature features.txt -kcv 15 \n", "DONE\n", - "Trying features [3, 4, 5, 6, 7] TEST NDCG@10=0.8659 after cost 0.8659\n", + "Trying features [3, 4, 5, 6, 7] TEST NDCG@10=0.8659\n", "Running java -jar data/RankyMcRankFace.jar -ranker 6 -metric2t NDCG@10 -tree 20 -leaf 20 -train data/title_judgments_train.txt -save data/temp_model.txt -feature features.txt -kcv 15 \n", "DONE\n", - "Trying features [1, 2, 3, 4, 5, 6] TEST NDCG@10=0.8978 after cost 0.8978\n", + "Trying features [1, 2, 3, 4, 5, 6] TEST NDCG@10=0.8978\n", "Running java -jar data/RankyMcRankFace.jar -ranker 6 -metric2t NDCG@10 -tree 20 -leaf 20 -train data/title_judgments_train.txt -save data/temp_model.txt -feature features.txt -kcv 15 \n", "DONE\n", - "Trying features [1, 2, 3, 4, 5, 7] TEST NDCG@10=0.906 after cost 0.906\n", + "Trying features [1, 2, 3, 4, 5, 7] TEST NDCG@10=0.906\n", "Running java -jar data/RankyMcRankFace.jar -ranker 6 -metric2t NDCG@10 -tree 20 -leaf 20 -train data/title_judgments_train.txt -save data/temp_model.txt -feature features.txt -kcv 15 \n", "DONE\n", - "Trying features [1, 2, 3, 4, 6, 7] TEST NDCG@10=0.8951 after cost 0.8951\n", + "Trying features [1, 2, 3, 4, 6, 7] TEST NDCG@10=0.8951\n", "Running java -jar data/RankyMcRankFace.jar -ranker 6 -metric2t NDCG@10 -tree 20 -leaf 20 -train data/title_judgments_train.txt -save data/temp_model.txt -feature features.txt -kcv 15 \n", "DONE\n", - "Trying features [1, 2, 3, 5, 6, 7] TEST NDCG@10=0.8709 after cost 0.8709\n", + "Trying features [1, 2, 3, 5, 6, 7] TEST NDCG@10=0.8709\n", "Running java -jar data/RankyMcRankFace.jar -ranker 6 -metric2t NDCG@10 -tree 20 -leaf 20 -train data/title_judgments_train.txt -save data/temp_model.txt -feature features.txt -kcv 15 \n", "DONE\n", - "Trying features [1, 2, 4, 5, 6, 7] TEST NDCG@10=0.8837 after cost 0.8837\n", + "Trying features [1, 2, 4, 5, 6, 7] TEST NDCG@10=0.8837\n", "Running java -jar data/RankyMcRankFace.jar -ranker 6 -metric2t NDCG@10 -tree 20 -leaf 20 -train data/title_judgments_train.txt -save data/temp_model.txt -feature features.txt -kcv 15 \n", "DONE\n", - "Trying features [1, 3, 4, 5, 6, 7] TEST NDCG@10=0.9004 after cost 0.9004\n", + "Trying features [1, 3, 4, 5, 6, 7] TEST NDCG@10=0.9004\n", "Running java -jar data/RankyMcRankFace.jar -ranker 6 -metric2t NDCG@10 -tree 20 -leaf 20 -train data/title_judgments_train.txt -save data/temp_model.txt -feature features.txt -kcv 15 \n", "DONE\n", - "Trying features [2, 3, 4, 5, 6, 7] TEST NDCG@10=0.8659 after cost 0.8659\n", + "Trying features [2, 3, 4, 5, 6, 7] TEST NDCG@10=0.8659\n", "Running java -jar data/RankyMcRankFace.jar -ranker 6 -metric2t NDCG@10 -tree 20 -leaf 20 -train data/title_judgments_train.txt -save data/temp_model.txt -feature features.txt -kcv 15 \n", "DONE\n", - "Trying features [1, 2, 3, 4, 5, 6, 7] TEST NDCG@10=0.9004 after cost 0.9004\n", + "Trying features [1, 2, 3, 4, 5, 6, 7] TEST NDCG@10=0.9004\n", "\n", "Impact of each feature on the model\n", "3 - 17728.651362443747\n", diff --git a/train_to_csv.py b/train_to_csv.py new file mode 100644 index 0000000..d0070ce --- /dev/null +++ b/train_to_csv.py @@ -0,0 +1,33 @@ +from ltr.judgments import judgments_from_file +from ltr.client import ElasticClient +import csv + + +def train_to_csv(client, feature_set, in_filename, out_filename): + features = client.feature_set(name=feature_set, index='tmdb')[0] + fieldnames = ['keywords', 'qid', 'grade'] + fieldnames.extend([feature['name'] for feature in features]) + with open(out_filename, 'w') as csvfile: + writer = csv.DictWriter(csvfile, fieldnames=fieldnames) + writer.writeheader() + + judgments = judgments_from_file(filename='data/title_judgments_train.txt') + for judgment in judgments: + assert len(judgment.features) == len(fieldnames) - 3 + record = {} + record[fieldnames[0]] = judgment.keywords + record[fieldnames[1]] = judgment.qid + record[fieldnames[2]] = judgment.grade + for idx,field in enumerate(fieldnames[3:]): + record[field] = judgment.features[idx] + + writer.writerow(record) + +if __name__ == "__main__": + from sys import argv + client = ElasticClient() + train_to_csv(client=client, in_filename=argv[1], + feature_set=argv[2], out_filename=argv[3]) + + +