瀏覽代碼

demo测试代码

zhangbo 5 月之前
父節點
當前提交
59d557a2b5
共有 1 個文件被更改,包括 29 次插入48 次删除
  1. 29 48
      src/main/java/com/tzld/piaoquan/recommend/similarity/word2vec/Demo.java

+ 29 - 48
src/main/java/com/tzld/piaoquan/recommend/similarity/word2vec/Demo.java

@@ -32,59 +32,40 @@ public class Demo {
         } catch (IOException e) {
             e.printStackTrace();
         }
-
-//        String[] s = new String[]{
-//                "🔴终于找到了这首歌,献给你!",
-//                "各位退休的同学,请听!",
-//                "这首歌太好听了,听醉了别怪我!",
-//                "老了真的很难!",
-//                "老同学在聚会上的演讲幽默是太实在了💢",
-//                "🔥🔥🔥一篇关于养老金问题的文章,请过来看看",
-//                "🔴老人考级的标准出台!符合6个条件的了不得🔥",
-//                "超级贵的景色,看过的彻底傻眼了📣",
-//                "她走了!泪目!留下了这段话,让人潸然泪下!",
-//                "🔴老同学❗️好久不见了,大家来看看吧!",
-//                "⭕谁写的?把人《一辈子》写明白了,给老友看看吧 ~!",
-//                "太美了,难得一见的美景~"
-//        };
-
-        String[] s = new String[]{
-                "九九重阳节快乐🔴",
-                "不结婚不生孩子,老了之后就是这个下场!",
-                "🔴瞠目结舌!朝鲜这个国家有多狠!",
-                "⭕九九重阳节,将出现“双月同天”的天文景象",
-                "🍑⭕《九九重阳节》",
-                "⭕这个建议实在是太及时了,忍不住为他鼓掌",
-                "⭕老外做梦也想不到,我国又出了一位像袁隆平一样的农业奇才",
-                "重阳节快乐🚩",
-                "🔴《知心朋友》一首好听的歌,说的好,",
-                "⚡为什么农历九月九为“重阳节”为什么又叫“老人节”",
-                "🔥📢🔴十分通透的一段话,写得太棒了,请朋友们收好!",
-                "🔴重阳将至,小宝贝送来最美最真挚的祝福,愿老友吉祥幸福",
-                "🔴老外惊掉下巴!中国竟在天上造机场,巫山机场太牛了",
-                "这就是人生,听完我哭了",
-                "⭕很多人都在找这首歌,太美了,太好听了!",
-                "⭕九九重阳节,将出现“双月同天”的珍贵天文景象",
-                "想念老同学",
-                "⭕今年的重阳节有什么讲究?看完你就明白了",
-                "⭕养老院的真实生活,看完让人泪目",
-                "早上好,有你相伴,幸运满满"
+        String[] s1 = new String[]{
+            "中医", "书法", "食疗", "固气", "唱歌", "太极",
+                "瑜伽", "短剧", "营养健康", "国画"
+        };
+        String[] s2 = new String[]{
+//                "人生忠告",
+//                "知识科普",
+//                "祝福音乐",
+//                "搞笑段子",
+//                "怀念时光",
+//                "生活小妙招",
+//                "中国历史影像",
+//                "国家力量",
+//                "早中晚好",
+//                "美食教程",
+//                "风景实拍",
+//                "民生政策",
+//                "节日祝福",
+//                "亲情音乐",
+//                "动物萌宠",
+//                "旅行攻略",
+//                "中国战争史",
+
+                "情感","音乐","搞笑","历史","生活记录","文化","旅行","美食","医疗健康","三农","科普","时政","教育","舞蹈","科技","艺术","军事","动物","财经","奇人异象","公益","随拍","母婴","综艺","法律","名人","时尚","生活家居","体育","宗教","汽车","剧情","摄影摄像","职场","地域本地","游戏","收藏品","二次元","电影","短剧","电视剧"
         };
-
-
 //分词,获取词语列表
-        List<String>[] words = new ArrayList[s.length];
-        for (int i = 0; i < s.length; i++) {
-            words[i] = Segment.getWords(s[i]);
-        }
-
-        for (int i = 0; i < words.length - 1; i++) {
-            for (int j = i + 1; j < words.length; j++) {
-                System.out.println(s[i] + "\t" + s[j] + "\t" + vec.fastSentenceSimilarity(words[i], words[j]) + "\t" + vec.sentenceSimilarity(words[i], words[j]));
+        for (String a : s1){
+            List<String> worda = Segment.getWords(a);
+            for (String b : s2){
+                List<String> wordb = Segment.getWords(b);
+                System.out.println(a + "\t" + b + "\t" + vec.sentenceSimilarity(worda, wordb));
             }
         }
 
-
 //句子相似度(名词、动词权值设为1,其他设为0.8)
 //        float[] weightArray1 = Segment.getPOSWeightArray(Segment.getPOS(s1));
 //        float[] weightArray2 = Segment.getPOSWeightArray(Segment.getPOS(s2));