update evaluation logic (#90)

shenweichen · web-flow · commit b681eb82495d · 2022-10-31T23:25:41.000+08:00
update evaluation logic
diff --git a/.github/ISSUE_TEMPLATE/bug_report.md b/.github/ISSUE_TEMPLATE/bug_report.md
@@ -20,7 +20,7 @@ Steps to reproduce the behavior:
 **Operating environment(运行环境):**
  - python version [e.g. 3.6, 3.7, 3.8]
  - tensorflow version [e.g. 1.9.0, 1.14.0, 2.5.0]
- - deepmatch version [e.g. 0.3.0,]
+ - deepmatch version [e.g. 0.3.1,]
 
 **Additional context**
 Add any other context about the problem here.
diff --git a/.github/ISSUE_TEMPLATE/question.md b/.github/ISSUE_TEMPLATE/question.md
@@ -17,4 +17,4 @@ Add any other context about the problem here.
 **Operating environment(运行环境):**
  - python version [e.g. 3.6, 3.7, 3.8]
  - tensorflow version [e.g. 1.9.0, 1.14.0, 2.5.0]
- - deepmatch version [e.g. 0.3.0,]
+ - deepmatch version [e.g. 0.3.1,]
diff --git a/.github/workflows/ci.yml b/.github/workflows/ci.yml
@@ -17,7 +17,7 @@ jobs:
     timeout-minutes: 120
     strategy:
       matrix:
-        python-version: [3.6,3.7,3.8]
+        python-version: [3.6,3.7,3.8,3.9,3.10.7]
         tf-version: [1.9.0,1.14.0,2.5.0]
 
         exclude:
@@ -57,12 +57,28 @@ jobs:
             tf-version: 2.8.0
           - python-version: 3.6
             tf-version: 2.9.0
+          - python-version: 3.6
+            tf-version: 2.10.0
           - python-version: 3.9
             tf-version: 1.4.0
+          - python-version: 3.9
+            tf-version: 1.9.0
           - python-version: 3.9
             tf-version: 1.15.0
           - python-version: 3.9
-            tf-version: 2.2.0
+            tf-version: 1.14.0
+          - python-version: 3.10.7
+            tf-version: 1.4.0
+          - python-version: 3.10.7
+            tf-version: 1.9.0
+          - python-version: 3.10.7
+            tf-version: 1.15.0
+          - python-version: 3.10.7
+            tf-version: 1.14.0
+          - python-version: 3.10.7
+            tf-version: 2.5.0
+          - python-version: 3.10.7
+            tf-version: 2.6.0
 
     steps:
 
@@ -75,6 +91,7 @@ jobs:
 
     - name: Install dependencies
       run: |
+        sudo apt update && sudo apt install -y pkg-config libhdf5-dev
         pip3 install -q tensorflow==${{ matrix.tf-version }}
         pip install -q protobuf==3.19.0
         pip install -q requests
diff --git a/.gitignore b/.gitignore
@@ -1,3 +1,4 @@
+.idea
 # Byte-compiled / optimized / DLL files
 __pycache__/
 *.py[cod]
diff --git a/deepmatch/__init__.py b/deepmatch/__init__.py
@@ -1,4 +1,4 @@
 from .utils import check_version
 
-__version__ = '0.3.0'
+__version__ = '0.3.1'
 check_version(__version__)
diff --git a/deepmatch/models/comirec.py b/deepmatch/models/comirec.py
@@ -13,18 +13,20 @@
 from deepctr.layers.utils import NoMask, combined_dnn_input, add_func
 from tensorflow.python.keras.layers import Concatenate, Lambda
 from tensorflow.python.keras.models import Model
+
 from ..inputs import create_embedding_matrix
-from ..layers.core import CapsuleLayer, PoolingLayer, LabelAwareAttention, SampledSoftmaxLayer, EmbeddingIndex
+from ..layers.core import CapsuleLayer, PoolingLayer, MaskUserEmbedding, LabelAwareAttention, SampledSoftmaxLayer, \
+    EmbeddingIndex
 from ..layers.interaction import SoftmaxWeightedSum
 from ..utils import get_item_embedding
 
 
-def tile_user_otherfeat(user_other_feature, interest_num):
-    return tf.tile(tf.expand_dims(user_other_feature, -2), [1, interest_num, 1])
+def tile_user_otherfeat(user_other_feature, k_max):
+    return tf.tile(tf.expand_dims(user_other_feature, -2), [1, k_max, 1])
 
 
-def tile_user_his_mask(hist_len, seq_max_len, interest_num):
-    return tf.tile(tf.sequence_mask(hist_len, seq_max_len), [1, interest_num, 1])
+def tile_user_his_mask(hist_len, seq_max_len, k_max):
+    return tf.tile(tf.sequence_mask(hist_len, seq_max_len), [1, k_max, 1])
 
 
 def softmax_Weighted_Sum(input):
@@ -37,20 +39,19 @@ def softmax_Weighted_Sum(input):
     return high_capsule
 
 
-def ComiRec(user_feature_columns, item_feature_columns, interest_num=2, p=100, interest_extractor='sa', add_pos=False,
+def ComiRec(user_feature_columns, item_feature_columns, k_max=2, p=100, interest_extractor='sa',
+            add_pos=True,
             user_dnn_hidden_units=(64, 32), dnn_activation='relu', dnn_use_bn=False, l2_reg_dnn=0,
             l2_reg_embedding=1e-6,
             dnn_dropout=0, output_activation='linear', sampler_config=None, seed=1024):
     """Instantiates the ComiRec Model architecture.
 
     :param user_feature_columns: An iterable containing user's features used by  the model.
     :param item_feature_columns: An iterable containing item's features used by  the model.
-    :param num_sampled: int, the number of classes to randomly sample per batch.
-    :param interest_num: int, the max size of user interest embedding
+    :param k_max: int, the max size of user interest embedding
     :param p: float,the parameter for adjusting the attention distribution in LabelAwareAttention.
     :param interest_extractor: string, type of a multi-interest extraction module, 'sa' means self-attentive and 'dr' means dynamic routing
     :param add_pos: bool. Whether use positional encoding layer
-    :param dnn_use_bn: bool. Whether use BatchNormalization before activation or not in deep net
     :param user_dnn_hidden_units: list,list of positive integer or empty list, the layer number and units in each layer of user tower
     :param dnn_activation: Activation function to use in deep net
     :param dnn_use_bn: bool. Whether use BatchNormalization before activation or not in deep net
@@ -131,29 +132,25 @@ def ComiRec(user_feature_columns, item_feature_columns, interest_num=2, p=100, i
     if interest_extractor.lower() == 'dr':
         high_capsule = CapsuleLayer(input_units=item_embedding_dim,
                                     out_units=item_embedding_dim, max_len=seq_max_len,
-                                    k_max=interest_num)((history_emb, hist_len))
+                                    k_max=k_max)((history_emb, hist_len))
     elif interest_extractor.lower() == 'sa':
         history_emb_add_pos = history_emb
         if add_pos:
             position_embedding = PositionEncoding()(history_emb)
             history_emb_add_pos = add_func([history_emb_add_pos, position_embedding])  # [None, max_len, emb_dim]
 
-        attn = DNN((item_embedding_dim * 4, interest_num), activation='tanh', l2_reg=l2_reg_dnn,
+        attn = DNN((item_embedding_dim * 4, k_max), activation='tanh', l2_reg=l2_reg_dnn,
                    dropout_rate=dnn_dropout, use_bn=dnn_use_bn, output_activation=None, seed=seed,
                    name="user_dnn_attn")(history_emb_add_pos)
-        mask = Lambda(tile_user_his_mask, arguments={'interest_num': interest_num,
+        mask = Lambda(tile_user_his_mask, arguments={'k_max': k_max,
                                                      'seq_max_len': seq_max_len})(
-            hist_len)  # [None, interest_num, max_len]
-        # high_capsule = SoftmaxWeightedSum(dropout_rate=0, future_binding=False,
-        #                 seed=seed)([attn, history_emb_add_pos, mask])
+            hist_len)  # [None, k_max, max_len]
+
         high_capsule = Lambda(softmax_Weighted_Sum)((history_emb_add_pos, mask, attn))
 
-    print("high_capsule",
-          high_capsule)  # Tensor("softmax_weighted_sum/MatMul:0", shape=(None, 2, 32), dtype=float32) Tensor("capsule_layer/Reshape_1:0", shape=(None, 2, 32), dtype=float32)
     if len(dnn_input_emb_list) > 0 or len(dense_value_list) > 0:
         user_other_feature = combined_dnn_input(dnn_input_emb_list, dense_value_list)
-        other_feature_tile = Lambda(tile_user_otherfeat, arguments={'interest_num': interest_num})(user_other_feature)
-        print("other_feature_tile", other_feature_tile, "NoMask", NoMask()(other_feature_tile))
+        other_feature_tile = Lambda(tile_user_otherfeat, arguments={'k_max': k_max})(user_other_feature)
         user_deep_input = Concatenate()([NoMask()(other_feature_tile), high_capsule])
     else:
         user_deep_input = high_capsule
@@ -173,7 +170,8 @@ def ComiRec(user_feature_columns, item_feature_columns, interest_num=2, p=100, i
 
     pooling_item_embedding_weight = PoolingLayer()([item_embedding_weight])
 
-    user_embedding_final = LabelAwareAttention(k_max=interest_num, pow_p=p)((user_embeddings, target_emb))
+    user_embedding_final = LabelAwareAttention(k_max=k_max, pow_p=p)((user_embeddings, target_emb))
+
     output = SampledSoftmaxLayer(sampler_config._asdict())(
         [pooling_item_embedding_weight, user_embedding_final, item_features[item_feature_name]])
     model = Model(inputs=inputs_list + item_inputs_list, outputs=output)
diff --git a/deepmatch/models/mind.py b/deepmatch/models/mind.py
@@ -53,11 +53,9 @@ def MIND(user_feature_columns, item_feature_columns, k_max=2, p=100, dynamic_k=F
 
     :param user_feature_columns: An iterable containing user's features used by  the model.
     :param item_feature_columns: An iterable containing item's features used by  the model.
-    :param num_sampled: int, the number of classes to randomly sample per batch.
     :param k_max: int, the max size of user interest embedding
     :param p: float,the parameter for adjusting the attention distribution in LabelAwareAttention.
     :param dynamic_k: bool, whether or not use dynamic interest number
-    :param dnn_use_bn: bool. Whether use BatchNormalization before activation or not in deep net
     :param user_dnn_hidden_units: list,list of positive integer or empty list, the layer number and units in each layer of user tower
     :param dnn_activation: Activation function to use in deep net
     :param dnn_use_bn: bool. Whether use BatchNormalization before activation or not in deep net
@@ -169,7 +167,7 @@ def MIND(user_feature_columns, item_feature_columns, k_max=2, p=100, dynamic_k=F
         user_embedding_final = LabelAwareAttention(k_max=k_max, pow_p=p)((user_embeddings, target_emb, interest_num))
     else:
         user_embedding_final = LabelAwareAttention(k_max=k_max, pow_p=p)((user_embeddings, target_emb))
-    print("swc")
+
     output = SampledSoftmaxLayer(sampler_config._asdict())(
         [pooling_item_embedding_weight, user_embedding_final, item_features[item_feature_name]])
     model = Model(inputs=inputs_list + item_inputs_list, outputs=output)
diff --git a/deepmatch/models/sdm.py b/deepmatch/models/sdm.py
@@ -30,7 +30,6 @@ def SDM(user_feature_columns, item_feature_columns, history_feature_list, units=
     :param user_feature_columns: An iterable containing user's features used by  the model.
     :param item_feature_columns: An iterable containing item's features used by  the model.
     :param history_feature_list: list,to indicate short and prefer sequence sparse field
-    :param num_sampled: int, the number of classes to randomly sample per batch.
     :param units: int, dimension for each output layer
     :param rnn_layers: int, layer number of rnn
     :param dropout_rate: float in [0,1), the probability we will drop out a given DNN coordinate.
diff --git a/deepmatch/models/youtubednn.py b/deepmatch/models/youtubednn.py
@@ -23,7 +23,6 @@ def YoutubeDNN(user_feature_columns, item_feature_columns,
 
     :param user_feature_columns: An iterable containing user's features used by  the model.
     :param item_feature_columns: An iterable containing item's features used by  the model.
-    :param num_sampled: int, the number of classes to randomly sample per batch.
     :param user_dnn_hidden_units: list,list of positive integer or empty list, the layer number and units in each layer of user tower
     :param dnn_activation: Activation function to use in deep net
     :param dnn_use_bn: bool. Whether use BatchNormalization before activation or not in deep net
diff --git a/docs/source/History.md b/docs/source/History.md
@@ -1,4 +1,5 @@
 # History
+- 10/31/2022 : [v0.3.1](https://github.com/shenweichen/DeepMatch/releases/tag/v0.3.1) released.Add `ComiRec` model .
 - 07/04/2022 : [v0.3.0](https://github.com/shenweichen/DeepMatch/releases/tag/v0.3.0) released.Support different negative sampling strategies, including `inbatch`, `uniform`, `frequency`, `adaptive`.
 - 06/17/2022 : [v0.2.1](https://github.com/shenweichen/DeepMatch/releases/tag/v0.2.1) released.Fix some bugs.
 - 10/12/2020 : [v0.2.0](https://github.com/shenweichen/DeepMatch/releases/tag/v0.2.0) released.Support different initializers for different embedding weights and loading pretrained embeddings. 
diff --git a/docs/source/conf.py b/docs/source/conf.py
@@ -26,7 +26,7 @@
 # The short X.Y version
 version = ''
 # The full version, including alpha/beta/rc tags
-release = '0.3.0'
+release = '0.3.1'
 
 
 # -- General configuration ---------------------------------------------------
diff --git a/docs/source/index.rst b/docs/source/index.rst
@@ -37,12 +37,12 @@ You can read the latest code at https://github.com/shenweichen/DeepMatch
 News
 -----
 
+10/31/2022 : Add `ComiRec` . `Changelog <https://github.com/shenweichen/DeepMatch/releases/tag/v0.3.1>`_
+
 07/04/2022 : Support different negative sampling strategies, including `inbatch` , `uniform` , `frequency` , `adaptive` . `Changelog <https://github.com/shenweichen/DeepMatch/releases/tag/v0.3.0>`_
 
 06/17/2022 : Fix some bugs. `Changelog <https://github.com/shenweichen/DeepMatch/releases/tag/v0.2.1>`_
 
-10/12/2020 : Support different initializers for different embedding weights and loading pretrained embeddings. `Changelog <https://github.com/shenweichen/DeepMatch/releases/tag/v0.2.0>`_
-
 DisscussionGroup
 -----------------------
 
diff --git a/examples/colab_MovieLen1M_ComiRec.ipynb b/examples/colab_MovieLen1M_ComiRec.ipynb
diff --git a/examples/run_sdm.py b/examples/run_sdm.py
diff --git a/examples/run_youtubednn.py b/examples/run_youtubednn.py
diff --git a/setup.py b/setup.py
diff --git a/tests/models/COMIREC_test.py b/tests/models/COMIREC_test.py
diff --git a/tests/models/SDM_test.py b/tests/models/SDM_test.py

Original file line number	Diff line number	Diff line change
`@@ -1,3 +1,4 @@`
	`1`	`+.idea`
`1`	`2`	`# Byte-compiled / optimized / DLL files`
`2`	`3`	`__pycache__/`
`3`	`4`	`*.py[cod]`
Original file line number	Diff line number	Diff line change
`@@ -1,4 +1,5 @@`
`1`	`1`	`# History`
	`2`	+- 10/31/2022 : [v0.3.1](https://github.com/shenweichen/DeepMatch/releases/tag/v0.3.1) released.Add `ComiRec` model .
`2`	`3`	- 07/04/2022 : [v0.3.0](https://github.com/shenweichen/DeepMatch/releases/tag/v0.3.0) released.Support different negative sampling strategies, including `inbatch`, `uniform`, `frequency`, `adaptive`.
`3`	`4`	`- 06/17/2022 : [v0.2.1](https://github.com/shenweichen/DeepMatch/releases/tag/v0.2.1) released.Fix some bugs.`
`4`	`5`	`- 10/12/2020 : [v0.2.0](https://github.com/shenweichen/DeepMatch/releases/tag/v0.2.0) released.Support different initializers for different embedding weights and loading pretrained embeddings.`