DeepRec-AI
diff --git a/‎docs/docs_en/Sample-awared-Graph-Compression.md‎
Lines changed: 23 additions & 9 deletions b/‎docs/docs_en/Sample-awared-Graph-Compression.md‎
Lines changed: 23 additions & 9 deletions
diff --git a/‎docs/docs_en/Sample-awared-Graph-Compression/img_1.png‎
223 KB b/‎docs/docs_en/Sample-awared-Graph-Compression/img_1.png‎
223 KB
diff --git a/‎docs/docs_zh/Sample-awared-Graph-Compression.md‎
Lines changed: 23 additions & 10 deletions b/‎docs/docs_zh/Sample-awared-Graph-Compression.md‎
Lines changed: 23 additions & 10 deletions
diff --git a/‎docs/docs_zh/Sample-awared-Graph-Compression/img_1.png‎
223 KB b/‎docs/docs_zh/Sample-awared-Graph-Compression/img_1.png‎
223 KB
diff --git a/‎tensorflow/python/graph_optimizer/sample_awared_graph_compression.py‎
Lines changed: 2 additions & 4 deletions b/‎tensorflow/python/graph_optimizer/sample_awared_graph_compression.py‎
Lines changed: 2 additions & 4 deletions
@@ -38,23 +38,31 @@ TODO
 ### Inference
 
 ```
+USER_FEATURE = ['user_feature_0', 'user_feature_1']
+ITEM_FEATURE = ['item_feature_0', 'item_feature_1']
+ALL_FEATURE = USER_FEATURE + ITEM_FEATURE
+
 def serving_input_receiver_fn():
-    item_size = tf.placeholder(dtype=tf.int32, shape=[None], name='item_size')
-    user_tensors=[]
-    item_tensors=[]
-    for feature, tensor in feature_map:
-        if is_user_feature(feature):
-            user_tensors.append(tensor)
-        else:
-            item_tensors.append(tensor)
+  item_size = tf.placeholder(dtype=tf.int32, shape=[None], name='item_size')
+  features = {}
+  inputs = {"item_size": item_size}
+  user_tensors = []
+  item_tensors = []
+  for fea_name in ALL_FEATURE:
+    features[fea_name] = tf.placeholder(tf.string, [None], name=fea_name)
+    inputs[fea_name] = features[fea_name]
+    if fea_name in ITEM_FEATURE:
+      item_tensors.append(features[fea_name])
+    else:
+      user_tensors.append(features[fea_name])
 
     """Enable Sample-awared Graph Compression"""
     tf.graph_optimizer.enable_sample_awared_graph_compression(
         user_tensors,
         item_tensors,
         item_size)
 
-    return tf.estimator.export.ServingInputReceiver(feature_map, inputs)
+  return tf.estimator.export.ServingInputReceiver(features, inputs)
 
 estiamtor = ...
 estiamtor.export_savedmodel(output_dir, serving_input_receiver_fn)
@@ -63,3 +71,9 @@ estiamtor.export_savedmodel(output_dir, serving_input_receiver_fn)
 
 2. Input data format
     Generally, in the inference scenario, the input data is protobuf, which contains the values of each feature required by the model and the tensor indicating the number of items in the sample. The user tensor shape is [Duser], and the item tensor shape is [N, Ditem]
+
+## Performance
+
+Compressing user-side features reduces the end-to-end delay of Inference. In a cloud online service case, the performance results are as follows:
+
+![img_1.png](Sample-awared-Graph-Compression/img_1.png)
@@ -11,7 +11,7 @@ user_1_feature, item_2_feature, label_2
 user_1_feature, item_N_feature, label_N
 ```
 
-这导致在样本的存储存在冗余，浪费了存储空间，表达了无效信息量。
+这导致在样本的存储存在冗余，浪费了存储/传输空间，表达了无效信息量。
 ### 模型特点
 在这样的样本特点下，读入的冗余样本必然也衍生了计算冗余，针对上面的样本，训练模型的时候，batch内部，user_1_feature会重复的run sub-graph（如：Attention Graph）若干次。这部分计算是完全冗余的，可以在运行时节省掉，只计算一次。
 ## 功能
@@ -34,23 +34,31 @@ TODO
 ### Inference
 
 ```
+USER_FEATURE = ['user_feature_0', 'user_feature_1']
+ITEM_FEATURE = ['item_feature_0', 'item_feature_1']
+ALL_FEATURE = USER_FEATURE + ITEM_FEATURE
+
 def serving_input_receiver_fn():
-    item_size = tf.placeholder(dtype=tf.int32, shape=[None], name='item_size')
-    user_tensors=[]
-    item_tensors=[]
-    for feature, tensor in feature_map:
-        if is_user_feature(feature):
-            user_tensors.append(tensor)
-        else:
-            item_tensors.append(tensor)
+  item_size = tf.placeholder(dtype=tf.int32, shape=[None], name='item_size')
+  features = {}
+  inputs = {"item_size": item_size}
+  user_tensors = []
+  item_tensors = []
+  for fea_name in ALL_FEATURE:
+    features[fea_name] = tf.placeholder(tf.string, [None], name=fea_name)
+    inputs[fea_name] = features[fea_name]
+    if fea_name in ITEM_FEATURE:
+      item_tensors.append(features[fea_name])
+    else:
+      user_tensors.append(features[fea_name])
 
     """Enable Sample-awared Graph Compression"""
     tf.graph_optimizer.enable_sample_awared_graph_compression(
         user_tensors,
         item_tensors,
         item_size)
 
-    return tf.estimator.export.ServingInputReceiver(feature_map, inputs)
+  return tf.estimator.export.ServingInputReceiver(features, inputs)
 
 estiamtor = ...
 estiamtor.export_savedmodel(output_dir, serving_input_receiver_fn)
@@ -59,3 +67,8 @@ estiamtor.export_savedmodel(output_dir, serving_input_receiver_fn)
 
 2. 输入数据格式
 一般在inference场景下，输入数据为protobuf，protobuf中包含模型所需各个特征的值以及指示该样本中item数目的tensor, user tensor shape为[Duser], item tensor shape为[N, Ditem]
+
+## 性能
+该功能，将user侧特征进行压缩，减少了Inference端到端时延，在某云上业务线上服务中，性能结果如下：
+
+![img_1.png](Sample-awared-Graph-Compression/img_1.png)
@@ -76,7 +76,7 @@ def find_boundery_tensors(user_ops, item_ops):
         else:
           user_sets.add(op2)
           queue_user.append(op2)
-  logging.info("boundery_tensor_sets: %s", boundery_tensor_sets)
+  logging.info("[SampleAwaredGraphCompression] boundery_tensor_sets: %s", boundery_tensor_sets)
   return user_sets, item_sets, boundery_tensor_sets
 
 def is_shape_op(op):
@@ -94,7 +94,6 @@ def add_tile_op(boundery_tensor_sets, item_seq_length, user_sets, seq_mask_resha
     # as some constant operations, such as reshape, should not be tiled
     if len(t.get_shape().as_list()) > 0 and not t.get_shape().as_list()[0]:
       with ops.colocate_with(t.op):
-        logging.info("add_tile_op [%d]: %s, %s", tiled_num, t, t.consumers())
         user_expand = array_ops.expand_dims(t, 1)
         tile_shape = array_ops.concat([[1], item_seq_length, [1 for i in range(len(t.get_shape()[1:]))]], axis=0)
         user_tiled = array_ops.tile(user_expand, tile_shape)
@@ -113,9 +112,8 @@ def add_tile_op(boundery_tensor_sets, item_seq_length, user_sets, seq_mask_resha
           for index, input_t in enumerate(op.inputs):
             if input_t is t:
               op._update_input(index, seq_user_input)
-              logging.info("add_tile_op detail: %s, %s, %s", op, index, seq_user_input)
         tiled_num += 1
-  logging.info("add_tile_op: total %d", tiled_num)
+  logging.info("[SampleAwaredGraphCompression] add %d TileOp", tiled_num)
 
 class SampleAwaredGraph(object):
   # user_tensors: list of common tensor