MegEngine
diff --git a/‎docs/download-models.zh.md
+6-7 b/‎docs/download-models.zh.md
+6-7
diff --git a/‎flow-python/examples/application/cat_finder/README.md
+3-2 b/‎flow-python/examples/application/cat_finder/README.md
+3-2
diff --git a/‎flow-python/examples/application/video_super_resolution/README.md
+32 b/‎flow-python/examples/application/video_super_resolution/README.md
+32
diff --git a/‎flow-python/examples/application/video_super_resolution/__init__.py
+10 b/‎flow-python/examples/application/video_super_resolution/__init__.py
+10
diff --git a/‎flow-python/examples/application/video_super_resolution/config.toml
+38 b/‎flow-python/examples/application/video_super_resolution/config.toml
+38
diff --git a/‎flow-python/examples/application/video_super_resolution/lite.py
+194 b/‎flow-python/examples/application/video_super_resolution/lite.py
+194
@@ -1,16 +1,15 @@
-# 模型下载
+# 模型和测试数据下载
 
-MegFlow 所有模型都压缩成了单个 models.zip 。
-
-| 云盘 | google drive |
-| - | - |
-| 链接: https://pan.baidu.com/s/1ZLVBR0igJ1hL6PoYQDtByA 提取码: 8ajf | [google](https://drive.google.com/file/d/1EwMJFjNp2kuNglutoleZOVsqccSOW2Z4/view?usp=sharing)  |
+| 应用名称 | 云盘 | google drive |
+| - | - | - |
+| 猫猫围栏、电动车检测 | 链接: https://pan.baidu.com/s/1ZLVBR0igJ1hL6PoYQDtByA 提取码: 8ajf | [google](https://drive.google.com/file/d/1EwMJFjNp2kuNglutoleZOVsqccSOW2Z4/view?usp=sharing) |
+| 视频超分 | 链接: https://pan.baidu.com/s/131Ul2A9DNxTXbatO1SGKFg?pwd=viy5 提取码: viy5 | [google](https://drive.google.com/file/d/1oyrVL20MODJOSf7BJ9T5OioE-ZaARDBC/view?usp=sharing) |
 
 取最新的 models_xxx.zip，解压、软链为 examples/models
 
 ```bash
 $ wget  ${URL}/modes.zip
-$ cd flow-python/examples
+$ cd flow-python/examples/application
 $ ln -s ${DOWNLOAD_DIR}/models models
 ```
 
 
@@ -95,7 +95,9 @@ $ megflow_run -c cat_finder/video_cpu.toml  -p cat_finder  # 无 GPU 的设备
 
 开启一路视频流解析需要流的 url，这里有两种方法：
 
-1）准备一个 rtsp 视频流地址，做测试输入（流地址部署不方便，也可以直接用离线文件的绝对路径代替）。模型包目录提供了测试视频，在 `models/cat_finder_testdata`，需要用户自行部署 live555 服务。最直接的办法：
+1）离线文件方式。也就是在 WebUI 中输入类似`/mnt/data/stream/file.ts` 的路径。需要自行保证服务器可访问这个文件、并且格式是可以被 ffmpeg 解析的（例如 .ts/.mp4/.h264/.h265）。
+
+2）在线流方式。准备一个 rtsp 视频流地址，做测试输入。模型包目录提供了测试视频，在 `models/cat_finder_testdata`，需要用户自行部署 live555 服务。最直接的办法：
 ```bash
 $ wget https://github.com/aler9/rtsp-simple-server/releases/download/v0.17.2/rtsp-simple-server_v0.17.2_linux_amd64.tar.gz
 $ 
@@ -108,7 +110,6 @@ $ ffmpeg -re -stream_loop -1 -i ${models}/cat_finder_testdata/test1.ts -c copy -
 
 相关教程已整合在 [如何生成自己的 rtsp 流地址](../../../../docs/02-how-to-run/generate-rtsp.zh.md) 。
 
-2）如果 rtsp 流地址部署不方便，也可以直接用离线文件的绝对路径代替，也就是在 WebUI 中输入类似`/mnt/data/stream/file.ts` 的路径。需要自行保证服务器可访问这个文件、并且格式是可以被 ffmpeg 解析的（例如 .ts/.mp4/.h264/.h265）。
 
 ## 六、视频识别 FAQ
 
 
@@ -0,0 +1,32 @@
+# 视频实时超分
+
+## 一、[下载模型和测试数据](../../../../docs/download-models.zh.md)
+
+## 二、运行
+
+模型软链后，使用`megflow_run`运行
+```bash
+$ cd ${path/to/MegFlow}/flow-python/examples/application # 这行必须
+$ megflow_run  -c video_super_resolution/config.toml  -p video_super_resolution
+```
+
+浏览器打开 [8087 端口](http://10.122.101.175:8087/docs#/default/post_start__url_)，try it out。
+
+1）上传测试数据中的 `a.mp4`，获取 stream_id
+
+2）用 stream_id 查询结果存到了哪个文件，例如 kj2WAS.flv
+
+## 三、如何使用自己的模型
+
+超分模型使用 [basicVSR_mge](https://github.com/Feynman1999/basicVSR_mge) 做训练，炼丹结束后请 cherry-pick  [这个 PR](https://github.com/Feynman1999/basicVSR_mge/pull/6)，然后把模型 jit.trace 成纯推理格式。
+
+```bash
+$ cd ${path/to/basicVSR_mge}
+$ python3 tools/dump.py configs/restorers/BasicVSR/basicVSR_test_valid.py
+```
+
+## 四、其他
+构造测试输入需**注意视频质量**，例如
+```bash
+$ ffmpeg -i images/%08d.png -q:v 2  -vcodec mpeg4 -r 20  a.mp4
+```
@@ -0,0 +1,10 @@
+# MegFlow is Licensed under the Apache License, Version 2.0 (the "License")
+#
+# Copyright (c) 2019-2021 Megvii Inc. All rights reserved.
+#
+# Unless required by applicable law or agreed to in writing,
+# software distributed under the License is distributed on an
+# "AS IS" BASIS, WITHOUT ARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+
+#!/usr/bin/env python
+# coding=utf-8
@@ -0,0 +1,38 @@
+main = "vsr"
+
+[[graphs]]
+name = "subgraph"
+inputs = [{ name = "inp", cap = 128, ports = ["model:inp"] }]
+outputs = [{ name = "out", cap = 128, ports = ["save:out"] }]
+connections = [
+  { cap = 128, ports = ["model:out", "save:inp"] }
+]
+
+    [[graphs.nodes]]
+    name = "model"
+    ty = "Model"
+    dir = "models/vsr_models"
+    device = "gpu"
+    device_id = 0
+    
+    [[graphs.nodes]]
+    name = "save"
+    ty = "Save"
+    path = "./"
+    
+[[graphs]]
+name = "vsr"
+connections = [
+  { cap = 16, ports = ["source:out", "destination:inp"] },
+  { cap = 16, ports = ["source:inp", "destination:out"] }
+]
+
+    [[graphs.nodes]]
+    name = "source"
+    ty = "VideoServer"
+    port = 8087
+    response = "json"
+    
+    [[graphs.nodes]]
+    name = "destination"
+    ty = "subgraph"
@@ -0,0 +1,194 @@
+# MegFlow is Licensed under the Apache License, Version 2.0 (the "License")
+#
+# Copyright (c) 2019-2021 Megvii Inc. All rights reserved.
+#
+# Unless required by applicable law or agreed to in writing,
+# software distributed under the License is distributed on an
+# "AS IS" BASIS, WITHOUT ARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+
+#!/usr/bin/env python
+# coding=utf-8
+
+import argparse
+import time
+import os
+import cv2
+import numpy as np
+import megenginelite as mgelite
+
+
+class PredictorLite:
+    def load(self, fullpath, config, device_id):
+        net = mgelite.LiteNetwork(config=config)
+        net.device_id = device_id
+        print(fullpath)
+        net.load(fullpath)
+        return net
+
+    def __init__(
+        self,
+        path,
+        device="gpu",
+        device_id=0,
+    ):
+
+        if "gpu" in device.lower():
+            device_type = mgelite.LiteDeviceType.LITE_CUDA
+        else:
+            device_type = mgelite.LiteDeviceType.LITE_CPU
+        net_config = mgelite.LiteConfig(device_type=device_type)
+
+        self.flownet = self.load(os.path.join(path, "flownet.mge"), net_config,
+                                 device_id)
+        self.gen = self.load(os.path.join(path, "generator.mge"), net_config,
+                             device_id)
+        self.upsample = self.load(os.path.join(path, "upsample.mge"),
+                                  net_config, device_id)
+        self.HIDDEN_CHANNELS = 96
+        print("basicVSR model loaded.")
+
+    def get_bilinear(self, image):
+        B, T, C, h, w = image.shape
+        image = image.reshape(-1, C, h, w)
+        ret = np.zeros((image.shape[0], C, 4 * h, 4 * w), dtype=np.float32)
+        for i in range(image.shape[0]):
+            chw = image[i:i + 1].reshape(C, h, w)
+            hwc = np.transpose(chw, (1, 2, 0))
+            hwc = cv2.resize(hwc, (w * 4, h * 4))
+            ret[i:i + 1] = np.transpose(hwc, (2, 0, 1))
+        ret = ret.reshape(B, T, C, h * 4, w * 4)
+        return ret
+
+    def inference_flownet(self, now_frame, ref):
+        begin = time.time()
+
+        data0 = self.flownet.get_io_tensor("tenFirst")
+        data0.set_data_by_share(now_frame)
+
+        data1 = self.flownet.get_io_tensor("tenSecond")
+        data1.set_data_by_share(ref)
+        self.flownet.forward()
+        self.flownet.wait()
+
+        tensor = self.flownet.get_io_tensor(
+            self.flownet.get_all_output_name()[0])
+        timecost = time.time() - begin
+        print(f"flownet timecost {timecost} ms")
+        return tensor.to_numpy()
+
+    def inference_gen(self, hidden, flow, nowFrame):
+        begin = time.time()
+
+        data0 = self.gen.get_io_tensor("hidden")
+        data0.set_data_by_share(hidden)
+
+        data1 = self.gen.get_io_tensor("flow")
+        data1.set_data_by_share(flow)
+
+        data2 = self.gen.get_io_tensor("nowFrame")
+        data2.set_data_by_share(nowFrame)
+
+        self.gen.forward()
+        self.gen.wait()
+
+        tensor = self.gen.get_io_tensor(self.gen.get_all_output_name()[0])
+        timecost = time.time() - begin
+        print(f"gen timecost {timecost} ms")
+        return tensor.to_numpy()
+
+    def inference_upsample(self, forward_hidden, backward_hidden):
+        begin = time.time()
+
+        data0 = self.upsample.get_io_tensor("forward_hidden")
+        data0.set_data_by_share(forward_hidden)
+
+        data1 = self.upsample.get_io_tensor("backward_hidden")
+        data1.set_data_by_share(backward_hidden)
+
+        self.upsample.forward()
+        self.upsample.wait()
+
+        tensor = self.upsample.get_io_tensor(
+            self.upsample.get_all_output_name()[0])
+        timecost = time.time() - begin
+        print(f"upsample timecost {timecost} ms")
+        return tensor.to_numpy()
+
+    # shape [batch, 3, H, W]
+    def inference(self, input):
+        input = input.astype(np.float32) / 255.0
+        input = np.expand_dims(input, axis=0)  # [1,100,3,180,320]
+
+        image = np.ascontiguousarray(input, np.float32)
+
+        B, T, _, h, w = image.shape
+        biup = self.get_bilinear(image)
+        forward_hiddens = []
+        backward_hiddens = []
+        res = []
+        hidden = np.zeros((2 * B, self.HIDDEN_CHANNELS, h, w),
+                          dtype=np.float32)
+        for i in range(T):
+            now_frame = np.concatenate(
+                [image[:, i, ...], image[:, T - i - 1, ...]], axis=0)
+            if i == 0:
+                flow = self.inference_flownet(now_frame, now_frame)
+            else:
+                ref = np.concatenate(
+                    [image[:, i - 1, ...], image[:, T - i, ...]], axis=0)
+                flow = self.inference_flownet(now_frame, ref)
+
+            hidden = self.inference_gen(hidden, flow, now_frame)
+            forward_hiddens.append(hidden[0:B, ...])
+            backward_hiddens.append(hidden[B:2 * B, ...])
+
+        for i in range(T):
+            res.append(
+                self.inference_upsample(forward_hiddens[i],
+                                        backward_hiddens[T - i - 1]))
+
+        res = np.stack(res, axis=1)  # [B,T,3,H,W]
+        HR_G = res + biup
+        HR_G = (np.clip(HR_G, a_min=0.0, a_max=1.0) * 255.0).round().astype(
+            np.uint8)
+
+        ret = []
+        for i in range(T):
+            x = HR_G[0, i, ...]
+            img_np = np.transpose(x[[2, 1, 0], :, :], (1, 2, 0))
+            ret.append(img_np)
+        return ret
+
+
+def make_parser():
+    parser = argparse.ArgumentParser("ModelServing Demo!")
+    parser.add_argument("--model",
+                        default=None,
+                        type=str,
+                        help=".mge for eval")
+    return parser
+
+
+# if __name__ == "__main__":
+
+#     batchdata = None
+#     imagelist = []
+#     for parent, _, filenames in os.walk("images"):
+#         filenames.sort()
+#         for filename in filenames:
+#             mat = cv2.imread(os.path.join(parent, filename))
+#             print(filename)
+#             mat = cv2.cvtColor(mat, cv2.COLOR_BGR2RGB)
+#             mat = np.transpose(mat, (2, 0, 1))
+#             mat = np.expand_dims(mat, axis=0)
+#             if mat is not None:
+#                 imagelist.append(mat[...])
+#     batchdata = np.concatenate(imagelist, axis=0)
+#     assert(batchdata is not None)
+
+#     predictor = PredictorLite("./")
+#     result = predictor.inference(batchdata)
+#     assert(len(result) == batchdata.shape[0])
+
+#     for idx, image in enumerate(result):
+#         cv2.imwrite(f"{idx}.jpg", image)