alibaba
diff --git a/‎README.md
+17-3 b/‎README.md
+17-3
diff --git a/‎configs/action_recognition/E3D_X3DL_FLOPs.py
+51 b/‎configs/action_recognition/E3D_X3DL_FLOPs.py
+51
diff --git a/‎configs/action_recognition/E3D_X3DM_FLOPs.py
+51 b/‎configs/action_recognition/E3D_X3DM_FLOPs.py
+51
diff --git a/‎configs/action_recognition/E3D_X3DS_FLOPs.py
+51 b/‎configs/action_recognition/E3D_X3DS_FLOPs.py
+51
diff --git a/‎configs/action_recognition/README.md
+58 b/‎configs/action_recognition/README.md
+58
diff --git a/‎configs/action_recognition/models/E3D_L.txt
+48 b/‎configs/action_recognition/models/E3D_L.txt
+48
diff --git a/‎configs/action_recognition/models/E3D_M.txt
+49 b/‎configs/action_recognition/models/E3D_M.txt
+49
@@ -10,14 +10,15 @@
 
 - **:sunny: Hiring research interns for Neural Architecture Search, Tiny Machine Learning, Computer Vision tasks: [xiuyu.sxy@alibaba-inc.com](xiuyu.sxy@alibaba-inc.com)**
 - :boom: 2023.04: We will give a talk on Zero-Cost NAS at [**IFML Workshop**](https://www.ifml.institute/events/ifml-workshop-2023), April 20, 2023.
+- :boom: 2023.03: Code for [**E3D**](configs/action_recognition/README.md) is now released.
 - :boom: 2023.03: The code is refactoried and DeepMAD is supported.
 - :boom: 2023.03: [**DeepMAD: Mathematical Architecture Design for Deep Convolutional Neural Network**](https://arxiv.org/abs/2303.02165) is accepted by CVPR'23.
 - :boom: 2023.02: A demo is available on [**ModelScope**](https://modelscope.cn/studios/damo/TinyNAS/summary)
 - :boom: 2023.01: [**Maximizing Spatio-Temporal Entropy of Deep 3D CNNs for Efficient Video Recognition**](https://openreview.net/pdf?id=lj1Eb1OPeNw) is accepted by ICLR'23.
 - :boom: 2022.11: [**DAMO-YOLO**](https://github.com/tinyvision/DAMO-YOLO) backbone search is now supported! And paper is on [ArXiv](https://arxiv.org/abs/2211.15444) now.
-- :boom: 2022.09: [**Mixed-Precision Quantization Search**](scripts/quant/README.md) is now supported! The [**QE-Score**](https://openreview.net/pdf?id=E28hy5isRzC) paper is accepted by NeurIPS'22.
+- :boom: 2022.09: [**Mixed-Precision Quantization Search**](configs/quant/README.md) is now supported! The [**QE-Score**](https://openreview.net/pdf?id=E28hy5isRzC) paper is accepted by NeurIPS'22.
 - :boom: 2022.08: We will give a tutorial on [**Functional View for Zero-Shot NAS**](https://mlsys.org/virtual/2022/tutorial/2201) at MLSys'22.
-- :boom: 2022.06: Code for [**MAE-DET**](scripts/detection/README.md) is now released.
+- :boom: 2022.06: Code for [**MAE-DET**](configs/detection/README.md) is now released.
 - :boom: 2022.05: [**MAE-DET**](https://proceedings.mlr.press/v162/sun22c/sun22c.pdf) is accepted by ICML'22.
 - :boom: 2021.09: Code for [**Zen-NAS**](https://github.com/idstcv/ZenNAS) is now released.
 - :boom: 2021.07: The inspiring training-free paper [**Zen-NAS**](https://openaccess.thecvf.com/content/ICCV2021/papers/Lin_Zen-NAS_A_Zero-Shot_NAS_for_High-Performance_Image_Recognition_ICCV_2021_paper.pdf) has been accepted by ICCV'21.
@@ -33,7 +34,8 @@
     - [Budgets module](tinynas/budgets/README.md)
     - [Latency Module](tinynas/latency/op_profiler/README.md)
     - [Population module](tinynas/evolutions/README.md)
-  It manages these modules with the help of [ModelScope](https://github.com/modelscope/modelscope) Registry and Configuration mechanism.
+
+It manages these modules with the help of [ModelScope](https://github.com/modelscope/modelscope) Registry and Configuration mechanism.
 
 - The `Searcher` is defined to be responsible for building and completing the entire search process. Through the combination of these modules and the corresponding configuration files, we can complete backbone search for different tasks (such as classification, detection, etc.) under different budget constraints (such as the number of parameters, FLOPs, delay, etc.).
 
@@ -89,6 +91,18 @@
 | MAE-DET-M | 25.8 |    89.9    |  46.9 | 30.1 | 50.9 | 59.9  | [txt](configs/detection/models/maedet_m.txt)       |[model](https://idstcv.oss-cn-zhangjiakou.aliyuncs.com/LightNAS/detection/maedet-m/latest.pth) |
 | MAE-DET-L | 43.9 |    152.9   |  47.8 | 30.3 | 51.9 | 61.1  | [txt](configs/detection/models/maedet_l.txt)      |[model](https://idstcv.oss-cn-zhangjiakou.aliyuncs.com/LightNAS/detection/maedet-l/latest.pth) |
 
+***
+## Results for Action Recognition ([Details](configs/action_recognition/README.md)）
+
+| Backbone  | size   |  FLOPs (G) |  SSV1 Top-1 | SSV1 Top-5 | Structure | 
+|:---------:|:-------:|:-------:|:-------:|:-------:|:--------:|
+| X3D-S | 160 |    1.9     |   44.6  | 74.4| -     |
+| X3D-S | 224 |    1.9     |   47.3  | 76.6| -     |
+| E3D-S | 160 |    1.9     |   47.1  | 75.6| [txt](configs/action_recognition/models/E3D_S.txt)       |
+| E3D-M  | 224 |     4.7     |   49.4  | 78.1| [txt](configs/action_recognition/models/E3D_M.txt)       |
+| E3D-L  | 312 |     18.3     |   51.1  | 78.7| [txt](configs/action_recognition/models/E3D_L.txt)       |
+
+***
 **Note**：
 If you find this useful, please support us by citing them.
 ```
 
@@ -0,0 +1,51 @@
+# Copyright (c) Alibaba, Inc. and its affiliates.
+# The implementation is also open-sourced by the authors, and available at
+# https://github.com/alibaba/lightweight-neural-architecture-search.
+
+work_dir = './save_model/E3DM_FLOPs_185e8/'
+log_level = 'INFO'  # INFO/DEBUG/ERROR
+log_freq = 1000
+
+""" video config """
+image_size = 312  
+frames = 16
+
+""" Model config """
+model = dict(
+    type = 'Cnn3DNet',
+    structure_info = [ 
+        {'class': 'Conv3DKXBNRELU', 'in': 3, 'out': 24, 's': 2, 'kt': 1, 'k': 3}, \
+        {'class': 'SuperRes3DK1DWK1', 'in': 24, 'out': 24, 's': 2, 'kt': 1, 'k': 5, 'L': 1, 'btn': 48}, \
+        {'class': 'SuperRes3DK1DWK1', 'in': 24, 'out': 48, 's': 2, 'kt': 3, 'k': 3, 'L': 1, 'btn': 96}, \
+        {'class': 'SuperRes3DK1DWK1', 'in': 48, 'out': 96, 's': 2, 'kt': 3, 'k': 3, 'L': 1, 'btn': 192}, \
+        {'class': 'SuperRes3DK1DWK1', 'in': 96, 'out': 96, 's': 1, 'kt': 3, 'k': 3, 'L': 1, 'btn': 192}, \
+        {'class': 'SuperRes3DK1DWK1', 'in': 96, 'out': 192, 's': 2, 'kt': 3, 'k': 3, 'L': 1, 'btn': 384}, \
+        {'class': 'Conv3DKXBNRELU', 'in': 192, 'out': 512, 's': 1, 'kt': 1, 'k': 1},\
+    ]
+)
+
+""" Budget config """
+budgets = [
+    dict(type = "flops", budget = 185e8),
+    dict(type = "layers",budget = 167),
+    ]
+
+""" Score config """
+score = dict(type = 'stentr', multi_block_ratio = [0,0,0,0,1], frames=16)
+
+""" Space config """
+space = dict(
+    type = 'space_3d_k1dwk1',
+    image_size = image_size,
+    )
+
+""" Search config """
+search=dict(
+    minor_mutation = False,  # whether fix the stage layer
+    minor_iter = 100000,  # which iteration to enable minor_mutation
+    popu_size = 256,
+    num_random_nets = 100000,  # the searching iterations
+    sync_size_ratio = 1.0,  # control each thread sync number: ratio * popu_size
+    num_network = 1,
+)
+
@@ -0,0 +1,51 @@
+# Copyright (c) Alibaba, Inc. and its affiliates.
+# The implementation is also open-sourced by the authors, and available at
+# https://github.com/alibaba/lightweight-neural-architecture-search.
+
+work_dir = './save_model/E3DM_FLOPs_50e8/'
+log_level = 'INFO'  # INFO/DEBUG/ERROR
+log_freq = 1000
+
+""" video config """
+image_size = 224  
+frames = 16
+
+""" Model config """
+model = dict(
+    type = 'Cnn3DNet',
+    structure_info = [ 
+        {'class': 'Conv3DKXBNRELU', 'in': 3, 'out': 24, 's': 2, 'kt': 1, 'k': 3}, \
+        {'class': 'SuperRes3DK1DWK1', 'in': 24, 'out': 24, 's': 2, 'kt': 1, 'k': 5, 'L': 1, 'btn': 48}, \
+        {'class': 'SuperRes3DK1DWK1', 'in': 24, 'out': 48, 's': 2, 'kt': 3, 'k': 3, 'L': 1, 'btn': 96}, \
+        {'class': 'SuperRes3DK1DWK1', 'in': 48, 'out': 96, 's': 2, 'kt': 3, 'k': 3, 'L': 1, 'btn': 192}, \
+        {'class': 'SuperRes3DK1DWK1', 'in': 96, 'out': 96, 's': 1, 'kt': 3, 'k': 3, 'L': 1, 'btn': 192}, \
+        {'class': 'SuperRes3DK1DWK1', 'in': 96, 'out': 192, 's': 2, 'kt': 3, 'k': 3, 'L': 1, 'btn': 384}, \
+        {'class': 'Conv3DKXBNRELU', 'in': 192, 'out': 512, 's': 1, 'kt': 1, 'k': 1},\
+    ]
+)
+
+""" Budget config """
+budgets = [
+    dict(type = "flops", budget = 50e8),
+    dict(type = "layers",budget = 83),
+    ]
+
+""" Score config """
+score = dict(type = 'stentr', multi_block_ratio = [0,0,0,0,1], frames=16)
+
+""" Space config """
+space = dict(
+    type = 'space_3d_k1dwk1',
+    image_size = image_size,
+    )
+
+""" Search config """
+search=dict(
+    minor_mutation = False,  # whether fix the stage layer
+    minor_iter = 100000,  # which iteration to enable minor_mutation
+    popu_size = 256,
+    num_random_nets = 100000,  # the searching iterations
+    sync_size_ratio = 1.0,  # control each thread sync number: ratio * popu_size
+    num_network = 1,
+)
+
@@ -0,0 +1,51 @@
+# Copyright (c) Alibaba, Inc. and its affiliates.
+# The implementation is also open-sourced by the authors, and available at
+# https://github.com/alibaba/lightweight-neural-architecture-search.
+
+work_dir = './save_model/E3DS_FLOPs_20e8/'
+log_level = 'INFO'  # INFO/DEBUG/ERROR
+log_freq = 1000
+
+""" video config """
+image_size = 160  
+frames = 13
+
+""" Model config """
+model = dict(
+    type = 'Cnn3DNet',
+    structure_info = [ 
+        {'class': 'Conv3DKXBNRELU', 'in': 3, 'out': 24, 's': 2, 'kt': 1, 'k': 3}, \
+        {'class': 'SuperRes3DK1DWK1', 'in': 24, 'out': 24, 's': 2, 'kt': 1, 'k': 5, 'L': 1, 'btn': 48}, \
+        {'class': 'SuperRes3DK1DWK1', 'in': 24, 'out': 48, 's': 2, 'kt': 3, 'k': 3, 'L': 1, 'btn': 96}, \
+        {'class': 'SuperRes3DK1DWK1', 'in': 48, 'out': 96, 's': 2, 'kt': 3, 'k': 3, 'L': 1, 'btn': 192}, \
+        {'class': 'SuperRes3DK1DWK1', 'in': 96, 'out': 96, 's': 1, 'kt': 3, 'k': 3, 'L': 1, 'btn': 192}, \
+        {'class': 'SuperRes3DK1DWK1', 'in': 96, 'out': 192, 's': 2, 'kt': 3, 'k': 3, 'L': 1, 'btn': 384}, \
+        {'class': 'Conv3DKXBNRELU', 'in': 192, 'out': 512, 's': 1, 'kt': 1, 'k': 1},\
+    ]
+)
+
+""" Budget config """
+budgets = [
+    dict(type = "flops", budget = 20e8),
+    dict(type = "layers",budget = 83),
+    ]
+
+""" Score config """
+score = dict(type = 'stentr', multi_block_ratio = [0,0,0,0,1], frames=13)
+
+""" Space config """
+space = dict(
+    type = 'space_3d_k1dwk1',
+    image_size = image_size,
+    )
+
+""" Search config """
+search=dict(
+    minor_mutation = False,  # whether fix the stage layer
+    minor_iter = 500000,  # which iteration to enable minor_mutation
+    popu_size = 256,
+    num_random_nets = 500000,  # the searching iterations
+    sync_size_ratio = 1.0,  # control each thread sync number: ratio * popu_size
+    num_network = 1,
+)
+
@@ -0,0 +1,58 @@
+## Abstract
+
+* **Instruction**
+
+    We search efficient E3D backbones for action recognition and E3D-S/M/L are aligned with X3D-S/M/L.   <br/>
+
+
+* **Use the searching configs for Classification**
+
+    ```shell
+    sh tools/dist_search.sh configs/E3D_X3DS_FLOPs.py
+    ```
+    **`E3D_X3DS_FLOPs.py` is the config for searching X3DS-like model within the budget of FLOPs using STEntr Score.**
+
+    **`E3D_X3DM_FLOPs.py` is the config for searching X3DM-like model within the budget of FLOPs using STEntr Score.** 
+      
+    **`E3D_X3DL_FLOPs.py` is the config for searching X3DL-like model within the budget of FLOPs using STEntr Score.**
+
+* **Use searched models in your own training pipeline**
+
+    **copy `tinynas/deploy/cnn3dnet` to your pipeline, then** 
+    ```python
+    from cnn3dnet import Cnn3DNet
+    # for classifictaion
+    model = Cnn3DNet(num_classes=classes, 
+                    structure_txt=structure_txt,
+                    out_indices=(4,),
+                    classfication=True)
+
+    # if load with pretrained model
+    model.init_weights(pretrained=pretrained_pth)
+    ```
+
+***
+
+## Results on Sth-Sth V1
+
+| Backbone  | size   |  FLOPs (G) |   Top-1 | Top-5 | Structure | 
+|:---------:|:-------:|:-------:|:-------:|:-------:|:--------:|
+| E3D-S | 160 |    1.9     |   47.1  | 75.6| [txt](models/E3D_S.txt)       |
+| E3D-M  | 224 |     4.7     |   49.4  | 78.1| [txt](models/E3D_M.txt)       |
+| E3D-L  | 312 |     18.3     |   51.1  | 78.7| [txt](models/E3D_L.txt)       |
+
+
+
+***
+## Citation
+
+If you find this toolbox useful, please support us by citing this work as
+
+```
+@inproceedings{iclr23maxste,
+	title     = {Maximizing Spatio-Temporal Entropy of Deep 3D CNNs for Efficient Video Recognition},
+	author    = {Junyan Wang and Zhenhong Sun and Yichen Qian and Dong Gong and Xiuyu Sun and Ming Lin and Maurice Pagnucco and Yang Song },
+	journal   = {International Conference on Learning Representations},
+	year      = {2023},
+}
+```
@@ -0,0 +1,48 @@
+{ 'best_structures':[[ {'class': 'Conv3DKXBNRELU', 'in': 3, 'k': 3, 'kt': 1, 'out': 24, 's': 2},
+  { 'L': 3,
+    'btn': 32,
+    'class': 'SuperRes3DK1DWK1',
+    'in': 24,
+    'inner_class': 'Res3DK1DWK1',
+    'k': 5,
+    'kt': 1,
+    'out': 24,
+    's': 2},
+  { 'L': 13,
+    'btn': 120,
+    'class': 'SuperRes3DK1DWK1',
+    'in': 24,
+    'inner_class': 'Res3DK1DWK1',
+    'k': 3,
+    'kt': 3,
+    'out': 48,
+    's': 2},
+  { 'L': 13,
+    'btn': 176,
+    'class': 'SuperRes3DK1DWK1',
+    'in': 48,
+    'inner_class': 'Res3DK1DWK1',
+    'k': 3,
+    'kt': 3,
+    'out': 120,
+    's': 2},
+  { 'L': 13,
+    'btn': 176,
+    'class': 'SuperRes3DK1DWK1',
+    'in': 120,
+    'inner_class': 'Res3DK1DWK1',
+    'k': 3,
+    'kt': 3,
+    'out': 120,
+    's': 1},
+  { 'L': 13,
+    'btn': 480,
+    'class': 'SuperRes3DK1DWK1',
+    'in': 120,
+    'inner_class': 'Res3DK1DWK1',
+    'k': 3,
+    'kt': 3,
+    'out': 192,
+    's': 2},
+  {'class': 'Conv3DKXBNRELU', 'in': 192, 'k': 1, 'kt': 1, 'out': 512, 's': 1}]],
+  'space_arch': 'Cnn3DNet'}
@@ -0,0 +1,49 @@
+{'best_structures': [[ 
+   {'class': 'Conv3DKXBNRELU', 'in': 3, 'k': 3, 'kt': 1, 'out': 24, 's': 2},
+  { 'L': 3,
+    'btn': 32,
+    'class': 'SuperRes3DK1DWK1',
+    'in': 24,
+    'inner_class': 'Res3DK1DWK1',
+    'k': 5,
+    'kt': 1,
+    'out': 24,
+    's': 2},
+  { 'L': 6,
+    'btn': 96,
+    'class': 'SuperRes3DK1DWK1',
+    'in': 24,
+    'inner_class': 'Res3DK1DWK1',
+    'k': 3,
+    'kt': 3,
+    'out': 64,
+    's': 2},
+  { 'L': 6,
+    'btn': 176,
+    'class': 'SuperRes3DK1DWK1',
+    'in': 64,
+    'inner_class': 'Res3DK1DWK1',
+    'k': 3,
+    'kt': 3,
+    'out': 120,
+    's': 2},
+  { 'L': 6,
+    'btn': 176,
+    'class': 'SuperRes3DK1DWK1',
+    'in': 120,
+    'inner_class': 'Res3DK1DWK1',
+    'k': 3,
+    'kt': 3,
+    'out': 120,
+    's': 1},
+  { 'L': 6,
+    'btn': 464,
+    'class': 'SuperRes3DK1DWK1',
+    'in': 120,
+    'inner_class': 'Res3DK1DWK1',
+    'k': 3,
+    'kt': 3,
+    'out': 184,
+    's': 2},
+  {'class': 'Conv3DKXBNRELU', 'in': 184, 'k': 1, 'kt': 1, 'out': 512, 's': 1}]],
+  'space_arch': 'Cnn3DNet'}