thuml
diff --git a/‎examples/domain_adaptation/image_classification/README.md
+20-18 b/‎examples/domain_adaptation/image_classification/README.md
+20-18
diff --git a/‎examples/domain_adaptation/image_classification/adda.py
+8-2 b/‎examples/domain_adaptation/image_classification/adda.py
+8-2
diff --git a/‎examples/domain_adaptation/image_classification/bsp.py
+8-3 b/‎examples/domain_adaptation/image_classification/bsp.py
+8-3
diff --git a/‎examples/domain_adaptation/image_classification/cdan.py
+6-2 b/‎examples/domain_adaptation/image_classification/cdan.py
+6-2
diff --git a/‎examples/domain_adaptation/image_classification/dan.py
+7-4 b/‎examples/domain_adaptation/image_classification/dan.py
+7-4
diff --git a/‎examples/domain_adaptation/image_classification/dann.py
+8-5 b/‎examples/domain_adaptation/image_classification/dann.py
+8-5
diff --git a/‎examples/domain_adaptation/image_classification/erm.py
+6-2 b/‎examples/domain_adaptation/image_classification/erm.py
+6-2
@@ -1,10 +1,11 @@
 # Unsupervised Domain Adaptation for Image Classification
 
 ## Installation
+
 It’s suggested to use **pytorch==1.7.1** and torchvision==0.8.2 in order to reproduce the benchmark results.
 
-Example scripts support all models in [PyTorch-Image-Models](https://github.com/rwightman/pytorch-image-models).
-You also need to install timm to use PyTorch-Image-Models.
+Example scripts support all models in [PyTorch-Image-Models](https://github.com/rwightman/pytorch-image-models). You
+also need to install timm to use PyTorch-Image-Models.
 
 ```
 pip install timm
@@ -14,19 +15,22 @@ pip install timm
 
 Following datasets can be downloaded automatically:
 
-- [MNIST](http://yann.lecun.com/exdb/mnist/), [SVHN](http://ufldl.stanford.edu/housenumbers/), [USPS](https://www.csie.ntu.edu.tw/~cjlin/libsvmtools/datasets/multiclass.html#usps) 
+- [MNIST](http://yann.lecun.com/exdb/mnist/), [SVHN](http://ufldl.stanford.edu/housenumbers/)
+  , [USPS](https://www.csie.ntu.edu.tw/~cjlin/libsvmtools/datasets/multiclass.html#usps)
 - [Office31](https://www.cc.gatech.edu/~judy/domainadapt/)
 - [OfficeCaltech](https://www.cc.gatech.edu/~judy/domainadapt/)
 - [OfficeHome](https://www.hemanthdv.org/officeHomeDataset.html)
 - [VisDA2017](http://ai.bu.edu/visda-2017/)
 - [DomainNet](http://ai.bu.edu/M3SDA/)
 
 You need to prepare following datasets manually if you want to use them:
+
 - [ImageNet](https://www.image-net.org/)
 - [ImageNetR](https://github.com/hendrycks/imagenet-r)
 - [ImageNet-Sketch](https://github.com/HaohanWang/ImageNet-Sketch)
 
-and prepare them following [Documentation for ImageNetR](/common/vision/datasets/imagenet_r.py) and [ImageNet-Sketch](/common/vision/datasets/imagenet_sketch.py).
+and prepare them following [Documentation for ImageNetR](/common/vision/datasets/imagenet_r.py)
+and [ImageNet-Sketch](/common/vision/datasets/imagenet_sketch.py).
 
 ## Supported Methods
 
@@ -45,8 +49,8 @@ Supported methods include:
 
 ## Usage
 
-The shell files give the script to reproduce the benchmark with specified hyper-parameters.
-For example, if you want to train DANN on Office31, use the following script
+The shell files give the script to reproduce the benchmark with specified hyper-parameters. For example, if you want to
+train DANN on Office31, use the following script
 
 ```shell script
 # Train a DANN on Office-31 Amazon -> Webcam task using ResNet 50.
@@ -55,16 +59,17 @@ For example, if you want to train DANN on Office31, use the following script
 CUDA_VISIBLE_DEVICES=0 python dann.py data/office31 -d Office31 -s A -t W -a resnet50 --epochs 20 --seed 1 --log logs/dann/Office31_A2W
 ```
 
-Note that ``-s`` specifies the source domain, ``-t`` specifies the target domain, and ``--log`` specifies where to store results.
+Note that ``-s`` specifies the source domain, ``-t`` specifies the target domain, and ``--log`` specifies where to store
+results.
 
-After running the above command, it will download ``Office-31`` datasets from the Internet if it's the first time you run the code. Directory that stores datasets will be named as
+After running the above command, it will download ``Office-31`` datasets from the Internet if it's the first time you
+run the code. Directory that stores datasets will be named as
 ``examples/domain_adaptation/image_classification/data/<dataset name>``.
 
 If everything works fine, you will see results in following format::
 
     Epoch: [1][ 900/1000]	Time  0.60 ( 0.69)	Data  0.22 ( 0.31)	Loss   0.74 (  0.85)	Cls Acc 96.9 (95.1)	Domain Acc 64.1 (62.6)
 
-
 You can also watch these results in the log file ``logs/dann/Office31_A2W/log.txt``.
 
 After training, you can test your algorithm's performance by passing in ``--phase test``.
@@ -73,21 +78,19 @@ After training, you can test your algorithm's performance by passing in ``--phas
 CUDA_VISIBLE_DEVICES=0 python dann.py data/office31 -d Office31 -s A -t W -a resnet50 --epochs 20 --seed 1 --log logs/dann/Office31_A2W --phase test
 ```
 
-
 ## Experiment and Results
 
 **Notations**
+
 - ``Origin`` means the accuracy reported by the original paper.
 - ``Avg`` is the accuracy reported by `TLlib`.
 - ``ERM`` refers to the model trained with data from the source domain.
 - ``Oracle`` refers to the model trained with data from the target domain.
 
-
-We found that the accuracies of adversarial methods (including DANN, ADDA, CDAN, MCD, BSP and MDD) are not stable
-even after the random seed is fixed, thus we repeat running adversarial methods on *Office-31* and *VisDA-2017*
+We found that the accuracies of adversarial methods (including DANN, ADDA, CDAN, MCD, BSP and MDD) are not stable even
+after the random seed is fixed, thus we repeat running adversarial methods on *Office-31* and *VisDA-2017*
 for three times and report their average accuracy.
 
-
 ### Office-31 accuracy on ResNet-50
 
 | Methods | Origin | Avg  | A → W | D → W | W → D | A → D | D → A | W → A |
@@ -162,8 +165,8 @@ for three times and report their average accuracy.
 | MDD         | 42.9 | 59.5 | 47.5 | 48.6 | 59.4 | 42.6 | 58.3 | 53.7 | 46.2 | 58.7 | 46.5 | 57.7 | 51.8 |
 | MCC         | 37.7 | 55.7 | 42.6 | 45.4 | 59.8 | 39.9 | 54.4 | 53.1 | 37.0 | 58.1 | 46.3 | 56.2 | 48.9 |
 
-
 ### DomainNet accuracy on ResNet-101 (Multi-Source)
+
 | Methods     | Origin | Avg  | :c   | :i   | :p   | :q   | :r   | :s   |
 |-------------|--------|------|------|------|------|------|------|------|
 | ERM         | 32.9   | 47.0 | 64.9 | 25.2 | 54.4 | 16.9 | 68.2 | 52.3 |
@@ -185,7 +188,6 @@ for three times and report their average accuracy.
 
 ## Visualization
 
-
 After training `DANN`, run the following command
 
 ```
@@ -200,15 +202,15 @@ Following are the t-SNE of representations from ResNet50 trained on source domai
 <img src="./fig/resnet_A2W.png" width="300"/>
 <img src="./fig/dann_A2W.png" width="300"/>
 
-
 ## TODO
+
 1. Support self-training methods
 2. Support translation methods
 3. Add results on ViT
 4. Add results on ImageNet
-5. Add more data augmentation options
 
 ## Citation
+
 If you use these methods in your research, please consider citing.
 
 ```
 
@@ -58,7 +58,8 @@ def main(args: argparse.Namespace):
     cudnn.benchmark = True
 
     # Data loading code
-    train_transform = utils.get_train_transform(args.train_resizing, random_horizontal_flip=not args.no_hflip,
+    train_transform = utils.get_train_transform(args.train_resizing, scale=args.scale, ratio=args.ratio,
+                                                random_horizontal_flip=not args.no_hflip,
                                                 random_color_jitter=False, resize_size=args.resize_size,
                                                 norm_mean=args.norm_mean, norm_std=args.norm_std)
     val_transform = utils.get_val_transform(args.val_resizing, resize_size=args.resize_size,
@@ -100,7 +101,8 @@ def main(args: argparse.Namespace):
         for epoch in range(args.pretrain_epochs):
             print("lr:", pretrain_lr_scheduler.get_lr())
             # pretrain for one epoch
-            utils.empirical_risk_minimization(train_source_iter, pretrain_model, pretrain_optimizer, pretrain_lr_scheduler, epoch, args,
+            utils.empirical_risk_minimization(train_source_iter, pretrain_model, pretrain_optimizer,
+                                              pretrain_lr_scheduler, epoch, args,
                                               device)
             # validate to show pretrain process
             utils.validate(val_loader, pretrain_model, args, device)
@@ -244,6 +246,10 @@ def train(train_source_iter: ForeverDataIterator, train_target_iter: ForeverData
     parser.add_argument('--val-resizing', type=str, default='default')
     parser.add_argument('--resize-size', type=int, default=224,
                         help='the image size after resizing')
+    parser.add_argument('--scale', type=float, nargs='+', default=[0.08, 1.0], metavar='PCT',
+                        help='Random resize scale (default: 0.08 1.0)')
+    parser.add_argument('--ratio', type=float, nargs='+', default=[3. / 4., 4. / 3.], metavar='RATIO',
+                        help='Random resize aspect ratio (default: 0.75 1.33)')
     parser.add_argument('--no-hflip', action='store_true',
                         help='no random horizontal flipping during training')
     parser.add_argument('--norm-mean', type=float, nargs='+',
 
@@ -28,7 +28,6 @@
 from tllib.utils.logger import CompleteLogger
 from tllib.utils.analysis import collect_feature, tsne, a_distance
 
-
 device = torch.device("cuda" if torch.cuda.is_available() else "cpu")
 
 
@@ -49,7 +48,8 @@ def main(args: argparse.Namespace):
     cudnn.benchmark = True
 
     # Data loading code
-    train_transform = utils.get_train_transform(args.train_resizing, random_horizontal_flip=not args.no_hflip,
+    train_transform = utils.get_train_transform(args.train_resizing, scale=args.scale, ratio=args.ratio,
+                                                random_horizontal_flip=not args.no_hflip,
                                                 random_color_jitter=False, resize_size=args.resize_size,
                                                 norm_mean=args.norm_mean, norm_std=args.norm_std)
     val_transform = utils.get_val_transform(args.val_resizing, resize_size=args.resize_size,
@@ -126,7 +126,8 @@ def main(args: argparse.Namespace):
         for epoch in range(args.pretrain_epochs):
             print("lr:", pretrain_lr_scheduler.get_lr())
             # pretrain for one epoch
-            utils.empirical_risk_minimization(train_source_iter, pretrain_model, pretrain_optimizer, pretrain_lr_scheduler, epoch, args,
+            utils.empirical_risk_minimization(train_source_iter, pretrain_model, pretrain_optimizer,
+                                              pretrain_lr_scheduler, epoch, args,
                                               device)
             # validate to show pretrain process
             utils.validate(val_loader, pretrain_model, args, device)
@@ -237,6 +238,10 @@ def train(train_source_iter: ForeverDataIterator, train_target_iter: ForeverData
     parser.add_argument('-t', '--target', help='target domain(s)', nargs='+')
     parser.add_argument('--train-resizing', type=str, default='default')
     parser.add_argument('--val-resizing', type=str, default='default')
+    parser.add_argument('--scale', type=float, nargs='+', default=[0.08, 1.0], metavar='PCT',
+                        help='Random resize scale (default: 0.08 1.0)')
+    parser.add_argument('--ratio', type=float, nargs='+', default=[3. / 4., 4. / 3.], metavar='RATIO',
+                        help='Random resize aspect ratio (default: 0.75 1.33)')
     parser.add_argument('--resize-size', type=int, default=224,
                         help='the image size after resizing')
     parser.add_argument('--no-hflip', action='store_true',
 
@@ -27,7 +27,6 @@
 from tllib.utils.logger import CompleteLogger
 from tllib.utils.analysis import collect_feature, tsne, a_distance
 
-
 device = torch.device("cuda" if torch.cuda.is_available() else "cpu")
 
 
@@ -48,7 +47,8 @@ def main(args: argparse.Namespace):
     cudnn.benchmark = True
 
     # Data loading code
-    train_transform = utils.get_train_transform(args.train_resizing, random_horizontal_flip=not args.no_hflip,
+    train_transform = utils.get_train_transform(args.train_resizing, scale=args.scale, ratio=args.ratio,
+                                                random_horizontal_flip=not args.no_hflip,
                                                 random_color_jitter=False, resize_size=args.resize_size,
                                                 norm_mean=args.norm_mean, norm_std=args.norm_std)
     val_transform = utils.get_val_transform(args.val_resizing, resize_size=args.resize_size,
@@ -221,6 +221,10 @@ def train(train_source_iter: ForeverDataIterator, train_target_iter: ForeverData
     parser.add_argument('--val-resizing', type=str, default='default')
     parser.add_argument('--resize-size', type=int, default=224,
                         help='the image size after resizing')
+    parser.add_argument('--scale', type=float, nargs='+', default=[0.08, 1.0], metavar='PCT',
+                        help='Random resize scale (default: 0.08 1.0)')
+    parser.add_argument('--ratio', type=float, nargs='+', default=[3. / 4., 4. / 3.], metavar='RATIO',
+                        help='Random resize aspect ratio (default: 0.75 1.33)')
     parser.add_argument('--no-hflip', action='store_true',
                         help='no random horizontal flipping during training')
     parser.add_argument('--norm-mean', type=float, nargs='+',
 
@@ -27,7 +27,6 @@
 from tllib.utils.logger import CompleteLogger
 from tllib.utils.analysis import collect_feature, tsne, a_distance
 
-
 device = torch.device("cuda" if torch.cuda.is_available() else "cpu")
 
 
@@ -48,7 +47,8 @@ def main(args: argparse.Namespace):
     cudnn.benchmark = True
 
     # Data loading code
-    train_transform = utils.get_train_transform(args.train_resizing, random_horizontal_flip=not args.no_hflip,
+    train_transform = utils.get_train_transform(args.train_resizing, scale=args.scale, ratio=args.ratio,
+                                                random_horizontal_flip=not args.no_hflip,
                                                 random_color_jitter=False, resize_size=args.resize_size,
                                                 norm_mean=args.norm_mean, norm_std=args.norm_std)
     val_transform = utils.get_val_transform(args.val_resizing, resize_size=args.resize_size,
@@ -77,7 +77,7 @@ def main(args: argparse.Namespace):
 
     # define optimizer and lr scheduler
     optimizer = SGD(classifier.get_parameters(), args.lr, momentum=args.momentum, weight_decay=args.wd, nesterov=True)
-    lr_scheduler = LambdaLR(optimizer, lambda x:  args.lr * (1. + args.lr_gamma * float(x)) ** (-args.lr_decay))
+    lr_scheduler = LambdaLR(optimizer, lambda x: args.lr * (1. + args.lr_gamma * float(x)) ** (-args.lr_decay))
 
     # define loss function
     mkmmd_loss = MultipleKernelMaximumMeanDiscrepancy(
@@ -207,6 +207,10 @@ def train(train_source_iter: ForeverDataIterator, train_target_iter: ForeverData
     parser.add_argument('--val-resizing', type=str, default='default')
     parser.add_argument('--resize-size', type=int, default=224,
                         help='the image size after resizing')
+    parser.add_argument('--scale', type=float, nargs='+', default=[0.08, 1.0], metavar='PCT',
+                        help='Random resize scale (default: 0.08 1.0)')
+    parser.add_argument('--ratio', type=float, nargs='+', default=[3. / 4., 4. / 3.], metavar='RATIO',
+                        help='Random resize aspect ratio (default: 0.75 1.33)')
     parser.add_argument('--no-hflip', action='store_true',
                         help='no random horizontal flipping during training')
     parser.add_argument('--norm-mean', type=float, nargs='+',
@@ -259,4 +263,3 @@ def train(train_source_iter: ForeverDataIterator, train_target_iter: ForeverData
                              "When phase is 'analysis', only analysis the model.")
     args = parser.parse_args()
     main(args)
-
 
@@ -27,7 +27,6 @@
 from tllib.utils.logger import CompleteLogger
 from tllib.utils.analysis import collect_feature, tsne, a_distance
 
-
 device = torch.device("cuda" if torch.cuda.is_available() else "cpu")
 
 
@@ -48,7 +47,8 @@ def main(args: argparse.Namespace):
     cudnn.benchmark = True
 
     # Data loading code
-    train_transform = utils.get_train_transform(args.train_resizing, random_horizontal_flip=not args.no_hflip,
+    train_transform = utils.get_train_transform(args.train_resizing, scale=args.scale, ratio=args.ratio,
+                                                random_horizontal_flip=not args.no_hflip,
                                                 random_color_jitter=False, resize_size=args.resize_size,
                                                 norm_mean=args.norm_mean, norm_std=args.norm_std)
     val_transform = utils.get_val_transform(args.val_resizing, resize_size=args.resize_size,
@@ -79,7 +79,7 @@ def main(args: argparse.Namespace):
     # define optimizer and lr scheduler
     optimizer = SGD(classifier.get_parameters() + domain_discri.get_parameters(),
                     args.lr, momentum=args.momentum, weight_decay=args.weight_decay, nesterov=True)
-    lr_scheduler = LambdaLR(optimizer, lambda x:  args.lr * (1. + args.lr_gamma * float(x)) ** (-args.lr_decay))
+    lr_scheduler = LambdaLR(optimizer, lambda x: args.lr * (1. + args.lr_gamma * float(x)) ** (-args.lr_decay))
 
     # define loss function
     domain_adv = DomainAdversarialLoss(domain_discri).to(device)
@@ -210,6 +210,10 @@ def train(train_source_iter: ForeverDataIterator, train_target_iter: ForeverData
     parser.add_argument('--val-resizing', type=str, default='default')
     parser.add_argument('--resize-size', type=int, default=224,
                         help='the image size after resizing')
+    parser.add_argument('--scale', type=float, nargs='+', default=[0.08, 1.0], metavar='PCT',
+                        help='Random resize scale (default: 0.08 1.0)')
+    parser.add_argument('--ratio', type=float, nargs='+', default=[3. / 4., 4. / 3.], metavar='RATIO',
+                        help='Random resize aspect ratio (default: 0.75 1.33)')
     parser.add_argument('--no-hflip', action='store_true',
                         help='no random horizontal flipping during training')
     parser.add_argument('--norm-mean', type=float, nargs='+',
@@ -239,7 +243,7 @@ def train(train_source_iter: ForeverDataIterator, train_target_iter: ForeverData
     parser.add_argument('--lr-decay', default=0.75, type=float, help='parameter for lr scheduler')
     parser.add_argument('--momentum', default=0.9, type=float, metavar='M',
                         help='momentum')
-    parser.add_argument('--wd', '--weight-decay',default=1e-3, type=float,
+    parser.add_argument('--wd', '--weight-decay', default=1e-3, type=float,
                         metavar='W', help='weight decay (default: 1e-3)',
                         dest='weight_decay')
     parser.add_argument('-j', '--workers', default=2, type=int, metavar='N',
@@ -261,4 +265,3 @@ def train(train_source_iter: ForeverDataIterator, train_target_iter: ForeverData
                              "When phase is 'analysis', only analysis the model.")
     args = parser.parse_args()
     main(args)
-
 
@@ -21,7 +21,6 @@
 from tllib.utils.analysis import collect_feature, tsne, a_distance
 from tllib.utils.data import ForeverDataIterator
 
-
 device = torch.device("cuda" if torch.cuda.is_available() else "cpu")
 
 
@@ -42,7 +41,8 @@ def main(args):
     cudnn.benchmark = True
 
     # Data loading code
-    train_transform = utils.get_train_transform(args.train_resizing, random_horizontal_flip=not args.no_hflip,
+    train_transform = utils.get_train_transform(args.train_resizing, scale=args.scale, ratio=args.ratio,
+                                                random_horizontal_flip=not args.no_hflip,
                                                 random_color_jitter=False, resize_size=args.resize_size,
                                                 norm_mean=args.norm_mean, norm_std=args.norm_std)
     val_transform = utils.get_val_transform(args.val_resizing, resize_size=args.resize_size,
@@ -136,6 +136,10 @@ def main(args):
     parser.add_argument('--val-resizing', type=str, default='default')
     parser.add_argument('--resize-size', type=int, default=224,
                         help='the image size after resizing')
+    parser.add_argument('--scale', type=float, nargs='+', default=[0.08, 1.0], metavar='PCT',
+                        help='Random resize scale (default: 0.08 1.0)')
+    parser.add_argument('--ratio', type=float, nargs='+', default=[3. / 4., 4. / 3.], metavar='RATIO',
+                        help='Random resize aspect ratio (default: 0.75 1.33)')
     parser.add_argument('--no-hflip', action='store_true',
                         help='no random horizontal flipping during training')
     parser.add_argument('--norm-mean', type=float, nargs='+',