fix fasterrcnn and mass bug.

2020-08-24 22:59:03 +08:00 · 2020-08-24 22:59:03 +08:00 · 9f5a7939d4
parent e69a91b6b5
commit 9f5a7939d4
5 changed files with 10 additions and 7 deletions
--- a/mindspore/ccsrc/runtime/device/ascend/kernel_select_ascend.cc
+++ b/mindspore/ccsrc/runtime/device/ascend/kernel_select_ascend.cc
@ -493,7 +493,7 @@ void SetTensorDeviceInfo(const kernel::KernelBuildInfo &selected_kernel_info, co
    if (AnfAlgo::GetOutputDeviceDataType(real_input_node, 0) == kTypeUnknown || is_ref) {
      std::vector<std::string> output_format = {selected_kernel_info.GetInputFormat(input_index)};
      builder->SetOutputsFormat(output_format);
-      std::vector<TypeId> output_type = {AnfAlgo::GetOutputInferDataType(real_input_node, 0)};
+      std::vector<TypeId> output_type = {selected_kernel_info.GetInputDeviceType(input_index)};
      builder->SetOutputsDeviceType(output_type);
      AnfAlgo::SetSelectKernelBuildInfo(builder->Build(), real_input_node.get());
    }
--- a/model_zoo/official/cv/faster_rcnn/README.md
+++ b/model_zoo/official/cv/faster_rcnn/README.md
@ -27,7 +27,7 @@ FasterRcnn proposed that convolution feature maps based on region detectors (suc

 [Paper](https://arxiv.org/abs/1506.01497):   Ren S , He K , Girshick R , et al. Faster R-CNN: Towards Real-Time Object Detection with Region Proposal Networks[J]. IEEE Transactions on Pattern Analysis and Machine Intelligence, 2015, 39(6).

-#Model Architecture
+# Model Architecture

 FasterRcnn is a two-stage target detection network,This network uses a region proposal network (RPN), which can share the convolution features of the whole image with the detection network, so that the calculation of region proposal is almost cost free. The whole network further combines RPN and FastRcnn into a network by sharing the convolution features.

@ -42,7 +42,7 @@ Dataset used: [COCO2017](<http://images.cocodataset.org/>)
 - Data format：image and json files
  - Note：Data will be processed in dataset.py

-#Environment Requirements
+# Environment Requirements

 - Install [MindSpore](https://www.mindspore.cn/install/en).

@ -87,6 +87,8 @@ Dataset used: [COCO2017](<http://images.cocodataset.org/>)

 After installing MindSpore via the official website, you can start training and evaluation as follows: 

+Note: 1.the first run will generate the mindeocrd file, which will take a long time. 2. pretrained model is a resnet50 checkpoint that trained over ImageNet2012. 3. VALIDATION_JSON_FILE is label file. CHECKPOINT_PATH is a checkpoint file after trained. 
+
 ```
 # standalone training
 sh run_standalone_train_ascend.sh [PRETRAINED_MODEL]
--- a/model_zoo/official/cv/faster_rcnn/src/FasterRcnn/rcnn.py
+++ b/model_zoo/official/cv/faster_rcnn/src/FasterRcnn/rcnn.py
@ -97,7 +97,7 @@ class Rcnn(nn.Cell):
        self.relu = P.ReLU()
        self.logicaland = P.LogicalAnd()
        self.loss_cls = P.SoftmaxCrossEntropyWithLogits()
-        self.loss_bbox = P.SmoothL1Loss(sigma=1.0)
+        self.loss_bbox = P.SmoothL1Loss(beta=1.0)
        self.reshape = P.Reshape()
        self.onehot = P.OneHot()
        self.greater = P.Greater()
--- a/model_zoo/official/cv/faster_rcnn/src/FasterRcnn/rpn.py
+++ b/model_zoo/official/cv/faster_rcnn/src/FasterRcnn/rpn.py
@ -137,7 +137,7 @@ class RPN(nn.Cell):
        self.CheckValid = P.CheckValid()
        self.sum_loss = P.ReduceSum()
        self.loss_cls = P.SigmoidCrossEntropyWithLogits()
-        self.loss_bbox = P.SmoothL1Loss(sigma=1.0/9.0)
+        self.loss_bbox = P.SmoothL1Loss(beta=1.0/9.0)
        self.squeeze = P.Squeeze()
        self.cast = P.Cast()
        self.tile = P.Tile()
--- a/model_zoo/official/nlp/mass/train.py
+++ b/model_zoo/official/nlp/mass/train.py
@ -151,7 +151,7 @@ def _build_training_pipeline(config: TransformerConfig,
    if dataset is None:
        raise ValueError("pre-training dataset or fine-tuning dataset must be provided one.")

-    update_steps = dataset.get_repeat_count() * dataset.get_dataset_size()
+    update_steps = config.epochs * dataset.get_dataset_size()
    if config.lr_scheduler == "isr":
        lr = Tensor(square_root_schedule(lr=config.lr,
                                         update_num=update_steps,
@ -331,7 +331,8 @@ if __name__ == '__main__':
        mode=context.GRAPH_MODE,
        device_target=args.platform,
        reserve_class_name_in_scope=False,
-        device_id=device_id)
+        device_id=device_id,
+        max_call_depth=2000)

    _rank_size = os.getenv('RANK_SIZE')