后脑勺

caffe——net.cpp——init（）

上一节讲的是solver的初始化，在其过程中，调用了net.cpp的init函数，下面，来看一下它是
怎么干活的。

template <typename Dtype>
void Net::Init(const NetParameter& in_param) {
//in_param，接solver.cpp的NetParameter
  CHECK(Caffe::root_solver() || root_net_)
      << "root_net_ needs to be set for all non-root solvers";
  // Set phase from the state.
  phase_ = in_param.state().phase();
  //phase_ = caffe::TRAIN
  // Filter layers based on their include/exclude rules and
  // the current NetState.
  NetParameter filtered_param;
  FilterNet(in_param, &filtered_param);
  //这个函数的作用就是检查in_param，如果in_param的layer符合要求，就赋给filtered_param
  //否则就不赋给filtered_param，你也可以认为这个函数的作用是移除in_param的指定层，将剩下
  //的复制给filtered_param(这里面主要是针对included和exclude)
  LOG_IF(INFO, Caffe::root_solver())
      << "Initializing net from parameters: " << std::endl
      << filtered_param.DebugString();
  // Create a copy of filtered_param with splits added where necessary.
  NetParameter param;
  InsertSplits(filtered_param, ¶m);
  //函数从filtered_param读入新网络到param
  // Basically, build all the layers and set up their connections.
  name_ = param.name();
  map<string, int> blob_name_to_idx;
  set<string> available_blobs;
  //关于set容器，可以看这个网址http://blog.csdn.net/wangran51/article/details/8836160
  memory_used_ = 0;
  // For each layer, set up its input and output
  bottom_vecs_.resize(param.layer_size());//重置bottom_vecs_的大小，一下是函数前后对比
  // bottom_vecs_ = std::vector of length 0, capacity 0
// bottom_vecs_ = std::vector of length 9, capacity 9 = {
//  std::vector of length 0, capacity 0, std::vector of length 0, capacity 0, 
//  std::vector of length 0, capacity 0, std::vector of length 0, capacity 0, 
//  std::vector of length 0, capacity 0, std::vector of length 0, capacity 0, 
// std::vector of length 0, capacity 0, std::vector of length 0, capacity 0, 
//  std::vector of length 0, capacity 0}
//这里面九个元素指的是网络的train layer共有9个所以需要九个参数

  top_vecs_.resize(param.layer_size());
  bottom_id_vecs_.resize(param.layer_size());
  param_id_vecs_.resize(param.layer_size());
  top_id_vecs_.resize(param.layer_size());
  bottom_need_backward_.resize(param.layer_size());
  //差不多参数后面带‘_’的，代表的都是函数运行过程中的中间变量
  for (int layer_id = 0; layer_id < param.layer_size(); ++layer_id) {
  //对layer的每一层进行处理
    // For non-root solvers, whether this layer is shared from root_net_.
    bool share_from_root = !Caffe::root_solver()
        && root_net_->layers_[layer_id]->ShareInParallel();
    // Inherit phase from net if unset.
    if (!param.layer(layer_id).has_phase()) {
      param.mutable_layer(layer_id)->set_phase(phase_);
    }
    // Setup layer.
    const LayerParameter& layer_param = param.layer(layer_id);//看 caffe.proto去～ 赶紧的
    if (layer_param.propagate_down_size() > 0) {
    //propagate_down：Specifies on which bottoms the backpropagation should 
    //be skipped. The size must be either 0 or equal to the number of bottoms.
      CHECK_EQ(layer_param.propagate_down_size(),
          layer_param.bottom_size())
          << "propagate_down param must be specified "
          << "either 0 or bottom_size times ";
    }
    if (share_from_root) {
      LOG(INFO) << "Sharing layer " << layer_param.name() << " from root net";
      layers_.push_back(root_net_->layers_[layer_id]);
      layers_[layer_id]->SetShared(true);
    } else {
      layers_.push_back(LayerRegistry::CreateLayer(layer_param));
      创建layer并将layer_param的值赋值给layers_（具体见下篇博客）
    }
    layer_names_.push_back(layer_param.name());
    LOG_IF(INFO, Caffe::root_solver())
        << "Creating Layer " << layer_param.name();
    bool need_backward = false;

    // Figure out this layer's input and output
    for (int bottom_id = 0; bottom_id < layer_param.bottom_size();
         ++bottom_id) 
         //上边创建了层，然后就该对bottom/top进行处理了
         {
      const int blob_id = AppendBottom(param, layer_id, bottom_id,
                                       &available_blobs, &blob_name_to_idx);
     //见附1
      // If a blob needs backward, this layer should provide it.
      need_backward |= blob_need_backward_[blob_id];
    }
    int num_top = layer_param.top_size();
    for (int top_id = 0; top_id < num_top; ++top_id) {
      AppendTop(param, layer_id, top_id, &available_blobs, &blob_name_to_idx);
      //见附2
      // Collect Input layer tops as Net inputs.
      if (layer_param.type() == "Input") {
        const int blob_id = blobs_.size() - 1;
        net_input_blob_indices_.push_back(blob_id);
        net_input_blobs_.push_back(blobs_[blob_id].get());
      }
    }
    // If the layer specifies that AutoTopBlobs() -> true and the LayerParameter
    // specified fewer than the required number (as specified by
    // ExactNumTopBlobs() or MinTopBlobs()), allocate them here.
    Layer* layer = layers_[layer_id].get();
    //vector > > layers_;
    if (layer->AutoTopBlobs()) {
      const int needed_num_top =
          std::max(layer->MinTopBlobs(), layer->ExactNumTopBlobs());
      for (; num_top < needed_num_top; ++num_top) {
        // Add "anonymous" top blobs -- do not modify available_blobs or
        // blob_name_to_idx as we don't want these blobs to be usable as input
        // to other layers.
        AppendTop(param, layer_id, num_top, NULL, NULL);
      }
    }
    // After this layer is connected, set it up.
    if (share_from_root) {
      // Set up size of top blobs using root_net_
      const vector*>& base_top = root_net_->top_vecs_[layer_id];
      const vector*>& this_top = this->top_vecs_[layer_id];
      for (int top_id = 0; top_id < base_top.size(); ++top_id) {
        this_top[top_id]->ReshapeLike(*base_top[top_id]);
        LOG(INFO) << "Created top blob " << top_id << " (shape: "
            << this_top[top_id]->shape_string() <<  ") for shared layer "
            << layer_param.name();
      }
    } else {
      layers_[layer_id]->SetUp(bottom_vecs_[layer_id], top_vecs_[layer_id]);
      //调用SetUp这一段的介绍看下一篇啊，要不然东西就太多了
    }
    LOG_IF(INFO, Caffe::root_solver())
        << "Setting up " << layer_names_[layer_id];

        //更新向量blob_loss_weights
    for (int top_id = 0; top_id < top_vecs_[layer_id].size(); ++top_id) {
      if (blob_loss_weights_.size() <= top_id_vecs_[layer_id][top_id]) {
        blob_loss_weights_.resize(top_id_vecs_[layer_id][top_id] + 1, Dtype(0));
        //调整blob_loss_weights_的大小，使其与top_id_vecs_[layer_id][top_id]一样大
      }
      blob_loss_weights_[top_id_vecs_[layer_id][top_id]] = layer->loss(top_id);
      //loss函数返回loss_weight ——> 在模板类的SetUp方法中会调用SetLossWeights来设置
      //其私有数据成员loss_,里面存储的其实是loss_weight  
      LOG_IF(INFO, Caffe::root_solver())
          << "Top shape: " << top_vecs_[layer_id][top_id]->shape_string();
          //  top_vecs_[0][0]->shape_string() = "64 1 28 28 (50176)"
      if (layer->loss(top_id)) {
        LOG_IF(INFO, Caffe::root_solver())
            << "    with loss weight " << layer->loss(top_id);
      }
      memory_used_ += top_vecs_[layer_id][top_id]->count();
    }
    LOG_IF(INFO, Caffe::root_solver())
        << "Memory required for data: " << memory_used_ * sizeof(Dtype);
    const int param_size = layer_param.param_size();
    const int num_param_blobs = layers_[layer_id]->blobs().size();
    //param_size是Layermeter类型对象layer_param中ParamSpec param成员的个数, num_param_blobs是一
//个Layer中learnable parameter blob的个数，param_size <= num_param_blobs  
    CHECK_LE(param_size, num_param_blobs)
        << "Too many params specified for layer " << layer_param.name();
    ParamSpec default_param_spec;
    for (int param_id = 0; param_id < num_param_blobs; ++param_id) {
      const ParamSpec* param_spec = (param_id < param_size) ?
          &layer_param.param(param_id) : &default_param_spec;
      const bool param_need_backward = param_spec->lr_mult() != 0;
      //是否反反向传播，主要看基础学习率，如果其为0，则不传播
      need_backward |= param_need_backward;
      //由param_need_backward来决定need_backward是否为真，并且，只要有一次遍历使得
      //need_backward为真，则这个for循环结束后，need_backward也为真
      layers_[layer_id]->set_param_propagate_down(param_id,
                                                  param_need_backward);
    }
    for (int param_id = 0; param_id < num_param_blobs; ++param_id) {
      AppendParam(param, layer_id, param_id);//附3
    }
    // Finally, set the backward flag
    layer_need_backward_.push_back(need_backwar
    d);
    if (need_backward) {
      for (int top_id = 0; top_id < top_id_vecs_[layer_id].size(); ++top_id) {
        blob_need_backward_[top_id_vecs_[layer_id][top_id]] = true;
      }
    }
  }
  //大循环，对每个层都进行处理。 附4

  // Go through the net backwards to determine which blobs contribute to the
  // loss.  We can skip backward computation for blobs that don't contribute
  // to the loss.
  // Also checks if all bottom blobs don't need backward computation (possible
  // because the skip_propagate_down param) and so we can skip bacward
  // computation for the entire layer
  set<string> blobs_under_loss;
  set<string> blobs_skip_backp;
  //这两个参数你可能不太懂，别着急 往下看
  //从上往下，遍历每一层
  for (int layer_id = layers_.size() - 1; layer_id >= 0; --layer_id) {
    bool layer_contributes_loss = false;
    bool layer_skip_propagate_down = true;
    //为true，则表示当前layer的bottom blob不需要backward computation，即该层不需要backward computation。  
//这个局部变量所表示的意义与caffe.proto里message Layerparameter的propagate_down的定义恰好相反。  
    //对于每一层的 top
    for (int top_id = 0; top_id < top_vecs_[layer_id].size(); ++top_id) {
      const string& blob_name = blob_names_[top_id_vecs_[layer_id][top_id]];
      if (layers_[layer_id]->loss(top_id) ||
          (blobs_under_loss.find(blob_name) != blobs_under_loss.end())) {
           //blobs_under_loss的赋值是在下面，也就是上几层
        layer_contributes_loss = true;
      }
      if (blobs_skip_backp.find(blob_name) == blobs_skip_backp.end()) {
        layer_skip_propagate_down = false;
      }
      if (layer_contributes_loss && !layer_skip_propagate_down)
        break;
    }
    // If this layer can skip backward computation, also all his bottom blobs
    // don't need backpropagation
    if (layer_need_backward_[layer_id] && layer_skip_propagate_down) {
      layer_need_backward_[layer_id] = false;
      for (int bottom_id = 0; bottom_id < bottom_vecs_[layer_id].size();
               ++bottom_id) {
        bottom_need_backward_[layer_id][bottom_id] = false;
      }
    }
    if (!layer_contributes_loss) { layer_need_backward_[layer_id] = false; }
    if (Caffe::root_solver()) {
      if (layer_need_backward_[layer_id]) {
        LOG(INFO) << layer_names_[layer_id] << " needs backward computation.";
      } else {
        LOG(INFO) << layer_names_[layer_id]
            << " does not need backward computation.";
      }
    }
    for (int bottom_id = 0; bottom_id < bottom_vecs_[layer_id].size();
         ++bottom_id) {
      if (layer_contributes_loss) {
        const string& blob_name =
            blob_names_[bottom_id_vecs_[layer_id][bottom_id]];
        blobs_under_loss.insert(blob_name);
        //判断当前层是否contributions to loss 是的话 就把名字插入 blobs_under_loss中
      } else {
        bottom_need_backward_[layer_id][bottom_id] = false;
      }
      if (!bottom_need_backward_[layer_id][bottom_id]) {
        const string& blob_name =
                   blob_names_[bottom_id_vecs_[layer_id][bottom_id]];
        blobs_skip_backp.insert(blob_name);
        //若本层不需要反反向传播，将名字插入blobs_skip_backp中。
      }
    }
  }
  // Handle force_backward if needed.
  if (param.force_backward()) {
    for (int layer_id = 0; layer_id < layers_.size(); ++layer_id) {
      layer_need_backward_[layer_id] = true;
      for (int bottom_id = 0;
           bottom_id < bottom_need_backward_[layer_id].size(); ++bottom_id) {
        bottom_need_backward_[layer_id][bottom_id] =
            bottom_need_backward_[layer_id][bottom_id] ||
            layers_[layer_id]->AllowForceBackward(bottom_id);
        blob_need_backward_[bottom_id_vecs_[layer_id][bottom_id]] =
            blob_need_backward_[bottom_id_vecs_[layer_id][bottom_id]] ||
            bottom_need_backward_[layer_id][bottom_id];
      }
      for (int param_id = 0; param_id < layers_[layer_id]->blobs().size();
           ++param_id) {
        layers_[layer_id]->set_param_propagate_down(param_id, true);
      }
    }
  }
  // In the end, all remaining blobs are considered output blobs.
  for (set<string>::iterator it = available_blobs.begin();
      it != available_blobs.end(); ++it) {
    LOG_IF(INFO, Caffe::root_solver())
        << "This network produces output " << *it;
    net_output_blobs_.push_back(blobs_[blob_name_to_idx[*it]].get());
    net_output_blob_indices_.push_back(blob_name_to_idx[*it]);
  }

//blob_names_.size() = 9
  for (size_t blob_id = 0; blob_id < blob_names_.size(); ++blob_id) {
    blob_names_index_[blob_names_[blob_id]] = blob_id;
    //向 blob_names_index_里逐一添加元素
  }

//layer_names_.size()= 9
  for (size_t layer_id = 0; layer_id < layer_names_.size(); ++layer_id) {
    layer_names_index_[layer_names_[layer_id]] = layer_id;
  }
/*
(gdb) p blob_names_index_
$95 = std::map with 9 elements = {["conv1"] = 2, ["conv2"] = 4, ["data"] = 0, 
  ["ip1"] = 6, ["ip2"] = 7, ["label"] = 1, ["loss"] = 8, ["pool1"] = 3, 
  ["pool2"] = 5}
(gdb) p  layer_names_index_
$96 = std::map with 9 elements = {["conv1"] = 1, ["conv2"] = 3, ["ip1"] = 5, 
  ["ip2"] = 7, ["loss"] = 8, ["mnist"] = 0, ["pool1"] = 2, ["pool2"] = 4, 
  ["relu1"] = 6}
*/
  ShareWeights();
  debug_info_ = param.debug_info();
  LOG_IF(INFO, Caffe::root_solver()) << "Network initialization done.";
}

template <typename Dtype>
void Net::FilterNet(const NetParameter& param,
    NetParameter* param_filtered) {
  NetState net_state(param.state());
  param_filtered->CopyFrom(param);
  param_filtered->clear_layer();
  for (int i = 0; i < param.layer_size(); ++i) {
    const LayerParameter& layer_param = param.layer(i);
    const string& layer_name = layer_param.name();
    CHECK(layer_param.include_size() == 0 || layer_param.exclude_size() == 0)
          << "Specify either include rules or exclude rules; not both.";
    // If no include rules are specified, the layer is included by default and
    // only excluded if it meets one of the exclude rules.
    bool layer_included = (layer_param.include_size() == 0);
    for (int j = 0; layer_included && j < layer_param.exclude_size(); ++j) {
      if (StateMeetsRule(net_state, layer_param.exclude(j), layer_name)) {
        layer_included = false;
      }
    }
    for (int j = 0; !layer_included && j < layer_param.include_size(); ++j) {
      if (StateMeetsRule(net_state, layer_param.include(j), layer_name)) {
        layer_included = true;
      }
    }
    if (layer_included) {
      param_filtered->add_layer()->CopyFrom(layer_param);
    }
  }
}

template <typename Dtype>
bool Net::StateMeetsRule(const NetState& state,
    const NetStateRule& rule, const string& layer_name) {
  // Check whether the rule is broken due to phase.
  if (rule.has_phase()) {
      if (rule.phase() != state.phase()) {
        LOG_IF(INFO, Caffe::root_solver())
            << "The NetState phase (" << state.phase()
            << ") differed from the phase (" << rule.phase()
            << ") specified by a rule in layer " << layer_name;
        return false;
      }
  }
  // Check whether the rule is broken due to min level.
  if (rule.has_min_level()) {
    if (state.level() < rule.min_level()) {
      LOG_IF(INFO, Caffe::root_solver())
          << "The NetState level (" << state.level()
          << ") is above the min_level (" << rule.min_level()
          << ") specified by a rule in layer " << layer_name;
      return false;
    }
  }
  // Check whether the rule is broken due to max level.
  if (rule.has_max_level()) {
    if (state.level() > rule.max_level()) {
      LOG_IF(INFO, Caffe::root_solver())
          << "The NetState level (" << state.level()
          << ") is above the max_level (" << rule.max_level()
          << ") specified by a rule in layer " << layer_name;
      return false;
    }
  }
  // Check whether the rule is broken due to stage. The NetState must
  // contain ALL of the rule's stages to meet it.
  for (int i = 0; i < rule.stage_size(); ++i) {
    // Check that the NetState contains the rule's ith stage.
    bool has_stage = false;
    for (int j = 0; !has_stage && j < state.stage_size(); ++j) {
      if (rule.stage(i) == state.stage(j)) { has_stage = true; }
    }
    if (!has_stage) {
      LOG_IF(INFO, Caffe::root_solver())
          << "The NetState did not contain stage '" << rule.stage(i)
          << "' specified by a rule in layer " << layer_name;
      return false;
    }
  }
  // Check whether the rule is broken due to not_stage. The NetState must
  // contain NONE of the rule's not_stages to meet it.
  for (int i = 0; i < rule.not_stage_size(); ++i) {
    // Check that the NetState contains the rule's ith not_stage.
    bool has_stage = false;
    for (int j = 0; !has_stage && j < state.stage_size(); ++j) {
      if (rule.not_stage(i) == state.stage(j)) { has_stage = true; }
    }
    if (has_stage) {
      LOG_IF(INFO, Caffe::root_solver())
          << "The NetState contained a not_stage '" << rule.not_stage(i)
          << "' specified by a rule in layer " << layer_name;
      return false;
    }
  }
  return true;
}

附1：:AppendBottom
// Helper for Net::Init: add a new bottom blob to the net.
template <typename Dtype>
int Net::AppendBottom(const NetParameter& param, const int layer_id,
    const int bottom_id, set<string>* available_blobs,
    map<string, int>* blob_name_to_idx) {
  const LayerParameter& layer_param = param.layer(layer_id);
  const string& blob_name = layer_param.bottom(bottom_id);
  if (available_blobs->find(blob_name) == available_blobs->end()) {
    LOG(FATAL) << "Unknown bottom blob '" << blob_name << "' (layer '"
               << layer_param.name() << "', bottom index " << bottom_id << ")";
  }
  const int blob_id = (*blob_name_to_idx)[blob_name];
  LOG_IF(INFO, Caffe::root_solver())
      << layer_names_[layer_id] << " <- " << blob_name;
  bottom_vecs_[layer_id].push_back(blobs_[blob_id].get());
  //调用shared_ptr类的get()方法提取存储在blobs_中的中间变量  
  bottom_id_vecs_[layer_id].push_back(blob_id);
  available_blobs->erase(blob_name);
  bool need_backward = blob_need_backward_[blob_id];
  // Check if the backpropagation on bottom_id should be skipped
  if (layer_param.propagate_down_size() > 0) {
    need_backward = layer_param.propagate_down(bottom_id);
    ////propagate_down为true,则表示参与BP;否则，skip bp  
  }  
  bottom_need_backward_[layer_id].push_back(need_backward);
  return blob_id;
}

附2：AppendTop
// Helper for Net::Init: add a new top blob to the net.
template <typename Dtype>
void Net::AppendTop(const NetParameter& param, const int layer_id,
                           const int top_id, set<string>* available_blobs,
                           map<string, int>* blob_name_to_idx) {
  shared_ptr layer_param( 
      new LayerParameter(param.layer(layer_id)));
      //param.layer(layer_id),第layer_id层的layer参数
  const string& blob_name = (layer_param->top_size() > top_id) ?
      layer_param->top(top_id) : "(automatic)";
  // Check if we are doing in-place computation
  if (blob_name_to_idx && layer_param->bottom_size() > top_id &&
      blob_name == layer_param->bottom(top_id)) {
    // In-place computation
    LOG_IF(INFO, Caffe::root_solver())
        << layer_param->name() << " -> " << blob_name << " (in-place)";
    top_vecs_[layer_id].push_back(blobs_[(*blob_name_to_idx)[blob_name]].get());
    top_id_vecs_[layer_id].push_back((*blob_name_to_idx)[blob_name]);
  } else if (blob_name_to_idx &&
             blob_name_to_idx->find(blob_name) != blob_name_to_idx->end()) {
    // If we are not doing in-place computation but have duplicated blobs,
    // raise an error.
    LOG(FATAL) << "Top blob '" << blob_name
               << "' produced by multiple sources.";
  } else {
    // Normal output.
    if (Caffe::root_solver()) {
      LOG(INFO) << layer_param->name() << " -> " << blob_name;
      //这里layer_param->name()指的是层的名字，blob_name指的是top或bottom的名字
    }
    shared_ptr > blob_pointer(new Blob());
    //构造函数 new一个bolb_pointer
    const int blob_id = blobs_.size();
    blobs_.push_back(blob_pointer);
    //blobs_是一个向量，值为vector of length 0, capacity 0
    //在其尾部插入blob_pointer值为vector of length 1, capacity 1 = {{px =
    //0x6af420, pn = {pi_ = 0x6af480}}}
    //感觉一开始的blibs_就是一个向量，里面储存的是可以0指向blob的的只能指针，然后将指向
    //blob_pointer的指针赋给了它
    blob_names_.push_back(blob_name);
    blob_need_backward_.push_back(false);
    if (blob_name_to_idx) { (*blob_name_to_idx)[blob_name] = blob_id; }
    //*blob_name_to_idx= std::map with 1 elements = {["data"] = 0}
/*
blob_name_to_idx是一个局部变量，其实它是在当前layer的top blob 和下一层的bottom blob间起着一个桥梁作用。  
blob_name_to_idx中元素的pair是从网络最开始一层一层搭建的过程中压入map的，其中的name和id都是不重复的。name是关键字——不重复是map数据结构的必然要求，id也是不重复的——0,1,2...  
blob_name_to_idx和blobs_一样，在"Normal output"的情形下，每次遍历到一个top blob的时候都会更新  参考 http://www.itdaan.com/blog/2016/03/26/726330.html
*/
    /// top_vecs stores the vectors containing the output for each layer
    //vector*> > top_vecs_;
    //vector > top_id_vecs_;
    top_id_vecs_[layer_id].push_back(blob_id);
    top_vecs_[layer_id].push_back(blob_pointer.get());
  }
  if (available_blobs) { available_blobs->insert(blob_name); }
}
/*
总结：AppendTop主要干了以下几件事：
1.new了bolb类的指针；
2.将blob的指针，名字等压入blobs；
3.更新map类型的blob_name_to_idx以及set类型的available_blobs；
现在只是一个初始化过程，还没有进行 数据的处理，现在只是搭框架。
*/

附3：

AppendParam函数
    template <typename Dtype>  
    void Net::AppendParam(const NetParameter& param, const int layer_id,  
                                 const int param_id) {  
      const LayerParameter& layer_param = layers_[layer_id]->layer_param();//模板类Layer的layer_param方法，返回Layerparameter类型成员  
      const int param_size = layer_param.param_size();  
      string param_name =  
          (param_size > param_id) ? layer_param.param(param_id).name() : "";  
      if (param_name.size()) {  
        param_display_names_.push_back(param_name);//vector param_display_names_ 这里param_name获取的是PaParamSpec类型中的name成员，如果有name且非空,就把name压入该向量，否则就压入param_id  
      } else {  
        ostringstream param_display_name;  
        param_display_name << param_id;  
        param_display_names_.push_back(param_display_name.str());  
      }  
      //Append 参数blob 每一次循环，net_param_id和param_id_vecs_都会更新  
      const int net_param_id = params_.size();//vector > > params_--->The parameters in the network,整个网络的参数的id,!!!不管这个参数有没有non-emty name，是否参与share!!!  
      params_.push_back(layers_[layer_id]->blobs()[param_id]);//将当前layer当前"参数blob"压入params_ --->vector > > params_  
      param_id_vecs_[layer_id].push_back(net_param_id);//将整个网络的参数按层的形式来存储，存储的元素可以理解为params_这个向量的下标值（类型为整型）  
      param_layer_indices_.push_back(make_pair(layer_id, param_id));//param_layer_indices_是向量，其元素为当layer_id 与当前param_id 组成的pair.vector > param_layer_indices_  
      //获取每个param_id所对应的Paramspec类型成员，如果param_id >= param_size 则返回default_param_spec。注意param_size <= num_param_blobs  
      ParamSpec default_param_spec;  
      const ParamSpec* param_spec = (layer_param.param_size() > param_id) ?  
          &layer_param.param(param_id) : &default_param_spec;  
      if (!param_size || !param_name.size() || (param_name.size() &&  
          param_names_index_.find(param_name) == param_names_index_.end())) {  
        // This layer "owns" this parameter blob -- it is either anonymous  
        // (i.e., not given a param_name) or explicitly given a name that we  
        // haven't already seen.  
        // 相反，如果param_name不为空，而且能够在param_names_index_中找到，说明这个parameter已经存在于之前的某个或者某些网络层里，说明这个parameter是共享于多个layer  
        // 在caffe.proto的message ParamSpec里关于name的注释——>To share a parameter between two layers, give it a (non-empty) name, 可见，如果一个parameter是共享与多个网络层，那么它会有一个非空的name  
        param_owners_.push_back(-1);//vector param_owners_ 是一个存储parameter "onwer"的一个向量  ——> -1 表示当前Layer就是该parameter的"owner"  
        //添加param_name  
        if (param_name.size()) {  
          //map param_names_index_是整个网络的参数non-empty name与index的映射。  
          //注意，这个name是ParamSpec 类型中的name,而且，""To share a parameter between two layers, give it a (non-empty) name"",所以说这个map中存储的pair是<会被share的parameter_name, 其对应index>  
          param_names_index_[param_name] = net_param_id;//map param_names_index_ 。虽然每一次循环，net_param_id都会更新，但是net_param_id只有当param_name.size()>0时才会被压入向量param_names_index_  
        }  
        //添加learnable_param  
        const int learnable_param_id = learnable_params_.size();//vector*> learnable_params_   
        learnable_params_.push_back(params_[net_param_id].get());//压入learnable parameter ---> 在模板类layer中，定义了一个blobs_成员，其存储的就是learnable parameter。随后压入learnable_param_id  
        learnable_param_ids_.push_back(learnable_param_id);//vector learnable_param_ids_  
        has_params_lr_.push_back(param_spec->has_lr_mult());//vector has_params_lr_  
        has_params_decay_.push_back(param_spec->has_decay_mult());  
        params_lr_.push_back(param_spec->lr_mult());//vector params_lr_  
        params_weight_decay_.push_back(param_spec->decay_mult());  
      } else {  
        // Named param blob with name we've seen before: share params  
        const int owner_net_param_id = param_names_index_[param_name];//因为"To share a parameter between two layers, give it a (non-empty) name",所以这句代码就是获取shared parameter的"owner" net_param_id  
        param_owners_.push_back(owner_net_param_id);//vector param_owners_  
        const pair<int, int>& owner_index =  
            param_layer_indices_[owner_net_param_id];//只获取了那些shared的parameter,即具有non-empty name的parameter的pair  
        const int owner_layer_id = owner_index.first;  
        const int owner_param_id = owner_index.second;  
        LOG_IF(INFO, Caffe::root_solver()) << "Sharing parameters '" << param_name  
            << "' owned by "  
            << "layer '" << layer_names_[owner_layer_id] << "', param "  
            << "index " << owner_param_id;  
        Blob* this_blob = layers_[layer_id]->blobs()[param_id].get();//获取当前层的当前参数Blob  
        Blob* owner_blob =  
            layers_[owner_layer_id]->blobs()[owner_param_id].get();//获取owner layer的对应的参数blob  
        const int param_size = layer_param.param_size();  
        if (param_size > param_id && (layer_param.param(param_id).share_mode() ==  
                                      ParamSpec_DimCheckMode_PERMISSIVE)) {  
          // Permissive dimension checking -- only check counts are the same.  
          CHECK_EQ(this_blob->count(), owner_blob->count())  
              << "Cannot share param '" << param_name << "' owned by layer '"  
              << layer_names_[owner_layer_id] << "' with layer '"  
              << layer_names_[layer_id] << "'; count mismatch.  Owner layer param "  
              << "shape is " << owner_blob->shape_string() << "; sharing layer "  
              << "shape is " << this_blob->shape_string();  
        } else {  
          // Strict dimension checking -- all dims must be the same.  
          CHECK(this_blob->shape() == owner_blob->shape())  
              << "Cannot share param '" << param_name << "' owned by layer '"  
              << layer_names_[owner_layer_id] << "' with layer '"  
              << layer_names_[layer_id] << "'; shape mismatch.  Owner layer param "  
              << "shape is " << owner_blob->shape_string() << "; sharing layer "  
              << "expects shape " << this_blob->shape_string();  
        }  
        //获取owner layer的learnable_param_id，并且压入当前layer的向量learnable_param_ids_。  
        //而且在这里也没有把参数blob压入learnable_params_向量（只是将id压入learnable_param_ids_），从而避免当前layer与sharing layer之间关于shared parameter blob 的重复  
        const int learnable_param_id = learnable_param_ids_[owner_net_param_id];//vector learnable_param_ids_ ; vector params_lr_;  
        learnable_param_ids_.push_back(learnable_param_id);  
        if (param_spec->has_lr_mult()) {  
          if (has_params_lr_[learnable_param_id]) {  
            CHECK_EQ(param_spec->lr_mult(), params_lr_[learnable_param_id])  
                << "Shared param '" << param_name << "' has mismatched lr_mult.";  
          } else {  
            has_params_lr_[learnable_param_id] = true;  
            params_lr_[learnable_param_id] = param_spec->lr_mult();  
          }  
        }  
        if (param_spec->has_decay_mult()) {  
          if (has_params_decay_[learnable_param_id]) {  
            CHECK_EQ(param_spec->decay_mult(),  
                     params_weight_decay_[learnable_param_id])  
                << "Shared param '" << param_name << "' has mismatched decay_mult.";  
          } else {  
            has_params_decay_[learnable_param_id] = true;  
            params_weight_decay_[learnable_param_id] = param_spec->decay_mult();  
          }  
        }  
      }  
    }  
    ps：借鉴的这个网址http://blog.csdn.net/iamzhangzhuping/article/details/50537240

附4：
I0509 15:23:17.999642  6356 layer_factory.hpp:77] Creating layer mnist
[New Thread 0x7ffff0bc6700 (LWP 6357)]
I0509 15:23:18.007805  6356 net.cpp:91] Creating Layer mnist
I0509 15:23:18.007853  6357 db_lmdb.cpp:38] Opened lmdb examples/mnist/mnist_train_lmdb
I0509 15:23:18.007879  6356 net.cpp:399] mnist -> data
I0509 15:23:18.008003  6356 net.cpp:399] mnist -> label
I0509 15:23:18.008141  6356 data_layer.cpp:41] output data size: 64,1,28,28
I0509 15:23:18.008430  6356 base_data_layer.cpp:69] Initializing prefetch
[New Thread 0x7effebfff700 (LWP 6358)]
I0509 15:23:18.009194  6356 base_data_layer.cpp:72] Prefetch initialized.
I0509 15:23:18.009217  6356 net.cpp:141] Setting up mnist
I0509 15:23:18.009263  6356 net.cpp:148] Top shape: 64 1 28 28 (50176)
I0509 15:23:18.009282  6356 net.cpp:148] Top shape: 64 (64)
I0509 15:23:18.009294  6356 net.cpp:156] Memory required for data: 200960
I0509 15:23:18.009320  6356 layer_factory.hpp:77] Creating layer conv1
I0509 15:23:18.009393  6356 net.cpp:91] Creating Layer conv1
I0509 15:23:18.009428  6356 net.cpp:425] conv1 <- data
I0509 15:23:18.009490  6356 net.cpp:399] conv1 -> conv1
I0509 15:23:18.009726  6356 net.cpp:141] Setting up conv1
I0509 15:23:18.009752  6356 net.cpp:148] Top shape: 64 20 24 24 (737280)
I0509 15:23:18.009764  6356 net.cpp:156] Memory required for data: 3150080
I0509 15:23:18.009879  6356 layer_factory.hpp:77] Creating layer pool1
I0509 15:23:18.009918  6356 net.cpp:91] Creating Layer pool1
I0509 15:23:18.009935  6356 net.cpp:425] pool1 <- conv1
I0509 15:23:18.009965  6356 net.cpp:399] pool1 -> pool1
I0509 15:23:18.010017  6356 net.cpp:141] Setting up pool1
I0509 15:23:18.010040  6356 net.cpp:148] Top shape: 64 20 12 12 (184320)
I0509 15:23:18.010063  6356 net.cpp:156] Memory required for data: 3887360
I0509 15:23:18.010081  6356 layer_factory.hpp:77] Creating layer conv2
I0509 15:23:18.010113  6356 net.cpp:91] Creating Layer conv2
I0509 15:23:18.010128  6356 net.cpp:425] conv2 <- pool1
I0509 15:23:18.010161  6356 net.cpp:399] conv2 -> conv2
I0509 15:23:18.010467  6358 data_layer.cpp:102] Prefetch batch: 1 ms.
I0509 15:23:18.010498  6358 data_layer.cpp:103]      Read time: 0.112 ms.
I0509 15:23:18.010507  6358 data_layer.cpp:104] Transform time: 0.714 ms.
I0509 15:23:18.011415  6358 data_layer.cpp:102] Prefetch batch: 0 ms.
I0509 15:23:18.011430  6358 data_layer.cpp:103]      Read time: 0.076 ms.
I0509 15:23:18.011437  6358 data_layer.cpp:104] Transform time: 0.565 ms.
I0509 15:23:18.011806  6356 net.cpp:141] Setting up conv2
I0509 15:23:18.011836  6356 net.cpp:148] Top shape: 64 50 8 8 (204800)
I0509 15:23:18.011848  6356 net.cpp:156] Memory required for data: 4706560
I0509 15:23:18.011881  6356 layer_factory.hpp:77] Creating layer pool2
I0509 15:23:18.011915  6356 net.cpp:91] Creating Layer pool2
I0509 15:23:18.011934  6356 net.cpp:425] pool2 <- conv2
I0509 15:23:18.011976  6356 net.cpp:399] pool2 -> pool2
I0509 15:23:18.012018  6356 net.cpp:141] Setting up pool2
I0509 15:23:18.012035  6356 net.cpp:148] Top shape: 64 50 4 4 (51200)
I0509 15:23:18.012043  6356 net.cpp:156] Memory required for data: 4911360
I0509 15:23:18.012054  6356 layer_factory.hpp:77] Creating layer ip1
I0509 15:23:18.012079  6356 net.cpp:91] Creating Layer ip1
I0509 15:23:18.012122  6356 net.cpp:425] ip1 <- pool2
I0509 15:23:18.012156  6356 net.cpp:399] ip1 -> ip1
I0509 15:23:18.012449  6358 data_layer.cpp:102] Prefetch batch: 0 ms.
I0509 15:23:18.012465  6358 data_layer.cpp:103]      Read time: 0.099 ms.
I0509 15:23:18.012475  6358 data_layer.cpp:104] Transform time: 0.595 ms.
I0509 15:23:18.035526  6356 net.cpp:141] Setting up ip1
I0509 15:23:18.035575  6356 net.cpp:148] Top shape: 64 500 (32000)
I0509 15:23:18.035583  6356 net.cpp:156] Memory required for data: 5039360
I0509 15:23:18.035614  6356 layer_factory.hpp:77] Creating layer relu1
I0509 15:23:18.035656  6356 net.cpp:91] Creating Layer relu1
I0509 15:23:18.035681  6356 net.cpp:425] relu1 <- ip1
I0509 15:23:18.035698  6356 net.cpp:386] relu1 -> ip1 (in-place)
I0509 15:23:18.035717  6356 net.cpp:141] Setting up relu1
I0509 15:23:18.035727  6356 net.cpp:148] Top shape: 64 500 (32000)
I0509 15:23:18.035732  6356 net.cpp:156] Memory required for data: 5167360
I0509 15:23:18.035739  6356 layer_factory.hpp:77] Creating layer ip2
I0509 15:23:18.035755  6356 net.cpp:91] Creating Layer ip2
I0509 15:23:18.035764  6356 net.cpp:425] ip2 <- ip1
I0509 15:23:18.035806  6356 net.cpp:399] ip2 -> ip2
I0509 15:23:18.036211  6356 net.cpp:141] Setting up ip2
I0509 15:23:18.036257  6356 net.cpp:148] Top shape: 64 10 (640)
I0509 15:23:18.036262  6356 net.cpp:156] Memory required for data: 5169920
I0509 15:23:18.036274  6356 layer_factory.hpp:77] Creating layer loss
I0509 15:23:18.036298  6356 net.cpp:91] Creating Layer loss
I0509 15:23:18.036308  6356 net.cpp:425] loss <- ip2
I0509 15:23:18.036320  6356 net.cpp:425] loss <- label
I0509 15:23:18.036336  6356 net.cpp:399] loss -> loss
I0509 15:23:18.036363  6356 layer_factory.hpp:77] Creating layer loss
I0509 15:23:18.036408  6356 net.cpp:141] Setting up loss
I0509 15:23:18.036420  6356 net.cpp:148] Top shape: (1)
I0509 15:23:18.036427  6356 net.cpp:151]     with loss weight 1
I0509 15:23:18.036437  6356 net.cpp:156] Memory required for data: 5169924

你可能感兴趣的:(caffe)

深度学习框架人工智能操作系统训练&前向推理 PyTorch Tensorflow MindSpore caffe 张量加速引擎TBE 深度学习编译器多面体 polyhedral AI集群框架 EwenWanW 深度学习人工智能 pytorch 深度学习编译器
深度学习框架人工智能操作系统训练&前向推理深度学习框架发展到今天，目前在架构上大体已经基本上成熟并且逐渐趋同。无论是国外的Tensorflow、PyTorch，亦或是国内最近开源的MegEngine、MindSpore，目前基本上都是支持EagerMode和GraphMode两种模式。AI嵌入式框架OneFlow&清华计图Jittor&华为深度学习框架MindSpore&旷视深度学习框架MegEn
Caffeine 与 Guava Cache 雨季里的向日葵 java
一、概要1.1背景在项目开发中，为提升系统性能，减少IO开销，本地缓存是必不可少的。最常见的本地缓存是Guava和Caffeine，Caffeine是基于GoogleGuavaCache设计经验改进的结果，相较于Guava在性能和命中率上更具有效率。1.2应用场景愿意消耗一些内存空间来提升速度预料到某些键会被多次查询缓存中存放的数据总量不会超出内存容量二、GuavaCache2.1GuavaCac
OSError: [WinError 126] 找不到指定的模块---caffe2_detectron_ops_gpu.dll 努力的小柚 python运行问题 python pytorch
代码复现记录：问题：OSError:[WinError126]找不到指定的模块。Errorloading"C:\Anaconda\Anaconda3\envs\TIN\lib\site-packages\torch\lib\caffe2_detectron_ops_gpu.dll"oroneofitsdependencies.在搜索很多关于无法查找到caffe2_detectron_ops_gpu
caffe/PyTorch/TensorFlow 在Jupyter Notebook GPU中运用俊俏的萌妹纸 caffe 人工智能深度学习
在JupyterNotebook中使用Caffe框架并利用GPU加速，可以实现多种效果和目的，主要集中在深度学习领域。以下是一些主要的应用场景：快速训练模型：GPU加速可以显著提高模型训练的速度。对于大型数据集和复杂的神经网络结构，使用GPU可以大大减少训练时间。实时数据增强：在训练过程中，可以实时地对输入数据进行变换和增强，以提高模型的泛化能力。GPU加速使得这些操作更加高效。大规模数据处理：深
Linux下Caffe、Docker、Tensorflow、PyTorch环境搭建(CentOS 7) SnailTyan
文章作者：Tyan博客：noahsnail.com|CSDN|注：模型的训练、测试、部署都可以通过Docker环境完成，环境问题会更少。1.CUDA8.0安装CUDA8.0Configenvvariables#CUDAPATHexportPATH="/usr/local/cuda-8.0/bin:$PATH"#CUDALDLIBRARY_PATHexportLD_LIBRARY_PATH="/us
JVM级缓存本地缓存Caffeine 旺仔爱Java JVM专题 jvm JVM缓存本地缓存 Caffeine Guava Cache
JVM级缓存本地缓存Caffeine和GuavaCache前言一、创建缓存的代码逻辑二、Caffeine的优化方面淘汰算法W-TinyLFU三、Caffeine的业务使用总结前言最新的Java面试题，技术栈涉及Java基础、集合、多线程、Mysql、分布式、Spring全家桶、MyBatis、Dubbo、缓存、消息队列、Linux…等等，会持续更新。一、创建缓存的代码逻辑Caffeine：publ
面试redis篇-04缓存雪崩卡搜偶缓存面试 redis
原理缓存雪崩：是指在同一时段大量的缓存key同时失效或者Redis服务宕机，导致大量请求到达数据库，带来巨大压力。解决方案：给不同的Key的TTL添加随机值利用Redis集群提高服务的可用性（哨兵模式、集群模式）给缓存业务添加降级限流策略（ngxin或springcloudgateway）给业务添加多级缓存（Guava或Caffeine）问答面试官：什么是缓存雪崩?怎么解决?回答：缓存雪崩意思是设
深度学习主流开源框架：Caffe、TensorFlow、Pytorch、Theano、Keras、MXNet、Chainer seasonsyy 深度学习小知识深度学习开源框架 pytorch
2.6深度学习主流开源框架表2.1深度学习主流框架参数对比框架关键词总结框架关键词基本数据结构（都是高维数组）Caffe“在工业中应用较为广泛”，“编译安装麻烦一点”BlobTensorFlow“安装简单pip”TensorPytorch“定位：快速实验研究”，“简单”，“灵活”TensorTheano×“用于处理大规模神经网络的训练”，“不支持移动设备”，“不能应用于工业环境”，“编译复杂模型时
MMsegmentation-随机初始化 SatVision炼金士 mmalb-炼金术 python
系列文章目录文章目录系列文章目录前言一、初始化单个模块二、初始化多个模块总结前言mmlab下游分支调用权重随机初始化使用参考mmengine的说明文档mmengine支持模型初始化方法包括：BaseInit,Caffe2XavierInit,ConstantInit,KaimingInit,NormalInit,PretrainedInit,TruncNormalInit,UniformInit,
解决：源码安装caffe时遇到libcudnn.so: file not recognized问题 Gracie丹妮
参考教程(19条消息)ubuntu16.04下Detectron+caffe2(Pytorch)安装配置过程_张家坎的博客-CSDN博客_caffe2_detectron_ops_gpu.dllhttps://blog.csdn.net/u014236392/article/details/81117287安装caffe2执行sudomakeinstall之后遇到如下问题:/home/Xdn/cu
进场行礼问候退场东方芭蕾Lily
1.当听到响铃声，按编号排队依次进入考场。tips：面带微笑，优雅自信且有礼貌的边看着考试官边跑到准备问好的位置。步伐轻盈像一阵风样，到位置站好一位脚，保持挺拔向上体态。小仙女就是你们。2.行礼问候Examier:(考试官)GillianMccafferyGoodmorning/afternoongirlsGoodmorning/afrernoonmadamorMs.MccafferyQuesti
YOLOv5独家改进：上采样算子 | 超轻量高效动态上采样DySample，效果秒杀CAFFE，助力小目标检测 AI小怪兽 YOLOv5原创自研 YOLO caffe 目标检测深度学习人工智能
本文独家改进：一种超轻量高效动态上采样DySample，具有更少的参数、FLOPs，效果秒杀CAFFE和YOLOv5网络中的nn.Upsample在多个数据集下验证能够涨点，尤其在小目标检测领域涨点显著。收录YOLOv5原创自研https://blog.csdn.net/m0_63774211/category_12511931.html全网独家首发创新（原创），适合paper！！！2024年计算
caffez转ncnn，及环境配置宁静深远软件安装
一、安装ncnn1、安装protobuf(a)、gitclonehttps://github.com/google/protobuf(b)、自动生成configure配置文件，运行：./autogen.sh(c)、配置环境：./configure(d)、编译源代码:make(e)、安装：sudomakeinstall(f)、刷新动态库:sudoldconfig2、安装ncnn(a)、mkdirco
最新姿态估计研究进展 a微风掠过
最新姿态估计研究进展自上而下：就是先检测包含人的框，即humanproposal，然后对框子中的人进行姿态估计。一般RCNN（区域CNN就是这个思路）自下而上：先检测keypoint，然后根据热力图、点与点之间连接的概率，根据图论知识，基于PAF（部分亲和字段）将关键点连接起来，将关键点分组到人。1、CMU：openpose研究多人的姿态估计运行环境：caffe自下而上，关键点被分组到人的实例时间
智慧云智能教育考试平台展示 barry200890 springboot vue 考试 java vue.js 小程序
智慧云智能教育平台项目简介技术架构1.1后端技术栈:*基于SpringBoot+MybatisPlus+Shiro+mysql5.7+redis+websocket构建.*使用jdk1.8的新特性如:caffeine缓存,lambda表达式.1.2前端技术:*Vue*Vuex*Vxe-Table(文档地址：https://gitee.com/xuliangzhan_admin/vxe-table)
what is SSD|Single Shot MultiBox Detector Woooooooooooooo
文章摘选自多篇文章，仅用于学习，在此表示感谢，若有侵权请联系，感谢论文下载地址：https://arxiv.org/abs/1512.02325论文代码：https://github.com/weiliu89/caffe/tree/ssd省去了区域建议网络，直接使用不同尺度featuremap中的cell得到priodbox（和anchor类似），利用卷积可以直接得到box的回归和score而不需
caffe中的参考模型雨住多一横
RCNNmode_reference_rcnn_ilsvrc13l.pngcaffenet用于Flickrstyle数据集model_finetune_flickr_style.pngAlexNetmodel_alexnet.pnggooglenetmodel_googlenet.pngcaffenetmodel_reference_caffenet.png
RT-DETR算法优化改进：上采样算子 | 超轻量高效动态上采样DySample，效果秒杀CAFFE，助力小目标检测 AI小怪兽 RT-DETR魔术师算法 caffe 目标检测 YOLO 深度学习人工智能
本文独家改进：一种超轻量高效动态上采样DySample，具有更少的参数、FLOPs，效果秒杀CAFFE和YOLOv8网络中的nn.Upsample在多个数据集下验证能够涨点，尤其在小目标检测领域涨点显著。RT-DETR魔术师专栏介绍：https://blog.csdn.net/m0_63774211/category_12497375.html✨✨✨魔改创新RT-DETR引入前沿顶会创新（CVPR
「性能提升」扩展 Spring Cache 支持多级缓存冷冷zz
为什么多级缓存缓存的引入是现在大部分系统所必须考虑的redis作为常用中间件，虽然我们一般业务系统（毕竟业务量有限）不会遇到如下图在随着data-size的增大和数据结构的复杂的造成性能下降，但网络IO消耗会成为整个调用链路中不可忽视的部分。尤其在微服务架构中，一次调用往往会涉及多次调用例如pigoauth2.0的client认证Caffeine来自未来的本地内存缓存,性能比如常见的内存缓存实现性
Spring Cache duration～ spring-boot spring java 后端
目录标题SpringCache1介绍2常用注解3入门SpringCache1介绍SpringCache是一个框架，实现了基于注解的缓存功能，只需要简单地加一个注解，就能实现缓存功能。SpringCache提供了一层抽象，底层可以切换不同的缓存实现，例如：EHCacheCaffeineRedis(常用)起步依赖：org.springframework.bootspring-boot-starter-
Caffeine与Spring cache的各种注解操作 500了 spring java 后端
前言Caffeine是一个基于Java8的进程内缓存框架，它使用乐观锁技术来提高并发吞吐量，并被誉为最快的缓存之一。Caffeine是内存型缓存，即缓存与调用者属于同一个应用，具体地说是属于同一个JVM。它的设计目标是提供高性能、高命中率以及低内存占用的本地缓存解决方案，被描述为GuavaCache的加强版和“新一代缓存”。关于Caffeine的使用，其提供了多种灵活的配置选项：自动加载数据：可以
缓存组件Caffeine的使用月月大王 Java #工具类缓存
caffeine是一个高性能的缓存组件，在需要缓存数据，但数据量不算太大，不想引入redis的时候，caffeine就是一个不错的选择。可以把caffeine理解为一个简单的redis。1、导入依赖com.github.ben-manes.caffeinecaffeine2.9.3导入是要注意版本，最开始我用的版本是3.1.1，不过启动是的时候会报错，这是因为我用的是jdk1.8，需要降低一下版本
Makefile.config walkMAN_aholic
##Refertohttp://caffe.berkeleyvision.org/installation.html#Contributionssimplifyingandimprovingourbuildsystemarewelcome!#cuDNNaccelerationswitch(uncommenttobuildwithcuDNN).USE_CUDNN:=1#CPU-onlyswitch(
缓存Caffeine之W-TinyLFU淘汰策略 georgesnoopy guava 缓存 java 淘汰策略 Caffeine
我们常见的缓存是基于内存的缓存，但是单机的内存是有限的，不能让缓存数据撑爆内存，所有需要缓存淘汰机制。https://mp.csdn.net/editor/html/115872837中大概说明了LRU的缓存淘汰机制，以及基于LRU的著名实现guavacache。除了LRU淘汰策略外，其是常见的还有FIFO以及LFU，只是说目前用的最多的是LRU。LRULRU记录了缓存中数据项的访问时间，在缓存数
Caffeine史上最快的内存缓存奇遇少年缓存 java
引言在现代的Web应用程序中，缓存是提升性能，减少数据库负载，加快响应速度的关键技术之一。SpringBoot作为一个简化Spring应用开发的框架，提供了与多种缓存技术集成的支持。Caffeine是一个高性能，灵活的缓存库，它可以作为本地缓存在Java应用中广泛使用。本文将详细介绍如何在SpringBoot项目中集成Caffeine缓存，并通过一个实例来展示它的使用。什么是Caffeine缓存？
如何解决caffe和video-caffe不能使用cudnn8编译的问题 Arnold-FY-Chen video-caffe 深度学习 Caffe video-caffe caffe 深度学习 cudnn8 cudnn
因为caffe之类的代码很久不更新了，只支持到了使用cudnn7.x，在使用了cudnn8的环境下编译caffe或video-caffe时，会在src/caffe/layers/cudnn_conv_layer.cpp等文件里出错：error:identifier"CUDNN_CONVOLUTION_FWD_SPECIFY_WORKSPACE_LIMIT"isundefinederror:iden
Redis 6.0 客户端缓存极简博客 java redis
不难发现，我们经常将Redis作为系统的缓存服务，但你有没有发现。在我们每次操作Redis时，都需要发送网络请求。这样就避免不了网络的开销。但如何解决这个问题呢？我们引入了本地缓存来解决此问题。查询逻辑从先前的直接查询转变为：先通过查询本地缓存，不存在再去远程查找然后设置到本地缓存-适用于分布式客户端缓存。有没有感觉像我们使用过的本地缓存Guava、Caffeine等一样？有啥特别的？这里Redi
[图像算法]-(yolov5.train)-GPU架构中的半精度fp16与单精度fp32计算蒸饺与白茶
GPU架构中的半精度与单精度计算由于项目原因，我们需要对darknet中卷积层进行优化，然而对于像caffe或者darknet这类深度学习框架来说，都已经将卷积运算转换成了矩阵乘法，从而可以方便调用cublas库函数和cudnn里tiling过的矩阵乘。 CUDA在推出7.5的时候提出了可以计算16位浮点数据的新特性。定义了两种新的数据类型half和half2.之前有师弟已经DEMO过半精度
caffe搭建深度神经网络 A异乡人_7a44
利用Caffe进行深度神经网络训练第一步需要搞懂几个重要文件：solver.prototxttrain_val.prototxttrain.shsolver.prototxtsolver这个文件主要存放模型训练所用到的一些超参数：net:=指定待训练模型结构文件，即train_val.prototxttest_interval:=测试间隔，即每隔多少次迭代进行一次测试test_initializa
deep-visualization-toolbox可视化安装 2014wzy caffe框架
运行环境：Linux+caffe步骤：Step0:Compilemasterbranchofcaffe本代码运行的前提是，配置过caffe。因为配置caffe的过程中会出现一些依赖库，正是本代码所需要的。http://blog.csdn.NET/u011204487/article/details/51596471是配置caffe的过程。注意Makefile.config中的CPU_ONLY:=1
枚举的构造函数中抛出异常会怎样 bylijinnan java enum 单例
首先从使用enum实现单例说起。为什么要用enum来实现单例？这篇文章（ http://javarevisited.blogspot.sg/2012/07/why-enum-singleton-are-better-in-java.html）阐述了三个理由： 1.enum单例简单、容易，只需几行代码： public enum Singleton { INSTANCE;
CMake 教程 aigo C++
转自：http://xiang.lf.blog.163.com/blog/static/127733322201481114456136/ CMake是一个跨平台的程序构建工具，比如起自己编写Makefile方便很多。介绍：http://baike.baidu.com/view/1126160.htm 本文件不介绍CMake的基本语法，下面是篇不错的入门教程： http:
cvc-complex-type.2.3: Element 'beans' cannot have character Cb123456 spring Webgis
cvc-complex-type.2.3: Element 'beans' cannot have character Line 33 in XML document from ServletContext resource [/WEB-INF/backend-servlet.xml] is i
jquery实例:随页面滚动条滚动而自动加载内容 120153216 jquery
<script language="javascript"> $(function (){ var i = 4;$(window).bind("scroll", function (event){ //滚动条到网页头部的高度，兼容ie,ff,chrome var top = document.documentElement.s
将数据库中的数据转换成dbs文件何必如此 sql dbs
旗正规则引擎通过数据库配置器（DataBuilder）来管理数据库，无论是Oracle，还是其他主流的数据都支持，操作方式是一样的。旗正规则引擎的数据库配置器是用于编辑数据库结构信息以及管理数据库表数据，并且可以执行SQL 语句，主要功能如下。 1)数据库生成表结构信息：主要生成数据库配置文件(.conf文
在IBATIS中配置SQL语句的IN方式 357029540 ibatis
在使用IBATIS进行SQL语句配置查询时，我们一定会遇到通过IN查询的地方，在使用IN查询时我们可以有两种方式进行配置参数：String和List。具体使用方式如下： 1.String:定义一个String的参数userIds，把这个参数传入IBATIS的sql配置文件，sql语句就可以这样写： <select id="getForms" param
Spring3 MVC 笔记（一） 7454103 spring mvc bean REST JSF
自从 MVC 这个概念提出来之后 struts1.X struts2.X jsf 。。。。。这个view 层的技术一个接一个！都用过！不敢说哪个绝对的强悍！要看业务，和整体的设计！最近公司要求开发个新系统！
Timer与Spring Quartz 定时执行程序 darkranger spring bean 工作 quartz
有时候需要定时触发某一项任务。其实在jdk1.3，java sdk就通过java.util.Timer提供相应的功能。一个简单的例子说明如何使用，很简单： 1、第一步，我们需要建立一项任务，我们的任务需要继承java.util.TimerTask package com.test; import java.text.SimpleDateFormat; import java.util.Date;
大端小端转换，le32_to_cpu 和cpu_to_le32 aijuans C语言相关
大端小端转换，le32_to_cpu 和cpu_to_le32 字节序 http://oss.org.cn/kernel-book/ldd3/ch11s04.html 小心不要假设字节序. PC 存储多字节值是低字节为先(小端为先, 因此是小端), 一些高级的平台以另一种方式(大端)
Nginx负载均衡配置实例详解 avords
[导读] 负载均衡是我们大流量网站要做的一个东西，下面我来给大家介绍在Nginx服务器上进行负载均衡配置方法，希望对有需要的同学有所帮助哦。负载均衡先来简单了解一下什么是负载均衡，单从字面上的意思来理解就可以解负载均衡是我们大流量网站要做的一个东西，下面我来给大家介绍在Nginx服务器上进行负载均衡配置方法，希望对有需要的同学有所帮助哦。负载均衡先来简单了解一下什么是负载均衡
乱说的 houxinyou 框架敏捷开发软件测试
从很久以前，大家就研究框架，开发方法，软件工程，好多！反正我是搞不明白！这两天看好多人研究敏捷模型，瀑布模型！也没太搞明白. 不过感觉和程序开发语言差不多，瀑布就是顺序，敏捷就是循环. 瀑布就是需求、分析、设计、编码、测试一步一步走下来。而敏捷就是按摸块或者说迭代做个循环，第个循环中也一样是需求、分析、设计、编码、测试一步一步走下来。也可以把软件开发理
欣赏的价值——一个小故事 bijian1013 有效辅导欣赏欣赏的价值
　　第一次参加家长会，幼儿园的老师说："您的儿子有多动症，在板凳上连三分钟都坐不了，你最好带他去医院看一看。"　　回家的路上，儿子问她老师都说了些什么，她鼻子一酸，差点流下泪来。因为全班30位小朋友，惟有他表现最差；惟有对他，老师表现出不屑，然而她还在告诉她的儿子："老师表扬你了，说宝宝原来在板凳上坐不了一分钟，现在能坐三分钟。其他妈妈都非常羡慕妈妈，因为全班只有宝宝
包冲突问题的解决方法 bingyingao eclipse maven exclusions 包冲突
包冲突是开发过程中很常见的问题：其表现有： 1.明明在eclipse中能够索引到某个类，运行时却报出找不到类。 2.明明在eclipse中能够索引到某个类的方法，运行时却报出找不到方法。 3.类及方法都有，以正确编译成了.class文件，在本机跑的好好的，发到测试或者正式环境就抛如下异常： java.lang.NoClassDefFoundError: Could not in
【Spark七十五】Spark Streaming整合Flume-NG三之接入log4j bit1129 Stream
先来一段废话：实际工作中，业务系统的日志基本上是使用Log4j写入到日志文件中的，问题的关键之处在于业务日志的格式混乱，这给对日志文件中的日志进行统计分析带来了极大的困难，或者说，基本上无法进行分析，每个人写日志的习惯不同，导致日志行的格式五花八门，最后只能通过grep来查找特定的关键词缩小范围，但是在集群环境下，每个机器去grep一遍，分析一遍，这个效率如何可想之二，大好光阴都浪费在这上面了
sudoku solver in Haskell bookjovi sudoku haskell
这几天没太多的事做，想着用函数式语言来写点实用的程序，像fib和prime之类的就不想提了（就一行代码的事），写什么程序呢？在网上闲逛时发现sudoku游戏，sudoku十几年前就知道了，学生生涯时也想过用C/Java来实现个智能求解，但到最后往往没写成，主要是用C/Java写的话会很麻烦。现在写程序，本人总是有一种思维惯性，总是想把程序写的更紧凑，更精致，代码行数最少，所以现
java apache ftpClient bro_feng java
最近使用apache的ftpclient插件实现ftp下载，遇见几个问题，做如下总结。 1. 上传阻塞，一连串的上传，其中一个就阻塞了，或是用storeFile上传时返回false。查了点资料，说是FTP有主动模式和被动模式。将传出模式修改为被动模式ftp.enterLocalPassiveMode();然后就好了。看了网上相关介绍，对主动模式和被动模式区别还是比较的模糊，不太了解被动模
读《研磨设计模式》-代码笔记-工厂方法模式 bylijinnan java 设计模式
声明：本文只为方便我个人查阅和理解，详细的分析以及源代码请移步原作者的博客http://chjavach.iteye.com/ package design.pattern; /* * 工厂方法模式：使一个类的实例化延迟到子类 * 某次，我在工作不知不觉中就用到了工厂方法模式（称为模板方法模式更恰当。2012-10-29）： * 有很多不同的产品，它
面试记录语 chenyu19891124 招聘
或许真的在一个平台上成长成什么样，都必须靠自己去努力。有了好的平台让自己展示，就该好好努力。今天是自己单独一次去面试别人，感觉有点小紧张，说话有点打结。在面试完后写面试情况表，下笔真的好难，尤其是要对面试人的情况说明真的好难。今天面试的是自己同事的同事，现在的这个同事要离职了，介绍了我现在这位同事以前的同事来面试。今天这位求职者面试的是配置管理，期初看了简历觉得应该很适合做配置管理，但是今天面
Fire Workflow 1.0正式版终于发布了 comsci 工作 workflow Google
Fire Workflow 是国内另外一款开源工作流，作者是著名的非也同志，哈哈.... 官方网站是 http://www.fireflow.org 经过大家努力,Fire Workflow 1.0正式版终于发布了正式版主要变化: 1、增加IWorkItem.jumpToEx(...)方法，取消了当前环节和目标环节必须在同一条执行线的限制，使得自由流更加自由 2、增加IT
Python向脚本传参 daizj python 脚本传参
如果想对python脚本传参数，python中对应的argc, argv(c语言的命令行参数)是什么呢？需要模块：sys 参数个数：len(sys.argv) 脚本名： sys.argv[0] 参数1： sys.argv[1] 参数2： sys.argv[
管理用户分组的命令gpasswd dongwei_6688 passwd
NAME： gpasswd - administer the /etc/group file SYNOPSIS： gpasswd group gpasswd -a user group gpasswd -d user group gpasswd -R group gpasswd -r group gpasswd [-A user,...] [-M user,...] g
郝斌老师数据结构课程笔记 dcj3sjt126com 数据结构与算法
<<<<<<<<<<<<<<<<<<<<<<<<<<<<<<<<<<<<<<<<<<<<<<<<<<
yii2 cgridview加上选择框进行操作 dcj3sjt126com GridView
页面代码 <?=Html::beginForm(['controller/bulk'],'post');?> <?=Html::dropDownList('action','',[''=>'Mark selected as: ','c'=>'Confirmed','nc'=>'No Confirmed'],['class'=>'dropdown',])
linux mysql fypop linux
enquiry mysql version in centos linux yum list installed | grep mysql yum -y remove mysql-libs.x86_64 enquiry mysql version in yum repositoryyum list | grep mysql oryum -y list mysql* install mysq
Scramble String hcx2013 String
Given a string s1, we may represent it as a binary tree by partitioning it to two non-empty substrings recursively. Below is one possible representation of s1 = "great":
跟我学Shiro目录贴 jinnianshilongnian 跟我学shiro
历经三个月左右时间，《跟我学Shiro》系列教程已经完结，暂时没有需要补充的内容，因此生成PDF版供大家下载。最近项目比较紧，没有时间解答一些疑问，暂时无法回复一些问题，很抱歉，不过可以加群（334194438/348194195）一起讨论问题。 ----广告-----------------------------------------------------
nginx日志切割并使用flume-ng收集日志 liyonghui160com
nginx的日志文件没有rotate功能。如果你不处理，日志文件将变得越来越大，还好我们可以写一个nginx日志切割脚本来自动切割日志文件。第一步就是重命名日志文件，不用担心重命名后nginx找不到日志文件而丢失日志。在你未重新打开原名字的日志文件前，nginx还是会向你重命名的文件写日志，linux是靠文件描述符而不是文件名定位文件。第二步向nginx主
Oracle死锁解决方法 pda158 oracle
　select p.spid,c.object_name,b.session_id,b.oracle_username,b.os_user_name from v$process p,v$session a, v$locked_object b,all_objects c where p.addr=a.paddr and a.process=b.process and c.object_id=b.
java之List排序 shiguanghui list排序
在Java Collection Framework中定义的List实现有Vector，ArrayList和LinkedList。这些集合提供了对对象组的索引访问。他们提供了元素的添加与删除支持。然而，它们并没有内置的元素排序支持。　　你能够使用java.util.Collections类中的sort()方法对List元素进行排序。你既可以给方法传递
servlet单例多线程 utopialxw 单例多线程 servlet
转自http://www.cnblogs.com/yjhrem/articles/3160864.html 和 http://blog.chinaunix.net/uid-7374279-id-3687149.html Servlet 单例多线程 Servlet如何处理多个请求访问？Servlet容器默认是采用单实例多线程的方式处理多个请求的：1.当web服务器启动的