zt_1995

cs231 assignment1--KNN

这次作业的主要的难点：
实现训练集和测试集之间距离的方法，主要是用向量形式来实现的部分
交叉检验的部分

import numpy as np
from collections import Counter
class KNearestNeighbor(object):
  """ a kNN classifier with L2 distance """

  def __init__(self):
    pass

  def train(self, X, y):
    """
    Train the classifier. For k-nearest neighbors this is just 
    memorizing the training data.

    Inputs:
    - X: A numpy array of shape (num_train, D) containing the training data
      consisting of num_train samples each of dimension D.
    - y: A numpy array of shape (N,) containing the training labels, where
         y[i] is the label for X[i].
    """
    self.X_train = X
    self.y_train = y

  def predict(self, X, k=1, num_loops=0):
    """
    Predict labels for test data using this classifier.

    Inputs:
    - X: A numpy array of shape (num_test, D) containing test data consisting
         of num_test samples each of dimension D.
    - k: The number of nearest neighbors that vote for the predicted labels.
    - num_loops: Determines which implementation to use to compute distances
      between training points and testing points.

    Returns:
    - y: A numpy array of shape (num_test,) containing predicted labels for the
      test data, where y[i] is the predicted label for the test point X[i].  
    """
    if num_loops == 0:
      dists = self.compute_distances_no_loops(X)
    elif num_loops == 1:
      dists = self.compute_distances_one_loop(X)
    elif num_loops == 2:
      dists = self.compute_distances_two_loops(X)
    else:
      raise ValueError('Invalid value %d for num_loops' % num_loops)

    return self.predict_labels(dists, k=k)
  #两个循环部分 ，实现比较简单
  def compute_distances_two_loops(self, X):
    """
    Compute the distance between each test point in X and each training point
    in self.X_train using a nested loop over both the training data and the 
    test data.

    Inputs:
    - X: A numpy array of shape (num_test, D) containing test data.

    Returns:
    - dists: A numpy array of shape (num_test, num_train) where dists[i, j]
      is the Euclidean distance between the ith test point and the jth training
      point.
    """
    num_test = X.shape[0]
    num_train = self.X_train.shape[0]
    dists = np.zeros((num_test, num_train))
    for i in xrange(num_test):
      for j in xrange(num_train):
        dists[i, j] = np.sqrt(np.sum(np.square(self.X_train[j,:]- X[i, :])))
        #####################################################################
        # TODO: #
        # Compute the l2 distance between the ith test point and the jth    #
        # training point, and store the result in dists[i, j]. You should   #
        # not use a loop over dimension.                                    #
        #####################################################################
        pass
        #####################################################################
        #                       END OF YOUR CODE                            #
        #####################################################################
    return dists
  #一个循环实现部分，主要是通过numpy广播机制来实现
  def compute_distances_one_loop(self, X):
    """
    Compute the distance between each test point in X and each training point
    in self.X_train using a single loop over the test data.

    Input / Output: Same as compute_distances_two_loops
    """
    num_test = X.shape[0]
    num_train = self.X_train.shape[0]
    dists = np.zeros((num_test, num_train))
    for i in xrange(num_test):
      #######################################################################
      # TODO:                                                               #
      # Compute the l2 distance between the ith test point and all training #
      # points, and store the result in dists[i, :].                        #
      #######################################################################
      pass
      dists[i,:] = np.sqrt(np.sum(np.square(self.X_train-X[i,:]),axis=1))
      #X_train中每一行都减去X[i,:]
      #######################################################################
      #                         END OF YOUR CODE                            #
      #######################################################################
    return dists
  #两个循环部分
  def compute_distances_no_loops(self, X):
    """
    Compute the distance between each test point in X and each training point
    in self.X_train using no explicit loops.

    Input / Output: Same as compute_distances_two_loops
    """
    num_test = X.shape[0]
    num_train = self.X_train.shape[0]
    dists = np.zeros((num_test, num_train)) 
    #########################################################################
    # TODO:                                                                 #
    # Compute the l2 distance between all test points and all training      #
    # points without using any explicit loops, and store the result in      #
    # dists.                                                                #
    #                                                                       #
    # You should implement this function using only basic array operations; #
    # in particular you should not use functions from scipy.                #
    #                                                                       #
    # HINT: Try to formulate the l2 distance using matrix multiplication    #
    #       and two broadcast sums.                                         #
    #########################################################################
    pass
    #注意点：numpy中dot才是点乘，而*预算则是所有相对应的元素进行相乘
    #此处实现的原理，计算距离方法：（X1-X2）^2，将其展开，X1^2+X2^2-2X1*X2
    #下面就是分别计算 X1^2,X2^2,2X1*X2 
    # X1*X2部分 500*5000
    M = np.dot(X,self.X_train.T) 
    # X1^2 部分 5000*1
    sqtr = np.sum(np.square(self.X_train),axis=1,keepdims=True) 
    # X2^2 部分  500*1
    sqte = np.sum(np.square(X),axis=1,keepdims=True)
    # 三部分相加，其中sqte+np.matrix(sqtr).T 500*1 + 1*5000  广播机制实现
    dists = np.sqrt(sqte+np.matrix(sqtr).T-2*M)   
    #########################################################################
    #                         END OF YOUR CODE                              #
    #########################################################################
    return dists

  def predict_labels(self, dists, k=1):
    """
    Given a matrix of distances between test points and training points,
    predict a label for each test point.

    Inputs:
    - dists: A numpy array of shape (num_test, num_train) where dists[i, j]
      gives the distance betwen the ith test point and the jth training point.

    Returns:
    - y: A numpy array of shape (num_test,) containing predicted labels for the
      test data, where y[i] is the predicted label for the test point X[i].  
    """
    num_test = dists.shape[0]
    y_pred = np.zeros(num_test)
    for i in xrange(num_test):
      # A list of length k storing the labels of the k nearest neighbors to
      # the ith test point.
      closest_y = []
      """
      closest_y = self.y_train[np.argsort(dists[i:])[:k]]
      y_pred[i] = np.argmax(np.bincount(np.matrix(closest_y)))
      """
      labels = self.y_train[np.argsort(dists[i, :])].flatten()
      closest_y = labels[0:k]
      c = Counter(closest_y)
      y_pred[i] = c.most_common(1)[0][0]

      #########################################################################
      # TODO:                                                                 #
      # Use the distance matrix to find the k nearest neighbors of the ith    #
      # testing point, and use self.y_train to find the labels of these       #
      # neighbors. Store these labels in closest_y.                           #
      # Hint: Look up the function numpy.argsort.                             #
      #########################################################################
      pass

      #########################################################################
      # TODO:                                                                 #
      # Now that you have found the labels of the k nearest neighbors, you    #
      # need to find the most common label in the list closest_y of labels.   #
      # Store this label in y_pred[i]. Break ties by choosing the smaller     #
      # label.                                                                #
      #########################################################################
      pass
      #########################################################################
      #                           END OF YOUR CODE                            # 
      #########################################################################

    return y_pred

# Run some setup code for this notebook.

import random
import numpy as np
from cs231n.data_utils import load_CIFAR10
import matplotlib.pyplot as plt

# This is a bit of magic to make matplotlib figures appear inline in the notebook
# rather than in a new window.
%matplotlib inline
plt.rcParams['figure.figsize'] = (10.0, 8.0) # set default size of plots
plt.rcParams['image.interpolation'] = 'nearest'
plt.rcParams['image.cmap'] = 'gray'

# Some more magic so that the notebook will reload external python modules;
# see http://stackoverflow.com/questions/1907993/autoreload-of-modules-in-ipython
%load_ext autoreload
%autoreload 2

# Visualize some examples from the dataset.
# We show a few examples of training images from each class.
classes = ['plane', 'car', 'bird', 'cat', 'deer',
 'dog', 'frog', 'horse', 'ship', 'truck']
num_classes = len(classes)
samples_per_class = 7
for y, cls in enumerate(classes):
    idxs = np.flatnonzero(y_train == y)
    idxs = np.random.choice(idxs, samples_per_class, replace=False)
    for i, idx in enumerate(idxs):
        plt_idx = i * num_classes + y + 1
        plt.subplot(samples_per_class, num_classes, plt_idx)
        plt.imshow(X_train[idx].astype('uint8'))
        plt.axis('off')
        if i == 0:
            plt.title(cls)
plt.show()
# Subsample the data for more efficient code execution in this exercise
num_training = 5000
mask = range(num_training)
X_train = X_train[mask]
y_train = y_train[mask]

num_test = 500
mask = range(num_test)
X_test = X_test[mask]
y_test = y_test[mask]
# Reshape the image data into rows
X_train = np.reshape(X_train, (X_train.shape[0], -1))
X_test = np.reshape(X_test, (X_test.shape[0], -1))
print X_train.shape, X_test.shape


from cs231n.classifiers import KNearestNeighbor

# Create a kNN classifier instance. 
# Remember that training a kNN classifier is a noop: 
# the Classifier simply remembers the data and does no further processing 
classifier = KNearestNeighbor()
classifier.train(X_train, y_train)
# Open cs231n/classifiers/k_nearest_neighbor.py and implement
# compute_distances_two_loops.

# Test your implementation:
dists = classifier.compute_distances_two_loops(X_test)
print dists.shape

# We can visualize the distance matrix: each row is a single test example and
# its distances to training examples
plt.imshow(dists, interpolation='none')
plt.show()

# Now implement the function predict_labels and run the code below:
# We use k = 1 (which is Nearest Neighbor).
y_test_pred = classifier.predict_labels(dists, k=1)

# Compute and print the fraction of correctly predicted examples
num_correct = np.sum(y_test_pred == y_test)
accuracy = float(num_correct) / num_test
print 'Got %d / %d correct => accuracy: %f' % (num_correct, num_test, accuracy)


y_test_pred = classifier.predict_labels(dists, k=5)
num_correct = np.sum(y_test_pred == y_test)
accuracy = float(num_correct) / num_test
print 'Got %d / %d correct => accuracy: %f' % (num_correct, num_test, accuracy)


# Now lets speed up distance matrix computation by using partial vectorization
# with one loop. Implement the function compute_distances_one_loop and run the
# code below:
dists_one = classifier.compute_distances_one_loop(X_test)

# To ensure that our vectorized implementation is correct, we make sure that it
# agrees with the naive implementation. There are many ways to decide whether
# two matrices are similar; one of the simplest is the Frobenius norm. In case
# you haven't seen it before, the Frobenius norm of two matrices is the square
# root of the squared sum of differences of all elements; in other words, reshape
# the matrices into vectors and compute the Euclidean distance between them.
difference = np.linalg.norm(dists - dists_one, ord='fro')
print 'Difference was: %f' % (difference, )
if difference < 0.001:
  print 'Good! The distance matrices are the same'
else:
  print 'Uh-oh! The distance matrices are different'


# Now implement the fully vectorized version inside compute_distances_no_loops
# and run the code
dists_two = classifier.compute_distances_no_loops(X_test)

# check that the distance matrix agrees with the one we computed before:
difference = np.linalg.norm(dists - dists_two, ord='fro')
print 'Difference was: %f' % (difference, )
if difference < 0.001:
  print 'Good! The distance matrices are the same'
else:
  print 'Uh-oh! The distance matrices are different'


# Let's compare how fast the implementations are
def time_function(f, *args):
  """
  Call a function f with args and return the time (in seconds) that it took to execute.
  """
  import time
  tic = time.time()
  f(*args)
  toc = time.time()
  return toc - tic

two_loop_time = time_function(classifier.compute_distances_two_loops, X_test)
print 'Two loop version took %f seconds' % two_loop_time

one_loop_time = time_function(classifier.compute_distances_one_loop, X_test)
print 'One loop version took %f seconds' % one_loop_time

no_loop_time = time_function(classifier.compute_distances_no_loops, X_test)
print 'No loop version took %f seconds' % no_loop_time

# you should see significantly faster performance with the fully vectorized implementation



Cross-validation
We have implemented the k-Nearest Neighbor classifier but we set the value k = 5 arbitrarily. 
We will now determine the best value of this hyperparameter with cross-validation.



# num_folds = 5
k_choices = [1, 3, 5, 8, 10, 12, 15, 20, 50, 100]

X_train_folds = []
y_train_folds = []
################################################################################
# TODO:                                                                        #
# Split up the training data into folds. After splitting, X_train_folds and    #
# y_train_folds should each be lists of length num_folds, where                #
# y_train_folds[i] is the label vector for the points in X_train_folds[i].     #
# Hint: Look up the numpy array_split function.                                #
################################################################################
pass
X_train_folds = np.array_split(X_train,num_folds,axis=0)
y_train_folds = np.array_split(y_train,num_folds,axis=0)
################################################################################
#                                 END OF YOUR CODE                             #
################################################################################

# A dictionary holding the accuracies for different values of k that we find
# when running cross-validation. After running cross-validation,
# k_to_accuracies[k] should be a list of length num_folds giving the different
# accuracy values that we found when using that value of k.
# 交叉检验部分，一开始完全没有实现的思路，查阅各种资料后，才发现是才训练数据分成5部分
# 5个部分轮流当测试集，并将5次的结果取平均值作为最终结果
k_to_accuracies = {}
classifier = KNearestNeighbor()
for k in k_choices:
    k_to_accuracies[k] = []
    for j in xrange(num_folds):
        X_tr = X_train_folds[0:j]+X_train_folds[(j+1):num_folds]
        X_tr = np.reshape(X_tr,(X_train.shape[0]*(num_folds-1)/num_folds,-1))
        y_tr = y_train_folds[0:j]+y_train_folds[(j+1):num_folds]
        y_tr = np.reshape(y_tr,(X_train.shape[0]*(num_folds-1)/num_folds,-1))
        X_te = np.reshape( X_train_folds[j], (X_train.shape[0]/num_folds,-1))
        y_te = y_train_folds[j]
        classifier.train(X_tr,y_tr)
        y_test_pred = classifier.predict(X_te,k,0)
        num_correct = sum(y_te==y_test_pred)
        num_test1 = np.shape(X_te)[0]
        accuracy = float(num_correct)/num_test1
        k_to_accuracies[k].append(accuracy)

################################################################################
# TODO:                                                                        #
# Perform k-fold cross validation to find the best value of k. For each        #
# possible value of k, run the k-nearest-neighbor algorithm num_folds times,   #
# where in each case you use all but one of the folds as training data and the #
# last fold as a validation set. Store the accuracies for all fold and all     #
# values of k in the k_to_accuracies dictionary.                               #
################################################################################
pass

################################################################################
#                                 END OF YOUR CODE                             #
################################################################################

# Print out the computed accuracies
for k in sorted(k_to_accuracies):
    for accuracy in k_to_accuracies[k]:
        print 'k = %d, accuracy = %f' % (k, accuracy)


# plot the raw observations
for k in k_choices:
  accuracies = k_to_accuracies[k]
  plt.scatter([k] * len(accuracies), accuracies)

# plot the trend line with error bars that correspond to standard deviation
accuracies_mean = np.array([np.mean(v) for k,v in sorted(k_to_accuracies.items())])
accuracies_std = np.array([np.std(v) for k,v in sorted(k_to_accuracies.items())])
plt.errorbar(k_choices, accuracies_mean, yerr=accuracies_std)
plt.title('Cross-validation on k')
plt.xlabel('k')
plt.ylabel('Cross-validation accuracy')
plt.show()

# Based on the cross-validation results above, choose the best value for k,   
# retrain the classifier using all the training data, and test it on the test
# data. You should be able to get above 28% accuracy on the test data.
best_k = 7
num_test=500
classifier = KNearestNeighbor()
classifier.train(X_train, y_train)
y_test_pred = classifier.predict(X_test, k=best_k)

# Compute and display the accuracy
num_correct = np.sum(y_test_pred == y_test)
accuracy = float(num_correct) / num_test
print 'Got %d / %d correct => accuracy: %f' % (num_correct, num_test, accuracy)

DL Homework 13 熬夜患者 DL Homework python 开发语言
目录编程实现优化算法，并3D可视化1.函数3D可视化2.加入优化算法，画出轨迹3.复现CS231经典动画4.结合3D动画，用自己的语言，从轨迹、速度等多个角度讲解各个算法优缺点5.总结编程实现优化算法，并3D可视化1.函数3D可视化分别画出和的3D图importtorchimportnumpyasnpimportmatplotlib.pyplotaspltclassOp(object):def__
【23-24 秋学期】NNDL 作业13 优化算法3D可视化 HBU_David 深度学习
编程实现优化算法，并3D可视化1.函数3D可视化分别画出和的3D图NNDL实验优化算法3D轨迹鱼书例题3D版_优化算法3d展示-CSDN博客2.加入优化算法，画出轨迹分别画出和的3D轨迹图NNDL实验优化算法3D轨迹pytorch版-CSDN博客3.复现CS231经典动画NNDL实验优化算法3D轨迹复现cs231经典动画_HBU_David的博客-CSDN博客
Dropout的rescale taoqick 深度学习
dropout有两种实现方式，VanillaDropout和invertedDropout。前者是原始论文中的朴素版后者在AndrewNg的cs231课程中（https://cs231n.github.io/neural-networks-2/#init）有介绍。其实就两个要点：rescale。输入序列为X=[x0,x1,x2,x3]X=[x_0,x_1,x_2,x_3]X=[x0,x1,x2,x
卷积神经网络可视化理解之子无裳深度学习
文章目录设计来源可视化第一层卷积核可视化第一层featuremap底层特征可视化隐层featuremap可视化遮挡、扰动实验GradientAscent、featureinversionDeepDream反卷积可视化设计来源看了CS231的课程，想自己尝试做下可视化，权当加深对卷积神经网络的理解吧。可视化第一层卷积核课程：课程里提到第一层卷积一般做的是传统视觉的工作，主要提取一些有向边，可视化卷积
深度学习中的卷积操作 zyw2002 #深度学习框架深度学习基础计算机视觉基础深度学习神经网络卷积 pytorch Conv1D
本文从信号处理中的互相关运算引入深度学习中的卷积。然后介绍了不同的卷积类型，以及如何在pytorch中使用这些卷积层。（在看pytorch文档中的Conv1D/2D/3D的时候感到比较困惑，又很好奇深度学习中各种各样的卷积操作。于是结合整理几乎包含深度学习中所有的卷积操作，主要参考的有《DiveintoDeeplearning》,cs231,pytorch的官网文档，stackoverflow以及
NNDL实验优化算法3D轨迹鱼书例题3D版 HBU_David DeepLearning 算法 3d python
这张图在网络上很流行。代码源自：深度学习入门：基于Python的理论与实现(ituring.com.cn)2D版讲解：NNDL作业11：优化算法比较调整学习率等超参数，观察动画，可以加深对各种算法的理解。配合实验的模型，CS231的模型，基本可以掌握各类算法特点。NNDL实验优化算法3D轨迹程序改编自《神经网络与深度学习：案例与实践》（Paddle版）https://blog.csdn.net/q
NNDL实验优化算法3D轨迹复现cs231经典动画 HBU_David DeepLearning 算法 3d
这个动画很有名气，学习深度学习的朋友大多都见过，源自于：CS231nConvolutionalNeuralNetworksforVisualRecognition复现动画，向经典致敬~第一版：轨迹版第二版：小球版“轨迹版”不如原图生动，观察后，发现缺少移动的小球~失去了小球，就失去了灵魂~赶紧把灵魂找回来~第三版：综合版这样就有点“高仿”的意思了~收工~俯视效果：放在一起对比下：代码改编自《神经网
[cv231n] Lecture 3 | Loss Functions and Optimization gdtop818 Stanford-cs231n
Lecture3|LossFunctionsandOptimization关于优化方法补充一条2019/2/27新出的论文：AdaBound，论文中该方法被证明比SGD和ADAM有更好的优化速度，并且也更容易在训练中达到最优效果~~本篇文章如果有朋友看不懂的话可以留言给我，我会抽时间把cs231笔记再翻译成中文~Tools:LinearClassificationLossVisualization
Numpy实现大矩阵减去小矩阵的方便运算 brightendavid numpy python
把一个向量加到矩阵的每一行:调用numpy库完成cs231作业1，numpy参考知乎CS231n课程笔记翻译：PythonNumpy教程使用一重循环#Wewilladdthevectorvtoeachrowofthematrixx,#storingtheresultinthematrixyimportnumpyasnpx=np.array([[1,2,3],[4,5,6],[7,8,9],[10,
深度学习学习路线睡觉特早头发特多论文总结深度学习学习 tensorflow
为了搞深度学习，看了《深度学习、优化与识别》，《TensorFlow：实战Google深度学习框架》以及三大牛人的《深度学习》，视频看的16年的cs231，据说和17年差别还是挺大的。谈一点个人经验。深度学习入门的话推荐《TensorFlow：实战Google深度学习框架》，这本书内容比较详细也比较基础，以tensorflow为框架，从搭建网络的每个具体功能讲起，配有示例，逐渐搭起来一个网络，后续
LSTM推导源码分析 vsooda papers LSTM 源码
LSTM推导说是推导，基本上没有一个公式。注重理解。神经网络后向推导cs231上有一篇关于非常好的文章,讲得非常好。一个例子：f(x,y)=x+σ(y)σ(x)+(x+y)2x=3#examplevaluesy=-4#forwardpasssigy=1.0/(1+math.exp(-y))#sigmoidinnumerator#(1)num=x+sigy#numerator#(2)sigx=1.0
cs231学习笔记一图像识别与KNN poorfriend 机器学习 cs231
课程地址：http://cs231n.github.io/classification/图像识别图像识别就是给你一张图，将其分类成一组给定类别中的一种。如图1所示，给定一张图片，以及可能的类别{猫、狗、帽子、杯子}，要求将这张图片识别出到底属于哪一类。一张图片输入计算机中，实际是转化为一个三维张量（宽*高*颜色通道），比如图一就是248x400x3共297,600个数据，每个数据的取值范围都是0到
斯坦福大学计算机视觉课程cs231-01-图像分类 Buaazhangrui 斯坦福大学计算机视觉课程
CS231设计为以计算机视觉解决实现图像分类问题和数据驱动方法的入门课程，课程内容如下：图像分类，数据驱动方法，流水线介绍临近分类器/K-NN验证集，交叉验证，超参数调整最近邻居的优点/缺点概要总结：KNN在现实中的应用图像分类动机.本节中，我们将介绍图像分类问题，即从一个固定的分类集合为输入图像分配一个标签。这是“计算机视觉”中的核心问题之一，尽管其简单，却有着各种各样的实际应用。而且，正如我们
DL4NLP---第一讲 Xiaomin-Wu NLP
第一讲：引言-自然语言处理与深度学习简介(IntrotoNLPandDeepLearning)推荐阅读材料：线性代数相关知识点回顾：[LinearAlgebraReview]概率相关知识点回顾：[ProbabilityReview]凸优化相关知识点回顾:[ConvexOptimizationReview]优化相关的另一篇介绍（来自于斯坦福CS231课程资料），随机梯度下降相关[MoreOptimi
cs231 assignment1--KNN zt_1995
这次作业的主要的难点：实现训练集和测试集之间距离的方法，主要是用向量形式来实现的部分交叉检验的部分importnumpyasnpfromcollectionsimportCounterclassKNearestNeighbor(object):"""akNNclassifierwithL2distance"""def__init__(self):passdeftrain(self,X,y):"""
cs231以及迁移学习 yuki___ cs231n
Normalization的原因以这个2元分类为例，不normalization的话，loss非常敏感，分类器稍微改变一下，对loss的影响很大。Normalization后问题得到解决。在CNN中我们希望每层都normalization，可以用batchnormalizationlearningrate是第一个需要调整的超参数，但当他调好之后再调其他参数可能对learningrate的调整产生影
cs231 学习笔记（一）路漫途远
FirstClassifier:NearestNeighbor训练过程就是记录所有的数据点，在预测阶段对每一条记录（一个图像）与原有数据集进行比较，得出与之最相近的一条记录，其label就是最后的预测值。通常使用的DistanceMetric来比较图像：L1依赖于坐标系，当坐标轴转动时L1值随之改变，而L2不会。KNN选择K个最近的邻居，随着K的值越大，你的决策边界也会越来越光滑，降噪提高robu
cs231神经网络学习笔记轻描没淡写
简介相比于线性分类中的S=W×X，其中W是一个矩阵，X是一个列向量，包含图像的全部像素信息。它们相乘的直接结果就是得到一个得分向量。像数据库CIFAR-10的案例中W是一个10×3072的矩阵，X是一个3072×1的向量，他们的结果就是得到10×1的得分向量》神经元则不同，它的计算法则是其中的W1可以是100×3072的矩阵与X相乘的到一个100×1的过度向量，max（）函数是非线性的，这种非线性
cs231反向传播笔记轻描没淡写
反向传播实践代码示例：函数表达式：代码示例x=3#例子数值y=-4#前向传播sigy=1.0/(1+math.exp(-y))#分子中的sigmoi#(1)num=x+sigy#分子#(2)sigx=1.0/(1+math.exp(-x))#分母中的sigmoid#(3)xpy=x+y#(4)xpysqr=xpy**2#(5)den=sigx+xpysqr#分母#(6)invden=1.0/den
cs231线性分类笔记轻描没淡写
最简单的线性分类器公式每个图像由32×32×3个像素，上述公式中把图像拉伸为一个3072×1的向量。W和b是参数，其中W是一个k×3072的矩阵（k表示类别数），被称为权重，b是一个k×1的偏执向量。1，一个单独的矩阵乘法就高效地并行评估10个不同的分类器，其中每个类的分类器就是W的一个行向量。2，其中的参数是可以控制的，目的就是找到最合适的参数使得准确率做高。3，数据驱动方式，就是利用训练集进行
PyTorch之迁移学习实战 IT派
简介：迁移学习是把一个领域(即源领域)的知识,迁移到另外一个领域(即目标领域),使得目标领域能够取得更好的学习效果。通常，源领域数据量充足，而目标领域数据量较小，迁移学习需要将在数据量充足的情况下学习到的知识，迁移到数据量小的新环境中。本文我们根据PyTorch官网上的例子(作者:SasankChilamkurthy)学习如何使用传输学习来训练网络。关于迁移学习的更多例子：http://cs231
cs231课程---作业1总结 chenxiaocui195
翻译链接：1、http://blog.csdn.net/u010004460/article/details/534325752、http://blog.csdn.net/zhangxb35/article/details/55223825一、安装Jupyter我选择的是在windows下的pip方式。首先安装python3.6和pip。https://jingyan.baidu.com/arti
CS231的一些资源努力的老周 CS231N CS231N资源
官方资源课程主页请参考http://cs231n.stanford.edu/index.html。官方笔记请参考http://cs231n.github.io/。教学大纲syllabus请参考http://cs231n.stanford.edu/syllabus.html。非官方资料课程中文翻译来自知乎。请参考https://zhuanlan.zhihu.com/p/21930884。但是还是建议
CS231对SVM及Softmax分类器的理解 NaLi_champion 深度学习
SVM分类器与Softmax分类器的区别这是针对一个数据，SVM与Softmax分类器的不同处理方式的例子。两个分类器都计算了同样的分值向量f。不同之处在于对f中分值的解释：SVM分类器将它们看作是分类评分，它的损失函数鼓励正确的分类（即图中的蓝色类别2）的分值比其它分类的分值高出至少一个边界值。Softmax分类器将这些数值看作是每个分类没有归一化的对数概率，鼓励正确分类的归一化的对数概率变高，
cs231学习笔记二线性分类器、SVM、Softmax poorfriend 机器学习 cs231
课程地址：http://cs231n.github.io/linear-classify/线性分类器假设样本xi∈RD,i=1…N，对应类标签yi∈1…K。现定义一个线性映射f(xi,W,b)=Wxi+b，W是K∗D的矩阵，b是K维的向量。W和b分别称作权重（或参数）和偏。W的每一行都是一个分类器，每个分类器对应于一个得分。通过学习W和b，我们希望正确类的得分要大于错误类的得分。相对于KNN，一旦
【深度学习】深度学习权重初始化 Shwan_Ma 深度学习
本文对CS231中的TrainingNeuralNetworks的权重更新部分进行记录权重的初始化在深度神经网络中起着比较大的重要，算是一个trick，但在实际应用上确是个大杀器。1.如果一开始把网络中的权重初始化为0，会发生什么？因为权重初始为0，由于网络中的神经元的更新机制完全相同，由于网络的对称性，会产生各个layer中产生相同的梯度更新，导致所有的权重最后值相同，收敛会出现问题。所以在初始
Computer Vision：CS231n CodeForCoffee 计算机视觉 CS321n
CS231n是斯坦福大学SVL实验室（StanfordVisionandLearningLab）主导开设为期10周的计算机视觉课程，主讲为李飞飞教授，相关链接如下：课程主页CS231课程主页：http://cs231n.stanford.edu/CS231GitHub主页（包含课程作业）：https://github.com/cs231n（访问页面：cs231n.github.io）CS231教学
吴恩达斯坦福大学机器学习 CS229 课程学习笔记（一） zcg1942 知乎读书笔记
说到机器学习总绕不过几个鼎鼎大名的人物，他们都创造了不少的机器学习资料，斯坦福吴恩达AndrewNg的公开课CS229；Google李飞飞的CS231、周志华的、李航的《统计学习方法》、林轩田的《机器学习基石》、PeterHarringtond的《机器学习实战》、周志华的《机器学习》（西瓜书，书中都是拿西瓜举例子）。CS229的官方网站是http://cs229.stanford.edu/，网易公
深度学习最基础理论知识总结 (CS231课程总结，持续更新) CAM-TAY 深度学习
因为有在看CS231学习深度学习的简单知识，所以打算整理成blog，持续更新中。。。一、损失函数lossfunction1、SVM：最简单的lossfunction其中为真实label对应的分数，为labelj对应的分数，Li为每个样本的分类损失，目的是最大化真实label对应分数。在初始化时，Li的初始值接近于C-1，其中C为分类的个数，因为所有的分数都接近于0，对应为（C-1）个1相加。所有样
cs231阅读笔记（2）—— 优化方法、正则化、迁移学习、软硬件 yjyjjyjy1231 笔记
文章目录优化方法正则化（防止过拟合）transferlearning迁移学习硬件&软件优化方法随机梯度下降SGD随机梯度下降（SGD,stochasticgradientdescent）：名字中已经体现了核心思想，随机选取一个店做梯度下降，而不是遍历所有样本后进行参数迭代。因为梯度下降法的代价函数计算需要遍历所有样本，而且是每次迭代都要遍历，直至达到局部最优解，在样本量庞大时就显得收敛速度比较慢了
SQL的各种连接查询 xieke90 UNION ALL UNION 外连接内连接 JOIN
一、内连接概念：内连接就是使用比较运算符根据每个表共有的列的值匹配两个表中的行。内连接（join 或者inner join ） SQL语法： select * fron
java编程思想--复用类百合不是茶 java 继承代理组合 final类
复用类看着标题都不知道是什么,再加上java编程思想翻译的比价难懂,所以知道现在才看这本软件界的奇书一:组合语法:就是将对象的引用放到新类中即可代码: package com.wj.reuse; /** * * @author Administrator 组
[开源与生态系统]国产CPU的生态系统 comsci cpu
计算机要从娃娃抓起...而孩子最喜欢玩游戏.... 要让国产CPU在国内市场形成自己的生态系统和产业链,国家和企业就不能够忘记游戏这个非常关键的环节.... 投入一些资金和资源,人力和政策,让游
JVM内存区域划分Eden Space、Survivor Space、Tenured Gen，Perm Gen解释商人shang jvm内存
jvm区域总体分两类，heap区和非heap区。heap区又分：Eden Space（伊甸园）、Survivor Space(幸存者区)、Tenured Gen（老年代-养老区）。非heap区又分：Code Cache(代码缓存区)、Perm Gen（永久代）、Jvm Stack(java虚拟机栈)、Local Method Statck(本地方法栈)。 HotSpot虚拟机GC算法采用分代收
页面上调用 QQ oloz qq
<A href="tencent://message/?uin=707321921&Site=有事Q我&Menu=yes"> <img style="border:0px;" src=http://wpa.qq.com/pa?p=1:707321921:1></a>
一些问题文强chu 问题
1.eclipse 导出 doc 出现“The Javadoc command does not exist.” javadoc command 选择 jdk/bin/javadoc.exe 2.tomcate 配置 web 项目 ..... SQL:3.mysql * 必须得放前面否则 select&nbs
生活没有安全感小桔子生活孤独安全感
圈子好小，身边朋友没几个，交心的更是少之又少。在深圳，除了男朋友，没几个亲密的人。不知不觉男朋友成了唯一的依靠，毫不夸张的说，业余生活的全部。现在感情好，也很幸福的。但是说不准难免人心会变嘛，不发生什么大家都乐融融，发生什么很难处理。我想说如果不幸被分手(无论原因如何)，生活难免变化很大，在深圳，我没交心的朋友。明
php 基础语法 aichenglong php 基本语法
1 .1 php变量必须以$开头 <?php $a=” b”; echo ?> 1 .2 php基本数据库类型 Integer float/double Boolean string 1 .3 复合数据类型数组array和对象 object 1 .4 特殊数据类型 null 资源类型(resource) $co
mybatis tools 配置详解 AILIKES mybatis
MyBatis Generator中文文档 MyBatis Generator中文文档地址： http://generator.sturgeon.mopaas.com/ 该中文文档由于尽可能和原文内容一致，所以有些地方如果不熟悉，看中文版的文档的也会有一定的障碍，所以本章根据该中文文档以及实际应用，使用通俗的语言来讲解详细的配置。本文使用Markdown进行编辑，但是博客显示效
继承与多态的探讨百合不是茶 JAVA面向对象继承对象
继承 extends 多态继承是面向对象最经常使用的特征之一：继承语法是通过继承发、基类的域和方法 //继承就是从现有的类中生成一个新的类，这个新类拥有现有类的所有extends是使用继承的关键字：在A类中定义属性和方法； class A{ //定义属性 int age； //定义方法 public void go
JS的undefined与null的实例 bijian1013 JavaScript JavaScript
<form name="theform" id="theform"> </form> <script language="javascript"> var a alert(typeof(b)); //这里提示undefined if(theform.datas
TDD实践（一） bijian1013 java 敏捷 TDD
一.TDD概述 TDD：测试驱动开发，它的基本思想就是在开发功能代码之前，先编写测试代码。也就是说在明确要开发某个功能后，首先思考如何对这个功能进行测试，并完成测试代码的编写，然后编写相关的代码满足这些测试用例。然后循环进行添加其他功能，直到完全部功能的开发。
[Maven学习笔记十]Maven Profile与资源文件过滤器 bit1129 maven
什么是Maven Profile Maven Profile的含义是针对编译打包环境和编译打包目的配置定制，可以在不同的环境上选择相应的配置，例如DB信息，可以根据是为开发环境编译打包，还是为生产环境编译打包，动态的选择正确的DB配置信息 Profile的激活机制 1.Profile可以手工激活，比如在Intellij Idea的Maven Project视图中可以选择一个P
【Hive八】Hive用户自定义生成表函数(UDTF) bit1129 hive
1. 什么是UDTF UDTF，是User Defined Table-Generating Functions，一眼看上去，貌似是用户自定义生成表函数，这个生成表不应该理解为生成了一个HQL Table，貌似更应该理解为生成了类似关系表的二维行数据集 2. 如何实现UDTF 继承org.apache.hadoop.hive.ql.udf.generic
tfs restful api 加auth 2.0认计 ronin47
　　目前思考如何给tfs的ngx-tfs api增加安全性。有如下两点：　　一是基于客户端的ip设置。这个比较容易实现。　　二是基于OAuth2.0认证，这个需要lua，实现起来相对于一来说，有些难度。　　现在重点介绍第二种方法实现思路。　　前言：我们使用Nginx的Lua中间件建立了OAuth2认证和授权层。如果你也有此打算，阅读下面的文档，实现自动化并获得收益。SeatGe
jdk环境变量配置 byalias java jdk
进行java开发，首先要安装jdk，安装了jdk后还要进行环境变量配置： 1、下载jdk（http://java.sun.com/javase/downloads/index.jsp），我下载的版本是：jdk-7u79-windows-x64.exe 2、安装jdk-7u79-windows-x64.exe 3、配置环境变量：右击"计算机"-->&quo
《代码大全》表驱动法-Table Driven Approach-2 bylijinnan java
package com.ljn.base; import java.io.BufferedReader; import java.io.FileInputStream; import java.io.InputStreamReader; import java.util.ArrayList; import java.util.Collections; import java.uti
SQL 数值四舍五入小数点后保留2位 chicony 四舍五入
1.round() 函数是四舍五入用，第一个参数是我们要被操作的数据，第二个参数是设置我们四舍五入之后小数点后显示几位。 2.numeric 函数的2个参数，第一个表示数据长度，第二个参数表示小数点后位数。例如：　　select cast(round(12.5,2) as numeric(5,2))
c++运算符重载 CrazyMizzz C++
一、加+，减-，乘*，除/ 的运算符重载 Rational operator*(const Rational &x) const{ return Rational(x.a * this->a); } 在这里只写乘法的，加减除的写法类似二、<<输出,>>输入的运算符重载 &nb
hive DDL语法汇总 daizj hive 修改列 DDL 修改表
hive DDL语法汇总１、对表重命名 hive> ALTER TABLE table_name RENAME TO new_table_name; 2、修改表备注 hive> ALTER TABLE table_name SET TBLPROPERTIES ('comment' = new_comm
jbox使用说明 dcj3sjt126com Web
参考网址：http://www.kudystudio.com/jbox/jbox-demo.html jBox v2.3 beta [ 点击下载] 技术交流QQGroup：172543951 100521167 [2011-11-11] jBox v2.3 正式版 - [调整&修复] IE6下有iframe或页面有active、applet控件
UISegmentedControl 开发笔记 dcj3sjt126com
// typedef NS_ENUM(NSInteger, UISegmentedControlStyle) { // UISegmentedControlStylePlain, // large plain &
Slick生成表映射文件 ekian scala
Scala添加SLICK进行数据库操作，需在sbt文件上添加slick-codegen包 "com.typesafe.slick" %% "slick-codegen" % slickVersion 因为我是连接SQL Server数据库，还需添加slick-extensions，jtds包 "com.typesa
ES-TEST gengzg test
package com.MarkNum; import java.io.IOException; import java.util.Date; import java.util.HashMap; import java.util.Map; import javax.servlet.ServletException; import javax.servlet.annotation
为何外键不再推荐使用 hugh.wang mysql DB
表的关联，是一种逻辑关系，并不需要进行物理上的“硬关联”，而且你所期望的关联，其实只是其数据上存在一定的联系而已，而这种联系实际上是在设计之初就定义好的固有逻辑。在业务代码中实现的时候，只要按照设计之初的这种固有关联逻辑来处理数据即可，并不需要在数据库层面进行“硬关联”，因为在数据库层面通过使用外键的方式进行“硬关联”，会带来很多额外的资源消耗来进行一致性和完整性校验，即使很多时候我们并不
领域驱动设计 julyflame VO DAO 设计模式 DTO po
概念： VO（View Object）：视图对象，用于展示层，它的作用是把某个指定页面（或组件）的所有数据封装起来。 DTO（Data Transfer Object）：数据传输对象，这个概念来源于J2EE的设计模式，原来的目的是为了EJB的分布式应用提供粗粒度的数据实体，以减少分布式调用的次数，从而提高分布式调用的性能和降低网络负载，但在这里，我泛指用于展示层与服务层之间的数据传输对
单例设计模式 hm4123660 java Singleton 单例设计模式懒汉式饿汉式
单例模式是一种常用的软件设计模式。在它的核心结构中只包含一个被称为单例类的特殊类。通过单例模式可以保证系统中一个类只有一个实例而且该实例易于外界访问，从而方便对实例个数的控制并节约系统源。如果希望在系统中某个类的对象只能存在一个，单例模式是最好的解决方案。 &nb
logback zhb8015 log logback
一、logback的介绍 Logback是由log4j创始人设计的又一个开源日志组件。logback当前分成三个模块：logback-core,logback- classic和logback-access。logback-core是其它两个模块的基础模块。logback-classic是log4j的一个改良版本。此外logback-class
整合Kafka到Spark Streaming——代码示例和挑战 Stark_Summer spark storm zookeeper PARALLELISM processing
作者Michael G. Noll是瑞士的一位工程师和研究员，效力于Verisign，是Verisign实验室的大规模数据分析基础设施（基础Hadoop）的技术主管。本文，Michael详细的演示了如何将Kafka整合到Spark Streaming中。期间， Michael还提到了将Kafka整合到 Spark Streaming中的一些现状，非常值得阅读，虽然有一些信息在Spark 1.2版
spring-master-slave-commondao 王新春 DAO spring dataSource slave master
互联网的web项目，都有个特点：请求的并发量高，其中请求最耗时的db操作，又是系统优化的重中之重。为此，往往搭建 db的一主多从库的数据库架构。作为web的DAO层，要保证针对主库进行写操作，对多个从库进行读操作。当然在一些请求中，为了避免主从复制的延迟导致的数据不一致性，部分的读操作也要到主库上。（这种需求一般通过业务垂直分开，比如下单业务的代码所部署的机器，读去应该也要从主库读取数

cs231 assignment1--KNN

你可能感兴趣的:(cs231 assignment1--KNN)