C语言 HTTP协议下载文件,实现断点续传,socket通讯,目前只支持ip和port方式连接,有兴趣的读者可完善域名方式。
代码分为 http.c: 实现http协议下载文件 ,socket.c: 封装linux socket函数,移植时只需修改socket.c中的函数即可。
希望对大家有帮助,本人亲测可用!
http.c
//http.c
#include <stdio.h>
#include <stdlib.h>
#include <errno.h>
#include <string.h>
#include <sys/types.h>
#include <sys/stat.h>
#include <fcntl.h>
#include "socket.h"
#include "http.h"
#define MAX_RECV_SIZE 1440//硬件单包最大的接收字节数
char g_host[URL_LEN];
char g_ip[URL_LEN+1];//ip/域名
char g_port[5+1];
char g_buf_send[4*1024];//发送数据暂存区
char g_buf_recv[10*1024];//接收数据暂存区
BreakPoint_ST g_break_point;
/*
功能:判断断点有效性,现在校验url是否一致
参数:
返回:
>0---------有效,已下载文件大小
-1----------无效
*/
int Get_Breakpoint_Available(BreakPoint_ST *breakpoint,char *url,char *file_crc)
{
//判断断点是否有效,后续加入文件校验码
if((memcmp(breakpoint->url,url,strlen(url))== 0)&&(breakpoint->recv_size== MAX_RECV_SIZE))
return breakpoint->download_size;
else
{
return -1;
}
}
/*
功能:判断要下载文件是否存在断点
参数:
filename---要下载的文件名
file_crc----服务器返回下载文件的校验码
返回:
0---------无断点
>0--------有断点,已下载文件大小
*/
int Get_Breakpoint(char *url,char *filename,char *file_crc)
{
char filename_bp[64];
int fd = -1;
int ret;
BreakPoint_ST break_point;
//断点文件名 filename+bp
sprintf(filename_bp,"%s.bp",filename);
//检测是否存在filename断点文件
fd = open(filename_bp,O_RDONLY,S_IRUSR|S_IWUSR);
if(fd == -1)
{
#ifdef DEBUG_HTTP
printf("no exsit %s\n",filename_bp);
#endif
return 0;
}
//存在断点
ret = read(fd,&break_point,sizeof(break_point));
if(ret != sizeof(break_point))
{
perror("ERR:Get_Breakpoint read");
exit(-1);
}
close(fd);
//判断断点是否有效
ret = Get_Breakpoint_Available(&break_point,url,file_crc);
if(ret > 0)
return ret;
else
{
printf("%s not available\n",filename_bp);
remove(filename);
remove(filename_bp);
return 0;
}
}
/*
功能:保存断点信息,文件名filename.bp
参数:
filename---要下载的文件名
file_crc----服务器返回下载文件的校验码
返回:
0---------成功
>0--------有断点,已下载文件大小
*/
int Save_Breakpoint(char *url,char *filename,int download_size,char *file_crc)
{
int fd;
BreakPoint_ST breakpoint;
char filename_bp[128];//断点信息文件名,包含路径
sprintf(filename_bp,"%s.bp",filename);
/* 创建目的文件 */
if((fd=open(filename_bp,O_WRONLY|O_CREAT,S_IRUSR|S_IWUSR))==-1)
{
fprintf(stderr,"Open %s Error:%s\n",filename_bp,strerror(errno));
exit(1);
}
memset(&breakpoint,0x0,sizeof(breakpoint));
strcpy(breakpoint.url,url);
//strcpy(breakpoint.crc,file_crc);
strcpy(breakpoint.filename,filename);
breakpoint.download_size = download_size;
breakpoint.recv_size= MAX_RECV_SIZE;
//xu tioa zheng wei fen ci xie ru
if(write(fd,&breakpoint,sizeof(breakpoint)) != sizeof(breakpoint))
{
perror("ERR:Save_Breakpoint");
exit(1);
}
close(fd);
return 0;
}
/*
功能:保存文件,追加写
参数:
返回:
0---------成功
*/
int Save_File(char *filebuf,int filelength,char *filename)
{
int fd;
/* 创建目的文件追加写 */
if((fd=open(filename,O_WRONLY|O_CREAT|O_APPEND,S_IRUSR|S_IWUSR))==-1)
{
fprintf(stderr,"Open %s Error:%s\n",filename,strerror(errno));
exit(1);
}
//xu tioa zheng wei fen ci xie ru
if(write(fd,filebuf,filelength) != filelength)
{
perror("ERR:Save_File");
exit(1);
}
close(fd);
return 0;
}
int HTTP_GetResponseCode(void)
{
}
/*
功能:读取http返回的协议实体主体长度
参数:
revbuf--------接收到的返回值
返回值:
>=0---------内容(实体主体)的长度
-1-----------数据返回错误
*/
int HTTP_GetRecvLength(char *revbuf)
{
char *p1 = NULL;
int HTTP_Body = 0;//内容体长度
int HTTP_Head = 0;//HTTP 协议头长度
HTTP_Body = HTTP_GetContentLength(revbuf);
if(HTTP_Body == -1)
return -1;
p1=strstr(revbuf,"\r\n\r\n");
if(p1==NULL)
return -1;
else
{
HTTP_Head = p1- revbuf +4;// 4是\r\n\r\n的长度
return HTTP_Body+HTTP_Head;
}
}
/*
功能:读取http返回的Content-Length长度
参数:
revbuf--------接收到的数据
返回值:
>=0---------Content-Length长度
-1-----------数据返回错误
*/
int HTTP_GetContentLength(char *revbuf)
{
char *p1 = NULL, *p2 = NULL;
int HTTP_Body = 0;//内容体长度
p1 = strstr(revbuf,"Content-Length");
if(p1 == NULL)
return -1;
else
{
p2 = p1+strlen("Content-Length")+ 2;
HTTP_Body = atoi(p2);
return HTTP_Body;
}
}
/*
功能:
参数:
sockfd--------接收到的返回值
返回值:
>0---------接收到长度
-1----------失败
=0---------服务端断开连接
注:内部接收缓冲10k
*/
int HTTP_Recv(int sockfd,char *buf_recv)
{
int ret;
int recvlen=0;
int downloadlen = 0;
//int contentlen=0;
char buf_recv_tmp[10*1024+1];
memset(buf_recv_tmp,0x0,sizeof(buf_recv_tmp));
while(1)
{
ret = Recv(sockfd,buf_recv_tmp+recvlen,sizeof(buf_recv_tmp)-1,0);
if(ret <= 0)//下载失败
{
perror("ERR:recv fail");
return ret;
}
if(recvlen == 0)
{
#ifdef DEBUG_HTTP_RECV
printf("recv len = %d\n", ret);
printf("recv = %s\n", buf_recv_tmp);
#endif
//获取需要下载长度;
downloadlen = HTTP_GetRecvLength(buf_recv_tmp);
#ifdef DEBUG_HTTP_RECV
printf("downloadlen = %d\n",downloadlen);
#endif
}
recvlen += ret;
#ifdef DEBUG_HTTP_RECV
printf("total recvlen = %d\n",recvlen);
#endif
if(downloadlen == recvlen)//下载完成
break;
}
memcpy(buf_recv,buf_recv_tmp,downloadlen);
return recvlen;
}
/*
功能:获取下载url中的文件名,最后一个/后的字符
参数:
返回值:
0-----------成功
-1----------失败
注:内部接收缓冲10k
*/
int HTTP_GetFileName(char *url,char *filename)
{
//提取url中最后一个/后的内容
int len;
int i;
len = strlen(url);
for(i=len-1;i>0;i--)
{
if(url[i] == '/')
break;
}
if(i == 0)//下载地址错误
{
printf("url not contain '/'\n");
return -1;
}
else
{
strcpy(filename,url+i+1);
#ifdef DEBUG_HTTP
printf("filename=%s\n",filename);
#endif
return 0;
}
}
/*
功能:获取下载url中的路径,第一个/后的字符
参数:
返回值:
0-----------成功
-1----------失败
注:url ex "http://host:port/path"
*/
int HTTP_GetPath(char *url,char *path)
{
char *p;
p = strstr(url,"http://");
if(p == NULL)
{
p = strchr(url,'/');
if(p == NULL)
return -1;
else
{
strcpy(path,p);
return 0;
}
}
else
{
p = strchr(url+strlen("http://"),'/');
if(p == NULL)
return -1;
else
{
strcpy(path,p);
return 0;
}
}
}
/*
功能:获取下载url中的ip和port,ip支持域名,端口默认为80
参数:
返回值:
1-----------域名式
2-----------ip port式
-1----------失败
注:url ex "http://host:port/path"
*/
int HTTP_Get_IP_PORT(char *url,char *ip,char *port)
{
char *p = NULL;
int offset = 0;
char DOMAIN_NAME[128];
p = strstr(url,"http://");
if(p == NULL)
{
offset = 0;
}
else
{
offset = strlen("http://");
}
p = strchr(url+offset,'/');
if(p == NULL)
{
printf("url:%s format error\n",url);
return -1;
}
else
{
memset(DOMAIN_NAME,0x0,sizeof(DOMAIN_NAME));
memcpy(DOMAIN_NAME,url+offset,(p-url-offset));
p = strchr(DOMAIN_NAME,':');
if(p == NULL)
{
strcpy(ip,DOMAIN_NAME);
strcpy(port,"80");
//printf("ip %p,port %p\n",ip,port);
#ifdef DEBUG_HTTP
printf("ip=%s,port=%s\n",ip,port);//debug info
#endif
return 1;
}
else
{
*p = '\0';
strcpy(ip,DOMAIN_NAME);
strcpy(port,p+1);
#ifdef DEBUG_HTTP
printf("ip=%s,port=%s\n",ip,port);//debug info
#endif
return 2;
}
return 0;
}
}
void Package_Url_Get_File(char *path, char *range)
{
char buf[64];
memset(g_buf_send,0x0,sizeof(g_buf_send));
sprintf(g_buf_send, "GET %s",path);
//HTTP/1.1\r\n 前面需要一个空格
strcat(g_buf_send," HTTP/1.1\r\n");
strcat(g_buf_send, "Host: ");
strcat(g_buf_send, g_host);
//strcat(g_buf_send, ":");
//strcat(g_buf_send, PORT);
sprintf(buf, "\r\nRange: bytes=%s",range);
strcat(g_buf_send,buf);
strcat(g_buf_send, "\r\nKeep-Alive: 200");
strcat(g_buf_send,"\r\nConnection: Keep-Alive\r\n\r\n");
}
int Package_Url_Get_FileSize(char *url)
{
memset(g_buf_send,0x0,sizeof(g_buf_send));
sprintf(g_buf_send, "HEAD %s",url);
//HTTP/1.1\r\n 前面需要一个空格
strcat(g_buf_send," HTTP/1.1\r\n");
strcat(g_buf_send, "Host: ");
strcat(g_buf_send, g_host);
//strcat(g_buf_send, ":");
//strcat(g_buf_send, PORT);
strcat(g_buf_send,"\r\nConnection: Keep-Alive\r\n\r\n");
return 0;
}
int HTTP_GetFileSize(int sockfd,char *path)
{
int ret = -1;
char buf_recv_tmp[10*1024+1];
Package_Url_Get_FileSize(path);
#ifdef DEBUG_HTTP
printf("send = %s \n",g_buf_send);
#endif
Send(sockfd, g_buf_send, strlen(g_buf_send), 0);
memset(buf_recv_tmp,0x0,sizeof(buf_recv_tmp));
ret = Recv(sockfd,buf_recv_tmp,sizeof(buf_recv_tmp)-1,0);
#ifdef DEBUG_HTTP
printf("recv len = %d\n", ret);
printf("recv = %s\n", buf_recv_tmp);
#endif
if(ret <= 0)
{
perror("ERR:recv fail GetFileSize()");
return -1;
}
ret = HTTP_GetContentLength(buf_recv_tmp);
if(ret <= 0)
return -1;
else
return ret;
}
/*
功能:分段下载文件
参数:
返回值:
>0----------已下载文件大小(不包含上次下载)
-1----------失败
*/
int HTTP_GetFile(int sockfd,char *path,int filelength,int download_size,char *filebuf)
{
int count;
char range[32];
int i;
int j = 0;//成功下载次数
int ret = -1;
char *p = NULL;
int download_index;//下载开始索引
count = (filelength%MAX_RECV_SIZE)?(filelength/MAX_RECV_SIZE +1):(filelength/MAX_RECV_SIZE);
download_index = download_size/MAX_RECV_SIZE;
for(i=download_index;i<count;i++)
{
//if(i == 20)//测试断点
//break;
if((i == (count-1))&&(filelength%MAX_RECV_SIZE))
sprintf(range,"%d-%d",i*MAX_RECV_SIZE,filelength-1);
else
sprintf(range,"%d-%d",i*MAX_RECV_SIZE,(i+1)*MAX_RECV_SIZE-1);
Package_Url_Get_File(path,range);
#ifdef DEBUG_HTTP
printf("send = %s \n",g_buf_send);
#endif
Send(sockfd, g_buf_send, strlen(g_buf_send), 0);
/*需改为提取http 返回协议头和协议体总长,然后定长接收*/
memset(g_buf_recv,0x0,sizeof(g_buf_recv));
ret = HTTP_Recv(sockfd,g_buf_recv);
if(ret < 0)
break;
if(ret == 0 )//服务端断开连接
{
sockfd = Socket_Connect(g_ip,g_port);
i--;
continue;
}
/*提取协议体数据,保存在filebuf中*/
p = strstr(g_buf_recv,"\r\n\r\n");
if(p == NULL)//jia ru duan dian baocun
{
printf("ERR:g_buf_recv not contain end flag\n");
break;
}
else
{
memcpy(filebuf+j*MAX_RECV_SIZE,p+4,MAX_RECV_SIZE);
j++;
}
}
if(i == count)
return (filelength-download_size);
else
return (i*MAX_RECV_SIZE-download_size);
}
/*
功能:HTTP下载文件
参数:
返回值:
0----------下载完成
-1---------失败
-2---------部分下载完成
注:保存文件到bin所在目录
*/
int HTTP_DownloadFile(char *url,char *save_path)
{
int ret;
int sockfd;
int filesize;
int download_size;
char filename[FILENAME_LEN+1];
char filename_bp[FILENAME_LEN+3+1];
char *filebuf;
char save_file_path[FILENAME_LEN+1];//保存下载文件的路径+文件名
char path[PATH_LEN+1];//url中的path
//提取ip和port或url(url 暂不实现,需要gethostbyname linux)
ret = HTTP_Get_IP_PORT(url,g_ip,g_port);
if(ret == -1)
return -1;
else
{
sprintf(g_host,"%s:%s",g_ip,g_port);
}
//提取下载文件名
ret = HTTP_GetFileName(url,filename);
if(ret == -1)
return -1;
ret = HTTP_GetPath(url,path);
if(ret == -1)
return -1;
//sleep(3);//debug info
//建立连接
sockfd = Socket_Connect(g_ip,g_port);
//获取下载文件总大小
filesize = HTTP_GetFileSize(sockfd,path);
if(filesize == -1)
return -1;
//#ifdef DEBUG_HTTP
printf("http need download size %d\n",filesize);
//#endif
//malloc分配存储文件空间
filebuf = (char *)malloc(filesize);
if(filebuf == NULL)
{
perror("malloc filebuf fail");
return -1;
}
else
memset(filebuf,0x0,filesize);
download_size = Get_Breakpoint(url,filename,NULL);
#ifdef DEBUG_HTTP
printf("breakpoint download_size=%d\n",download_size);//debug info
sleep(3);//debug info
#endif
//分段下载文件
ret = HTTP_GetFile(sockfd,path,filesize,download_size,filebuf);
Close(sockfd);
if(ret < 0)
{
free(filebuf);
return -1;
}
else
{
sprintf(save_file_path,"%s%s",save_path,filename);
#ifdef DEBUG_HTTP
printf("save_path=%s\n",save_path);
printf("filename=%s\n",filename);
printf("save_file_path=%s\n",save_file_path);
printf("download_size = %d\n",ret);
#endif
Save_File(filebuf,ret,save_file_path);
free(filebuf);
if((ret+download_size) == filesize)//全部下载完成
{
sprintf(filename_bp,"%s.bp",filename);
remove(filename_bp);
printf("download success\n");
return 0;
}
else//部分下载完成
{
printf("part download success\n");
//保存断点信息
Save_Breakpoint(url,save_file_path,ret+download_size,NULL);
return -2;
}
}
}
socket.c
点击(此处)折叠或打开
//socket.c
//作者:王振
#include <stdio.h>
#include <stdlib.h>
#include <errno.h>
#include <string.h>
#include <sys/types.h>
#include <netinet/in.h>
#include <sys/socket.h>
#include <sys/wait.h>
#include "socket.h"
int Connect(int fd, struct sockaddr *addr, socklen_t len)
{
int result;
if ((result = connect(fd, addr, len)) == -1) {
perror("connect");
exit(EXIT_FAILURE);
}
return 0;
}
int Socket_Connect(char *ip,char *port)
{
struct sockaddr_in addr;
int sockfd;
int len;
addr.sin_family = AF_INET;
addr.sin_addr.s_addr = inet_addr(ip);//127.0.0.1为本机ip
addr.sin_port = htons(atoi(port));
len = sizeof(addr);
sockfd = socket(AF_INET, SOCK_STREAM, 0);
Connect(sockfd, (struct sockaddr*)&addr, len);
return sockfd;
}
/*
功能:向socketfd发送数据,内部实现了循环发送len长度
参数:
sockfd 是代表你与远程程序连接的套接字描述符。
msg 是一个指针,指向你想发送的信息的地址。
len 是你想发送信息的长度。
flags 发送标记。一般都设为0
返回:
0-------- 成功
退出---失败
修改:
备注:
王振
*/
int Send(int sockfd, char *sendbuf, int len, int flags)
{
int sendlen = 0;
int ret = -1;
while(sendlen < len)
{
ret = send(sockfd, sendbuf+sendlen, len-sendlen, flags);
if(-1 == ret)
{
perror("send");
exit(EXIT_FAILURE);
}
else
sendlen += ret;
}
return 0;
}
int Close(int sockfd)
{
return close(sockfd);
}
int Recv(int sockfd, char *recvbuf, int len, int flags)
{
int recv_len;
if ((recv_len = recv(sockfd, recvbuf, len, flags)) < 0)
{
perror("recv error");
exit(EXIT_FAILURE);
}
return recv_len;
}