该程序应该打印到终端的网页
用法:./prog www.page.com 80 /folder/index.html
程序始终按预期进行,但始终在最后进行分段
#define _XOPEN_SOURCE 600
#include <stdio.h>
#include <sys/types.h>
#include <sys/socket.h>
#include <stdlib.h>
#include <arpa/inet.h>
#include <netdb.h>
#include <string.h>
#include <strings.h>
#include <unistd.h>
#include <termios.h>
#define HOST "localhost"
#define PAGE "/"
#define PORT "80"
#define USERAGENT "HTML 1.1"
char *build_get_query(char *host,char *page){
char *query;
char *getpage = page;
char *tpl = "GET /%s HTTP/1.1\r\nHost: %s\r\nUser-Agent: %s\r\nConnection: close\r\n\r\n";
if(getpage[0]=='/'){
getpage=getpage + 1; /*Removing leading / */
}
/* -5 is to consider the %s %s %s in tpl and the ending \0 */
query=malloc(strlen(host)+strlen(getpage)+strlen(USERAGENT)+strlen(tpl)-5);
sprintf(query, tpl, getpage, host, USERAGENT);
return query;
}
int main(int argc, char **argv){
int sockfd;
struct addrinfo hints, *servinfo, *p;
int s;
char *page;
char *stringA;
int tmpres;
char *sstr;
if(argc<3){
fprintf(stderr,"\n\tUSAGE:\n\t%s hostname/ip PORTnr /PAGE/index.shtml \n\n",argv[0]);
fprintf(stderr,"\texample:\n\t%s www.anypage.com 80 /folder/index.shtml \n\n",argv[0]);
exit(1);
}
memset(&hints,0,sizeof(struct addrinfo));
hints.ai_family=AF_INET; /* Allow IPv4 or IPv6 */
hints.ai_socktype=SOCK_STREAM; /* stream socket */
hints.ai_flags=0;
hints.ai_protocol=0; /* Any protocol */
if((s=getaddrinfo(argv[1],PORT,&hints,&servinfo))!=0){
fprintf(stderr,"\n\tgetaddrinfo: %s\n",gai_strerror(s));
exit(EXIT_FAILURE);
}
for(p=servinfo; p!=NULL; p=p->ai_next){
if((sockfd=socket(p->ai_family,p->ai_socktype,p->ai_protocol))==-1){
fprintf(stderr,"\n\tSOCKET FAIL\n\n");
continue;
}
if((connect(sockfd,p->ai_addr,p->ai_addrlen))<0){
close(sockfd);
fprintf(stderr,"\n\tCONECTION FAIL\n\n");
continue;
}
break;
}
if(p==NULL){
fprintf(stderr,"\n\tCONECTION FAIL\n\n");
exit(2);
}
freeaddrinfo(servinfo);
if(argc > 3){
page=argv[3];
}else{
page=PAGE;
}
if((stringA=malloc(BUFSIZ))==NULL){
printf("\n\tMEMORY ERROR\n\n");
exit(1);
}
stringA=build_get_query(argv[1],page);
if((write(sockfd,stringA,strlen(stringA)))<0){
printf("\n\tERROR ON SEND\n\n");
}
memset(stringA, 0, sizeof(stringA));
while((tmpres=read(sockfd,stringA,BUFSIZ))>0){
if((sstr=strstr(stringA,"<!DOCTYPE "))!=NULL){
stringA=sstr;
}
if((sstr=strstr(stringA,"</html>"))!=NULL){
strncpy(sstr+7,"\n",(BUFSIZ-strlen(stringA))+5);
}
fprintf(stdout,"%s",stringA);
}
if(tmpres<0){
perror("READ ERROR");
}
close(sockfd);
return 0;
}
gdb信息
Program received signal SIGSEGV, Segmentation fault.
_dl_fini () at dl-fini.c:183
183 dl-fini.c: No such file or directory.
in dl-fini.c
(gdb) bt
#0 _dl_fini () at dl-fini.c:183
#1 0x0015d1ef in __run_exit_handlers (status=0, listp=0x289324, run_list_atexit=true) at exit.c:78
#2 0x0015d25f in *__GI_exit (status=0) at exit.c:100
#3 0x00144bde in __libc_start_main (main=0x804892d <main>, argc=4, ubp_av=0xbffff454, init=0x8048d00 <__libc_csu_init>,
fini=0x8048cf0 <__libc_csu_fini>, rtld_fini=0x11e080 <_dl_fini>, stack_end=0xbffff44c) at libc-start.c:258
#4 0x08048811 in _start ()
(gdb)
我对gdb信息很感兴趣,因为我在大约一年前安装了sudo apt-get install build-essential
,直到今天才出现问题。
答案 0 :(得分:2)
我看到的是你将BUFSIZ
个字节分配给缓冲区,并将最多BUFSIZ
个字节读入缓冲区,但是你试图使用strstr()
和缓冲区上的strlen()
...如果你实际上已经将BUFSIZ
字节读入缓冲区,那么很可能不是一个以空字符结尾的字符串。
我建议您分配BUFSIZ+1
和memset( stringA, 0, BUFSIZ+1 )
以防止strlen()
随机遍历内存,这会在while循环中产生一些非常不确定的行为,并且还可能导致循环中的printf()
表现得很奇怪,或者至少使用printf( "%.*s", BUFSIZ, stringA );
表示输出。
char readBuffer[BUFSIZ+1] = { 0 };
stringA=build_get_query(argv[1],page);
if((write(sockfd,stringA,strlen(stringA)))<0){
printf("\n\tERROR ON SEND\n\n");
}
while((tmpres=read(sockfd,readBuffer,BUFSIZ))>0){
if((sstr=strstr(readBuffer,"<!DOCTYPE "))!=NULL){
strcpy( readBuffer, sstr );
}
if((sstr=strstr(readBuffer,"</html>"))!=NULL){
strncpy(sstr+7,"\n",(BUFSIZ-strlen(readBuffer))+5);
}
fprintf(stdout,"%s",readBuffer);
memset( readBuffer, 0 , BUFSIZ+1 );
}
PS:实际上,在阅读了另一个响应之后,我意识到你犯了一个更大的错误,取决于stringA是一个指向BUFSIZ数组的指针,之后你将它重新分配给其他地址(从构建查询返回)
答案 1 :(得分:2)
分配给stringA的缓冲区大小不是BUFSIZ。毕竟它接收到build_get_query中分配的缓冲区的地址,它甚至可能比BUFSIZ小。 我不知道你为什么使用stringA = malloc(BUFSIZ),并在下一条指令中将stringA指针更改为另一个缓冲区。那里有很多内存泄漏。