http socket request returning trailling characters












0















I am learning network programming in C and tried to create to a toy version of wget.



However, when I run the program, I get the page with some trailing characters at the beginning and at the end (0 & f43 in this case).



The program contains two .c and two .h files.



One for parsing (naïvely) the address and the other to make the network request
and dump the data.



Here are the files for parsing the input:



url.h



#ifndef URL_H
#define URL_H

/* information of an URL*/
struct url_info
{
char* url; //full url
char* protocol; // protocol type: http, ftp, etc...
char* host; // host name
int port; //port number
char* path; //path
};
typedef struct url_info url_info;

static const char P_HTTP = "http";

void parse_url(char* url, url_info *info);

void exit_with_error(char* message);

void print_url_info(url_info info);

#endif //URL_H


url.c



#include<stdio.h>
#include<stdlib.h>
#include<string.h>
#include"url.h"


void parse_url(char* url, url_info *info)
{
// url format: [http://]<hostname>[:<port>]/<path>

char *full_url = malloc((strlen(url) + 1) * sizeof(char));
char *protocol;
char *path;
char *host;
int port;

strcpy(full_url, url);
info->url = full_url;

char *protocol_token = strstr(url, "://");
if (protocol_token){
protocol = url;
*protocol_token = '';
url = protocol_token + 3;
} else {
protocol = "http";
}
info->protocol = protocol;

char *port_token = strstr(url, ":");
char *path_token = strstr(url, "/");

if (port_token && port_token < path_token){
port = atoi(port_token + 1);
*port_token = '';
} else {
port = 80;
}
info->port = port;

if (path_token){
*path_token = '';
host = url;
path = path_token + 1;
info->host = host;
info->path = path;
} else {
exit_with_error("No trailing /.");
}
}


void print_url_info(url_info info){
printf("The URL contains following information: n");
printf("Full url:t%sn", info.url);
printf("Protocol type:t%sn", info.protocol);
printf("Host name:t%sn", info.host);
printf("Port No.:t%dn", info.port);
printf("Path:tt%sn", info.path);
}


void exit_with_error(char *message)
{
fprintf(stderr, "%sn", message);
exit(EXIT_FAILURE);
}


Here are the files for making the request



wgetX.h



#ifndef WGETX_H_
#define WGETX_H_

#define B_SIZE 1024 * 5000

void write_data(const char *path, const char *data);

char* download_page(url_info info, char *buff);

char* http_get_request(char* path, char* host);

char* read_http_reply(char* recv_buf_t);

unsigned long ipfromhost(const char *host);

#endif


wgetX.c



 #include <sys/types.h>
#include <sys/socket.h>
#include <netinet/in.h>
#include <arpa/inet.h>
#include <unistd.h>
#include <netdb.h>
#include <stdio.h>
#include <stdlib.h>
#include <ctype.h>
#include <string.h>

#include "url.h"
#include "wgetX.h"

int main(int argc, char* argv)
{

url_info info;


if (argc != 2) {
exit_with_error("The wgetX must have exactly 1 parameter as input. n");
}
char *url = argv[1];
parse_url(url, &info);

char *buf;
buf = malloc(sizeof(char)*B_SIZE);
bzero(buf, B_SIZE);

download_page(info, buf);
printf("%s", buf);

free(buf);
return (EXIT_SUCCESS);
}

char* download_page(url_info info, char *buf)
{
struct sockaddr_in dest;
int len, sz, mysocket;
char *request = http_get_request(info.path, info.host);

mysocket = socket(AF_INET, SOCK_STREAM, 0);
memset(&dest, 0, sizeof(dest));
dest.sin_family = AF_INET;
dest.sin_addr.s_addr = ipfromhost(info.host);
dest.sin_port = htons(info.port);
connect(mysocket, (struct sockaddr *)&dest, sizeof(struct sockaddr));
send(mysocket, request, strlen(request), 0);

len = 0;
sz = 0;
do {
len = recv(mysocket, buf + sz, B_SIZE - sz, 0);
if (len == -1) {continue;}
sz += len;
} while (len > 0);

*(buf + sz) = '';

close(mysocket);
return buf;
}


char* http_get_request(char* path, char* host) {
char * request_buffer = (char *) malloc(1024);
memset(request_buffer, 0, sizeof(*request_buffer));
snprintf(request_buffer, 1024, "GET /%s HTTP/1.1rnHost: %srnConnection: closernrn",
path, host);
return request_buffer;
}

unsigned long ipfromhost(const char *host){
struct in_addr **addr_list;
struct hostent *he;
if ((he = gethostbyname(host)) != NULL){
addr_list = (struct in_addr **) he->h_addr_list;
int i;
for (i = 0; addr_list[i] != NULL; i++){
return addr_list[i]->s_addr;
}
exit_with_error("Couldn't resolve host to ip adressn");
return 0;
} else {
exit_with_error("Couldn't resolve host to ip adressn");
return 0;
}
}


Makefile



LINK_TARGET = wgetX
OBJS =
wgetX.o
url.o
REBUILDABLES = $(OBJS) $(LINK_TARGET)
all : $(LINK_TARGET)
clean:
rm -f $(REBUILDABLES)

$(LINK_TARGET) : $(OBJS)
cc -g -o $@ $^

%.o : %.c
cc -g -Wall -o $@ -c $<

wgetX.o : wgetX.h url.h
url.o : url.h


When executing the program on one specific url, I get an html output that is different from the source code (as found in Chrome). I get garbage characters: a zero at the end and "f43" just before the start of the html



Commands



make clean
make
./wgetX http://www.polytechnique.fr/


Output



I got the http reply message with the status code and all and just before "










share|improve this question























  • That's way too much code to wade through but I bet you aren't properly zero terminating a string somewhere.

    – Shawn
    Jan 3 at 16:36






  • 1





    Also, why not just use libcurl or the like if you want to talk to a http server?

    – Shawn
    Jan 3 at 16:38











  • I suppose it would be easier. This is for school so I have to use sockets this way. It's for learning purposes!

    – aripy887
    Jan 3 at 18:42











  • regarding: cc -g -Wall -o $@ -c $< strongly suggest: cc -g -Wall -Wextra -Wconversion -pedantic -std=gnu11 -o $@ -c $< This enables the main warning features. Which when applied to the posted code will result in several warning messages being output by the compiler. Those warnings need to be corrected

    – user3629249
    Jan 3 at 18:48











  • OT: regarding function: exit_with_error(), the statement: fprintf(stderr, "%sn", message); this does not tell the user why the error occurred. Suggest using perror() where approporiate.

    – user3629249
    Jan 3 at 18:51
















0















I am learning network programming in C and tried to create to a toy version of wget.



However, when I run the program, I get the page with some trailing characters at the beginning and at the end (0 & f43 in this case).



The program contains two .c and two .h files.



One for parsing (naïvely) the address and the other to make the network request
and dump the data.



Here are the files for parsing the input:



url.h



#ifndef URL_H
#define URL_H

/* information of an URL*/
struct url_info
{
char* url; //full url
char* protocol; // protocol type: http, ftp, etc...
char* host; // host name
int port; //port number
char* path; //path
};
typedef struct url_info url_info;

static const char P_HTTP = "http";

void parse_url(char* url, url_info *info);

void exit_with_error(char* message);

void print_url_info(url_info info);

#endif //URL_H


url.c



#include<stdio.h>
#include<stdlib.h>
#include<string.h>
#include"url.h"


void parse_url(char* url, url_info *info)
{
// url format: [http://]<hostname>[:<port>]/<path>

char *full_url = malloc((strlen(url) + 1) * sizeof(char));
char *protocol;
char *path;
char *host;
int port;

strcpy(full_url, url);
info->url = full_url;

char *protocol_token = strstr(url, "://");
if (protocol_token){
protocol = url;
*protocol_token = '';
url = protocol_token + 3;
} else {
protocol = "http";
}
info->protocol = protocol;

char *port_token = strstr(url, ":");
char *path_token = strstr(url, "/");

if (port_token && port_token < path_token){
port = atoi(port_token + 1);
*port_token = '';
} else {
port = 80;
}
info->port = port;

if (path_token){
*path_token = '';
host = url;
path = path_token + 1;
info->host = host;
info->path = path;
} else {
exit_with_error("No trailing /.");
}
}


void print_url_info(url_info info){
printf("The URL contains following information: n");
printf("Full url:t%sn", info.url);
printf("Protocol type:t%sn", info.protocol);
printf("Host name:t%sn", info.host);
printf("Port No.:t%dn", info.port);
printf("Path:tt%sn", info.path);
}


void exit_with_error(char *message)
{
fprintf(stderr, "%sn", message);
exit(EXIT_FAILURE);
}


Here are the files for making the request



wgetX.h



#ifndef WGETX_H_
#define WGETX_H_

#define B_SIZE 1024 * 5000

void write_data(const char *path, const char *data);

char* download_page(url_info info, char *buff);

char* http_get_request(char* path, char* host);

char* read_http_reply(char* recv_buf_t);

unsigned long ipfromhost(const char *host);

#endif


wgetX.c



 #include <sys/types.h>
#include <sys/socket.h>
#include <netinet/in.h>
#include <arpa/inet.h>
#include <unistd.h>
#include <netdb.h>
#include <stdio.h>
#include <stdlib.h>
#include <ctype.h>
#include <string.h>

#include "url.h"
#include "wgetX.h"

int main(int argc, char* argv)
{

url_info info;


if (argc != 2) {
exit_with_error("The wgetX must have exactly 1 parameter as input. n");
}
char *url = argv[1];
parse_url(url, &info);

char *buf;
buf = malloc(sizeof(char)*B_SIZE);
bzero(buf, B_SIZE);

download_page(info, buf);
printf("%s", buf);

free(buf);
return (EXIT_SUCCESS);
}

char* download_page(url_info info, char *buf)
{
struct sockaddr_in dest;
int len, sz, mysocket;
char *request = http_get_request(info.path, info.host);

mysocket = socket(AF_INET, SOCK_STREAM, 0);
memset(&dest, 0, sizeof(dest));
dest.sin_family = AF_INET;
dest.sin_addr.s_addr = ipfromhost(info.host);
dest.sin_port = htons(info.port);
connect(mysocket, (struct sockaddr *)&dest, sizeof(struct sockaddr));
send(mysocket, request, strlen(request), 0);

len = 0;
sz = 0;
do {
len = recv(mysocket, buf + sz, B_SIZE - sz, 0);
if (len == -1) {continue;}
sz += len;
} while (len > 0);

*(buf + sz) = '';

close(mysocket);
return buf;
}


char* http_get_request(char* path, char* host) {
char * request_buffer = (char *) malloc(1024);
memset(request_buffer, 0, sizeof(*request_buffer));
snprintf(request_buffer, 1024, "GET /%s HTTP/1.1rnHost: %srnConnection: closernrn",
path, host);
return request_buffer;
}

unsigned long ipfromhost(const char *host){
struct in_addr **addr_list;
struct hostent *he;
if ((he = gethostbyname(host)) != NULL){
addr_list = (struct in_addr **) he->h_addr_list;
int i;
for (i = 0; addr_list[i] != NULL; i++){
return addr_list[i]->s_addr;
}
exit_with_error("Couldn't resolve host to ip adressn");
return 0;
} else {
exit_with_error("Couldn't resolve host to ip adressn");
return 0;
}
}


Makefile



LINK_TARGET = wgetX
OBJS =
wgetX.o
url.o
REBUILDABLES = $(OBJS) $(LINK_TARGET)
all : $(LINK_TARGET)
clean:
rm -f $(REBUILDABLES)

$(LINK_TARGET) : $(OBJS)
cc -g -o $@ $^

%.o : %.c
cc -g -Wall -o $@ -c $<

wgetX.o : wgetX.h url.h
url.o : url.h


When executing the program on one specific url, I get an html output that is different from the source code (as found in Chrome). I get garbage characters: a zero at the end and "f43" just before the start of the html



Commands



make clean
make
./wgetX http://www.polytechnique.fr/


Output



I got the http reply message with the status code and all and just before "










share|improve this question























  • That's way too much code to wade through but I bet you aren't properly zero terminating a string somewhere.

    – Shawn
    Jan 3 at 16:36






  • 1





    Also, why not just use libcurl or the like if you want to talk to a http server?

    – Shawn
    Jan 3 at 16:38











  • I suppose it would be easier. This is for school so I have to use sockets this way. It's for learning purposes!

    – aripy887
    Jan 3 at 18:42











  • regarding: cc -g -Wall -o $@ -c $< strongly suggest: cc -g -Wall -Wextra -Wconversion -pedantic -std=gnu11 -o $@ -c $< This enables the main warning features. Which when applied to the posted code will result in several warning messages being output by the compiler. Those warnings need to be corrected

    – user3629249
    Jan 3 at 18:48











  • OT: regarding function: exit_with_error(), the statement: fprintf(stderr, "%sn", message); this does not tell the user why the error occurred. Suggest using perror() where approporiate.

    – user3629249
    Jan 3 at 18:51














0












0








0








I am learning network programming in C and tried to create to a toy version of wget.



However, when I run the program, I get the page with some trailing characters at the beginning and at the end (0 & f43 in this case).



The program contains two .c and two .h files.



One for parsing (naïvely) the address and the other to make the network request
and dump the data.



Here are the files for parsing the input:



url.h



#ifndef URL_H
#define URL_H

/* information of an URL*/
struct url_info
{
char* url; //full url
char* protocol; // protocol type: http, ftp, etc...
char* host; // host name
int port; //port number
char* path; //path
};
typedef struct url_info url_info;

static const char P_HTTP = "http";

void parse_url(char* url, url_info *info);

void exit_with_error(char* message);

void print_url_info(url_info info);

#endif //URL_H


url.c



#include<stdio.h>
#include<stdlib.h>
#include<string.h>
#include"url.h"


void parse_url(char* url, url_info *info)
{
// url format: [http://]<hostname>[:<port>]/<path>

char *full_url = malloc((strlen(url) + 1) * sizeof(char));
char *protocol;
char *path;
char *host;
int port;

strcpy(full_url, url);
info->url = full_url;

char *protocol_token = strstr(url, "://");
if (protocol_token){
protocol = url;
*protocol_token = '';
url = protocol_token + 3;
} else {
protocol = "http";
}
info->protocol = protocol;

char *port_token = strstr(url, ":");
char *path_token = strstr(url, "/");

if (port_token && port_token < path_token){
port = atoi(port_token + 1);
*port_token = '';
} else {
port = 80;
}
info->port = port;

if (path_token){
*path_token = '';
host = url;
path = path_token + 1;
info->host = host;
info->path = path;
} else {
exit_with_error("No trailing /.");
}
}


void print_url_info(url_info info){
printf("The URL contains following information: n");
printf("Full url:t%sn", info.url);
printf("Protocol type:t%sn", info.protocol);
printf("Host name:t%sn", info.host);
printf("Port No.:t%dn", info.port);
printf("Path:tt%sn", info.path);
}


void exit_with_error(char *message)
{
fprintf(stderr, "%sn", message);
exit(EXIT_FAILURE);
}


Here are the files for making the request



wgetX.h



#ifndef WGETX_H_
#define WGETX_H_

#define B_SIZE 1024 * 5000

void write_data(const char *path, const char *data);

char* download_page(url_info info, char *buff);

char* http_get_request(char* path, char* host);

char* read_http_reply(char* recv_buf_t);

unsigned long ipfromhost(const char *host);

#endif


wgetX.c



 #include <sys/types.h>
#include <sys/socket.h>
#include <netinet/in.h>
#include <arpa/inet.h>
#include <unistd.h>
#include <netdb.h>
#include <stdio.h>
#include <stdlib.h>
#include <ctype.h>
#include <string.h>

#include "url.h"
#include "wgetX.h"

int main(int argc, char* argv)
{

url_info info;


if (argc != 2) {
exit_with_error("The wgetX must have exactly 1 parameter as input. n");
}
char *url = argv[1];
parse_url(url, &info);

char *buf;
buf = malloc(sizeof(char)*B_SIZE);
bzero(buf, B_SIZE);

download_page(info, buf);
printf("%s", buf);

free(buf);
return (EXIT_SUCCESS);
}

char* download_page(url_info info, char *buf)
{
struct sockaddr_in dest;
int len, sz, mysocket;
char *request = http_get_request(info.path, info.host);

mysocket = socket(AF_INET, SOCK_STREAM, 0);
memset(&dest, 0, sizeof(dest));
dest.sin_family = AF_INET;
dest.sin_addr.s_addr = ipfromhost(info.host);
dest.sin_port = htons(info.port);
connect(mysocket, (struct sockaddr *)&dest, sizeof(struct sockaddr));
send(mysocket, request, strlen(request), 0);

len = 0;
sz = 0;
do {
len = recv(mysocket, buf + sz, B_SIZE - sz, 0);
if (len == -1) {continue;}
sz += len;
} while (len > 0);

*(buf + sz) = '';

close(mysocket);
return buf;
}


char* http_get_request(char* path, char* host) {
char * request_buffer = (char *) malloc(1024);
memset(request_buffer, 0, sizeof(*request_buffer));
snprintf(request_buffer, 1024, "GET /%s HTTP/1.1rnHost: %srnConnection: closernrn",
path, host);
return request_buffer;
}

unsigned long ipfromhost(const char *host){
struct in_addr **addr_list;
struct hostent *he;
if ((he = gethostbyname(host)) != NULL){
addr_list = (struct in_addr **) he->h_addr_list;
int i;
for (i = 0; addr_list[i] != NULL; i++){
return addr_list[i]->s_addr;
}
exit_with_error("Couldn't resolve host to ip adressn");
return 0;
} else {
exit_with_error("Couldn't resolve host to ip adressn");
return 0;
}
}


Makefile



LINK_TARGET = wgetX
OBJS =
wgetX.o
url.o
REBUILDABLES = $(OBJS) $(LINK_TARGET)
all : $(LINK_TARGET)
clean:
rm -f $(REBUILDABLES)

$(LINK_TARGET) : $(OBJS)
cc -g -o $@ $^

%.o : %.c
cc -g -Wall -o $@ -c $<

wgetX.o : wgetX.h url.h
url.o : url.h


When executing the program on one specific url, I get an html output that is different from the source code (as found in Chrome). I get garbage characters: a zero at the end and "f43" just before the start of the html



Commands



make clean
make
./wgetX http://www.polytechnique.fr/


Output



I got the http reply message with the status code and all and just before "










share|improve this question














I am learning network programming in C and tried to create to a toy version of wget.



However, when I run the program, I get the page with some trailing characters at the beginning and at the end (0 & f43 in this case).



The program contains two .c and two .h files.



One for parsing (naïvely) the address and the other to make the network request
and dump the data.



Here are the files for parsing the input:



url.h



#ifndef URL_H
#define URL_H

/* information of an URL*/
struct url_info
{
char* url; //full url
char* protocol; // protocol type: http, ftp, etc...
char* host; // host name
int port; //port number
char* path; //path
};
typedef struct url_info url_info;

static const char P_HTTP = "http";

void parse_url(char* url, url_info *info);

void exit_with_error(char* message);

void print_url_info(url_info info);

#endif //URL_H


url.c



#include<stdio.h>
#include<stdlib.h>
#include<string.h>
#include"url.h"


void parse_url(char* url, url_info *info)
{
// url format: [http://]<hostname>[:<port>]/<path>

char *full_url = malloc((strlen(url) + 1) * sizeof(char));
char *protocol;
char *path;
char *host;
int port;

strcpy(full_url, url);
info->url = full_url;

char *protocol_token = strstr(url, "://");
if (protocol_token){
protocol = url;
*protocol_token = '';
url = protocol_token + 3;
} else {
protocol = "http";
}
info->protocol = protocol;

char *port_token = strstr(url, ":");
char *path_token = strstr(url, "/");

if (port_token && port_token < path_token){
port = atoi(port_token + 1);
*port_token = '';
} else {
port = 80;
}
info->port = port;

if (path_token){
*path_token = '';
host = url;
path = path_token + 1;
info->host = host;
info->path = path;
} else {
exit_with_error("No trailing /.");
}
}


void print_url_info(url_info info){
printf("The URL contains following information: n");
printf("Full url:t%sn", info.url);
printf("Protocol type:t%sn", info.protocol);
printf("Host name:t%sn", info.host);
printf("Port No.:t%dn", info.port);
printf("Path:tt%sn", info.path);
}


void exit_with_error(char *message)
{
fprintf(stderr, "%sn", message);
exit(EXIT_FAILURE);
}


Here are the files for making the request



wgetX.h



#ifndef WGETX_H_
#define WGETX_H_

#define B_SIZE 1024 * 5000

void write_data(const char *path, const char *data);

char* download_page(url_info info, char *buff);

char* http_get_request(char* path, char* host);

char* read_http_reply(char* recv_buf_t);

unsigned long ipfromhost(const char *host);

#endif


wgetX.c



 #include <sys/types.h>
#include <sys/socket.h>
#include <netinet/in.h>
#include <arpa/inet.h>
#include <unistd.h>
#include <netdb.h>
#include <stdio.h>
#include <stdlib.h>
#include <ctype.h>
#include <string.h>

#include "url.h"
#include "wgetX.h"

int main(int argc, char* argv)
{

url_info info;


if (argc != 2) {
exit_with_error("The wgetX must have exactly 1 parameter as input. n");
}
char *url = argv[1];
parse_url(url, &info);

char *buf;
buf = malloc(sizeof(char)*B_SIZE);
bzero(buf, B_SIZE);

download_page(info, buf);
printf("%s", buf);

free(buf);
return (EXIT_SUCCESS);
}

char* download_page(url_info info, char *buf)
{
struct sockaddr_in dest;
int len, sz, mysocket;
char *request = http_get_request(info.path, info.host);

mysocket = socket(AF_INET, SOCK_STREAM, 0);
memset(&dest, 0, sizeof(dest));
dest.sin_family = AF_INET;
dest.sin_addr.s_addr = ipfromhost(info.host);
dest.sin_port = htons(info.port);
connect(mysocket, (struct sockaddr *)&dest, sizeof(struct sockaddr));
send(mysocket, request, strlen(request), 0);

len = 0;
sz = 0;
do {
len = recv(mysocket, buf + sz, B_SIZE - sz, 0);
if (len == -1) {continue;}
sz += len;
} while (len > 0);

*(buf + sz) = '';

close(mysocket);
return buf;
}


char* http_get_request(char* path, char* host) {
char * request_buffer = (char *) malloc(1024);
memset(request_buffer, 0, sizeof(*request_buffer));
snprintf(request_buffer, 1024, "GET /%s HTTP/1.1rnHost: %srnConnection: closernrn",
path, host);
return request_buffer;
}

unsigned long ipfromhost(const char *host){
struct in_addr **addr_list;
struct hostent *he;
if ((he = gethostbyname(host)) != NULL){
addr_list = (struct in_addr **) he->h_addr_list;
int i;
for (i = 0; addr_list[i] != NULL; i++){
return addr_list[i]->s_addr;
}
exit_with_error("Couldn't resolve host to ip adressn");
return 0;
} else {
exit_with_error("Couldn't resolve host to ip adressn");
return 0;
}
}


Makefile



LINK_TARGET = wgetX
OBJS =
wgetX.o
url.o
REBUILDABLES = $(OBJS) $(LINK_TARGET)
all : $(LINK_TARGET)
clean:
rm -f $(REBUILDABLES)

$(LINK_TARGET) : $(OBJS)
cc -g -o $@ $^

%.o : %.c
cc -g -Wall -o $@ -c $<

wgetX.o : wgetX.h url.h
url.o : url.h


When executing the program on one specific url, I get an html output that is different from the source code (as found in Chrome). I get garbage characters: a zero at the end and "f43" just before the start of the html



Commands



make clean
make
./wgetX http://www.polytechnique.fr/


Output



I got the http reply message with the status code and all and just before "







c sockets http






share|improve this question













share|improve this question











share|improve this question




share|improve this question










asked Jan 3 at 16:04









aripy887aripy887

11




11













  • That's way too much code to wade through but I bet you aren't properly zero terminating a string somewhere.

    – Shawn
    Jan 3 at 16:36






  • 1





    Also, why not just use libcurl or the like if you want to talk to a http server?

    – Shawn
    Jan 3 at 16:38











  • I suppose it would be easier. This is for school so I have to use sockets this way. It's for learning purposes!

    – aripy887
    Jan 3 at 18:42











  • regarding: cc -g -Wall -o $@ -c $< strongly suggest: cc -g -Wall -Wextra -Wconversion -pedantic -std=gnu11 -o $@ -c $< This enables the main warning features. Which when applied to the posted code will result in several warning messages being output by the compiler. Those warnings need to be corrected

    – user3629249
    Jan 3 at 18:48











  • OT: regarding function: exit_with_error(), the statement: fprintf(stderr, "%sn", message); this does not tell the user why the error occurred. Suggest using perror() where approporiate.

    – user3629249
    Jan 3 at 18:51



















  • That's way too much code to wade through but I bet you aren't properly zero terminating a string somewhere.

    – Shawn
    Jan 3 at 16:36






  • 1





    Also, why not just use libcurl or the like if you want to talk to a http server?

    – Shawn
    Jan 3 at 16:38











  • I suppose it would be easier. This is for school so I have to use sockets this way. It's for learning purposes!

    – aripy887
    Jan 3 at 18:42











  • regarding: cc -g -Wall -o $@ -c $< strongly suggest: cc -g -Wall -Wextra -Wconversion -pedantic -std=gnu11 -o $@ -c $< This enables the main warning features. Which when applied to the posted code will result in several warning messages being output by the compiler. Those warnings need to be corrected

    – user3629249
    Jan 3 at 18:48











  • OT: regarding function: exit_with_error(), the statement: fprintf(stderr, "%sn", message); this does not tell the user why the error occurred. Suggest using perror() where approporiate.

    – user3629249
    Jan 3 at 18:51

















That's way too much code to wade through but I bet you aren't properly zero terminating a string somewhere.

– Shawn
Jan 3 at 16:36





That's way too much code to wade through but I bet you aren't properly zero terminating a string somewhere.

– Shawn
Jan 3 at 16:36




1




1





Also, why not just use libcurl or the like if you want to talk to a http server?

– Shawn
Jan 3 at 16:38





Also, why not just use libcurl or the like if you want to talk to a http server?

– Shawn
Jan 3 at 16:38













I suppose it would be easier. This is for school so I have to use sockets this way. It's for learning purposes!

– aripy887
Jan 3 at 18:42





I suppose it would be easier. This is for school so I have to use sockets this way. It's for learning purposes!

– aripy887
Jan 3 at 18:42













regarding: cc -g -Wall -o $@ -c $< strongly suggest: cc -g -Wall -Wextra -Wconversion -pedantic -std=gnu11 -o $@ -c $< This enables the main warning features. Which when applied to the posted code will result in several warning messages being output by the compiler. Those warnings need to be corrected

– user3629249
Jan 3 at 18:48





regarding: cc -g -Wall -o $@ -c $< strongly suggest: cc -g -Wall -Wextra -Wconversion -pedantic -std=gnu11 -o $@ -c $< This enables the main warning features. Which when applied to the posted code will result in several warning messages being output by the compiler. Those warnings need to be corrected

– user3629249
Jan 3 at 18:48













OT: regarding function: exit_with_error(), the statement: fprintf(stderr, "%sn", message); this does not tell the user why the error occurred. Suggest using perror() where approporiate.

– user3629249
Jan 3 at 18:51





OT: regarding function: exit_with_error(), the statement: fprintf(stderr, "%sn", message); this does not tell the user why the error occurred. Suggest using perror() where approporiate.

– user3629249
Jan 3 at 18:51












1 Answer
1






active

oldest

votes


















1















I get garbage characters: a zero at the end and "f43" just before the start of the html




Welcome to the wonderful world of HTTP. Please note that HTTP is not a trivial protocol even though it might look like this. It should say something that the HTTP/1.1 standard as initially published in RFC 2616 has 176 pages text.



What you likely see here is chunked transfer encoding of the content. In this encoding the content is not transferred as one single piece but in several chunks, each prefixed by the length (in hex). I.e. something like this:



 HTTP/1.1 200 ok
Transfer-Encoding: chunked

a
0123456789
12
These are 18 bytes
0


In your specific case the initial f43 "just before the start of the html" is the length of the following chunk (f43 in hex of 3907 in decimal) and the "zero at the end" is the length of the final chunk (0).



For more on this see section 3.6.1 in RFC 2616 or section 4.1 in RFC 7230.






share|improve this answer
























  • Thank you! Can I force that the transfer-encoding not be chunked?

    – aripy887
    Jan 3 at 18:55











  • @aripy887: As long as you claim to support HTTP/1.1 you must support chunked encoding. If you instead only use HTTP/1.0 in your request then the server cannot use chunked encoding since this is only defined with HTTP/1.1.

    – Steffen Ullrich
    Jan 3 at 18:57












Your Answer






StackExchange.ifUsing("editor", function () {
StackExchange.using("externalEditor", function () {
StackExchange.using("snippets", function () {
StackExchange.snippets.init();
});
});
}, "code-snippets");

StackExchange.ready(function() {
var channelOptions = {
tags: "".split(" "),
id: "1"
};
initTagRenderer("".split(" "), "".split(" "), channelOptions);

StackExchange.using("externalEditor", function() {
// Have to fire editor after snippets, if snippets enabled
if (StackExchange.settings.snippets.snippetsEnabled) {
StackExchange.using("snippets", function() {
createEditor();
});
}
else {
createEditor();
}
});

function createEditor() {
StackExchange.prepareEditor({
heartbeatType: 'answer',
autoActivateHeartbeat: false,
convertImagesToLinks: true,
noModals: true,
showLowRepImageUploadWarning: true,
reputationToPostImages: 10,
bindNavPrevention: true,
postfix: "",
imageUploader: {
brandingHtml: "Powered by u003ca class="icon-imgur-white" href="https://imgur.com/"u003eu003c/au003e",
contentPolicyHtml: "User contributions licensed under u003ca href="https://creativecommons.org/licenses/by-sa/3.0/"u003ecc by-sa 3.0 with attribution requiredu003c/au003e u003ca href="https://stackoverflow.com/legal/content-policy"u003e(content policy)u003c/au003e",
allowUrls: true
},
onDemand: true,
discardSelector: ".discard-answer"
,immediatelyShowMarkdownHelp:true
});


}
});














draft saved

draft discarded


















StackExchange.ready(
function () {
StackExchange.openid.initPostLogin('.new-post-login', 'https%3a%2f%2fstackoverflow.com%2fquestions%2f54025860%2fhttp-socket-request-returning-trailling-characters%23new-answer', 'question_page');
}
);

Post as a guest















Required, but never shown

























1 Answer
1






active

oldest

votes








1 Answer
1






active

oldest

votes









active

oldest

votes






active

oldest

votes









1















I get garbage characters: a zero at the end and "f43" just before the start of the html




Welcome to the wonderful world of HTTP. Please note that HTTP is not a trivial protocol even though it might look like this. It should say something that the HTTP/1.1 standard as initially published in RFC 2616 has 176 pages text.



What you likely see here is chunked transfer encoding of the content. In this encoding the content is not transferred as one single piece but in several chunks, each prefixed by the length (in hex). I.e. something like this:



 HTTP/1.1 200 ok
Transfer-Encoding: chunked

a
0123456789
12
These are 18 bytes
0


In your specific case the initial f43 "just before the start of the html" is the length of the following chunk (f43 in hex of 3907 in decimal) and the "zero at the end" is the length of the final chunk (0).



For more on this see section 3.6.1 in RFC 2616 or section 4.1 in RFC 7230.






share|improve this answer
























  • Thank you! Can I force that the transfer-encoding not be chunked?

    – aripy887
    Jan 3 at 18:55











  • @aripy887: As long as you claim to support HTTP/1.1 you must support chunked encoding. If you instead only use HTTP/1.0 in your request then the server cannot use chunked encoding since this is only defined with HTTP/1.1.

    – Steffen Ullrich
    Jan 3 at 18:57
















1















I get garbage characters: a zero at the end and "f43" just before the start of the html




Welcome to the wonderful world of HTTP. Please note that HTTP is not a trivial protocol even though it might look like this. It should say something that the HTTP/1.1 standard as initially published in RFC 2616 has 176 pages text.



What you likely see here is chunked transfer encoding of the content. In this encoding the content is not transferred as one single piece but in several chunks, each prefixed by the length (in hex). I.e. something like this:



 HTTP/1.1 200 ok
Transfer-Encoding: chunked

a
0123456789
12
These are 18 bytes
0


In your specific case the initial f43 "just before the start of the html" is the length of the following chunk (f43 in hex of 3907 in decimal) and the "zero at the end" is the length of the final chunk (0).



For more on this see section 3.6.1 in RFC 2616 or section 4.1 in RFC 7230.






share|improve this answer
























  • Thank you! Can I force that the transfer-encoding not be chunked?

    – aripy887
    Jan 3 at 18:55











  • @aripy887: As long as you claim to support HTTP/1.1 you must support chunked encoding. If you instead only use HTTP/1.0 in your request then the server cannot use chunked encoding since this is only defined with HTTP/1.1.

    – Steffen Ullrich
    Jan 3 at 18:57














1












1








1








I get garbage characters: a zero at the end and "f43" just before the start of the html




Welcome to the wonderful world of HTTP. Please note that HTTP is not a trivial protocol even though it might look like this. It should say something that the HTTP/1.1 standard as initially published in RFC 2616 has 176 pages text.



What you likely see here is chunked transfer encoding of the content. In this encoding the content is not transferred as one single piece but in several chunks, each prefixed by the length (in hex). I.e. something like this:



 HTTP/1.1 200 ok
Transfer-Encoding: chunked

a
0123456789
12
These are 18 bytes
0


In your specific case the initial f43 "just before the start of the html" is the length of the following chunk (f43 in hex of 3907 in decimal) and the "zero at the end" is the length of the final chunk (0).



For more on this see section 3.6.1 in RFC 2616 or section 4.1 in RFC 7230.






share|improve this answer














I get garbage characters: a zero at the end and "f43" just before the start of the html




Welcome to the wonderful world of HTTP. Please note that HTTP is not a trivial protocol even though it might look like this. It should say something that the HTTP/1.1 standard as initially published in RFC 2616 has 176 pages text.



What you likely see here is chunked transfer encoding of the content. In this encoding the content is not transferred as one single piece but in several chunks, each prefixed by the length (in hex). I.e. something like this:



 HTTP/1.1 200 ok
Transfer-Encoding: chunked

a
0123456789
12
These are 18 bytes
0


In your specific case the initial f43 "just before the start of the html" is the length of the following chunk (f43 in hex of 3907 in decimal) and the "zero at the end" is the length of the final chunk (0).



For more on this see section 3.6.1 in RFC 2616 or section 4.1 in RFC 7230.







share|improve this answer












share|improve this answer



share|improve this answer










answered Jan 3 at 17:09









Steffen UllrichSteffen Ullrich

62.5k360102




62.5k360102













  • Thank you! Can I force that the transfer-encoding not be chunked?

    – aripy887
    Jan 3 at 18:55











  • @aripy887: As long as you claim to support HTTP/1.1 you must support chunked encoding. If you instead only use HTTP/1.0 in your request then the server cannot use chunked encoding since this is only defined with HTTP/1.1.

    – Steffen Ullrich
    Jan 3 at 18:57



















  • Thank you! Can I force that the transfer-encoding not be chunked?

    – aripy887
    Jan 3 at 18:55











  • @aripy887: As long as you claim to support HTTP/1.1 you must support chunked encoding. If you instead only use HTTP/1.0 in your request then the server cannot use chunked encoding since this is only defined with HTTP/1.1.

    – Steffen Ullrich
    Jan 3 at 18:57

















Thank you! Can I force that the transfer-encoding not be chunked?

– aripy887
Jan 3 at 18:55





Thank you! Can I force that the transfer-encoding not be chunked?

– aripy887
Jan 3 at 18:55













@aripy887: As long as you claim to support HTTP/1.1 you must support chunked encoding. If you instead only use HTTP/1.0 in your request then the server cannot use chunked encoding since this is only defined with HTTP/1.1.

– Steffen Ullrich
Jan 3 at 18:57





@aripy887: As long as you claim to support HTTP/1.1 you must support chunked encoding. If you instead only use HTTP/1.0 in your request then the server cannot use chunked encoding since this is only defined with HTTP/1.1.

– Steffen Ullrich
Jan 3 at 18:57




















draft saved

draft discarded




















































Thanks for contributing an answer to Stack Overflow!


  • Please be sure to answer the question. Provide details and share your research!

But avoid



  • Asking for help, clarification, or responding to other answers.

  • Making statements based on opinion; back them up with references or personal experience.


To learn more, see our tips on writing great answers.




draft saved


draft discarded














StackExchange.ready(
function () {
StackExchange.openid.initPostLogin('.new-post-login', 'https%3a%2f%2fstackoverflow.com%2fquestions%2f54025860%2fhttp-socket-request-returning-trailling-characters%23new-answer', 'question_page');
}
);

Post as a guest















Required, but never shown





















































Required, but never shown














Required, but never shown












Required, but never shown







Required, but never shown

































Required, but never shown














Required, but never shown












Required, but never shown







Required, but never shown







Popular posts from this blog

Monofisismo

Angular Downloading a file using contenturl with Basic Authentication

Olmecas