http socket request returning trailling characters

I am learning network programming in C and tried to create to a toy version of wget.

However, when I run the program, I get the page with some trailing characters at the beginning and at the end (0 & f43 in this case).

The program contains two .c and two .h files.

One for parsing (naïvely) the address and the other to make the network request
and dump the data.

Here are the files for parsing the input:

url.h

#ifndef URL_H

#define URL_H



/* information of an URL*/

struct url_info

{

    char* url; //full url

    char* protocol; // protocol type: http, ftp, etc...

    char* host; // host name

    int port;   //port number

    char* path; //path

};

typedef struct url_info url_info;



static const char P_HTTP = "http";



void parse_url(char* url, url_info *info);



void exit_with_error(char* message);



void print_url_info(url_info info);



#endif //URL_H

url.c

#include<stdio.h>

#include<stdlib.h>

#include<string.h>

#include"url.h"





void parse_url(char* url, url_info *info)

{

    // url format: [http://]<hostname>[:<port>]/<path>



    char *full_url = malloc((strlen(url) + 1) * sizeof(char));

  char *protocol;

  char *path;

  char *host;

  int port;



  strcpy(full_url, url);

    info->url = full_url;



  char *protocol_token = strstr(url, "://");

  if (protocol_token){

    protocol = url;

    *protocol_token = '';

    url = protocol_token + 3;

  } else {

    protocol = "http";

  }

    info->protocol = protocol;



  char *port_token = strstr(url, ":");

  char *path_token = strstr(url, "/");



  if (port_token && port_token < path_token){

        port = atoi(port_token + 1);

        *port_token = '';

  } else {

    port = 80;

  }

    info->port = port;



  if (path_token){

    *path_token = '';

    host = url;

    path = path_token + 1;

        info->host = host;

        info->path = path;

  } else {

    exit_with_error("No trailing /.");

  }

}





void print_url_info(url_info info){

    printf("The URL contains following information: n");

    printf("Full url:t%sn", info.url);

    printf("Protocol type:t%sn", info.protocol);

    printf("Host name:t%sn", info.host);

    printf("Port No.:t%dn", info.port);

    printf("Path:tt%sn", info.path);

}





void exit_with_error(char *message)

{

    fprintf(stderr, "%sn", message);

    exit(EXIT_FAILURE);

}

Here are the files for making the request

wgetX.h

#ifndef WGETX_H_

#define WGETX_H_



#define B_SIZE 1024 * 5000



void write_data(const char *path, const char *data);



char* download_page(url_info info, char *buff);



char* http_get_request(char* path, char* host);



char* read_http_reply(char* recv_buf_t);



unsigned long ipfromhost(const char *host);



#endif

wgetX.c

 #include <sys/types.h>

 #include <sys/socket.h>

 #include <netinet/in.h>

 #include <arpa/inet.h>

 #include <unistd.h>

 #include <netdb.h>

 #include <stdio.h>

 #include <stdlib.h>

 #include <ctype.h>

 #include <string.h>



#include "url.h"

#include "wgetX.h"



int main(int argc, char* argv)

{



    url_info info;





    if (argc != 2) {

        exit_with_error("The wgetX must have exactly 1 parameter as input. n");

    }

    char *url = argv[1];

    parse_url(url, &info);



    char *buf;

    buf = malloc(sizeof(char)*B_SIZE);

    bzero(buf, B_SIZE);



    download_page(info, buf);

  printf("%s", buf);



    free(buf);

    return (EXIT_SUCCESS);

}



char* download_page(url_info info, char *buf)

{

    struct sockaddr_in dest;

    int len, sz, mysocket;

    char *request = http_get_request(info.path, info.host);



    mysocket = socket(AF_INET, SOCK_STREAM, 0);

    memset(&dest, 0, sizeof(dest));

    dest.sin_family = AF_INET;

    dest.sin_addr.s_addr = ipfromhost(info.host);

    dest.sin_port = htons(info.port);

    connect(mysocket, (struct sockaddr *)&dest, sizeof(struct sockaddr));

    send(mysocket, request, strlen(request), 0);



    len = 0;

    sz = 0;

    do {

        len = recv(mysocket, buf + sz, B_SIZE - sz, 0);

        if (len == -1) {continue;}

        sz += len;

    } while (len > 0);



    *(buf + sz) = '';



  close(mysocket);

    return buf;

}





char* http_get_request(char* path, char* host) {

    char * request_buffer = (char *) malloc(1024);

    memset(request_buffer, 0, sizeof(*request_buffer));

    snprintf(request_buffer, 1024, "GET /%s HTTP/1.1rnHost: %srnConnection: closernrn",

            path, host);

    return request_buffer;

}



unsigned long ipfromhost(const char *host){

  struct in_addr **addr_list;

  struct hostent *he;

  if ((he = gethostbyname(host)) != NULL){

    addr_list = (struct in_addr **) he->h_addr_list;

    int i;

    for (i = 0; addr_list[i] != NULL; i++){

      return addr_list[i]->s_addr;

    }

    exit_with_error("Couldn't resolve host to ip adressn");

    return 0;

  } else {

    exit_with_error("Couldn't resolve host to ip adressn");

    return 0;

  }

}

Makefile

LINK_TARGET = wgetX

OBJS = 

    wgetX.o 

    url.o

REBUILDABLES = $(OBJS) $(LINK_TARGET)

all : $(LINK_TARGET)

clean:

    rm -f $(REBUILDABLES)



$(LINK_TARGET) : $(OBJS)

    cc -g -o $@ $^



%.o : %.c

    cc -g  -Wall -o $@ -c $<



wgetX.o : wgetX.h url.h

url.o : url.h

When executing the program on one specific url, I get an html output that is different from the source code (as found in Chrome). I get garbage characters: a zero at the end and "f43" just before the start of the html

Commands

make clean

make

./wgetX http://www.polytechnique.fr/

Output

I got the http reply message with the status code and all and just before "

asked Jan 3 at 16:04

aripy887

That's way too much code to wade through but I bet you aren't properly zero terminating a string somewhere.

– Shawn
Jan 3 at 16:36

1

Also, why not just use libcurl or the like if you want to talk to a http server?

– Shawn
Jan 3 at 16:38

I suppose it would be easier. This is for school so I have to use sockets this way. It's for learning purposes!

– aripy887
Jan 3 at 18:42

regarding: cc -g -Wall -o $@ -c $< strongly suggest: cc -g -Wall -Wextra -Wconversion -pedantic -std=gnu11 -o $@ -c $< This enables the main warning features. Which when applied to the posted code will result in several warning messages being output by the compiler. Those warnings need to be corrected

– user3629249
Jan 3 at 18:48

OT: regarding function: exit_with_error(), the statement: fprintf(stderr, "%sn", message); this does not tell the user why the error occurred. Suggest using perror() where approporiate.

– user3629249
Jan 3 at 18:51

|
show 9 more comments

I am learning network programming in C and tried to create to a toy version of wget.

However, when I run the program, I get the page with some trailing characters at the beginning and at the end (0 & f43 in this case).

The program contains two .c and two .h files.

One for parsing (naïvely) the address and the other to make the network request
and dump the data.

Here are the files for parsing the input:

url.h

#ifndef URL_H

#define URL_H



/* information of an URL*/

struct url_info

{

    char* url; //full url

    char* protocol; // protocol type: http, ftp, etc...

    char* host; // host name

    int port;   //port number

    char* path; //path

};

typedef struct url_info url_info;



static const char P_HTTP = "http";



void parse_url(char* url, url_info *info);



void exit_with_error(char* message);



void print_url_info(url_info info);



#endif //URL_H

url.c

#include<stdio.h>

#include<stdlib.h>

#include<string.h>

#include"url.h"





void parse_url(char* url, url_info *info)

{

    // url format: [http://]<hostname>[:<port>]/<path>



    char *full_url = malloc((strlen(url) + 1) * sizeof(char));

  char *protocol;

  char *path;

  char *host;

  int port;



  strcpy(full_url, url);

    info->url = full_url;



  char *protocol_token = strstr(url, "://");

  if (protocol_token){

    protocol = url;

    *protocol_token = '';

    url = protocol_token + 3;

  } else {

    protocol = "http";

  }

    info->protocol = protocol;



  char *port_token = strstr(url, ":");

  char *path_token = strstr(url, "/");



  if (port_token && port_token < path_token){

        port = atoi(port_token + 1);

        *port_token = '';

  } else {

    port = 80;

  }

    info->port = port;



  if (path_token){

    *path_token = '';

    host = url;

    path = path_token + 1;

        info->host = host;

        info->path = path;

  } else {

    exit_with_error("No trailing /.");

  }

}





void print_url_info(url_info info){

    printf("The URL contains following information: n");

    printf("Full url:t%sn", info.url);

    printf("Protocol type:t%sn", info.protocol);

    printf("Host name:t%sn", info.host);

    printf("Port No.:t%dn", info.port);

    printf("Path:tt%sn", info.path);

}





void exit_with_error(char *message)

{

    fprintf(stderr, "%sn", message);

    exit(EXIT_FAILURE);

}

Here are the files for making the request

wgetX.h

#ifndef WGETX_H_

#define WGETX_H_



#define B_SIZE 1024 * 5000



void write_data(const char *path, const char *data);



char* download_page(url_info info, char *buff);



char* http_get_request(char* path, char* host);



char* read_http_reply(char* recv_buf_t);



unsigned long ipfromhost(const char *host);



#endif

wgetX.c

 #include <sys/types.h>

 #include <sys/socket.h>

 #include <netinet/in.h>

 #include <arpa/inet.h>

 #include <unistd.h>

 #include <netdb.h>

 #include <stdio.h>

 #include <stdlib.h>

 #include <ctype.h>

 #include <string.h>



#include "url.h"

#include "wgetX.h"



int main(int argc, char* argv)

{



    url_info info;





    if (argc != 2) {

        exit_with_error("The wgetX must have exactly 1 parameter as input. n");

    }

    char *url = argv[1];

    parse_url(url, &info);



    char *buf;

    buf = malloc(sizeof(char)*B_SIZE);

    bzero(buf, B_SIZE);



    download_page(info, buf);

  printf("%s", buf);



    free(buf);

    return (EXIT_SUCCESS);

}



char* download_page(url_info info, char *buf)

{

    struct sockaddr_in dest;

    int len, sz, mysocket;

    char *request = http_get_request(info.path, info.host);



    mysocket = socket(AF_INET, SOCK_STREAM, 0);

    memset(&dest, 0, sizeof(dest));

    dest.sin_family = AF_INET;

    dest.sin_addr.s_addr = ipfromhost(info.host);

    dest.sin_port = htons(info.port);

    connect(mysocket, (struct sockaddr *)&dest, sizeof(struct sockaddr));

    send(mysocket, request, strlen(request), 0);



    len = 0;

    sz = 0;

    do {

        len = recv(mysocket, buf + sz, B_SIZE - sz, 0);

        if (len == -1) {continue;}

        sz += len;

    } while (len > 0);



    *(buf + sz) = '';



  close(mysocket);

    return buf;

}





char* http_get_request(char* path, char* host) {

    char * request_buffer = (char *) malloc(1024);

    memset(request_buffer, 0, sizeof(*request_buffer));

    snprintf(request_buffer, 1024, "GET /%s HTTP/1.1rnHost: %srnConnection: closernrn",

            path, host);

    return request_buffer;

}



unsigned long ipfromhost(const char *host){

  struct in_addr **addr_list;

  struct hostent *he;

  if ((he = gethostbyname(host)) != NULL){

    addr_list = (struct in_addr **) he->h_addr_list;

    int i;

    for (i = 0; addr_list[i] != NULL; i++){

      return addr_list[i]->s_addr;

    }

    exit_with_error("Couldn't resolve host to ip adressn");

    return 0;

  } else {

    exit_with_error("Couldn't resolve host to ip adressn");

    return 0;

  }

}

Makefile

LINK_TARGET = wgetX

OBJS = 

    wgetX.o 

    url.o

REBUILDABLES = $(OBJS) $(LINK_TARGET)

all : $(LINK_TARGET)

clean:

    rm -f $(REBUILDABLES)



$(LINK_TARGET) : $(OBJS)

    cc -g -o $@ $^



%.o : %.c

    cc -g  -Wall -o $@ -c $<



wgetX.o : wgetX.h url.h

url.o : url.h

Commands

make clean

make

./wgetX http://www.polytechnique.fr/

Output

I got the http reply message with the status code and all and just before "

asked Jan 3 at 16:04

aripy887

That's way too much code to wade through but I bet you aren't properly zero terminating a string somewhere.

– Shawn
Jan 3 at 16:36

1

Also, why not just use libcurl or the like if you want to talk to a http server?

– Shawn
Jan 3 at 16:38

I suppose it would be easier. This is for school so I have to use sockets this way. It's for learning purposes!

– aripy887
Jan 3 at 18:42

regarding: cc -g -Wall -o $@ -c $< strongly suggest: cc -g -Wall -Wextra -Wconversion -pedantic -std=gnu11 -o $@ -c $< This enables the main warning features. Which when applied to the posted code will result in several warning messages being output by the compiler. Those warnings need to be corrected

– user3629249
Jan 3 at 18:48

OT: regarding function: exit_with_error(), the statement: fprintf(stderr, "%sn", message); this does not tell the user why the error occurred. Suggest using perror() where approporiate.

– user3629249
Jan 3 at 18:51

|
show 9 more comments

I am learning network programming in C and tried to create to a toy version of wget.

However, when I run the program, I get the page with some trailing characters at the beginning and at the end (0 & f43 in this case).

The program contains two .c and two .h files.

One for parsing (naïvely) the address and the other to make the network request
and dump the data.

Here are the files for parsing the input:

url.h

#ifndef URL_H

#define URL_H



/* information of an URL*/

struct url_info

{

    char* url; //full url

    char* protocol; // protocol type: http, ftp, etc...

    char* host; // host name

    int port;   //port number

    char* path; //path

};

typedef struct url_info url_info;



static const char P_HTTP = "http";



void parse_url(char* url, url_info *info);



void exit_with_error(char* message);



void print_url_info(url_info info);



#endif //URL_H

url.c

#include<stdio.h>

#include<stdlib.h>

#include<string.h>

#include"url.h"





void parse_url(char* url, url_info *info)

{

    // url format: [http://]<hostname>[:<port>]/<path>



    char *full_url = malloc((strlen(url) + 1) * sizeof(char));

  char *protocol;

  char *path;

  char *host;

  int port;



  strcpy(full_url, url);

    info->url = full_url;



  char *protocol_token = strstr(url, "://");

  if (protocol_token){

    protocol = url;

    *protocol_token = '';

    url = protocol_token + 3;

  } else {

    protocol = "http";

  }

    info->protocol = protocol;



  char *port_token = strstr(url, ":");

  char *path_token = strstr(url, "/");



  if (port_token && port_token < path_token){

        port = atoi(port_token + 1);

        *port_token = '';

  } else {

    port = 80;

  }

    info->port = port;



  if (path_token){

    *path_token = '';

    host = url;

    path = path_token + 1;

        info->host = host;

        info->path = path;

  } else {

    exit_with_error("No trailing /.");

  }

}





void print_url_info(url_info info){

    printf("The URL contains following information: n");

    printf("Full url:t%sn", info.url);

    printf("Protocol type:t%sn", info.protocol);

    printf("Host name:t%sn", info.host);

    printf("Port No.:t%dn", info.port);

    printf("Path:tt%sn", info.path);

}





void exit_with_error(char *message)

{

    fprintf(stderr, "%sn", message);

    exit(EXIT_FAILURE);

}

Here are the files for making the request

wgetX.h

#ifndef WGETX_H_

#define WGETX_H_



#define B_SIZE 1024 * 5000



void write_data(const char *path, const char *data);



char* download_page(url_info info, char *buff);



char* http_get_request(char* path, char* host);



char* read_http_reply(char* recv_buf_t);



unsigned long ipfromhost(const char *host);



#endif

wgetX.c

 #include <sys/types.h>

 #include <sys/socket.h>

 #include <netinet/in.h>

 #include <arpa/inet.h>

 #include <unistd.h>

 #include <netdb.h>

 #include <stdio.h>

 #include <stdlib.h>

 #include <ctype.h>

 #include <string.h>



#include "url.h"

#include "wgetX.h"



int main(int argc, char* argv)

{



    url_info info;





    if (argc != 2) {

        exit_with_error("The wgetX must have exactly 1 parameter as input. n");

    }

    char *url = argv[1];

    parse_url(url, &info);



    char *buf;

    buf = malloc(sizeof(char)*B_SIZE);

    bzero(buf, B_SIZE);



    download_page(info, buf);

  printf("%s", buf);



    free(buf);

    return (EXIT_SUCCESS);

}



char* download_page(url_info info, char *buf)

{

    struct sockaddr_in dest;

    int len, sz, mysocket;

    char *request = http_get_request(info.path, info.host);



    mysocket = socket(AF_INET, SOCK_STREAM, 0);

    memset(&dest, 0, sizeof(dest));

    dest.sin_family = AF_INET;

    dest.sin_addr.s_addr = ipfromhost(info.host);

    dest.sin_port = htons(info.port);

    connect(mysocket, (struct sockaddr *)&dest, sizeof(struct sockaddr));

    send(mysocket, request, strlen(request), 0);



    len = 0;

    sz = 0;

    do {

        len = recv(mysocket, buf + sz, B_SIZE - sz, 0);

        if (len == -1) {continue;}

        sz += len;

    } while (len > 0);



    *(buf + sz) = '';



  close(mysocket);

    return buf;

}





char* http_get_request(char* path, char* host) {

    char * request_buffer = (char *) malloc(1024);

    memset(request_buffer, 0, sizeof(*request_buffer));

    snprintf(request_buffer, 1024, "GET /%s HTTP/1.1rnHost: %srnConnection: closernrn",

            path, host);

    return request_buffer;

}



unsigned long ipfromhost(const char *host){

  struct in_addr **addr_list;

  struct hostent *he;

  if ((he = gethostbyname(host)) != NULL){

    addr_list = (struct in_addr **) he->h_addr_list;

    int i;

    for (i = 0; addr_list[i] != NULL; i++){

      return addr_list[i]->s_addr;

    }

    exit_with_error("Couldn't resolve host to ip adressn");

    return 0;

  } else {

    exit_with_error("Couldn't resolve host to ip adressn");

    return 0;

  }

}

Makefile

LINK_TARGET = wgetX

OBJS = 

    wgetX.o 

    url.o

REBUILDABLES = $(OBJS) $(LINK_TARGET)

all : $(LINK_TARGET)

clean:

    rm -f $(REBUILDABLES)



$(LINK_TARGET) : $(OBJS)

    cc -g -o $@ $^



%.o : %.c

    cc -g  -Wall -o $@ -c $<



wgetX.o : wgetX.h url.h

url.o : url.h

Commands

make clean

make

./wgetX http://www.polytechnique.fr/

Output

I got the http reply message with the status code and all and just before "

asked Jan 3 at 16:04

aripy887

I am learning network programming in C and tried to create to a toy version of wget.

However, when I run the program, I get the page with some trailing characters at the beginning and at the end (0 & f43 in this case).

The program contains two .c and two .h files.

One for parsing (naïvely) the address and the other to make the network request
and dump the data.

Here are the files for parsing the input:

url.h

#ifndef URL_H

#define URL_H



/* information of an URL*/

struct url_info

{

    char* url; //full url

    char* protocol; // protocol type: http, ftp, etc...

    char* host; // host name

    int port;   //port number

    char* path; //path

};

typedef struct url_info url_info;



static const char P_HTTP = "http";



void parse_url(char* url, url_info *info);



void exit_with_error(char* message);



void print_url_info(url_info info);



#endif //URL_H

url.c

#include<stdio.h>

#include<stdlib.h>

#include<string.h>

#include"url.h"





void parse_url(char* url, url_info *info)

{

    // url format: [http://]<hostname>[:<port>]/<path>



    char *full_url = malloc((strlen(url) + 1) * sizeof(char));

  char *protocol;

  char *path;

  char *host;

  int port;



  strcpy(full_url, url);

    info->url = full_url;



  char *protocol_token = strstr(url, "://");

  if (protocol_token){

    protocol = url;

    *protocol_token = '';

    url = protocol_token + 3;

  } else {

    protocol = "http";

  }

    info->protocol = protocol;



  char *port_token = strstr(url, ":");

  char *path_token = strstr(url, "/");



  if (port_token && port_token < path_token){

        port = atoi(port_token + 1);

        *port_token = '';

  } else {

    port = 80;

  }

    info->port = port;



  if (path_token){

    *path_token = '';

    host = url;

    path = path_token + 1;

        info->host = host;

        info->path = path;

  } else {

    exit_with_error("No trailing /.");

  }

}





void print_url_info(url_info info){

    printf("The URL contains following information: n");

    printf("Full url:t%sn", info.url);

    printf("Protocol type:t%sn", info.protocol);

    printf("Host name:t%sn", info.host);

    printf("Port No.:t%dn", info.port);

    printf("Path:tt%sn", info.path);

}





void exit_with_error(char *message)

{

    fprintf(stderr, "%sn", message);

    exit(EXIT_FAILURE);

}

Here are the files for making the request

wgetX.h

#ifndef WGETX_H_

#define WGETX_H_



#define B_SIZE 1024 * 5000



void write_data(const char *path, const char *data);



char* download_page(url_info info, char *buff);



char* http_get_request(char* path, char* host);



char* read_http_reply(char* recv_buf_t);



unsigned long ipfromhost(const char *host);



#endif

wgetX.c

 #include <sys/types.h>

 #include <sys/socket.h>

 #include <netinet/in.h>

 #include <arpa/inet.h>

 #include <unistd.h>

 #include <netdb.h>

 #include <stdio.h>

 #include <stdlib.h>

 #include <ctype.h>

 #include <string.h>



#include "url.h"

#include "wgetX.h"



int main(int argc, char* argv)

{



    url_info info;





    if (argc != 2) {

        exit_with_error("The wgetX must have exactly 1 parameter as input. n");

    }

    char *url = argv[1];

    parse_url(url, &info);



    char *buf;

    buf = malloc(sizeof(char)*B_SIZE);

    bzero(buf, B_SIZE);



    download_page(info, buf);

  printf("%s", buf);



    free(buf);

    return (EXIT_SUCCESS);

}



char* download_page(url_info info, char *buf)

{

    struct sockaddr_in dest;

    int len, sz, mysocket;

    char *request = http_get_request(info.path, info.host);



    mysocket = socket(AF_INET, SOCK_STREAM, 0);

    memset(&dest, 0, sizeof(dest));

    dest.sin_family = AF_INET;

    dest.sin_addr.s_addr = ipfromhost(info.host);

    dest.sin_port = htons(info.port);

    connect(mysocket, (struct sockaddr *)&dest, sizeof(struct sockaddr));

    send(mysocket, request, strlen(request), 0);



    len = 0;

    sz = 0;

    do {

        len = recv(mysocket, buf + sz, B_SIZE - sz, 0);

        if (len == -1) {continue;}

        sz += len;

    } while (len > 0);



    *(buf + sz) = '';



  close(mysocket);

    return buf;

}





char* http_get_request(char* path, char* host) {

    char * request_buffer = (char *) malloc(1024);

    memset(request_buffer, 0, sizeof(*request_buffer));

    snprintf(request_buffer, 1024, "GET /%s HTTP/1.1rnHost: %srnConnection: closernrn",

            path, host);

    return request_buffer;

}



unsigned long ipfromhost(const char *host){

  struct in_addr **addr_list;

  struct hostent *he;

  if ((he = gethostbyname(host)) != NULL){

    addr_list = (struct in_addr **) he->h_addr_list;

    int i;

    for (i = 0; addr_list[i] != NULL; i++){

      return addr_list[i]->s_addr;

    }

    exit_with_error("Couldn't resolve host to ip adressn");

    return 0;

  } else {

    exit_with_error("Couldn't resolve host to ip adressn");

    return 0;

  }

}

Makefile

LINK_TARGET = wgetX

OBJS = 

    wgetX.o 

    url.o

REBUILDABLES = $(OBJS) $(LINK_TARGET)

all : $(LINK_TARGET)

clean:

    rm -f $(REBUILDABLES)



$(LINK_TARGET) : $(OBJS)

    cc -g -o $@ $^



%.o : %.c

    cc -g  -Wall -o $@ -c $<



wgetX.o : wgetX.h url.h

url.o : url.h

Commands

make clean

make

./wgetX http://www.polytechnique.fr/

Output

I got the http reply message with the status code and all and just before "

c sockets http

asked Jan 3 at 16:04

aripy887

asked Jan 3 at 16:04

aripy887

asked Jan 3 at 16:04

aripy887

asked Jan 3 at 16:04

aripy887

asked Jan 3 at 16:04

aripy887

That's way too much code to wade through but I bet you aren't properly zero terminating a string somewhere.

– Shawn
Jan 3 at 16:36

1

Also, why not just use libcurl or the like if you want to talk to a http server?

– Shawn
Jan 3 at 16:38

I suppose it would be easier. This is for school so I have to use sockets this way. It's for learning purposes!

– aripy887
Jan 3 at 18:42

regarding: cc -g -Wall -o $@ -c $< strongly suggest: cc -g -Wall -Wextra -Wconversion -pedantic -std=gnu11 -o $@ -c $< This enables the main warning features. Which when applied to the posted code will result in several warning messages being output by the compiler. Those warnings need to be corrected

– user3629249
Jan 3 at 18:48

OT: regarding function: exit_with_error(), the statement: fprintf(stderr, "%sn", message); this does not tell the user why the error occurred. Suggest using perror() where approporiate.

– user3629249
Jan 3 at 18:51

|
show 9 more comments

That's way too much code to wade through but I bet you aren't properly zero terminating a string somewhere.

– Shawn
Jan 3 at 16:36

1

Also, why not just use libcurl or the like if you want to talk to a http server?

– Shawn
Jan 3 at 16:38

I suppose it would be easier. This is for school so I have to use sockets this way. It's for learning purposes!

– aripy887
Jan 3 at 18:42

regarding: cc -g -Wall -o $@ -c $< strongly suggest: cc -g -Wall -Wextra -Wconversion -pedantic -std=gnu11 -o $@ -c $< This enables the main warning features. Which when applied to the posted code will result in several warning messages being output by the compiler. Those warnings need to be corrected

– user3629249
Jan 3 at 18:48

OT: regarding function: exit_with_error(), the statement: fprintf(stderr, "%sn", message); this does not tell the user why the error occurred. Suggest using perror() where approporiate.

– user3629249
Jan 3 at 18:51

That's way too much code to wade through but I bet you aren't properly zero terminating a string somewhere.

– Shawn
Jan 3 at 16:36

Also, why not just use libcurl or the like if you want to talk to a http server?

– Shawn
Jan 3 at 16:38

I suppose it would be easier. This is for school so I have to use sockets this way. It's for learning purposes!

– aripy887
Jan 3 at 18:42

regarding: cc -g -Wall -o $@ -c $< strongly suggest: cc -g -Wall -Wextra -Wconversion -pedantic -std=gnu11 -o $@ -c $< This enables the main warning features. Which when applied to the posted code will result in several warning messages being output by the compiler. Those warnings need to be corrected

– user3629249
Jan 3 at 18:48

OT: regarding function: exit_with_error(), the statement: fprintf(stderr, "%sn", message); this does not tell the user why the error occurred. Suggest using perror() where approporiate.

– user3629249
Jan 3 at 18:51

|
show 9 more comments

1 Answer
1

active

oldest

votes

I get garbage characters: a zero at the end and "f43" just before the start of the html

Welcome to the wonderful world of HTTP. Please note that HTTP is not a trivial protocol even though it might look like this. It should say something that the HTTP/1.1 standard as initially published in RFC 2616 has 176 pages text.

What you likely see here is chunked transfer encoding of the content. In this encoding the content is not transferred as one single piece but in several chunks, each prefixed by the length (in hex). I.e. something like this:

 HTTP/1.1 200 ok

 Transfer-Encoding: chunked



 a

 0123456789

 12

 These are 18 bytes

 0

In your specific case the initial f43 "just before the start of the html" is the length of the following chunk (f43 in hex of 3907 in decimal) and the "zero at the end" is the length of the final chunk (0).

For more on this see section 3.6.1 in RFC 2616 or section 4.1 in RFC 7230.

answered Jan 3 at 17:09

Steffen Ullrich

62.5k360102

Thank you! Can I force that the transfer-encoding not be chunked?

– aripy887
Jan 3 at 18:55

@aripy887: As long as you claim to support HTTP/1.1 you must support chunked encoding. If you instead only use HTTP/1.0 in your request then the server cannot use chunked encoding since this is only defined with HTTP/1.1.

– Steffen Ullrich
Jan 3 at 18:57

add a comment |

StackExchange.ifUsing("editor", function () {
StackExchange.using("externalEditor", function () {
StackExchange.using("snippets", function () {
StackExchange.snippets.init();
});
});
}, "code-snippets");

StackExchange.ready(function() {
var channelOptions = {
tags: "".split(" "),
id: "1"
};
initTagRenderer("".split(" "), "".split(" "), channelOptions);

StackExchange.using("externalEditor", function() {
// Have to fire editor after snippets, if snippets enabled
if (StackExchange.settings.snippets.snippetsEnabled) {
StackExchange.using("snippets", function() {
createEditor();
});
}
else {
createEditor();
}
});

function createEditor() {
StackExchange.prepareEditor({
heartbeatType: 'answer',
autoActivateHeartbeat: false,
convertImagesToLinks: true,
noModals: true,
showLowRepImageUploadWarning: true,
reputationToPostImages: 10,
bindNavPrevention: true,
postfix: "",
imageUploader: {
brandingHtml: "Powered by u003ca class="icon-imgur-white" href="https://imgur.com/"u003eu003c/au003e",
contentPolicyHtml: "User contributions licensed under u003ca href="https://creativecommons.org/licenses/by-sa/3.0/"u003ecc by-sa 3.0 with attribution requiredu003c/au003e u003ca href="https://stackoverflow.com/legal/content-policy"u003e(content policy)u003c/au003e",
allowUrls: true
},
onDemand: true,
discardSelector: ".discard-answer"
,immediatelyShowMarkdownHelp:true
});

}
});

draft saved

draft discarded

Sign up or log in

StackExchange.ready(function () {
StackExchange.helpers.onClickDraftSave('#login-link');
});

Post as a guest

Name

Required, but never shown

StackExchange.ready(
function () {
StackExchange.openid.initPostLogin('.new-post-login', 'https%3a%2f%2fstackoverflow.com%2fquestions%2f54025860%2fhttp-socket-request-returning-trailling-characters%23new-answer', 'question_page');
}
);

Post as a guest

Name

Required, but never shown

1 Answer
1

active

oldest

votes

1 Answer
1

active

oldest

votes

I get garbage characters: a zero at the end and "f43" just before the start of the html

 HTTP/1.1 200 ok

 Transfer-Encoding: chunked



 a

 0123456789

 12

 These are 18 bytes

 0

For more on this see section 3.6.1 in RFC 2616 or section 4.1 in RFC 7230.

answered Jan 3 at 17:09

Steffen Ullrich

62.5k360102

Thank you! Can I force that the transfer-encoding not be chunked?

– aripy887
Jan 3 at 18:55

@aripy887: As long as you claim to support HTTP/1.1 you must support chunked encoding. If you instead only use HTTP/1.0 in your request then the server cannot use chunked encoding since this is only defined with HTTP/1.1.

– Steffen Ullrich
Jan 3 at 18:57

add a comment |

I get garbage characters: a zero at the end and "f43" just before the start of the html

 HTTP/1.1 200 ok

 Transfer-Encoding: chunked



 a

 0123456789

 12

 These are 18 bytes

 0

For more on this see section 3.6.1 in RFC 2616 or section 4.1 in RFC 7230.

answered Jan 3 at 17:09

Steffen Ullrich

62.5k360102

Thank you! Can I force that the transfer-encoding not be chunked?

– aripy887
Jan 3 at 18:55

@aripy887: As long as you claim to support HTTP/1.1 you must support chunked encoding. If you instead only use HTTP/1.0 in your request then the server cannot use chunked encoding since this is only defined with HTTP/1.1.

– Steffen Ullrich
Jan 3 at 18:57

add a comment |

I get garbage characters: a zero at the end and "f43" just before the start of the html

 HTTP/1.1 200 ok

 Transfer-Encoding: chunked



 a

 0123456789

 12

 These are 18 bytes

 0

For more on this see section 3.6.1 in RFC 2616 or section 4.1 in RFC 7230.

answered Jan 3 at 17:09

Steffen Ullrich

62.5k360102

I get garbage characters: a zero at the end and "f43" just before the start of the html

 HTTP/1.1 200 ok

 Transfer-Encoding: chunked



 a

 0123456789

 12

 These are 18 bytes

 0

For more on this see section 3.6.1 in RFC 2616 or section 4.1 in RFC 7230.

answered Jan 3 at 17:09

Steffen Ullrich

62.5k360102

answered Jan 3 at 17:09

Steffen Ullrich

62.5k360102

answered Jan 3 at 17:09

Steffen Ullrich

62.5k360102

answered Jan 3 at 17:09

Steffen Ullrich

62.5k360102

Thank you! Can I force that the transfer-encoding not be chunked?

– aripy887
Jan 3 at 18:55

@aripy887: As long as you claim to support HTTP/1.1 you must support chunked encoding. If you instead only use HTTP/1.0 in your request then the server cannot use chunked encoding since this is only defined with HTTP/1.1.

– Steffen Ullrich
Jan 3 at 18:57

add a comment |

Thank you! Can I force that the transfer-encoding not be chunked?

– aripy887
Jan 3 at 18:55

@aripy887: As long as you claim to support HTTP/1.1 you must support chunked encoding. If you instead only use HTTP/1.0 in your request then the server cannot use chunked encoding since this is only defined with HTTP/1.1.

– Steffen Ullrich
Jan 3 at 18:57

Thank you! Can I force that the transfer-encoding not be chunked?

– aripy887
Jan 3 at 18:55

@aripy887: As long as you claim to support HTTP/1.1 you must support chunked encoding. If you instead only use HTTP/1.0 in your request then the server cannot use chunked encoding since this is only defined with HTTP/1.1.

– Steffen Ullrich
Jan 3 at 18:57

add a comment |

draft saved

draft discarded

Thanks for contributing an answer to Stack Overflow!

Please be sure to answer the question. Provide details and share your research!

But avoid …

Asking for help, clarification, or responding to other answers.

Making statements based on opinion; back them up with references or personal experience.

To learn more, see our tips on writing great answers.

draft saved

draft discarded

Sign up or log in

StackExchange.ready(function () {
StackExchange.helpers.onClickDraftSave('#login-link');
});

Post as a guest

Name

Required, but never shown

Post as a guest

Name

Required, but never shown

Sign up or log in

StackExchange.ready(function () {
StackExchange.helpers.onClickDraftSave('#login-link');
});

Post as a guest

Name

Required, but never shown

Sign up or log in

StackExchange.ready(function () {
StackExchange.helpers.onClickDraftSave('#login-link');
});

Post as a guest

Name

Required, but never shown

Sign up or log in

StackExchange.ready(function () {
StackExchange.helpers.onClickDraftSave('#login-link');
});

Post as a guest

Name

Required, but never shown

Name

Required, but never shown

Name

Required, but never shown

This page is only for reference, If you need detailed information, please check here

搜尋此網誌

Bdtjtk