From d2be24f0b636d93e1873e27207e841150e9f54bf Mon Sep 17 00:00:00 2001 From: Nick White Date: Fri, 15 Jul 2011 22:30:48 +0100 Subject: Basic http working --- getgbook.c | 100 +++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++ 1 file changed, 100 insertions(+) create mode 100644 getgbook.c (limited to 'getgbook.c') diff --git a/getgbook.c b/getgbook.c new file mode 100644 index 0000000..c17abf6 --- /dev/null +++ b/getgbook.c @@ -0,0 +1,100 @@ +#define usage "getgbook bookid" + +#define hostname "books.google.com" + +#include +#include +#include +#include +#include +#include +#include + +void die(char *msg) { + fputs(msg, stderr); + exit(EXIT_FAILURE); +} + +int dial(char *host, char *port) { + static struct addrinfo hints; + int srv; + struct addrinfo *res, *r; + + memset(&hints, 0, sizeof hints); + hints.ai_family = AF_UNSPEC; + hints.ai_socktype = SOCK_STREAM; + if(getaddrinfo(host, port, &hints, &res) != 0) + die("error: cannot resolve hostname\n"); + for(r = res; r; r = r->ai_next) { + if((srv = socket(r->ai_family, r->ai_socktype, r->ai_protocol)) == -1) + continue; + if(connect(srv, r->ai_addr, r->ai_addrlen) == 0) + break; + close(srv); + } + freeaddrinfo(res); + if(!r) + die("error: cannot connect to host\n"); + return srv; +} + +char * get(FILE *srv, char *host, char *path) { + size_t l, res; + int fd, i; + char *buf, *c, *p; + + fprintf(srv, "GET %s HTTP/1.0\r\nUser-Agent: getgbook-prealpha (not mozilla)\r\nHost: %s\r\n\r\n", path, host); + + fflush(srv); + + l=0; + fd = fileno(srv); + + buf = malloc(sizeof(char *) * 4096); + for(i=0; (res = read(fd, buf+l, 4096)) > 0; l+=res, i++) + buf = realloc(buf, sizeof(char *) * (l+4096)); + + /* check that it's a 200 */ + if(strncmp(buf+9, "200 ", 4)) { + free(buf); + return NULL; + } + + /* exclude header */ + for(p = buf; *p && *(p+1) && *(p+2) && *(p+3); p++) + if(!strncmp(p, "\r\n\r\n", 4)) break; + p+=4; + + i = l - (p - buf); + c = malloc(i); + memcpy(c, p, i); + free(buf); + + return c; +} + +int main(int argc, char *argv[]) +{ + int i, s; + char *bookid, url[80]; + char *curpage; + FILE *srv; + + if(argc != 2) + die("usage: " usage "\n"); + + bookid = argv[1]; + + i = dial(hostname, "80"); + srv = fdopen(i, "r+"); + + snprintf(url, 80, "/books?id=%s&pg=%s&jscmd=click3", bookid, "PA1"); + if((curpage = get(srv, hostname, url)) == NULL) + fprintf(stderr,"Error downloading page\n"); + else { + fputs(curpage,stdout); + free(curpage); + } + + return 0; +} -- cgit v1.2.3