summaryrefslogtreecommitdiff
path: root/getgbook.c
blob: ae479937ac056f1d0413a5b835e376751ca1dc4f (plain)
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
/* See COPYING file for copyright, license and warranty details. */

#define VERSION "prealpha"

#include <stdio.h>
#include <stdlib.h>
#include <string.h>
#include "util.c"

#define usage "getgbook " VERSION " - a google books downloader\n" \
              "usage: getgbook [-p|-a] isbn\n" \
              "  -p print all available pages\n" \
              "  -a download all available pages\n" \
              "  otherwise, all pages in stdin will be downloaded\n"

#define hostname "books.google.com"

#define URLMAX 1024
#define BOOKID_LEN 12

typedef struct {
	char *name;
	char *code;
} pgtype;

pgtype pgtypes[] = {
	{"cover", "PP"},
	{"preface", "PR"},
	{"page", "PA"},
	{"postface", "PA"},
};

char *getbookid(char *isbn)
{
	char url[URLMAX];
	char *buf, *bookid, *c;

	/* NOTE: new api returns json, and looks like this:
	 * http://www.googleapis.com/books/v1/volumes?q=isbn:1589235126
	 * (this needs https, which we don't yet support) */

	snprintf(url, URLMAX, "/books/feeds/volumes?q=isbn:%s", isbn);

	bookid = malloc(sizeof(char *) * BOOKID_LEN);

	if((buf = get("books.google.com", url)) == NULL)
		return NULL;

	if((c = strstr(buf,"<dc:identifier>")) == NULL)
		return NULL;
	strncpy(bookid, c+15, BOOKID_LEN);
	bookid[BOOKID_LEN] = '\0';
	free(buf);

	return bookid;
}

char *getpageurl(char *bookid, char *pg)
{
	char url[URLMAX];
	int l;
	char *buf, *c, *d, m[80], *pageurl;

	snprintf(url, URLMAX, "/books?id=%s&pg=%s&jscmd=click3", bookid, pg);

	if((buf = get("books.google.com", url)) == NULL)
		return NULL;

	snprintf(m, 80, "\"pid\":\"%s\"", pg);
	if((c = strstr(buf,m)) == NULL)
		return NULL;
	if(strncmp(c+strlen(m)+1, "\"src\"", 5) != 0)
		return NULL;
	for(l=0, d=c+strlen(m)+8; *d && *d != '"'; *d++, l++);

	pageurl = malloc(sizeof(char *) * l);
	strncpy(pageurl, c+strlen(m)+8, l);
	pageurl[l] = '\0';
	free(buf);

	return pageurl;
}

int main(int argc, char *argv[])
{
	char *bookid, *url, pg[12];

	if(argc < 2 || argc > 3)
		die(usage);

	if(argv[1][0] == '-') {
		if((argv[1][1] != 'p' && argv[1][1] != 'a') || argc < 3)
			die(usage);

		if((bookid = getbookid(argv[2])) == NULL)
			die("Could not find book\n");
		printf("bookid is %s\n", bookid);
	} else {
		if((bookid = getbookid(argv[1])) == NULL)
			die("Could not find book\n");
		printf("bookid is %s\n", bookid);

		strncpy(pg, "PA2", 12);
		if((url = getpageurl(bookid, pg)) != NULL)
			printf("page %s url is %s\n", pg, url);
		else
			fprintf(stderr, "Could not find page %s\n", pg);
	}

	free(bookid);
	free(url);
	return EXIT_SUCCESS;
}