1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
|
/* See COPYING file for copyright, license and warranty details. */
#define VERSION "prealpha"
#include <stdio.h>
#include <stdlib.h>
#include <string.h>
#include "util.c"
#define usage "getgbook " VERSION " - a google books downloader\n" \
"usage: getgbook [-p|-a] isbn\n" \
" -p print all available pages\n" \
" -a download all available pages\n" \
" otherwise, all pages in stdin will be downloaded\n"
#define hostname "books.google.com"
#define URLMAX 1024
#define BOOKID_LEN 12
typedef struct {
char *name;
char *code;
} pgtype;
pgtype pgtypes[] = {
{"cover", "PP"},
{"preface", "PR"},
{"page", "PA"},
{"postface", "PA"},
};
char *getbookid(char *isbn)
{
char url[URLMAX];
char *buf, *bookid, *c;
/* NOTE: new api returns json, and looks like this:
* http://www.googleapis.com/books/v1/volumes?q=isbn:1589235126
* (this needs https, which we don't yet support) */
snprintf(url, URLMAX, "/books/feeds/volumes?q=isbn:%s", isbn);
bookid = malloc(sizeof(char *) * BOOKID_LEN);
if((buf = get("books.google.com", url)) == NULL)
return NULL;
if((c = strstr(buf,"<dc:identifier>")) == NULL)
return NULL;
strncpy(bookid, c+15, BOOKID_LEN);
bookid[BOOKID_LEN] = '\0';
free(buf);
return bookid;
}
char *getpageurl(char *bookid, char *pg)
{
char url[URLMAX];
int l;
char *buf, *c, *d, m[80], *pageurl;
snprintf(url, URLMAX, "/books?id=%s&pg=%s&jscmd=click3", bookid, pg);
if((buf = get("books.google.com", url)) == NULL)
return NULL;
snprintf(m, 80, "\"pid\":\"%s\"", pg);
if((c = strstr(buf,m)) == NULL)
return NULL;
if(strncmp(c+strlen(m)+1, "\"src\"", 5) != 0)
return NULL;
for(l=0, d=c+strlen(m)+8; *d && *d != '"'; *d++, l++);
pageurl = malloc(sizeof(char *) * l);
strncpy(pageurl, c+strlen(m)+8, l);
pageurl[l] = '\0';
free(buf);
return pageurl;
}
int main(int argc, char *argv[])
{
char *bookid, *url, pg[12];
if(argc < 2 || argc > 3)
die(usage);
if(argv[1][0] == '-') {
if((argv[1][1] != 'p' && argv[1][1] != 'a') || argc < 3)
die(usage);
if((bookid = getbookid(argv[2])) == NULL)
die("Could not find book\n");
printf("bookid is %s\n", bookid);
} else {
if((bookid = getbookid(argv[1])) == NULL)
die("Could not find book\n");
printf("bookid is %s\n", bookid);
strncpy(pg, "PA2", 12);
if((url = getpageurl(bookid, pg)) != NULL)
printf("page %s url is %s\n", pg, url);
else
fprintf(stderr, "Could not find page %s\n", pg);
}
free(bookid);
free(url);
return EXIT_SUCCESS;
}
|