summaryrefslogtreecommitdiff
path: root/strap.c
diff options
context:
space:
mode:
Diffstat (limited to 'strap.c')
-rw-r--r--strap.c144
1 files changed, 144 insertions, 0 deletions
diff --git a/strap.c b/strap.c
new file mode 100644
index 0000000..eb456c1
--- /dev/null
+++ b/strap.c
@@ -0,0 +1,144 @@
+#include <stdbool.h>
+#include <locale.h>
+#ifdef HAVE_LANGINFO_H
+#include <langinfo.h>
+#endif
+#include <tidy.h>
+#include <tidybuffio.h>
+#include "icclient.h"
+
+extern char *image_dir;
+static locale_t loc = 0;
+
+static void recurse(TidyDoc doc, TidyNode tnod, struct icclient_catalog **catalog, char **category,
+ bool is_sku, bool is_category, bool is_price)
+{
+ struct icclient_product *product;
+ for (TidyNode child = tidyGetChild(tnod); child; child = tidyGetNext(child)) {
+ ctmbstr name = tidyNodeGetName(child);
+ if (name) {
+ if (!strcmp(name, "html")) {
+ char locale[11];
+ for (TidyAttr attr = tidyAttrFirst(child); attr; attr = tidyAttrNext(attr)) {
+ if (!strcmp(tidyAttrValue(attr), "en"))
+ strcpy(locale, "en_US.utf8");
+ else if (!strcmp(tidyAttrValue(attr), "id"))
+ strcpy(locale, "id_ID.utf8");
+ loc = newlocale(LC_MONETARY_MASK | LC_NUMERIC_MASK, locale, 0);
+ }
+ } else if (!strcmp(name, "h3")) {
+ is_sku = false;
+ is_category = true;
+ is_price = false;
+ } else if (!strcmp(name, "img")) {
+ static const char *subdir = "/items/";
+ char prefix[strlen(image_dir) + strlen(subdir) + 1];
+ sprintf(prefix, "%s%s", image_dir, subdir);
+ size_t prefix_len = strlen(prefix);
+ for (TidyAttr attr = tidyAttrFirst(child); attr; attr = tidyAttrNext(attr)) {
+ name = tidyAttrName(attr);
+ ctmbstr value = tidyAttrValue(attr);
+ if (!strcmp(name, "src")) {
+ if (strncmp(value, prefix, prefix_len))
+ break;
+ product = malloc(sizeof(struct icclient_product));
+ memset(product, '\0', sizeof(struct icclient_product));
+ size_t len = strlen(value) - prefix_len;
+ product->image = malloc(len + 1);
+ strncpy(product->image, value + prefix_len, len + 1);
+ }
+ if (strcmp(name, "title"))
+ continue;
+ product->description = malloc(strlen(value) + 1);
+ strcpy(product->description, value);
+ if (*category) {
+ product->category = malloc(strlen(*category) + 1);
+ strcpy(product->category, *category);
+ }
+ (*catalog)->length++;
+ *catalog = realloc(*catalog, sizeof(struct icclient_catalog)
+ + sizeof(struct icclient_product *[(*catalog)->length]));
+ (*catalog)->products[(*catalog)->length - 1] = product;
+ }
+ continue;
+ } else if (!strcmp(name, "h4")) {
+ is_sku = true;
+ is_category = false;
+ is_price = false;
+ } else if (is_sku && !strcmp(name, "a")) {
+ is_sku = false;
+ for (TidyAttr attr = tidyAttrFirst(child); attr; attr = tidyAttrNext(attr)) {
+ char *sku = strrchr(tidyAttrValue(attr), '/');
+ char *session_id = strchr(sku++, '?');
+ if (session_id)
+ *session_id = '\0';
+ product = (*catalog)->products[(*catalog)->length - 1];
+ product->sku = malloc(strlen(sku) + 1);
+ strcpy(product->sku, sku);
+ }
+ } else if (!strcmp(name, "p") && !((*catalog)->products[(*catalog)->length - 1])->price) {
+ is_sku = false;
+ is_category = false;
+ is_price = true;
+ } else {
+ is_sku = false;
+ is_category = false;
+ is_price = false;
+ }
+ recurse(doc, child, catalog, category, is_sku, is_category, is_price);
+ } else if (is_category || is_price) {
+ TidyBuffer buf;
+ tidyBufInit(&buf);
+ tidyNodeGetText(doc, child, &buf);
+ char *text = (char *)buf.bp;
+ product = (*catalog)->products[(*catalog)->length - 1];
+ if (is_category) {
+ is_category = false;
+ text[strlen(text) - 1] = '\0';
+ if (*category)
+ free(*category);
+ *category = malloc(strlen(text) + 1);
+ strcpy(*category, text);
+ } else {
+ is_price = false;
+#ifdef HAVE_LANGINFO_H
+ char *symbol = nl_langinfo_l(CRNCYSTR, loc);
+ size_t symbol_len = strlen(symbol) - 1;
+ if (symbol[0] == '-')
+ text += symbol_len;
+ char *separator = nl_langinfo_l(THOUSEP, loc);
+ if (strstr(text, separator)) {
+ size_t price_len = strlen(text) - symbol_len - 1;
+ char price[price_len];
+ memset(price, '\0', price_len);
+ strcat(price, strtok(text, separator));
+ strcat(price, strtok(NULL, separator));
+ product->price = atof(price);
+ } else
+ product->price = atof(text);
+#endif
+ }
+ tidyBufFree(&buf);
+ }
+ }
+}
+
+void handle_results(icclient_response *response)
+{
+ TidyDoc tdoc = tidyCreate();
+ tidyOptSetBool(tdoc, TidyXhtmlOut, yes);
+ tidyParseString(tdoc, response->data);
+ tidyCleanAndRepair(tdoc);
+ tidyOptSetBool(tdoc, TidyForceOutput, yes);
+ TidyBuffer output = {0};
+ tidyBufInit(&output);
+ tidySaveBuffer(tdoc, &output);
+ struct icclient_catalog *catalog = malloc(sizeof(struct icclient_catalog));
+ catalog->length = 0;
+ recurse(tdoc, tidyGetRoot(tdoc), &catalog, &(char *){NULL}, false, false, false);
+ tidyBufFree(&output);
+ tidyRelease(tdoc);
+ if (loc)
+ freelocale(loc);
+ ((void (*)(struct icclient_catalog *))response->userData)(catalog);
+}