From f3aa7ca0bc2ef7c286609e8f87d07cc2568093af Mon Sep 17 00:00:00 2001 From: frosty Date: Tue, 6 Jan 2026 23:46:24 -0500 Subject: rebase(d) --- src/Scraping/Scraping.h | 34 ++++++++++++++++++++++++++++++++++ 1 file changed, 34 insertions(+) create mode 100644 src/Scraping/Scraping.h (limited to 'src/Scraping/Scraping.h') diff --git a/src/Scraping/Scraping.h b/src/Scraping/Scraping.h new file mode 100644 index 0000000..7ad4d59 --- /dev/null +++ b/src/Scraping/Scraping.h @@ -0,0 +1,34 @@ +#ifndef SCRAPING_H +#define SCRAPING_H + +#include + +#define LOG_INFO(msg, ...) fprintf(stderr, "[INFO] " msg "\n", ##__VA_ARGS__) +#define LOG_WARN(msg, ...) fprintf(stderr, "[WARN] " msg "\n", ##__VA_ARGS__) +#define LOG_DEBUG(msg, ...) fprintf(stderr, "[DEBUG] " msg "\n", ##__VA_ARGS__) +#define LOG_ERROR(msg, ...) fprintf(stderr, "[ERROR] " msg "\n", ##__VA_ARGS__) + +typedef struct { + char *url; + char *title; + char *snippet; +} SearchResult; + +typedef int (*ParserFunc)(const char *engine_name, xmlDocPtr doc, + SearchResult **out_results, int max_results); + +typedef struct { + const char *name; + const char *base_url; + const char *host_header; + const char *referer; + ParserFunc parser; +} SearchEngine; + +extern const SearchEngine ENGINE_REGISTRY[]; +extern const int ENGINE_COUNT; + +int scrape_engine(const SearchEngine *engine, const char *query, + SearchResult **out_results, int max_results); + +#endif -- cgit v1.2.3