aboutsummaryrefslogtreecommitdiff
path: root/src/Infobox
diff options
context:
space:
mode:
Diffstat (limited to 'src/Infobox')
-rw-r--r--src/Infobox/UnitConversion.c500
-rw-r--r--src/Infobox/UnitConversion.h9
2 files changed, 509 insertions, 0 deletions
diff --git a/src/Infobox/UnitConversion.c b/src/Infobox/UnitConversion.c
new file mode 100644
index 0000000..6a08b9c
--- /dev/null
+++ b/src/Infobox/UnitConversion.c
@@ -0,0 +1,500 @@
+#include "UnitConversion.h"
+#include <ctype.h>
+#include <math.h>
+#include <stdio.h>
+#include <stdlib.h>
+#include <string.h>
+
+typedef enum {
+ UNIT_LENGTH,
+ UNIT_WEIGHT,
+ UNIT_TEMP,
+ UNIT_VOLUME,
+ UNIT_AREA,
+ UNIT_TIME,
+ UNIT_UNKNOWN
+} UnitType;
+
+typedef struct {
+ const char *name;
+ const char *alias[4];
+ UnitType type;
+ double to_base;
+} UnitDef;
+
+static const UnitDef UNITS[] = {
+ {"metre", {"m", "metres", "meter", "meters"}, UNIT_LENGTH, 1.0},
+ {"kilometre", {"km", "kilometres", "kilometer", "kilometers"}, UNIT_LENGTH, 1000.0},
+ {"centimetre", {"cm", "centimetres", "centimeter", "centimeters"}, UNIT_LENGTH, 0.01},
+ {"millimetre", {"mm", "millimetres", "millimeter", "millimeters"}, UNIT_LENGTH, 0.001},
+ {"mile", {"mi", "miles"}, UNIT_LENGTH, 1609.344},
+ {"yard", {"yd", "yards"}, UNIT_LENGTH, 0.9144},
+ {"foot", {"ft", "feet", "'"}, UNIT_LENGTH, 0.3048},
+ {"inch", {"in", "inches", "\""}, UNIT_LENGTH, 0.0254},
+
+ {"kilogram", {"kg", "kilograms", "kilo", "kilos"}, UNIT_WEIGHT, 1.0},
+ {"gram", {"g", "grams"}, UNIT_WEIGHT, 0.001},
+ {"milligram", {"mg", "milligrams"}, UNIT_WEIGHT, 0.000001},
+ {"pound", {"lb", "lbs", "pounds"}, UNIT_WEIGHT, 0.453592},
+ {"ounce", {"oz", "ounces"}, UNIT_WEIGHT, 0.0283495},
+ {"tonne", {"tonnes", "tons", "ton"}, UNIT_WEIGHT, 1000.0},
+ {"stone", {"st", "stones"}, UNIT_WEIGHT, 6.35029},
+
+ {"celsius", {"c", "°c", "degrees celsius", "degrees c"}, UNIT_TEMP, 1.0},
+ {"fahrenheit", {"f", "°f", "degrees fahrenheit", "degrees f"}, UNIT_TEMP, 1.0},
+ {"kelvin", {"k", "degrees kelvin", "degrees k"}, UNIT_TEMP, 1.0},
+
+ {"litre", {"l", "litres", "liter", "liters"}, UNIT_VOLUME, 1.0},
+ {"millilitre", {"ml", "millilitres", "milliliter", "milliliters"}, UNIT_VOLUME, 0.001},
+ {"gallon", {"gal", "gallons"}, UNIT_VOLUME, 3.78541},
+ {"quart", {"qt", "quarts"}, UNIT_VOLUME, 0.946353},
+ {"pint", {"pt", "pints"}, UNIT_VOLUME, 0.473176},
+ {"cup", {"cups"}, UNIT_VOLUME, 0.236588},
+ {"fluid ounce", {"fl oz", "fluid ounces"}, UNIT_VOLUME, 0.0295735},
+
+ {"square metre", {"sqm", "sq m", "m2", "square metres"}, UNIT_AREA, 1.0},
+ {"square foot", {"sqft", "sq ft", "ft2", "square feet"}, UNIT_AREA, 0.092903},
+ {"square kilometre", {"sqkm", "sq km", "km2", "square kilometres"}, UNIT_AREA, 1000000.0},
+ {"square mile", {"sqmi", "sq mi", "mi2", "square miles"}, UNIT_AREA, 2589988.0},
+ {"acre", {"acres"}, UNIT_AREA, 4046.86},
+ {"hectare", {"ha", "hectares"}, UNIT_AREA, 10000.0},
+
+ {"second", {"sec", "seconds", "s"}, UNIT_TIME, 1.0},
+ {"minute", {"min", "minutes"}, UNIT_TIME, 60.0},
+ {"hour", {"hr", "hours", "h"}, UNIT_TIME, 3600.0},
+ {"day", {"days", "d"}, UNIT_TIME, 86400.0},
+ {"week", {"weeks", "wk"}, UNIT_TIME, 604800.0},
+ {"month", {"months", "mo"}, UNIT_TIME, 2629746.0},
+ {"year", {"years", "yr"}, UNIT_TIME, 31556952.0},
+};
+
+static const int UNIT_COUNT = sizeof(UNITS) / sizeof(UNITS[0]);
+
+static int is_whitespace(char c) {
+ return c == ' ' || c == '\t' || c == '\n' || c == '\r';
+}
+
+static const UnitDef *find_unit(const char *str) {
+ if (!str || !*str) return NULL;
+
+ size_t len = strlen(str);
+ char normalized[64] = {0};
+ size_t j = 0;
+
+ for (size_t i = 0; i < len && j < 63; i++) {
+ if ((unsigned char)str[i] == 0xC2 && (unsigned char)str[i+1] == 0xB0) {
+ i++;
+ continue;
+ }
+ if (str[i] == '^' && i + 1 < len && str[i + 1] == '2') {
+ normalized[j++] = '2';
+ i++;
+ continue;
+ }
+ normalized[j++] = tolower((unsigned char)str[i]);
+ }
+ normalized[j] = '\0';
+
+ for (int i = 0; i < UNIT_COUNT; i++) {
+ if (strcmp(normalized, UNITS[i].name) == 0) return &UNITS[i];
+ for (int k = 0; k < 4 && UNITS[i].alias[k]; k++) {
+ if (strcmp(normalized, UNITS[i].alias[k]) == 0) return &UNITS[i];
+ }
+ }
+ return NULL;
+}
+
+int is_unit_conv_query(const char *query) {
+ if (!query) return 0;
+
+ const char *patterns[] = {
+ " to ", " in ", " into ",
+ " = ", " equals ", " equal ",
+ " convert ", " conversion ",
+ " -> ", " → ",
+ NULL
+ };
+
+ int has_pattern = 0;
+ for (int i = 0; patterns[i]; i++) {
+ if (strstr(query, patterns[i])) {
+ has_pattern = 1;
+ break;
+ }
+ }
+
+ if (!has_pattern) {
+ const char *last_space = strrchr(query, ' ');
+ if (last_space) {
+ const UnitDef *u = find_unit(last_space + 1);
+ if (u) {
+ const char *before = query;
+ while (*before && is_whitespace(*before)) before++;
+ const char *num_end = before;
+ while (*num_end &&
+ (isdigit(*num_end) || *num_end == '.' || *num_end == '-' ||
+ *num_end == '+' || *num_end == '/' || *num_end == '\'' || *num_end == '"')) {
+ num_end++;
+ }
+ if (num_end > before) has_pattern = 1;
+ }
+ }
+ }
+
+ return has_pattern;
+}
+
+static double parse_value(const char **ptr) {
+ const char *p = *ptr;
+ while (*p && is_whitespace(*p)) p++;
+
+ double value = 0.0;
+ int has_num = 0;
+
+ if (*p == '-' || *p == '+') p++;
+ while (*p >= '0' && *p <= '9') {
+ value = value * 10 + (*p - '0');
+ has_num = 1;
+ p++;
+ }
+ if (*p == '.') {
+ p++;
+ double frac = 0.1;
+ while (*p >= '0' && *p <= '9') {
+ value += (*p - '0') * frac;
+ frac *= 0.1;
+ has_num = 1;
+ p++;
+ }
+ }
+
+ if (*p == '/' && has_num) {
+ p++;
+ double denom = 0.0;
+ int has_denom = 0;
+ while (*p >= '0' && *p <= '9') {
+ denom = denom * 10 + (*p - '0');
+ has_denom = 1;
+ p++;
+ }
+ if (has_denom && denom > 0) {
+ value = value / denom;
+ }
+ }
+
+ while (*p == '\'' || *p == '"') {
+ double extra = 0.0;
+ p++;
+ while (*p >= '0' && *p <= '9') {
+ extra = extra * 10 + (*p - '0');
+ p++;
+ }
+ if (*p == '.') {
+ p++;
+ double frac = 0.1;
+ while (*p >= '0' && *p <= '9') {
+ extra += (*p - '0') * frac;
+ frac *= 0.1;
+ p++;
+ }
+ }
+ if (*p == '\'' || *p == '"') p++;
+ value += extra * (p[-1] == '\'' ? 0.3048 : 0.0254);
+ }
+
+ if (!has_num) {
+ *ptr = p;
+ return 0.0;
+ }
+
+ *ptr = p;
+ return value;
+}
+
+static int is_separator(char c) {
+ return is_whitespace(c) || c == ',' || c == '.' || c == '(' || c == ')' || c == '\0';
+}
+
+static int parse_conversion_query(const char *query, double *value, const UnitDef **from_unit, const UnitDef **to_unit) {
+ *value = 0;
+ *from_unit = NULL;
+ *to_unit = NULL;
+
+ const char *value_end = query;
+ *value = parse_value(&value_end);
+
+ if (value_end == query) return 0;
+
+ const char *p = value_end;
+ while (*p && is_whitespace(*p)) p++;
+
+ size_t remaining = strlen(p);
+ if (remaining < 2) return 0;
+
+ const char *to_keywords[] = {" to ", " in ", " into ", " -> ", " → ", " = ", NULL};
+ const char *to_pos = NULL;
+ size_t keyword_len = 0;
+ for (int i = 0; to_keywords[i]; i++) {
+ const char *found = strstr(p, to_keywords[i]);
+ if (found) {
+ to_pos = found + strlen(to_keywords[i]);
+ keyword_len = strlen(to_keywords[i]);
+ break;
+ }
+ }
+
+ if (!to_pos) {
+ const char *last_space = strrchr(p, ' ');
+ if (last_space && last_space > p) {
+ char from_part[64] = {0};
+ size_t len = last_space - p;
+ if (len < 63) {
+ strncpy(from_part, p, len);
+ *from_unit = find_unit(from_part);
+ if (*from_unit) {
+ *to_unit = find_unit(last_space + 1);
+ return *to_unit ? 1 : 0;
+ }
+ }
+ }
+ return 0;
+ }
+
+ char from_part[64] = {0};
+ size_t from_len = to_pos - p - keyword_len;
+ if (from_len > 63) from_len = 63;
+ strncpy(from_part, p, from_len);
+
+ char *end_from = from_part + from_len;
+ while (end_from > from_part && is_whitespace(end_from[-1])) end_from--;
+ *end_from = '\0';
+
+ *from_unit = find_unit(from_part);
+ if (!*from_unit) {
+ char *end = from_part + strlen(from_part);
+ while (end > from_part) {
+ while (end > from_part && is_whitespace(end[-1])) end--;
+ if (end <= from_part) break;
+ char *start = end;
+ while (start > from_part && !is_whitespace(start[-1])) start--;
+ size_t word_len = end - start;
+ memmove(from_part + word_len + 1, from_part, start - from_part);
+ from_part[word_len] = ' ';
+ from_part[word_len + 1] = '\0';
+ *from_unit = find_unit(from_part);
+ if (*from_unit) break;
+ end = start;
+ }
+ }
+
+ if (!*from_unit) return 0;
+
+ while (*to_pos && is_whitespace(*to_pos)) to_pos++;
+
+ if (!*to_pos) return 0;
+
+ char to_part[64] = {0};
+ size_t to_len = 0;
+ const char *tp = to_pos;
+ while (*tp && !is_separator(*tp) && to_len < 63) {
+ to_part[to_len++] = *tp++;
+ }
+ to_part[to_len] = '\0';
+
+ *to_unit = find_unit(to_part);
+ if (!*to_unit) {
+ const char *try_ptr = to_pos;
+ while (*try_ptr && is_whitespace(*try_ptr)) try_ptr++;
+ char try_buf[64] = {0};
+ size_t try_len = 0;
+ while (*try_ptr && try_len < 63) {
+ try_buf[try_len++] = *try_ptr++;
+ }
+ while (try_len > 0) {
+ *to_unit = find_unit(try_buf);
+ if (*to_unit) {
+ strcpy(to_part, try_buf);
+ break;
+ }
+ char *last_space = strrchr(try_buf, ' ');
+ if (!last_space) break;
+ *last_space = '\0';
+ try_len = strlen(try_buf);
+ }
+ }
+
+ return *to_unit ? 1 : 0;
+}
+
+static double convert_temp(double value, const UnitDef *from, const UnitDef *to) {
+ double celsius = 0;
+
+ if (strcmp(from->name, "celsius") == 0) celsius = value;
+ else if (strcmp(from->name, "fahrenheit") == 0) celsius = (value - 32) * 5.0 / 9.0;
+ else if (strcmp(from->name, "kelvin") == 0) celsius = value - 273.15;
+
+ if (strcmp(to->name, "celsius") == 0) return celsius;
+ else if (strcmp(to->name, "fahrenheit") == 0) return celsius * 9.0 / 5.0 + 32;
+ else if (strcmp(to->name, "kelvin") == 0) return celsius + 273.15;
+ return 0;
+}
+
+static double convert_value(double value, const UnitDef *from, const UnitDef *to) {
+ if (from->type != to->type) return 0;
+
+ if (from->type == UNIT_TEMP) {
+ return convert_temp(value, from, to);
+ }
+
+ double base_value = value * from->to_base;
+ return base_value / to->to_base;
+}
+
+static void format_number(double val, char *buf, size_t bufsize) {
+ if (bufsize == 0) return;
+ if (val == 0) {
+ snprintf(buf, bufsize, "0");
+ return;
+ }
+ if (fabs(val) < 0.01 && fabs(val) > 0) {
+ snprintf(buf, bufsize, "%.2g", val);
+ } else if (fabs(val) < 1) {
+ snprintf(buf, bufsize, "%.2f", val);
+ char *p = buf + strlen(buf) - 1;
+ while (p > buf && *p == '0') *p-- = '\0';
+ if (*p == '.') *p = '\0';
+ } else if (fmod(val + 0.0001, 1.0) < 0.0002) {
+ snprintf(buf, bufsize, "%.0f", val);
+ } else {
+ snprintf(buf, bufsize, "%.2f", val);
+ char *p = buf + strlen(buf) - 1;
+ while (p > buf && *p == '0') *p-- = '\0';
+ if (*p == '.') *p = '\0';
+ }
+}
+
+static const char *pluralize(const char *unit, double value, char *buf, size_t bufsize) {
+ int is_one = (fabs(value - 1.0) < 0.0001 || fabs(value + 1.0) < 0.0001);
+
+ size_t len = strlen(unit);
+ if (len == 0 || bufsize == 0) return unit;
+
+ strncpy(buf, unit, bufsize - 1);
+ buf[bufsize - 1] = '\0';
+
+ if (strcmp(unit, "foot") == 0 || strcmp(unit, "square foot") == 0) {
+ if (is_one) strcpy(buf, unit);
+ else strcpy(buf, strcmp(unit, "square foot") == 0 ? "square feet" : "feet");
+ return buf;
+ }
+ if (strcmp(unit, "inch") == 0 || strcmp(unit, "square inch") == 0) {
+ if (is_one) strcpy(buf, unit);
+ else strcpy(buf, strcmp(unit, "square inch") == 0 ? "square inches" : "inches");
+ return buf;
+ }
+ if (strcmp(unit, "stone") == 0) {
+ if (is_one) strcpy(buf, "stone");
+ else strcpy(buf, "stones");
+ return buf;
+ }
+ if (strcmp(unit, "celsius") == 0 ||
+ strcmp(unit, "fahrenheit") == 0 ||
+ strcmp(unit, "kelvin") == 0) {
+ strcpy(buf, unit);
+ return buf;
+ }
+
+ if (unit[len-1] == 's' ||
+ unit[len-1] == 'x' ||
+ unit[len-1] == 'z' ||
+ (len >= 2 && unit[len-2] == 'c' && unit[len-1] == 'h') ||
+ (len >= 2 && unit[len-2] == 's' && unit[len-1] == 'h')) {
+ if (!is_one) {
+ buf[len] = 'e';
+ buf[len+1] = '\0';
+ }
+ } else if (unit[len-1] == 'y' && len >= 2 &&
+ !(unit[len-2] == 'a' || unit[len-2] == 'e' ||
+ unit[len-2] == 'i' || unit[len-2] == 'o' ||
+ unit[len-2] == 'u')) {
+ if (is_one) {
+ buf[len-1] = '\0';
+ } else {
+ buf[len] = 's';
+ buf[len+1] = '\0';
+ }
+ } else if (len >= 2 && unit[len-2] == 'f' && unit[len-1] == 'e') {
+ if (is_one) {
+ buf[len-2] = '\0';
+ } else {
+ buf[len-1] = 's';
+ buf[len] = '\0';
+ }
+ } else if (unit[len-1] == 'f' && len >= 1) {
+ if (is_one) {
+ buf[len-1] = '\0';
+ } else {
+ buf[len-1] = 'v';
+ buf[len] = 'e';
+ buf[len+1] = 's';
+ buf[len+2] = '\0';
+ }
+ } else if (unit[len-1] == 'e' && len >= 2 && unit[len-2] == 'f') {
+ if (is_one) {
+ buf[len-2] = '\0';
+ } else {
+ buf[len-1] = 's';
+ buf[len] = '\0';
+ }
+ } else {
+ if (!is_one) {
+ buf[len] = 's';
+ buf[len+1] = '\0';
+ }
+ }
+
+ return buf;
+}
+
+static char *build_html(double value, const UnitDef *from, double result, const UnitDef *to) {
+ static char html[4096];
+ char val_buf[64], res_buf[64], from_name_buf[64], to_name_buf[64];
+ format_number(value, val_buf, sizeof(val_buf));
+ format_number(result, res_buf, sizeof(res_buf));
+
+ pluralize(from->name, value, from_name_buf, sizeof(from_name_buf));
+ pluralize(to->name, result, to_name_buf, sizeof(to_name_buf));
+
+ int n = snprintf(html, sizeof(html),
+ "<div class='unit-conv-container' style='line-height: 1.6;'>"
+ "<div style='font-size: 1.3em; margin-bottom: 8px;'>"
+ "<b>%s %s</b> = <b>%s %s</b>"
+ "</div>",
+ val_buf, from_name_buf,
+ res_buf, to_name_buf);
+ snprintf(html + n, sizeof(html) - n, "</div>");
+ return html;
+}
+
+InfoBox fetch_unit_conv_data(const char *query) {
+ InfoBox info = {NULL, NULL, NULL, NULL};
+ if (!query) return info;
+
+ double value = 0;
+ const UnitDef *from = NULL;
+ const UnitDef *to = NULL;
+
+ if (!parse_conversion_query(query, &value, &from, &to)) return info;
+ if (!from || !to) return info;
+ if (from->type != to->type) return info;
+
+ double result = convert_value(value, from, to);
+ if (result == 0 && value != 0 && from->type != UNIT_TEMP) return info;
+
+ info.title = strdup("Unit Conversion");
+ info.extract = strdup(build_html(value, from, result, to));
+ info.thumbnail_url = strdup("/static/calculation.svg");
+ info.url = strdup("#");
+
+ return info;
+}
diff --git a/src/Infobox/UnitConversion.h b/src/Infobox/UnitConversion.h
new file mode 100644
index 0000000..b148cb3
--- /dev/null
+++ b/src/Infobox/UnitConversion.h
@@ -0,0 +1,9 @@
+#ifndef UNITCONVERSION_H
+#define UNITCONVERSION_H
+
+#include "Infobox.h"
+
+int is_unit_conv_query(const char *query);
+InfoBox fetch_unit_conv_data(const char *query);
+
+#endif