summaryrefslogtreecommitdiffstats
path: root/src/main.c
blob: f57e3981d119a4507955f3bebc8c2750d547cf43 (plain) (blame)
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
#define _GNU_SOURCE
#include <stdio.h>
#include <stdlib.h>
#include <string.h>
#include <stdarg.h>
#include <printf.h>
#include <ctype.h>
#include <math.h>
#include <time.h>
#include <unistd.h>
#include <signal.h>
#include <pthread.h>
#include <stdatomic.h>
#include <i18n.h>
#include <sys/types.h>
#include <sys/select.h>
#include <sys/socket.h>
#include <libxml/nanohttp.h>
#include <libxml/HTMLparser.h>
#include <libxml/HTMLtree.h>
#include <libxml/tree.h>
#include <libxml/xpath.h>
#include <microhttpd.h>
#ifndef SC_OLD_STORAGE
#include <search.h>
#endif
#include <lib.c>
#include <url.c>
#define ABS(x) (((x) < 0) ? -(x) : (x))
enum sc_return {
	SC_BADCALL = -1,	/* calling the function the wrong way, I could actually just crash */
	SC_EMPTYRESPONSE = -2,	/* something weird, do not retry */
	SC_CAPTCHA = -3,	/* engine responded with a CAPTCHA, redirect to a different server */
	SC_NOIMGCLASS = -4,	/* couldn't find image class name from definition, do not retry */
	SC_NOCLASS = -5,	/* couldn't find result class name from def, do not retry */
	SC_NOHREF = -6		/* a result did not contain a href attribute */
};
const char * sc_return_str (enum sc_return r) {
	switch (r) {
		case SC_BADCALL:
			return "SC_BADCALL";
		case SC_EMPTYRESPONSE:
			return "SC_EMPTYRESPONSE";
		case SC_CAPTCHA:
			return "SC_CAPTCHA";
		case SC_NOIMGCLASS:
			return "SC_NOIMGCLASS";
		case SC_NOCLASS:
			return "SC_NOCLASS";
		case SC_NOHREF:
			return "SC_NOHREF";
	}
	return "SC_BADRETURN";
}
unsigned char sc_hp[] = { /* html page null terminated format string, from file src/hp.html */
#include <hp.xxd>
};
char sc_osdd[] = { /* xml document for opensearch */
#include <osdd.xxd>
};
char sc_robotstxt[] = "User-Agent: *\nDisallow: /\n";
char sc_securitytxt[] = "# This content information is provided by the developer of this opensource application.\n"
	"# The developer is not responsible for the actions of his software\n"
	"# This website IS NOT operated by the developer. Do not use the contact information below in hopes of contacting the webmaster\n"
	"# The following contact information is provided for reporting security bugs regarding the software, not for legal issues\n"
	"Contact: https://www.sijanec.eu/o.html#kontakt\n"
	"Acknowledgments: https://git.sijanec.eu/sijanec/sear.c\n"
	"Encryption: https://www.sijanec.eu/pgp-key.txt\n"
	"Expires: Thu, 31 Dec 2021 18:37:07 -0800\n"
	"Preferred-Languages: sl, en, de, hr\n";
#define SC_HTTP_PORT (getenv("SC_PORT") ? atoi(getenv("SC_PORT")) : 7327) /* SEAR on mobile keyboard */
#define SC_HTTP_RBUFSIZE 4096 /* initial size of http read buffer, increasning by K */
#define SC_HTTP_USER_AGENT "Nokia WAP Gateway 4.1 CD1/ECD13_D/4.1.04)" /* so google and others sends a minimal response */
#define SC_HTTP_HEADERS "User-Agent: " SC_HTTP_USER_AGENT "\r\n"
#include <structs.c>
#include <log.c>
#include <api.c>
#include <httpd.c>
/* this is new in my programs. I am now using _sizeof for the actual alloced size of the array and _length for the count of elements in array. this is done to decrease number of calls to realloc&amis */
void sc_signalhander (int s) {
	return;
}
int main (int argc, char ** argv) {
	int rs = 0;
	struct sc_cache * c = sc_cache_init();
	struct MHD_Daemon * d;
	if (!c) {
		rs = 1;
		goto rc;
	}
	xmlInitParser();
	d = MHD_start_daemon(MHD_USE_THREAD_PER_CONNECTION, SC_HTTP_PORT, NULL, NULL, &sc_httpd, c, MHD_OPTION_END);
	if (!d) {
		rs = 2;
		goto rc;
	}
	signal(SIGTERM, sc_signalhander);
	signal(SIGINT, sc_signalhander);
	pause();
	fprintf(stderr, "cleaning up!\n");
	fflush(stderr);
rc:
	xmlCleanupParser();
	MHD_stop_daemon(d); /* stop the daemon first and the free, threads might still be running */
	sc_cache_free(c);
	return rs;
}