09a01deb52 2009-10-01 c.kworr@d4daf: CREATE PROCEDURAL LANGUAGE plpgsql;
09a01deb52 2009-10-01 c.kworr@d4daf:
e0ecab03f9 2009-10-07 c.kworr@d4daf: -- general array sorting functions
e0ecab03f9 2009-10-07 c.kworr@d4daf: -- sorts array
e0ecab03f9 2009-10-07 c.kworr@d4daf: CREATE FUNCTION sort(original anyarray) RETURNS anyarray
e0ecab03f9 2009-10-07 c.kworr@d4daf: LANGUAGE sql IMMUTABLE STRICT
e0ecab03f9 2009-10-07 c.kworr@d4daf: AS $_$
e0ecab03f9 2009-10-07 c.kworr@d4daf: select array_agg(item) as result from (select unnest($1) as item order by item) a;
e0ecab03f9 2009-10-07 c.kworr@d4daf: $_$;
e0ecab03f9 2009-10-07 c.kworr@d4daf:
e0ecab03f9 2009-10-07 c.kworr@d4daf: -- sorts array and removes duplicates
e0ecab03f9 2009-10-07 c.kworr@d4daf: CREATE FUNCTION usort(original anyarray) RETURNS anyarray
e0ecab03f9 2009-10-07 c.kworr@d4daf: LANGUAGE sql IMMUTABLE STRICT
e0ecab03f9 2009-10-07 c.kworr@d4daf: AS $_$
e0ecab03f9 2009-10-07 c.kworr@d4daf: select array_agg(item) as result from (select distinct unnest($1) as item order by item) a;
e0ecab03f9 2009-10-07 c.kworr@d4daf: $_$;
e0ecab03f9 2009-10-07 c.kworr@d4daf:
ddb0e69dd7 2009-10-02 c.kworr@d4daf: -- this function adds tag to domain
2326f3bb9a 2009-10-08 c.kworr@d4daf: CREATE or replace FUNCTION mark(domain text, new_tag text) RETURNS void
2326f3bb9a 2009-10-08 c.kworr@d4daf: LANGUAGE plpgsql STRICT
2326f3bb9a 2009-10-08 c.kworr@d4daf: AS $$
2326f3bb9a 2009-10-08 c.kworr@d4daf: declare
2326f3bb9a 2009-10-08 c.kworr@d4daf: my_site text[];
2326f3bb9a 2009-10-08 c.kworr@d4daf: my_id_site smallint;
2326f3bb9a 2009-10-08 c.kworr@d4daf: my_tag text[];
2326f3bb9a 2009-10-08 c.kworr@d4daf: my_id_tag smallint;
2326f3bb9a 2009-10-08 c.kworr@d4daf: begin
2326f3bb9a 2009-10-08 c.kworr@d4daf: my_site := tripdomain(domain);
2326f3bb9a 2009-10-08 c.kworr@d4daf:
2326f3bb9a 2009-10-08 c.kworr@d4daf: -- selecting site id from table or adding site to the table
2326f3bb9a 2009-10-08 c.kworr@d4daf: select id_site from site where my_site = site into my_id_site;
2326f3bb9a 2009-10-08 c.kworr@d4daf: if not found then
2326f3bb9a 2009-10-08 c.kworr@d4daf: insert into site (site) values (my_site);
2326f3bb9a 2009-10-08 c.kworr@d4daf: select id_site from site where my_site = site into my_id_site;
2326f3bb9a 2009-10-08 c.kworr@d4daf: end if;
2326f3bb9a 2009-10-08 c.kworr@d4daf:
2326f3bb9a 2009-10-08 c.kworr@d4daf: -- selecting tags site already have and adding new tag to them
2326f3bb9a 2009-10-08 c.kworr@d4daf: -- note that tags should be sorted to eliminate permutations
2326f3bb9a 2009-10-08 c.kworr@d4daf: select coalesce(tag, '{}'::text[]) from urls natural join tag where id_site = my_id_site into my_tag;
2326f3bb9a 2009-10-08 c.kworr@d4daf: if not found then
2326f3bb9a 2009-10-08 c.kworr@d4daf: -- no records found - creating new tag
2326f3bb9a 2009-10-08 c.kworr@d4daf: insert into urls (id_site, id_tag) values (my_id_site, get_tag(array[new_tag]));
2326f3bb9a 2009-10-08 c.kworr@d4daf: my_tag := array[new_tag];
2326f3bb9a 2009-10-08 c.kworr@d4daf: else
2326f3bb9a 2009-10-08 c.kworr@d4daf: -- joining tags
2326f3bb9a 2009-10-08 c.kworr@d4daf: select usort(my_tag || array[new_tag]) into my_tag;
2326f3bb9a 2009-10-08 c.kworr@d4daf: -- deleting old site specification
2326f3bb9a 2009-10-08 c.kworr@d4daf: update urls set id_tag = get_tag(my_tag || array[new_tag]) where id_site = my_id_site;
2326f3bb9a 2009-10-08 c.kworr@d4daf: end if;
2326f3bb9a 2009-10-08 c.kworr@d4daf: end;
2326f3bb9a 2009-10-08 c.kworr@d4daf: $$;
2326f3bb9a 2009-10-08 c.kworr@d4daf:
2326f3bb9a 2009-10-08 c.kworr@d4daf: -- this function adds tag to site by site id
2326f3bb9a 2009-10-08 c.kworr@d4daf: CREATE or replace FUNCTION mark(my_id_site integer, new_tag text) RETURNS void
2326f3bb9a 2009-10-08 c.kworr@d4daf: LANGUAGE plpgsql STRICT
2326f3bb9a 2009-10-08 c.kworr@d4daf: AS $$
2326f3bb9a 2009-10-08 c.kworr@d4daf: declare
2326f3bb9a 2009-10-08 c.kworr@d4daf: -- maybe check should be added to make sure supplied site id really exists
2326f3bb9a 2009-10-08 c.kworr@d4daf: my_tag text[];
2326f3bb9a 2009-10-08 c.kworr@d4daf: my_tag_id integer;
2326f3bb9a 2009-10-08 c.kworr@d4daf: begin
2326f3bb9a 2009-10-08 c.kworr@d4daf: -- selecting tags site already have and adding new tag to them
2326f3bb9a 2009-10-08 c.kworr@d4daf: -- note that tags should be sorted to eliminate permutations
2326f3bb9a 2009-10-08 c.kworr@d4daf: select coalesce(tag, '{}'::text[]) from urls natural left join tag where id_site = my_id_site into my_tag;
2326f3bb9a 2009-10-08 c.kworr@d4daf: if not found then
2326f3bb9a 2009-10-08 c.kworr@d4daf: -- no records found - creating new tag
2326f3bb9a 2009-10-08 c.kworr@d4daf: insert into urls (id_site, id_tag) values (my_id_site, get_tag(array[new_tag]));
2326f3bb9a 2009-10-08 c.kworr@d4daf: else
2326f3bb9a 2009-10-08 c.kworr@d4daf: -- joining tags
2326f3bb9a 2009-10-08 c.kworr@d4daf: select usort(my_tag || array[new_tag]) into my_tag;
2326f3bb9a 2009-10-08 c.kworr@d4daf: -- updating existing record
2326f3bb9a 2009-10-08 c.kworr@d4daf: update urls set id_tag = get_tag(my_tag || array[new_tag]) where id_site = my_id_site;
2326f3bb9a 2009-10-08 c.kworr@d4daf: end if;
2326f3bb9a 2009-10-08 c.kworr@d4daf: end;
2326f3bb9a 2009-10-08 c.kworr@d4daf: $$;
2326f3bb9a 2009-10-08 c.kworr@d4daf:
2326f3bb9a 2009-10-08 c.kworr@d4daf: -- this function returns id of tag array
2326f3bb9a 2009-10-08 c.kworr@d4daf: create or replace function get_tag(my_tag text[]) returns integer
2326f3bb9a 2009-10-08 c.kworr@d4daf: language plpgsql strict
2326f3bb9a 2009-10-08 c.kworr@d4daf: as $$
2326f3bb9a 2009-10-08 c.kworr@d4daf: declare
2326f3bb9a 2009-10-08 c.kworr@d4daf: tag_id integer;
2326f3bb9a 2009-10-08 c.kworr@d4daf: begin
2326f3bb9a 2009-10-08 c.kworr@d4daf: select id_tag from tag where usort(my_tag) = tag into tag_id;
2326f3bb9a 2009-10-08 c.kworr@d4daf: if not found then
2326f3bb9a 2009-10-08 c.kworr@d4daf: insert into tag (tag) values (usort(my_tag));
2326f3bb9a 2009-10-08 c.kworr@d4daf: select id_tag from tag where usort(my_tag) = tag into tag_id;
2326f3bb9a 2009-10-08 c.kworr@d4daf: end if;
2326f3bb9a 2009-10-08 c.kworr@d4daf: return tag_id;
e0ecab03f9 2009-10-07 c.kworr@d4daf: end;
e0ecab03f9 2009-10-07 c.kworr@d4daf: $$;
ddb0e69dd7 2009-10-02 c.kworr@d4daf:
ddb0e69dd7 2009-10-02 c.kworr@d4daf: -- transforms domain into ordered array for indexing
fce4cc7368 2009-10-02 c.kworr@d4daf: CREATE FUNCTION tripdomain(url text) RETURNS text[]
ddb0e69dd7 2009-10-02 c.kworr@d4daf: LANGUAGE plpgsql IMMUTABLE STRICT
ddb0e69dd7 2009-10-02 c.kworr@d4daf: AS $_$
ddb0e69dd7 2009-10-02 c.kworr@d4daf: declare
ddb0e69dd7 2009-10-02 c.kworr@d4daf: result text[];
ddb0e69dd7 2009-10-02 c.kworr@d4daf: splitted text[];
ddb0e69dd7 2009-10-02 c.kworr@d4daf: x integer;
ddb0e69dd7 2009-10-02 c.kworr@d4daf: length integer;
ddb0e69dd7 2009-10-02 c.kworr@d4daf: begin
ddb0e69dd7 2009-10-02 c.kworr@d4daf: splitted := string_to_array($1, '.');
ddb0e69dd7 2009-10-02 c.kworr@d4daf: length := array_length(splitted, 1);
ddb0e69dd7 2009-10-02 c.kworr@d4daf: x := 1;
ddb0e69dd7 2009-10-02 c.kworr@d4daf: loop
ddb0e69dd7 2009-10-02 c.kworr@d4daf: exit when splitted[x] is null;
ddb0e69dd7 2009-10-02 c.kworr@d4daf: result[x] := splitted[x] || ':' || length - x;
ddb0e69dd7 2009-10-02 c.kworr@d4daf: x := x + 1;
ddb0e69dd7 2009-10-02 c.kworr@d4daf: end loop;
ddb0e69dd7 2009-10-02 c.kworr@d4daf: return result;
ddb0e69dd7 2009-10-02 c.kworr@d4daf: end;$_$;
ddb0e69dd7 2009-10-02 c.kworr@d4daf:
ddb0e69dd7 2009-10-02 c.kworr@d4daf: -- transforms ordered array into domain
ddb0e69dd7 2009-10-02 c.kworr@d4daf: create function untrip(site text[]) returns text
ddb0e69dd7 2009-10-02 c.kworr@d4daf: language plpgsql immutable strict
ddb0e69dd7 2009-10-02 c.kworr@d4daf: as $_$
fce4cc7368 2009-10-02 c.kworr@d4daf: declare
ddb0e69dd7 2009-10-02 c.kworr@d4daf: x integer;
ddb0e69dd7 2009-10-02 c.kworr@d4daf: splitted text[];
ddb0e69dd7 2009-10-02 c.kworr@d4daf: pair text[];
fce4cc7368 2009-10-02 c.kworr@d4daf: begin
ddb0e69dd7 2009-10-02 c.kworr@d4daf: x := array_length(site, 1);
ddb0e69dd7 2009-10-02 c.kworr@d4daf: loop
ddb0e69dd7 2009-10-02 c.kworr@d4daf: exit when site[x] is null;
ddb0e69dd7 2009-10-02 c.kworr@d4daf: pair := string_to_array(site[x], ':');
ddb0e69dd7 2009-10-02 c.kworr@d4daf: splitted[0 - pair[2]::integer] := pair[1];
ddb0e69dd7 2009-10-02 c.kworr@d4daf: x := x - 1;
ddb0e69dd7 2009-10-02 c.kworr@d4daf: end loop;
ddb0e69dd7 2009-10-02 c.kworr@d4daf: return array_to_string(splitted, '.');
09a01deb52 2009-10-01 c.kworr@d4daf: end;
09a01deb52 2009-10-01 c.kworr@d4daf: $_$;
09a01deb52 2009-10-01 c.kworr@d4daf:
ddb0e69dd7 2009-10-02 c.kworr@d4daf: -- table to hold all rules
ddb0e69dd7 2009-10-02 c.kworr@d4daf: CREATE TABLE rules (
ddb0e69dd7 2009-10-02 c.kworr@d4daf: netmask cidr NOT NULL,
ddb0e69dd7 2009-10-02 c.kworr@d4daf: redirect_url text DEFAULT 'about::blank'::text NOT NULL,
ddb0e69dd7 2009-10-02 c.kworr@d4daf: from_weekday smallint DEFAULT 0 NOT NULL,
ddb0e69dd7 2009-10-02 c.kworr@d4daf: to_weekday smallint DEFAULT 6 NOT NULL,
ddb0e69dd7 2009-10-02 c.kworr@d4daf: from_time time without time zone DEFAULT '00:00:00'::time without time zone NOT NULL,
ddb0e69dd7 2009-10-02 c.kworr@d4daf: to_time time without time zone DEFAULT '23:59:59'::time without time zone NOT NULL,
ddb0e69dd7 2009-10-02 c.kworr@d4daf: id_tag smallint NOT NULL
ddb0e69dd7 2009-10-02 c.kworr@d4daf: );
ddb0e69dd7 2009-10-02 c.kworr@d4daf:
ddb0e69dd7 2009-10-02 c.kworr@d4daf: ALTER TABLE ONLY rules
ddb0e69dd7 2009-10-02 c.kworr@d4daf: ADD CONSTRAINT rules_pkey PRIMARY KEY (netmask);
ddb0e69dd7 2009-10-02 c.kworr@d4daf:
ddb0e69dd7 2009-10-02 c.kworr@d4daf: -- table to hold site arrays
ddb0e69dd7 2009-10-02 c.kworr@d4daf: CREATE TABLE site (
ddb0e69dd7 2009-10-02 c.kworr@d4daf: id_site serial,
4b22e25f24 2009-10-07 c.kworr@d4daf: site text[] NOT NULL
ddb0e69dd7 2009-10-02 c.kworr@d4daf: );
ddb0e69dd7 2009-10-02 c.kworr@d4daf:
ddb0e69dd7 2009-10-02 c.kworr@d4daf: ALTER TABLE ONLY site
2326f3bb9a 2009-10-08 c.kworr@d4daf: ADD CONSTRAINT id_site PRIMARY KEY (id_site);
ddb0e69dd7 2009-10-02 c.kworr@d4daf:
e0ecab03f9 2009-10-07 c.kworr@d4daf: CREATE UNIQUE INDEX site_s ON site (usort(site));
ddb0e69dd7 2009-10-02 c.kworr@d4daf:
e0ecab03f9 2009-10-07 c.kworr@d4daf: CREATE INDEX site_g ON site USING gin (site);
ddb0e69dd7 2009-10-02 c.kworr@d4daf:
ddb0e69dd7 2009-10-02 c.kworr@d4daf: -- table to hold tag combinations
ddb0e69dd7 2009-10-02 c.kworr@d4daf: CREATE TABLE tag (
ddb0e69dd7 2009-10-02 c.kworr@d4daf: id_tag serial,
ddb0e69dd7 2009-10-02 c.kworr@d4daf: tag text[] NOT NULL
ddb0e69dd7 2009-10-02 c.kworr@d4daf: );
ddb0e69dd7 2009-10-02 c.kworr@d4daf:
ddb0e69dd7 2009-10-02 c.kworr@d4daf: ALTER TABLE ONLY tag
ddb0e69dd7 2009-10-02 c.kworr@d4daf: ADD CONSTRAINT tag_id PRIMARY KEY (id_tag);
ddb0e69dd7 2009-10-02 c.kworr@d4daf:
e0ecab03f9 2009-10-07 c.kworr@d4daf: CREATE UNIQUE INDEX tag_s ON tag (usort(tag));
09a01deb52 2009-10-01 c.kworr@d4daf:
e0ecab03f9 2009-10-07 c.kworr@d4daf: CREATE INDEX tag_g ON tag USING gin (tag);
09a01deb52 2009-10-01 c.kworr@d4daf:
ddb0e69dd7 2009-10-02 c.kworr@d4daf: -- table to hold tag - site links
ddb0e69dd7 2009-10-02 c.kworr@d4daf: CREATE TABLE urls (
ddb0e69dd7 2009-10-02 c.kworr@d4daf: date_added timestamp without time zone DEFAULT ('now'::text)::timestamp(0) without time zone NOT NULL,
ddb0e69dd7 2009-10-02 c.kworr@d4daf: id_site smallint NOT NULL,
7d9c268669 2009-10-02 c.kworr@d4daf: id_tag smallint NOT NULL,
7d9c268669 2009-10-02 c.kworr@d4daf: regex text
ddb0e69dd7 2009-10-02 c.kworr@d4daf: );
ddb0e69dd7 2009-10-02 c.kworr@d4daf:
ddb0e69dd7 2009-10-02 c.kworr@d4daf: ALTER TABLE ONLY urls
ddb0e69dd7 2009-10-02 c.kworr@d4daf: ADD CONSTRAINT urls_pkey PRIMARY KEY (date_added);
09a01deb52 2009-10-01 c.kworr@d4daf:
09a01deb52 2009-10-01 c.kworr@d4daf: CREATE UNIQUE INDEX urls_id_site ON urls USING btree (id_site);
4b22e25f24 2009-10-07 c.kworr@d4daf:
4b22e25f24 2009-10-07 c.kworr@d4daf: CREATE UNIQUE INDEX urls_id_tag ON urls USING btree (id_tag);
7d9c268669 2009-10-02 c.kworr@d4daf:
ddb0e69dd7 2009-10-02 c.kworr@d4daf: -- rule to join all tables into one to simplify access
ddb0e69dd7 2009-10-02 c.kworr@d4daf: -- automaticall uses current day and time data
ddb0e69dd7 2009-10-02 c.kworr@d4daf: CREATE VIEW site_rule AS
7d9c268669 2009-10-02 c.kworr@d4daf: SELECT a.redirect_url, a.netmask, b.site, b.regexp
ddb0e69dd7 2009-10-02 c.kworr@d4daf: FROM ((
ddb0e69dd7 2009-10-02 c.kworr@d4daf: SELECT rules.redirect_url, tag.tag AS rule_tag, rules.netmask
7d9c268669 2009-10-02 c.kworr@d4daf: FROM rules NATURAL JOIN tag
7d9c268669 2009-10-02 c.kworr@d4daf: WHERE ('now'::text)::time without time zone >= rules.from_time
7d9c268669 2009-10-02 c.kworr@d4daf: AND ('now'::text)::time without time zone <= rules.to_time
7d9c268669 2009-10-02 c.kworr@d4daf: AND date_part('dow'::text, now()) >= (rules.from_weekday)::double precision
7d9c268669 2009-10-02 c.kworr@d4daf: AND date_part('dow'::text, now()) <= (rules.to_weekday)::double precision
ddb0e69dd7 2009-10-02 c.kworr@d4daf: ) a JOIN (
7d9c268669 2009-10-02 c.kworr@d4daf: SELECT site.site, tag.tag AS url_tag, regexp
7d9c268669 2009-10-02 c.kworr@d4daf: FROM urls NATURAL JOIN tag NATURAL JOIN site
7d9c268669 2009-10-02 c.kworr@d4daf: ) b ON (b.url_tag && a.rule_tag));