2022-05-02 17:23:08 -04:00
-- SPDX-License-Identifier: MIT
-- Copyright 2017 J. King, Dustin Wilson et al.
-- See LICENSE and AUTHORS files for details
-- Create a temporary table mapping old article IDs to new article IDs per-user.
2022-05-02 23:35:25 -04:00
-- Any articles which have only one subscription will be unchanged, which will
-- limit the amount of disruption
2022-06-06 19:54:48 -04:00
create temp table arsse_articles_map (
2022-05-02 17:23:08 -04:00
article int not null ,
subscription int not null ,
id integer primary key autoincrement
) ;
2022-06-07 13:49:13 -04:00
replace into temp . sqlite_sequence ( name , seq ) select ' arsse_articles_map ' , max ( id ) from arsse_articles ;
2022-05-02 17:23:08 -04:00
insert into arsse_articles_map ( article , subscription )
2022-06-06 19:54:48 -04:00
select
a . id as article ,
s . id as subscription
2022-05-30 15:10:09 -04:00
from arsse_articles as a join arsse_subscriptions as s using ( feed )
2022-05-02 23:35:25 -04:00
where feed in (
2022-06-06 19:54:48 -04:00
select feed from ( select feed , count ( * ) as count from arsse_subscriptions group by feed ) as c where count > 1
2022-05-02 23:35:25 -04:00
) ;
2022-05-30 15:10:09 -04:00
insert into arsse_articles_map ( article , subscription , id )
2022-06-06 19:54:48 -04:00
select
a . id as article ,
s . id as subscription ,
2022-05-02 23:35:25 -04:00
a . id as id
2022-05-30 15:10:09 -04:00
from arsse_articles as a join arsse_subscriptions as s using ( feed )
2022-05-02 23:35:25 -04:00
where feed in (
2022-06-06 19:54:48 -04:00
select feed from ( select feed , count ( * ) as count from arsse_subscriptions group by feed ) as c where count = 1
2022-05-02 23:35:25 -04:00
) ;
2022-05-02 17:23:08 -04:00
2022-05-02 23:35:25 -04:00
-- Create a new articles table which combines the marks table but does not include content
create table arsse_articles_new (
2022-05-03 15:51:33 -04:00
-- metadata for entries in newsfeeds, including user state
id integer primary key , -- sequence number
subscription integer not null references arsse_subscriptions ( id ) on delete cascade on update cascade , -- associated subscription
2022-05-26 17:33:16 -04:00
read int not null default 0 , -- whether the article has been read
starred int not null default 0 , -- whether the article is starred
hidden int not null default 0 , -- whether the article should be excluded from selection by default
2022-05-03 15:51:33 -04:00
published text , -- time of original publication
edited text , -- time of last edit by author
modified text not null default CURRENT_TIMESTAMP , -- time when article was last modified in database pursuant to an authorial edit
marked text , -- time at which an article was last modified by the user
url text , -- URL of article
title text collate nocase , -- article title
author text collate nocase , -- author's name
guid text , -- a nominally globally unique identifier for the article, from the feed
url_title_hash text not null , -- hash of URL + title; used when checking for updates and for identification if there is no guid
url_content_hash text not null , -- hash of URL + content + enclosure URL + enclosure content type; used when checking for updates and for identification if there is no guid
title_content_hash text not null , -- hash of title + content + enclosure URL + enclosure content type; used when checking for updates and for identification if there is no guid
2023-02-16 23:32:04 -05:00
touched int not null default 0 , -- field used internally while marking; should normally be left as 0
2022-05-03 15:51:33 -04:00
note text not null default ' ' -- Tiny Tiny RSS freeform user note
2022-05-02 23:35:25 -04:00
) ;
insert into arsse_articles_new
select
i . id ,
i . subscription ,
2022-05-30 15:10:09 -04:00
coalesce ( m . read , 0 ) ,
coalesce ( m . starred , 0 ) ,
coalesce ( m . hidden , 0 ) ,
2022-05-02 23:35:25 -04:00
a . published ,
a . edited ,
a . modified ,
m . modified ,
a . url ,
a . title ,
a . author ,
a . guid ,
a . url_title_hash ,
2022-06-06 19:54:48 -04:00
a . url_content_hash ,
2022-05-02 23:35:25 -04:00
a . title_content_hash ,
2023-02-16 23:32:04 -05:00
0 ,
2022-05-30 15:10:09 -04:00
coalesce ( m . note , ' ' )
2022-05-02 23:35:25 -04:00
from arsse_articles_map as i
left join arsse_articles as a on a . id = i . article
2022-09-26 16:49:41 -04:00
left join arsse_marks as m on a . id = m . article and m . subscription = i . subscription ;
2022-05-02 23:35:25 -04:00
-- Create a new table to hold article content
create table arsse_article_contents (
2022-05-03 15:51:33 -04:00
-- contents of articles, which is typically large text
id integer primary key references arsse_articles ( id ) on delete cascade on update cascade , -- reference to the article ID
content text -- the contents
2022-05-02 23:35:25 -04:00
) ;
insert into arsse_article_contents
select
2022-05-26 17:33:16 -04:00
m . id ,
2022-09-26 16:49:41 -04:00
case when s . scrape = 0 then a . content else coalesce ( a . content_scraped , a . content ) end
2022-05-26 17:33:16 -04:00
from arsse_articles_map as m
2022-09-26 16:49:41 -04:00
left join arsse_articles as a on a . id = m . article
left join arsse_subscriptions as s on s . id = m . subscription ;
2022-05-02 23:35:25 -04:00
2022-05-26 17:33:16 -04:00
-- Create one edition for each renumbered article, and delete any editions for obsolete articles
2022-09-27 16:32:46 -04:00
insert into arsse_editions ( article , modified )
select
m . id , e . modified
from arsse_editions as e
join arsse_articles_map as m using ( article )
where m . id < > article
order by m . id , modified ;
delete from arsse_editions where article in ( select article from arsse_articles_map where id < > article ) or article not in ( select id from arsse_articles_map ) ;
2022-05-02 17:23:08 -04:00
2022-05-26 17:33:16 -04:00
-- Create enclures for renumbered articles and delete obsolete enclosures
insert into arsse_enclosures ( article , url , type )
2022-06-06 19:54:48 -04:00
select
m . id , url , type
2022-05-26 17:33:16 -04:00
from arsse_articles_map as m
join arsse_enclosures as e on m . article = e . article
where m . id < > m . article ;
2022-09-27 11:17:06 -04:00
delete from arsse_enclosures where article in ( select article from arsse_articles_map where id < > article ) or article not in ( select id from arsse_articles_map ) ;
2022-05-02 17:23:08 -04:00
2022-05-30 15:10:09 -04:00
-- Create categories for renumbered articles and delete obsolete categories
insert into arsse_categories ( article , name )
2022-06-06 19:54:48 -04:00
select
m . id , name
2022-05-30 15:10:09 -04:00
from arsse_articles_map as m
join arsse_categories as c on m . article = c . article
where m . id < > m . article ;
2022-09-27 11:17:06 -04:00
delete from arsse_categories where article in ( select article from arsse_articles_map where id < > article ) or article not in ( select id from arsse_articles_map ) ;
2022-05-30 15:10:09 -04:00
2022-05-26 17:33:16 -04:00
-- Create a new label-associations table which omits the subscription column and populate it with new data
2022-05-03 15:51:33 -04:00
create table arsse_label_members_new (
-- label assignments for articles
label integer not null references arsse_labels ( id ) on delete cascade , -- label ID associated to an article; label IDs belong to a user
article integer not null references arsse_articles ( id ) on delete cascade , -- article associated to a label
2022-05-26 17:33:16 -04:00
assigned int not null default 1 , -- whether the association is current, to support soft deletion
2022-05-03 15:51:33 -04:00
modified text not null default CURRENT_TIMESTAMP , -- time at which the association was last made or unmade
primary key ( label , article ) -- only one association of a given label to a given article
) without rowid ;
2022-05-26 17:33:16 -04:00
insert into arsse_label_members_new
select
label , m . id , assigned , l . modified
from arsse_articles_map as m
2022-09-27 11:17:06 -04:00
join arsse_label_members as l using ( article , subscription ) ;
2022-05-02 17:23:08 -04:00
-- Create a new subscriptions table which combines the feeds table
2022-05-26 17:33:16 -04:00
create table arsse_subscriptions_new (
-- users' subscriptions to newsfeeds, with settings
id integer primary key , -- sequence number
owner text not null references arsse_users ( id ) on delete cascade on update cascade , -- owner of subscription
url text not null , -- URL of feed
2022-09-30 12:32:28 -04:00
deleted int not null default 0 , -- soft-delete flag
2022-05-30 15:10:09 -04:00
feed_title text collate nocase , -- feed title
2022-05-26 17:33:16 -04:00
title text collate nocase , -- user-supplied title, which overrides the feed title when set
folder integer references arsse_folders ( id ) on delete cascade , -- TT-RSS category (nestable); the first-level category (which acts as Nextcloud folder) is joined in when needed
2022-09-30 12:32:28 -04:00
modified text not null default CURRENT_TIMESTAMP , -- time at which subscription properties were last modified by the user
2022-05-26 17:33:16 -04:00
last_mod text , -- time at which the feed last actually changed at the foreign host
etag text not null default ' ' , -- HTTP ETag hash used for cache validation, changes each time the content changes
next_fetch text , -- time at which the feed should next be fetched
added text not null default CURRENT_TIMESTAMP , -- time at which feed was added
source text , -- URL of site to which the feed belongs
updated text , -- time at which the feed was last fetched
err_count integer not null default 0 , -- count of successive times update resulted in error since last successful update
err_msg text , -- last error message
size integer not null default 0 , -- number of articles in the feed at last fetch
icon integer references arsse_icons ( id ) on delete set null , -- numeric identifier of any associated icon
order_type int not null default 0 , -- Nextcloud sort order
pinned int not null default 0 , -- whether feed is pinned (always sorts at top)
2022-05-30 15:10:09 -04:00
scrape int not null default 0 , -- whether the user has requested scraping content from source articles
keep_rule text , -- Regular expression the subscription's articles must match to avoid being hidden
block_rule text , -- Regular expression the subscription's articles must not match to avoid being hidden
2022-05-26 17:33:16 -04:00
unique ( owner , url ) -- a URL with particular credentials should only appear once
) ;
insert into arsse_subscriptions_new
select
2022-06-06 19:54:48 -04:00
s . id ,
s . owner ,
f . url ,
2022-09-30 12:32:28 -04:00
0 ,
2022-06-06 19:54:48 -04:00
f . title ,
s . title ,
2022-05-26 17:33:16 -04:00
s . folder ,
2022-09-30 12:32:28 -04:00
s . modified ,
2022-05-26 17:33:16 -04:00
f . modified ,
2022-06-06 19:54:48 -04:00
f . etag ,
2022-05-26 17:33:16 -04:00
f . next_fetch ,
2022-06-06 19:54:48 -04:00
s . added ,
2022-05-26 17:33:16 -04:00
f . source ,
f . updated ,
f . err_count ,
f . err_msg ,
f . size ,
f . icon ,
s . order_type ,
2022-05-30 15:10:09 -04:00
s . pinned ,
s . scrape ,
s . keep_rule ,
s . block_rule
2022-05-26 17:33:16 -04:00
from arsse_subscriptions as s left join arsse_feeds as f on s . feed = f . id ;
2022-05-02 17:23:08 -04:00
-- Delete the old tables and rename the new ones
2022-05-26 17:33:16 -04:00
drop table arsse_label_members ;
drop table arsse_subscriptions ;
drop table arsse_feeds ;
drop table arsse_articles ;
drop table arsse_marks ;
drop table arsse_articles_map ;
alter table arsse_subscriptions_new rename to arsse_subscriptions ;
alter table arsse_articles_new rename to arsse_articles ;
alter table arsse_label_members_new rename to arsse_label_members ;
-- set version marker
pragma user_version = 8 ;
update arsse_meta set value = ' 8 ' where " key " = ' schema_version ' ;