PbDbFixer/src/main.rs

343 lines
11 KiB
Rust
Raw Normal View History

2021-02-11 21:58:10 +01:00
mod epub;
2021-01-29 12:47:33 +01:00
mod pocketbook;
2021-02-11 21:58:10 +01:00
use rusqlite::{named_params, Connection, Transaction, NO_PARAMS};
use std::usize;
2021-02-10 10:31:44 +01:00
2021-01-28 17:52:09 +01:00
struct BookEntry {
id: i32,
filepath: String,
2021-02-01 19:39:36 +01:00
author: String,
firstauthor: String,
has_drm: bool,
2021-02-10 10:31:44 +01:00
genre: String,
first_author_letter: String,
2021-02-15 13:05:32 +01:00
series: String,
2021-01-28 17:52:09 +01:00
}
2021-02-01 14:33:00 +01:00
fn get_epubs_from_database(tx: &Transaction) -> Vec<BookEntry> {
let mut book_entries = Vec::new();
let mut stmt = tx
.prepare(
r#"
SELECT books.id, folders.name, files.filename, books.firstauthor,
2021-02-15 13:05:32 +01:00
books.author, genres.name, first_author_letter, series
2021-02-01 14:33:00 +01:00
FROM books_impl books JOIN files
ON books.id = files.book_id
JOIN folders
ON folders.id = files.folder_id
2021-02-10 10:31:44 +01:00
LEFT OUTER JOIN booktogenre btg
ON books.id = btg.bookid
LEFT OUTER JOIN genres
ON genres.id = btg.genreid
2021-02-01 14:33:00 +01:00
WHERE files.storageid = 1 AND books.ext = 'epub'
ORDER BY books.id"#,
2021-02-01 14:33:00 +01:00
)
.unwrap();
2021-01-29 13:51:36 +01:00
2021-01-30 17:59:00 +01:00
let mut rows = stmt.query(NO_PARAMS).unwrap();
while let Some(row) = rows.next().unwrap() {
let book_id: i32 = row.get(0).unwrap();
let prefix: String = row.get(1).unwrap();
let filename: String = row.get(2).unwrap();
let filepath = format!("{}/{}", prefix, filename);
2021-02-01 19:39:36 +01:00
let firstauthor: String = row.get(3).unwrap();
let author: String = row.get(4).unwrap();
let has_drm = match prefix.as_str() {
"/mnt/ext1/Digital Editions" => true,
_ => false,
};
2021-02-10 10:31:44 +01:00
let genre: String = row.get(5).unwrap_or_default();
let first_author_letter = row.get(6).unwrap_or_default();
2021-02-15 13:05:32 +01:00
let series: String = row.get(7).unwrap_or_default();
2021-02-01 14:33:00 +01:00
let entry = BookEntry {
2021-01-30 17:59:00 +01:00
id: book_id,
filepath,
2021-02-01 19:39:36 +01:00
firstauthor,
author,
has_drm,
2021-02-10 10:31:44 +01:00
genre,
first_author_letter,
2021-02-15 13:05:32 +01:00
series,
2021-02-01 14:33:00 +01:00
};
book_entries.push(entry);
2021-01-30 17:59:00 +01:00
}
2021-01-28 17:52:09 +01:00
2021-02-01 14:33:00 +01:00
book_entries
}
2021-02-01 19:39:36 +01:00
fn remove_ghost_books_from_db(tx: &Transaction) -> usize {
let mut stmt = tx
.prepare(
r#"
2021-02-01 19:39:36 +01:00
DELETE FROM books_impl
WHERE id IN (
SELECT books.id
FROM books_impl books
LEFT OUTER JOIN files
ON books.id = files.book_id
WHERE files.filename is NULL
)"#,
2021-02-01 19:39:36 +01:00
)
.unwrap();
let num = stmt.execute(NO_PARAMS).unwrap();
tx.execute(
r#"DELETE FROM books_settings WHERE bookid NOT IN ( SELECT id FROM books_impl )"#,
2021-02-01 19:39:36 +01:00
NO_PARAMS,
)
.unwrap();
tx.execute(
r#"DELETE FROM books_uids WHERE book_id NOT IN ( SELECT id FROM books_impl )"#,
2021-02-01 19:39:36 +01:00
NO_PARAMS,
)
.unwrap();
tx.execute(
r#"DELETE FROM bookshelfs_books WHERE bookid NOT IN ( SELECT id FROM books_impl )"#,
2021-02-01 19:39:36 +01:00
NO_PARAMS,
)
.unwrap();
tx.execute(
r#"DELETE FROM booktogenre WHERE bookid NOT IN ( SELECT id FROM books_impl )"#,
2021-02-01 19:39:36 +01:00
NO_PARAMS,
)
.unwrap();
tx.execute(
r#"DELETE FROM social WHERE bookid NOT IN ( SELECT id FROM books_impl )"#,
2021-02-01 19:39:36 +01:00
NO_PARAMS,
)
.unwrap();
num
}
2021-02-01 14:33:00 +01:00
struct Statistics {
authors_fixed: i32,
2021-02-01 19:39:36 +01:00
ghost_books_cleaned: usize,
drm_skipped: usize,
2021-02-10 10:31:44 +01:00
genres_fixed: usize,
sorting_fixed: usize,
2021-02-15 13:05:32 +01:00
series_fixed: usize,
2021-02-01 14:33:00 +01:00
}
2021-02-12 09:34:58 +01:00
impl Statistics {
fn anything_fixed(&self) -> bool {
&self.authors_fixed > &0
|| &self.genres_fixed > &0
|| &self.ghost_books_cleaned > &0
|| &self.sorting_fixed > &0
2021-02-15 13:05:32 +01:00
|| &self.series_fixed > &0
2021-02-12 09:34:58 +01:00
}
}
2021-02-01 14:33:00 +01:00
fn fix_db_entries(tx: &Transaction, book_entries: &Vec<BookEntry>) -> Statistics {
2021-02-01 19:39:36 +01:00
let mut stat = Statistics {
authors_fixed: 0,
ghost_books_cleaned: 0,
drm_skipped: 0,
2021-02-10 10:31:44 +01:00
genres_fixed: 0,
sorting_fixed: 0,
2021-02-15 13:05:32 +01:00
series_fixed: 0,
2021-02-01 19:39:36 +01:00
};
2021-02-01 14:33:00 +01:00
for entry in book_entries {
if entry.has_drm {
stat.drm_skipped = stat.drm_skipped + 1;
continue;
}
2021-02-11 21:58:10 +01:00
if let Some(epub_metadata) = epub::get_epub_metadata(&entry.filepath) {
// Fix firstauthor…
let mut firstauthors = epub_metadata
2021-02-11 21:58:10 +01:00
.authors
.iter()
.filter(|aut| aut.firstauthor.len() > 0)
.map(|aut| aut.firstauthor.clone())
.collect::<Vec<_>>();
firstauthors.sort();
2021-02-11 21:58:10 +01:00
if !firstauthors.iter().all(|s| entry.firstauthor.contains(s)) {
let mut stmt = tx
.prepare("UPDATE books_impl SET firstauthor = :file_as WHERE id = :book_id")
.unwrap();
stmt.execute_named(
named_params![":file_as": firstauthors.join(" & "), ":book_id": entry.id],
)
.unwrap();
stat.authors_fixed = stat.authors_fixed + 1;
}
// Fix first_author_letter
let first_author_letter = firstauthors
.join(" & ")
.chars()
.next()
.unwrap_or_default()
.to_string()
.to_uppercase();
if entry.first_author_letter != first_author_letter {
let mut stmt = tx
.prepare("UPDATE books_impl SET first_author_letter = :first_letter WHERE id = :book_id")
.unwrap();
stmt.execute_named(
named_params![":first_letter": first_author_letter,":book_id": entry.id],
)
.unwrap();
stat.sorting_fixed = stat.sorting_fixed + 1;
}
2021-02-11 21:58:10 +01:00
// Fix author names…
let authornames = epub_metadata
.authors
2021-02-11 21:58:10 +01:00
.iter()
.map(|aut| aut.name.clone())
.collect::<Vec<_>>();
if !authornames.iter().all(|s| entry.author.contains(s))
|| authornames.join(", ").len() != entry.author.len()
{
2021-02-11 21:58:10 +01:00
let mut stmt = tx
.prepare("UPDATE books_impl SET author = :authors WHERE id = :book_id")
.unwrap();
stmt.execute_named(
named_params![":authors": authornames.join(", "), ":book_id": entry.id],
)
.unwrap();
stat.authors_fixed = stat.authors_fixed + 1;
}
// Fix genre…
2021-02-11 21:58:10 +01:00
if entry.genre.is_empty() && epub_metadata.genre.len() > 0 {
let mut stmt = tx
.prepare(r#"INSERT INTO genres (name) SELECT :genre ON CONFLICT DO NOTHING"#)
.unwrap();
stmt.execute_named(named_params![":genre": &epub_metadata.genre])
.unwrap();
let mut stmt = tx
.prepare(
r#"
INSERT INTO booktogenre (bookid, genreid)
VALUES (:bookid,
(SELECT id FROM genres WHERE name = :genre)
)
ON CONFLICT DO NOTHING"#,
)
.unwrap();
stmt.execute_named(
named_params![":bookid": &entry.id, ":genre": &epub_metadata.genre],
)
.unwrap();
stat.genres_fixed = stat.genres_fixed + 1;
2021-02-10 10:31:44 +01:00
}
2021-02-15 13:05:32 +01:00
// Fix series…
if !epub_metadata.series.name.is_empty() && entry.series.is_empty() {
let mut stmt = tx
.prepare("UPDATE books_impl SET series = :series, numinseries = :series_index WHERE id = :book_id")
.unwrap();
stmt.execute_named(
named_params![":series": &epub_metadata.series.name, ":series_index": &epub_metadata.series.index, ":book_id": entry.id],
)
.unwrap();
stat.series_fixed = stat.series_fixed + 1;
}
2021-01-28 17:52:09 +01:00
}
}
2021-01-30 17:59:00 +01:00
2021-02-01 19:39:36 +01:00
// ghost books
let num = remove_ghost_books_from_db(tx);
stat.ghost_books_cleaned = num;
2021-02-01 14:33:00 +01:00
stat
2021-01-30 17:59:00 +01:00
}
fn main() {
2021-02-02 09:52:50 +01:00
if cfg!(target_arch = "arm") {
let res = pocketbook::dialog(
pocketbook::Icon::None,
"PocketBook has sometimes problems parsing metadata.\n\
This app tries to fix some of these issues.\n\
(Note: The database file explore-3.db will be altered!)\n\
\n\
Please be patient - this might take a while.\n\
You will see a blank screen during the process.\n\
\n\
Proceed?",
&["Cancel", "Yes"],
);
if res == 1 {
return;
}
}
2021-01-30 17:59:00 +01:00
let mut conn = Connection::open("/mnt/ext1/system/explorer-3/explorer-3.db").unwrap();
2021-02-01 19:39:36 +01:00
conn.execute("PRAGMA foreign_keys = 0", NO_PARAMS).unwrap();
2021-01-30 17:59:00 +01:00
let tx = conn.transaction().unwrap();
2021-02-01 14:33:00 +01:00
let book_entries = get_epubs_from_database(&tx);
let stat = fix_db_entries(&tx, &book_entries);
2021-01-28 17:52:09 +01:00
tx.commit().unwrap();
2021-01-29 12:47:33 +01:00
if cfg!(target_arch = "arm") {
2021-02-12 09:34:58 +01:00
if stat.anything_fixed() == false {
2021-02-02 20:11:13 +01:00
if stat.drm_skipped == 0 {
pocketbook::dialog(
pocketbook::Icon::Info,
"The database seems to be ok.\n\
Nothing had to be fixed.",
&["OK"],
);
} else {
pocketbook::dialog(
pocketbook::Icon::Info,
&format!(
"The database seems to be ok.\n\
Nothing had to be fixed.\n\
(Books skipped (DRM): {})",
&stat.drm_skipped
),
&["OK"],
);
}
2021-01-29 12:47:33 +01:00
} else {
pocketbook::dialog(
pocketbook::Icon::Info,
2021-02-01 19:39:36 +01:00
&format!(
"Authors fixed: {}\n\
Sorting fixed: {}\n\
2021-02-10 10:31:44 +01:00
Genres fixed: {}\n\
2021-02-15 13:05:32 +01:00
Series fixed: {}\n\
2021-02-10 10:31:44 +01:00
Books skipped (DRM): {}\n\
Books cleaned from DB: {}",
2021-02-10 10:31:44 +01:00
&stat.authors_fixed,
&stat.sorting_fixed,
2021-02-10 10:31:44 +01:00
&stat.genres_fixed,
2021-02-15 13:05:32 +01:00
&stat.series_fixed,
2021-02-10 10:31:44 +01:00
&stat.drm_skipped,
&stat.ghost_books_cleaned
2021-02-01 19:39:36 +01:00
),
2021-02-02 09:52:50 +01:00
&["OK"],
2021-01-29 12:47:33 +01:00
);
}
2021-02-01 14:33:00 +01:00
} else {
2021-02-01 19:39:36 +01:00
println!(
"Authors fixed: {}\n\
Sorting fixed: {}\n\
2021-02-10 10:31:44 +01:00
Genres fixed: {}\n\
2021-02-15 13:05:32 +01:00
Series fixed: {}\n\
2021-02-10 10:31:44 +01:00
Books skipped (DRM): {}\n\
Books cleaned from DB: {}",
&stat.authors_fixed,
&stat.sorting_fixed,
&stat.genres_fixed,
2021-02-15 13:05:32 +01:00
&stat.series_fixed,
&stat.drm_skipped,
&stat.ghost_books_cleaned
2021-02-01 19:39:36 +01:00
);
2021-01-29 12:47:33 +01:00
}
2021-01-28 17:52:09 +01:00
}