crocodilestick
diff --git a/‎CONTRIBUTORS‎
Lines changed: 2 additions & 2 deletions b/‎CONTRIBUTORS‎
Lines changed: 2 additions & 2 deletions
diff --git a/‎README.md‎
Lines changed: 13 additions & 2 deletions b/‎README.md‎
Lines changed: 13 additions & 2 deletions
diff --git a/‎cps/admin.py‎
Lines changed: 1 addition & 1 deletion b/‎cps/admin.py‎
Lines changed: 1 addition & 1 deletion
diff --git a/‎cps/constants.py‎
Lines changed: 3 additions & 1 deletion b/‎cps/constants.py‎
Lines changed: 3 additions & 1 deletion
diff --git a/‎cps/cwa_functions.py‎
Lines changed: 47 additions & 1 deletion b/‎cps/cwa_functions.py‎
Lines changed: 47 additions & 1 deletion
diff --git a/‎cps/duplicates.py‎
Lines changed: 122 additions & 0 deletions b/‎cps/duplicates.py‎
Lines changed: 122 additions & 0 deletions
diff --git a/‎cps/main.py‎
Lines changed: 2 additions & 0 deletions b/‎cps/main.py‎
Lines changed: 2 additions & 0 deletions
diff --git a/‎cps/render_template.py‎
Lines changed: 5 additions & 0 deletions b/‎cps/render_template.py‎
Lines changed: 5 additions & 0 deletions
@@ -1,7 +1,7 @@
 CONTRIBUTORS
 
 This file is automatically generated. DO NOT EDIT MANUALLY.
-Generated on: 2025-09-01T20:52:42.198138Z
+Generated on: 2025-09-02T13:44:20.914655Z
 
 Upstream project: https://github.com/janeczku/calibre-web
 Fork project (Calibre-Web Automated, since 2024): https://github.com/crocodilestick/calibre-web-automated
@@ -289,7 +289,7 @@ Copyright (C) 2024-2025 Calibre-Web Automated contributors
 - zhiyue (1 commits)
 # Fork Contributors (crocodilestick/calibre-web-automated)
 
-- crocodilestick (587 commits)
+- crocodilestick (588 commits)
 - jmarmstrong1207 (73 commits)
 - demitrix (30 commits)
 - sirwolfgang (22 commits)
 
@@ -7,6 +7,7 @@
 ![Docker Pulls](https://img.shields.io/docker/pulls/crocodilestick/calibre-web-automated)
 ![GitHub Release](https://img.shields.io/github/v/release/crocodilestick/calibre-web-automated)
 ![GitHub commits since latest release](https://img.shields.io/github/commits-since/crocodilestick/calibre-web-automated/latest)
+![OAuth 2.0 + OIDC](https://img.shields.io/badge/OAuth-2.0%20%2B%20OIDC-blue?style=flat&logo=oauth)
 
 
 ## _Quick Access_
@@ -23,6 +24,7 @@
 - [Usage](#usage-) 🔧
   - [Adding Books to Your Library](#adding-books-to-your-library)
   - [KOReader Syncing (KOSync)](#koreader-syncing-kosync-) 📖⚡
+  - [OAuth Authentication Setup](#enhanced-oauth-20oidc-authentication-) 🔐
 - [For Developers](#for-developers---building-custom-docker-image) 🚀
 - [Further Development](#further-development-️) 🏗️
 - [Support / Buy me a Coffee](https://ko-fi.com/crocodilestick) ☕
@@ -107,7 +109,7 @@ This tells CWA to avoid enabling WAL on the Calibre `metadata.db` and the `app.d
 | eBook metadata editing and deletion support | Metadata download from various sources (extensible via plugins) | eBook download restriction to logged-in users |
 | Public user registration support | Send eBooks to E-Readers with a single click | Sync Kobo devices with your Calibre library |
 | In-browser eBook reading support for multiple formats | Content hiding based on categories and Custom Column content per user | "Magic Link" login for easy access on eReaders |
-| LDAP, Google/GitHub OAuth, and proxy authentication support | Advanced search and filtering options | Multilingual user interface supporting 20+ [languages](https://github.com/janeczku/calibre-web/wiki/Translation-Status) |
+| Enhanced OAuth 2.0/OIDC authentication with auto-discovery | Advanced search and filtering options | Multilingual user interface supporting 20+ [languages](https://github.com/janeczku/calibre-web/wiki/Translation-Status) |
 
 ## Plus these _**CWA Specific Features**_ on top:
 
@@ -120,7 +122,7 @@ This tells CWA to avoid enabling WAL on the Calibre `metadata.db` and the `app.d
 | [Automatic EPUB Fixer Service 🔨](#automatic-epub-fixer-service-) | [Multi-Format Conversion Service 🌌](#simple-to-use-multi-format-conversion-service-) | [Library Auto-Detect 📚🕵️](#library-auto-detect-️) |
 | [Server Stats Tracking Page 📍](#server-stats-tracking-page-) | [Server Stats Tracking 📊](#server-stats-tracking-page-) | [Easy Dark/ Light Mode Switching ☀️🌙](#easy-dark-light-mode-switching-️) |
 | [Internal Update Notification System 🛎️](#internal-update-notification-system-️) | [Auto-Compression of Backed Up Files 🤐](#auto-compression-of-backed-up-files-) | [Additional Metadata Providers 🗃️](#additional-metadata-providers-️) |
-| [KOReader Syncing (KOSync) 📖⚡](#koreader-syncing-kosync-) | | |
+| [KOReader Syncing (KOSync) 📖⚡](#koreader-syncing-kosync-) | [Enhanced OAuth 2.0/OIDC Authentication 🔐](#enhanced-oauth-20oidc-authentication-) | |
 
 #### **Automatic Ingest Service** ✨
 - CWA currently supports automatic ingest of 27 different popular ebook formats
@@ -188,6 +190,15 @@ This tells CWA to avoid enabling WAL on the Calibre `metadata.db` and the `app.d
 - **CWA Integration:** Leverages your existing CWA user accounts and permissions - no additional server setup required
 - **Easy Installation:** Plugin and setup instructions are available directly from your CWA instance at `/kosync`
 
+#### **Enhanced OAuth 2.0/OIDC Authentication** 🔐
+- **Auto-Discovery:** Automatic endpoint configuration via OIDC metadata URLs for seamless setup with providers like Keycloak, Authentik, Google, and Azure AD
+- **Manual Override:** Full manual control over OAuth endpoints when auto-discovery isn't available
+- **Field Mapping:** Configurable JWT field extraction for usernames and emails to work with any provider's token structure
+- **Group-Based Roles:** Automatic admin role assignment based on OAuth provider groups
+- **Testing Tools:** Built-in connection testing and validation to ensure your configuration works before going live
+- **Enterprise Ready:** Support for custom scopes, multiple authentication methods, and comprehensive troubleshooting
+- **📖 [Full OAuth Configuration Guide](https://github.com/crocodilestick/Calibre-Web-Automated/wiki/OAuth-Configuration)** for detailed setup instructions
+
 #### **Server Stats Tracking Page** 📍📊
   - Ever wondered how many times CWA has been there for you in the background? Check out the CWA Stats page to see a fun list of statistics showing how many times CWA has been there to make your life just that little bit easier
 - A database also exists to keep track of any and all enforcements, imports, conversions & fixes both for peace of mind and to make the checking of any bugs or weird behaviour easier
 
@@ -548,7 +548,7 @@ def edit_list_user(param):
                     if user.name == "Guest" and value == constants.SIDEBAR_READ_AND_UNREAD:
                         raise Exception(_("Guest can't have this view"))
                     # check for valid value, last on checks for power of 2 value
-                    if value > 0 and value <= constants.SIDEBAR_LIST and (value & value - 1 == 0 or value == 1):
+                    if value > 0 and value <= constants.SIDEBAR_DUPLICATES and (value & value - 1 == 0 or value == 1):
                         if vals['value'] == 'true':
                             user.sidebar_view |= value
                         elif vals['value'] == 'false':
 
@@ -88,6 +88,7 @@
 SIDEBAR_ARCHIVED        = 1 << 15
 SIDEBAR_DOWNLOAD        = 1 << 16
 SIDEBAR_LIST            = 1 << 17
+SIDEBAR_DUPLICATES      = 1 << 18
 
 sidebar_settings = {
                 "detail_random": DETAIL_RANDOM,
@@ -106,11 +107,12 @@
                 "sidebar_archived": SIDEBAR_ARCHIVED,
                 "sidebar_download": SIDEBAR_DOWNLOAD,
                 "sidebar_list": SIDEBAR_LIST,
+                "sidebar_duplicates": SIDEBAR_DUPLICATES,
             }
 
 
 ADMIN_USER_ROLES        = sum(r for r in ALL_ROLES.values()) & ~ROLE_ANONYMOUS
-ADMIN_USER_SIDEBAR      = (SIDEBAR_LIST << 1) - 1
+ADMIN_USER_SIDEBAR      = (SIDEBAR_DUPLICATES << 1) - 1
 
 UPDATE_STABLE       = 0 << 0
 AUTO_UPDATE_STABLE  = 1 << 0
 
@@ -100,6 +100,32 @@ def get_ingest_dir():
         dirs = json.load(f)
         return dirs['ingest_folder']
 
+def get_ingest_status():
+    """Read the current ingest service status"""
+    try:
+        with open('/config/cwa_ingest_status', 'r') as f:
+            status_line = f.read().strip()
+            if ':' in status_line:
+                parts = status_line.split(':')
+                return {
+                    'state': parts[0],
+                    'filename': parts[1] if len(parts) > 1 else '',
+                    'timestamp': parts[2] if len(parts) > 2 else '',
+                    'detail': parts[3] if len(parts) > 3 else ''
+                }
+            else:
+                return {'state': status_line, 'filename': '', 'timestamp': '', 'detail': ''}
+    except (FileNotFoundError, IOError):
+        return {'state': 'unknown', 'filename': '', 'timestamp': '', 'detail': ''}
+
+def get_ingest_queue_size():
+    """Get the number of files in the retry queue"""
+    try:
+        with open('/config/cwa_ingest_retry_queue', 'r') as f:
+            return len([line for line in f if line.strip()])
+    except (FileNotFoundError, IOError):
+        return 0
+
 def refresh_library(app):
     with app.app_context():  # Create app context for session
         ingest_dir = get_ingest_dir()
@@ -180,8 +206,12 @@ def set_cwa_settings():
     boolean_settings = []
     string_settings = []
     list_settings = []
+    integer_settings = ['ingest_timeout_minutes']  # Special handling for integer settings
+    
     for setting in cwa_default_settings:
-        if isinstance(cwa_default_settings[setting], int):
+        if setting in integer_settings:
+            continue  # Handle separately
+        elif isinstance(cwa_default_settings[setting], int):
             boolean_settings.append(setting)
         elif isinstance(cwa_default_settings[setting], str) and cwa_default_settings[setting] != "":
             string_settings.append(setting)
@@ -229,6 +259,22 @@ def set_cwa_settings():
             if result['auto_convert_target_format'] in result['auto_ingest_ignored_formats']:
                 result['auto_ingest_ignored_formats'].remove(result['auto_convert_target_format'])
 
+            # Handle integer settings
+            for setting in integer_settings:
+                value = request.form.get(setting)
+                if value is not None:
+                    try:
+                        int_value = int(value)
+                        # Validate timeout range
+                        if setting == 'ingest_timeout_minutes':
+                            int_value = max(5, min(120, int_value))  # Clamp between 5 and 120 minutes
+                        result[setting] = int_value
+                    except (ValueError, TypeError):
+                        # Use current value if conversion fails
+                        result[setting] = cwa_db.cwa_settings.get(setting, 15)  # Default to 15 minutes
+                else:
+                    result[setting] = cwa_db.cwa_settings.get(setting, 15)  # Default to 15 minutes
+
             # DEBUGGING
             # with open("/config/post_request" ,"w") as f:
             #     for key in result.keys():
 
@@ -0,0 +1,122 @@
+# Calibre-Web Automated – fork of Calibre-Web
+# Copyright (C) 2018-2025 Calibre-Web contributors
+# Copyright (C) 2024-2025 Calibre-Web Automated contributors
+# SPDX-License-Identifier: GPL-3.0-or-later
+# See CONTRIBUTORS for full list of authors.
+
+from flask import Blueprint
+from flask_babel import gettext as _
+from sqlalchemy import func, and_
+
+from . import db, calibre_db, logger
+from .admin import admin_required  
+from .usermanagement import login_required_if_no_ano
+from .render_template import render_title_template
+from .cw_login import current_user
+
+duplicates = Blueprint('duplicates', __name__)
+log = logger.create()
+
+
+@duplicates.route("/duplicates")
+@login_required_if_no_ano
+@admin_required
+def show_duplicates():
+    """Display books with duplicate titles and authors"""
+    print("[cwa-duplicates] Loading duplicates page...", flush=True)
+    log.info("[cwa-duplicates] Loading duplicates page for user: %s", current_user.name)
+    
+    try:
+        # Use SQL to efficiently find duplicates with proper user filtering
+        duplicate_groups = find_duplicate_books()
+        
+        print(f"[cwa-duplicates] Found {len(duplicate_groups)} duplicate groups total", flush=True)
+        log.info("[cwa-duplicates] Found %s duplicate groups total", len(duplicate_groups))
+        
+        return render_title_template('duplicates.html', 
+                                     duplicate_groups=duplicate_groups,
+                                     title=_("Duplicate Books"), 
+                                     page="duplicates")
+                                     
+    except Exception as e:
+        print(f"[cwa-duplicates] Critical error loading duplicates page: {str(e)}", flush=True)
+        log.error("[cwa-duplicates] Critical error loading duplicates page: %s", str(e))
+        # Return empty page on error
+        return render_title_template('duplicates.html', 
+                                     duplicate_groups=[],
+                                     title=_("Duplicate Books"), 
+                                     page="duplicates")
+
+
+def find_duplicate_books():
+    """Find books with duplicate title + primary author combinations using efficient SQL"""
+    
+    # Get all books with proper user filtering - this is much simpler and more reliable
+    # than trying to do complex joins for duplicate detection
+    books_query = (calibre_db.session.query(db.Books)
+                   .filter(calibre_db.common_filters())  # Respect user permissions and library filtering
+                   .order_by(db.Books.title, db.Books.timestamp.desc()))
+    
+    all_books = books_query.all()
+    print(f"[cwa-duplicates] Retrieved {len(all_books)} books with user filtering applied", flush=True)
+    
+    # Group books by title + primary author combination (case-insensitive)
+    title_author_groups = {}
+    
+    for book in all_books:
+        # Ensure authors are loaded (lazy loading)
+        if not book.authors:
+            continue
+            
+        # Get primary author (use Calibre-Web's standard approach)
+        book.ordered_authors = calibre_db.order_authors([book])
+        primary_author = book.ordered_authors[0].name if book.ordered_authors else "Unknown"
+        
+        # Create case-insensitive key
+        key = (book.title.lower().strip(), primary_author.lower().strip())
+        
+        if key not in title_author_groups:
+            title_author_groups[key] = []
+        title_author_groups[key].append(book)
+    
+    print(f"[cwa-duplicates] Grouped books into {len(title_author_groups)} unique title+author combinations", flush=True)
+    
+    # Filter to only groups with duplicates and prepare display data
+    duplicate_groups = []
+    for (lower_title, lower_author), books in title_author_groups.items():
+        if len(books) > 1:
+            # Sort books by timestamp (newest first)
+            books.sort(key=lambda x: x.timestamp, reverse=True)
+            
+            # Add additional information for display
+            for book in books:
+                # Ensure we have ordered authors
+                if not hasattr(book, 'ordered_authors') or not book.ordered_authors:
+                    book.ordered_authors = calibre_db.order_authors([book])
+                
+                book.author_names = ', '.join([author.name.replace('|', ',') for author in book.ordered_authors])
+                
+                # Add cover URL
+                if book.has_cover:
+                    book.cover_url = f"/cover/{book.id}"
+                else:
+                    book.cover_url = "/static/generic_cover.jpg"
+            
+            duplicate_groups.append({
+                'title': books[0].title,
+                'author': books[0].author_names.split(',')[0].strip(),  # Primary author
+                'count': len(books),
+                'books': books
+            })
+            
+            book_ids = [book.id for book in books]
+            print(f"[cwa-duplicates] Found duplicate group: '{books[0].title}' by {books[0].author_names.split(',')[0].strip()} ({len(books)} copies) - IDs: {book_ids}", flush=True)
+            log.info("[cwa-duplicates] Found duplicate group: '%s' by %s (%s copies) - IDs: %s", 
+                    books[0].title, books[0].author_names.split(',')[0].strip(), len(books), book_ids)
+    
+    # Sort by title, then author for consistent display
+    duplicate_groups.sort(key=lambda x: (x['title'].lower(), x['author'].lower()))
+    
+    print(f"[cwa-duplicates] Found {len(duplicate_groups)} duplicate groups total", flush=True)
+    
+    return duplicate_groups
@@ -33,6 +33,7 @@ def main():
     from .error_handler import init_errorhandler
     from .remotelogin import remotelogin
     from .kosync import kosync
+    from .duplicates import duplicates
     try:
         from .kobo import kobo, get_kobo_activated
         from .kobo_auth import kobo_auth
@@ -78,6 +79,7 @@ def main():
     app.register_blueprint(gdrive)
     app.register_blueprint(editbook)
     app.register_blueprint(kosync)
+    app.register_blueprint(duplicates)
     if kobo_available:
         app.register_blueprint(kobo)
         app.register_blueprint(kobo_auth)
 
@@ -99,6 +99,11 @@ def get_sidebar_config(kwargs=None):
             {"glyph": "glyphicon-th-list", "text": _('Books List'), "link": 'web.books_table', "id": "list",
              "visibility": constants.SIDEBAR_LIST, 'public': (not current_user.is_anonymous), "page": "list",
              "show_text": _('Show Books List'), "config_show": content})
+    if current_user.role_admin():
+        sidebar.append(
+            {"glyph": "glyphicon-copy", "text": _('Duplicates'), "link": 'duplicates.show_duplicates', "id": "duplicates",
+             "visibility": constants.SIDEBAR_DUPLICATES, 'public': (not current_user.is_anonymous), "page": "duplicates",
+             "show_text": _('Show Duplicate Books'), "config_show": content})
     g.shelves_access = ub.session.query(ub.Shelf).filter(
         or_(ub.Shelf.is_public == 1, ub.Shelf.user_id == current_user.id)).order_by(ub.Shelf.name).all()