Name: jbaruch/nanoclaw-media
Rating: 73.83 (1 reviews)
Author: jbaruch
jbaruch/nanoclaw-media

Personal entertainment-media skills for NanoClaw: Trakt watch-history sync, TV-show and audiobook recommendations, watchlist release checks, YouTube channel-comment digests, and Audible backup — with a weekly cadence companion. NanoClaw per-chat overlay tile.
Quality
92%
Does it follow best practices?
Impact
—
No eval scenarios have been run
Securityby
Risky
Do not use without reviewing
#!/usr/bin/env python3
"""
Append new Audible books to books-library.csv.

Reads JSON from stdin (audible_backup tool output).
Deduplicates by ASIN against existing CSV rows AND within the input
payload (duplicate ASINs appearing twice in a single `books` array
collapse to one row). On a brand-new or empty target CSV, the CSV
header row is written before data so the next run's `csv.DictReader`
can parse it correctly.
Outputs JSON summary to stdout.

Concurrency: read-existing → check-new → append is wrapped in an advisory
exclusive file lock (fcntl.flock) so two simultaneous runs can't both see the
same "existing" set and double-write the same books.
"""

import csv
import fcntl
import json
import os
import sys

CSV_PATH = os.environ.get("BOOKS_CSV", "/workspace/group/books-library.csv")


def _lock_path_for(csv_path):
    """Return the sibling lock-file path for a given CSV target.

    Derived per-call so `append_books_locked(csv_path=...)` locks the
    file it's actually writing to — not a global LOCK_PATH tied to
    CSV_PATH. Tests that point at an alternative output location get
    a correctly-scoped lock; production keeps locking
    `<CSV_PATH>.lock`.
    """
    return csv_path + ".lock"


HEADERS = [
    "Key",
    "Title",
    "Author",
    "Narrated By",
    "Purchase Date",
    "Duration",
    "Release Date",
    "Ave. Rating",
    "Genre",
    "Series Name",
    "Series Sequence",
    "Product ID",
    "ASIN",
    "Book URL",
    "Summary",
    "Description",
    "Rating Count",
    "Publisher",
    "Short Title",
    "Copyright",
    "Author URL",
    "File name",
    "Series URL",
    "Abridged",
    "Language",
    "PDF URL",
    "Image URL",
    "Region",
    "File Paths",
    "AYCE",
    "Read Status",
    "User ID",
    "Audible (AAX)",
    "MP3",
    "Image",
    "M4B",
    "PDF",
]


def minutes_to_duration(mins):
    """Convert runtime_length_min (int) to HH:MM:00 format."""
    if not mins:
        return ""
    try:
        mins = int(mins)
    except (ValueError, TypeError):
        return ""
    h = mins // 60
    m = mins % 60
    return f"{h:02d}:{m:02d}:00"


def map_book(book):
    """Map audible_backup JSON book to CSV row dict."""
    row = {h: "" for h in HEADERS}

    row["ASIN"] = book.get("asin", "")
    row["Title"] = book.get("title", "")
    row["Short Title"] = book.get("title", "")
    row["Author"] = book.get("authors", "")
    row["Narrated By"] = book.get("narrators", "")
    row["Genre"] = book.get("genres", "")
    row["Ave. Rating"] = str(book.get("rating", ""))
    row["Rating Count"] = str(book.get("num_ratings", ""))
    row["Image URL"] = book.get("cover_url", "")
    row["Series Name"] = book.get("series_title", "")
    row["Series Sequence"] = book.get("series_sequence", "")
    row["Duration"] = minutes_to_duration(book.get("runtime_length_min"))
    row["Language"] = "english"
    row["Region"] = "US"
    row["Abridged"] = "false"
    row["AYCE"] = "false"

    # Purchase date: extract date part if datetime
    pd = book.get("purchase_date", "")
    if pd and "T" in str(pd):
        pd = str(pd).split("T")[0]
    row["Purchase Date"] = str(pd)

    row["Release Date"] = str(book.get("release_date", ""))

    # Read status
    finished = book.get("is_finished", False)
    row["Read Status"] = "Finished" if finished else ""

    # M4B path from download
    row["M4B"] = book.get("m4b_path", "")

    # Product ID and Key use ASIN as fallback
    row["Key"] = book.get("asin", "")
    row["Product ID"] = book.get("asin", "")

    return row


def get_existing_asins(csv_path):
    """Read existing ASINs from CSV."""
    asins = set()
    if not os.path.exists(csv_path):
        return asins
    with open(csv_path, newline="", encoding="utf-8") as f:
        reader = csv.DictReader(f)
        for row in reader:
            asin = row.get("ASIN", "").strip()
            if asin:
                asins.add(asin)
    return asins


def append_books_locked(csv_path, books):
    """
    Append new book rows to CSV under an exclusive advisory lock.
    Returns (appended_list, existing_before_count, skipped_count).
    """
    # Use a sibling lock file — per csv_path, not a global — so tests or
    # alternative output paths get their own lock and don't contend
    # with readers of the CSV itself. flock is held for the entire
    # read-check-write window.
    lock_path = _lock_path_for(csv_path)
    # Mode "a" instead of "w": "w" would truncate the lockfile on every
    # run (wasted syscall, and a reader that opened the lockfile for
    # any reason would see zero bytes mid-run). The file content is
    # irrelevant — flock only needs a valid fd on the lockable inode —
    # so "a" (or "a+") leaves the file alone and is idempotent across
    # concurrent openers.
    with open(lock_path, "a") as lock_fh:
        fcntl.flock(lock_fh.fileno(), fcntl.LOCK_EX)
        try:
            existing = get_existing_asins(csv_path)
            # Dedup against BOTH the existing CSV and the input itself so
            # an ASIN that appears twice in `books` lands only once. The
            # pre-existing filter (no lock at the time) checked against
            # `existing` alone, so duplicate ASINs repeated within a
            # single `books` payload would both pass the check and both
            # get written in a single run. Adding the lock alone would
            # not have fixed this intra-input case, so it's addressed
            # here as part of the same write path.
            seen = set(existing)
            new_books = []
            for b in books:
                asin = b.get("asin")
                if asin and asin not in seen:
                    seen.add(asin)
                    new_books.append(b)

            appended = []
            if new_books:
                # If the CSV doesn't exist yet OR is empty, write the
                # header before data rows. Without this, the first-ever
                # run creates a header-less file: next-run
                # csv.DictReader treats row 0 as the header, row 1's
                # ASIN lands in the "Key" column, and dedup quietly
                # fails. Checked inside the lock so two concurrent
                # first-run attempts can't both write headers.
                needs_header = not os.path.exists(csv_path) or os.path.getsize(csv_path) == 0
                with open(csv_path, "a", newline="", encoding="utf-8") as f:
                    writer = csv.DictWriter(f, fieldnames=HEADERS, quoting=csv.QUOTE_ALL)
                    if needs_header:
                        writer.writeheader()
                    for book in new_books:
                        row = map_book(book)
                        writer.writerow(row)
                        appended.append(
                            {
                                "asin": row["ASIN"],
                                "title": row["Title"],
                                "author": row["Author"],
                                "series": row["Series Name"],
                            }
                        )

            skipped = len(books) - len(appended)
            return appended, len(existing), skipped
        finally:
            fcntl.flock(lock_fh.fileno(), fcntl.LOCK_UN)


def main():
    data = json.load(sys.stdin)

    books = data.get("books", [])
    if not books:
        print(json.dumps({"appended": 0, "skipped_existing": 0, "books": []}))
        return

    appended, existing_count, skipped = append_books_locked(CSV_PATH, books)

    print(
        json.dumps(
            {
                "appended": len(appended),
                "skipped_existing": skipped,
                "csv_total": existing_count + len(appended),
                "books": appended,
            }
        )
    )


if __name__ == "__main__":
    main()
jbaruch/nanoclaw-media

csv-append.py.css-3qkkll{font-size:var(--chakra-font-sizes-sm);font-weight:var(--chakra-font-weights-normal);color:var(--chakra-colors-gray-300);}skills/audible-backup/scripts/

csv-append.pyskills/audible-backup/scripts/